package Business::ISBN;
use strict;
=encoding utf8
=head1 NAME
Business::ISBN - work with International Standard Book Numbers
=head1 SYNOPSIS
use Business::ISBN;
# 10 digit ISBNs
$isbn10 = Business::ISBN->new('1565922573');
$isbn10 = Business::ISBN->new('1-56592-257-3');
# 13 digit ISBNs
$isbn13 = Business::ISBN->new('978-0-596-52724-2');
# convert
$isbn10 = $isbn13->as_isbn10; # for the 978 prefixes
$isbn13 = $isbn10->as_isbn13;
# maybe you don't care what it is as long as everything works
$isbn = Business::ISBN->new( $ARGV[0] );
#print the ISBN with hyphens at usual positions
print $isbn->as_string;
#print the ISBN with hyphens at specified positions.
#this not does affect the default positions
print $isbn->as_string([]);
#print the group code or publisher code
print $isbn->group_code;
print $isbn->publisher_code;
#check to see if the ISBN is valid
$isbn->is_valid;
#fix the ISBN checksum. BEWARE: the error might not be
#in the checksum!
$isbn->fix_checksum;
# create an EAN13 barcode in PNG format
$isbn->png_barcode;
=head1 DESCRIPTION
This modules handles International Standard Book Numbers, including
ISBN-10 and ISBN-13.
=cut
# # # # # # # # # # # # # # # # # # # # # # # # # # # # # # # # # # #
# # # # # # # # # # # # # # # # # # # # # # # # # # # # # # # # # # #
# # Boring set up stuff
use subs qw(
_common_format
INVALID_GROUP_CODE
INVALID_PUBLISHER_CODE
BAD_CHECKSUM
GOOD_ISBN
BAD_ISBN
);
use vars qw( $VERSION @ISA @EXPORT_OK %EXPORT_TAGS $debug %group_data
$MAX_GROUP_CODE_LENGTH %ERROR_TEXT );
use Carp qw(carp croak cluck);
use base qw(Exporter);
use Business::ISBN::Data 20120719.001; # now a separate module
# ugh, hack
*group_data = *Business::ISBN::country_data;
sub _group_data { $group_data{ $_[1] } }
sub _max_group_code_length { $Business::ISBN::MAX_COUNTRY_CODE_LENGTH };
sub _max_publisher_code_length {
$_[0]->_max_length
- $_[0]->_prefix_length # prefix
- $_[0]->_group_code_length # group
- 1 # article
- 1; # checksum
};
sub _publisher_ranges {
my $self = shift;
[ @{ $self->_group_data( $self->group_code )->[1] } ];
}
my $debug = 0;
BEGIN {
@EXPORT_OK = qw(
INVALID_GROUP_CODE INVALID_PUBLISHER_CODE
BAD_CHECKSUM GOOD_ISBN BAD_ISBN
INVALID_PREFIX
%ERROR_TEXT
valid_isbn_checksum
);
%EXPORT_TAGS = (
'all' => \@EXPORT_OK,
);
};
$VERSION = "2.06";
sub INVALID_PREFIX () { -4 };
sub INVALID_GROUP_CODE () { -2 };
sub INVALID_PUBLISHER_CODE () { -3 };
sub BAD_CHECKSUM () { -1 };
sub GOOD_ISBN () { 1 };
sub BAD_ISBN () { 0 };
%ERROR_TEXT = (
0 => "Bad ISBN",
1 => "Good ISBN",
-1 => "Bad ISBN checksum",
-2 => "Invalid group code",
-3 => "Invalid publisher code",
-4 => "Invalid prefix (must be 978 or 979)",
);
use Business::ISBN10;
use Business::ISBN13;
=head2 Function interface
=over 4
=item valid_isbn_checksum( ISBN10 | ISBN13 )
This function is exportable on demand, and works for either 10
or 13 character ISBNs).
use Business::ISBN qw( valid_isbn_checksum );
Returns 1 if the ISBN is a valid ISBN with the right checksum.
Returns 0 if the ISBN has valid prefix and publisher codes, but an
invalid checksum.
Returns undef if the ISBN does not validate for any other reason.
=back
=cut
sub valid_isbn_checksum {
my $isbn = shift;
my $obj = Business::ISBN->new( $isbn );
return unless defined $obj;
return 1 if $obj->is_valid_checksum == GOOD_ISBN;
return 0 if $obj->is_valid_checksum == BAD_CHECKSUM;
return;
}
=head2 Object interface
=over 4
=item new($isbn)
The constructor accepts a scalar representing the ISBN.
The string representing the ISBN may contain characters other than
C<[0-9xX]>, although these will be removed in the internal
representation. The resulting string must look like an ISBN - the
first nine characters must be digits and the tenth character must be a
digit, 'x', or 'X'.
The constructor attempts to determine the group code and the publisher
code. If these data cannot be determined, the constructor sets C<<
$obj->error >> to something other than C<GOOD_ISBN>. An object is
still returned and it is up to the program to check C<< $obj->error >>
for one of five values (which may be exported on demand). The actual
values of these symbolic versions are the same as those from previous
versions of this module which used literal values.
Business::ISBN::INVALID_PUBLISHER_CODE
Business::ISBN::INVALID_GROUP_CODE
Business::ISBN::BAD_CHECKSUM
Business::ISBN::GOOD_ISBN
Business::ISBN::BAD_ISBN
If you have one of these values and want to turn it into a string, you
can use the C<%Business::ISBN::ERROR_TEXT> hash, which is exportable
by asking for it explicitly in the import list.
use Business::ISBN qw(%ERROR_TEXT);
The string passed as the ISBN need not be a valid ISBN as long as it
superficially looks like one. This allows one to use the
C<fix_checksum()> method. Despite the disclaimer in the discussion of
that method, the author has found it extremely useful. One should
check the validity of the ISBN with C<is_valid()> rather than relying
on the return value of the constructor. If all one wants to do is
check the validity of an ISBN, one can skip the object-oriented
interface and use the C<valid_isbn_checksum()> function which is
exportable on demand.
If the constructor decides it cannot create an object, it returns
C<undef>. It may do this if the string passed as the ISBN cannot be
munged to the internal format meaning that it does not even come close
to looking like an ISBN.
=cut
# # # # # # # # # # # # # # # # # # # # # # # # # # # # # # # # # # #
# # # # # # # # # # # # # # # # # # # # # # # # # # # # # # # # # # #
sub new {
my $class = shift;
my $input_data = shift;
my $common_data = _common_format $input_data;
return unless $common_data;
my $self = {
input_isbn => $input_data,
common_data => $common_data
};
my $isbn = do {
if( length( $common_data ) == 10 ) {
bless $self, 'Business::ISBN10';
}
elsif( length( $common_data ) == 13 ) {
bless $self, 'Business::ISBN13';
}
else {
return BAD_ISBN;
}
};
$self->_init( $common_data );
$self->_parse_isbn( $common_data );
return $isbn;
}
=back
=head2 Instance methods
=over 4
=item input_isbn
Returns the starting ISBN. Since you may insert hyphens or fix
checksums, you might want to see the original data.
=cut
sub input_isbn { $_[0]->{'input_isbn'} }
=item common_data
Returns the starting ISBN after normalization, which removes anything
that isn't a digit or a valid checksum character.
=cut
sub common_data { $_[0]->{'common_data'} }
=item isbn
Returns the current value of ISBN, even if it has an invalid checksum.
This is the raw data so it doesn't have the hyphens. If you want
hyphenation, try C<as_string>.
The C<isbn> method should be the same as C<as_string( [] )>.
=cut
sub isbn { $_[0]->{'isbn'} }
=item error
Return the error code for the reason the ISBN isn't valid. The return
value is a key in %ERROR_TEXT.
=cut
sub error { $_[0]->{'valid'} }
=item is_valid
Return true if the ISBN is valid, meaning that it has a valid prefix
(for ISBN-13), group code, and publisher code; and its checksum
validates.
=cut
sub is_valid { $_[0]->{'valid'} eq GOOD_ISBN }
=item type
Returns either C<ISBN10> or C<ISBN13>.
=cut
sub type { $_[0]->{'type'} }
=item prefix
Returns the prefix for the ISBN. This is currently either 978 or 979
for ISBN-13. It returns the empty string (so, a defined value) for
ISBN-10.
=cut
sub prefix { $_[0]->{'prefix'} }
sub _prefix_length { length $_[0]->{'prefix'} }
=item group_code
Returns the group code for the ISBN. This is the numerical version,
for example, '0' for the English group. The valid group codes come
from C<Business::ISBN::Data>.
=cut
sub group_code { $_[0]->{'group_code'} }
=item group
Returns the group name for the ISBN. This is the string version. For
instance, 'English' for the '0' group. The names come from
C<Business::ISBN::Data>.
=cut
sub group { $_[0]->_group_data( $_[0]->group_code )->[0] }
sub _group_code_length {
length(
defined $_[0]->{'group_code'} ? $_[0]->{'group_code'} : ''
);
}
=item publisher_code
Returns the publisher code for the ISBN. This is the numeric version,
for instance '596' for O'Reilly Media.
=cut
sub publisher_code { $_[0]->{'publisher_code'} }
sub _publisher_code_length {
length(
defined $_[0]->{'publisher_code'} ? $_[0]->{'publisher_code'} : ''
);
}
=item article_code
Returns the article code for the ISBN. This is the numeric version that
uniquely identifies the item.
=cut
sub article_code { $_[0]->{'article_code'} }
=item checksum
Returns the checksum code for the ISBN. This checksum may not be valid since
you can create an object an fix the checksum later with C<fix_checksum>.
=cut
sub checksum { $_[0]->{'checksum'} }
sub _checksum_pos { length( $_[0]->isbn ) - 1 }
=item is_valid_checksum
Returns C<Business::ISBN::GOOD_ISBN> for valid checksums and
C<Business::ISBN::BAD_CHECKSUM> otherwise. This does not guarantee
that the rest of the ISBN is actually assigned to a book.
=cut
sub is_valid_checksum {
my $self = shift;
cluck "is_valid_checksum: Didn't get object!" unless ref $self;
no warnings 'uninitialized';
return GOOD_ISBN if $self->checksum eq $self->_checksum;
return BAD_CHECKSUM;
}
=item fix_checksum
Checks the checksum and modifies the ISBN to set it correctly if needed.
=cut
sub fix_checksum {
my $self = shift;
my $last_char = substr($self->isbn, $self->_checksum_pos, 1);
my $checksum = $self->_checksum;
my $isbn = $self->isbn;
substr($isbn, $self->_checksum_pos, 1) = $checksum;
$self->_set_isbn( $isbn );
$self->_set_checksum( $checksum );
$self->_check_validity;
return 0 if $last_char eq $checksum;
return 1;
}
=item as_string(), as_string([])
Return the ISBN as a string. This function takes an
optional anonymous array (or array reference) that specifies
the placement of hyphens in the string. An empty anonymous array
produces a string with no hyphens. An empty argument list
automatically hyphenates the ISBN based on the discovered
group and publisher codes. An ISBN that is not valid may
produce strange results.
The positions specified in the passed anonymous array
are only used for one method use and do not replace
the values specified by the constructor. The method
assumes that you know what you are doing and will attempt
to use the least three positions specified. If you pass
an anonymous array of several positions, the list will
be sorted and the lowest three positions will be used.
Positions less than 1 and greater than 12 are silently
ignored.
A terminating 'x' is changed to 'X'.
=cut
sub as_string {
my $self = shift;
my $array_ref = shift;
#this allows one to override the positions settings from the
#constructor
$array_ref = $self->_hyphen_positions unless ref $array_ref eq ref [];
# print STDERR Data::Dumper->Dump( [$array_ref], [qw(array_ref)] );
# print STDERR Data::Dumper->Dump( [$self], [qw(self)] );
return unless $self->is_valid eq GOOD_ISBN;
my $isbn = $self->isbn;
foreach my $position ( sort { $b <=> $a } @$array_ref ) {
next if $position > 12 or $position < 1;
substr($isbn, $position, 0) = '-';
}
return $isbn;
}
=item as_isbn10
Returns a new ISBN object. If the object is already ISBN-10, this method
clones it. If it is an ISBN-13 with the prefix 978, it returns the ISBN-10
equivalent. For all other cases it returns undef.
=cut
sub as_isbn10 {
croak "as_isbn10() must be implemented in Business::ISBN subclass"
}
=item as_isbn13
Returns a new ISBN object. If the object is already ISBN-13, this method
clones it. If it is an ISBN-10, it returns the ISBN-13 equivalent with the
978 prefix.
=cut
sub as_isbn13 {
croak "as_isbn13() must be implemented in Business::ISBN subclass"
}
=item xisbn
In scalar context, returns an anonymous array of related ISBNs using xISBN.
In list context, returns a list.
This feature requires C<LWP::Simple>.
=cut
sub xisbn {
my $self = shift;
my $data = $self->_get_xisbn;
$data =~ tr/x/X/;
my @isbns = $data =~ m|<isbn>(.*?)</isbn>|ig;
shift @isbns;
wantarray ? @isbns : \@isbns;
}
sub _get_xisbn {
my $self = shift;
eval "use LWP::Simple";
if( $@ ) { carp "You need LWP::Simple to use xisbn()"; return; }
my $data = LWP::Simple::get( $self->_xisbn_url );
carp "Could not fetch xISBN data" unless defined $data;
return $data;
}
sub _xisbn_url {
my $self = shift;
my $isbn = $self->as_string([]);
return "http://xisbn.worldcat.org/xid/isbn/$isbn";
}
=item png_barcode
Returns image data in PNG format for the barcode for the ISBN. This
works with ISBN-10 and ISBN-13. The ISBN-10s are automaically converted
to ISBN-13.
This requires C<GD::Barcode::EAN13>.
=cut
sub png_barcode {
my $self = shift;
my $ean = $self->as_isbn13->as_string([]);
eval "use GD::Barcode::EAN13";
if( $@ )
{
carp "Need GD::Barcode::EAN13 to use png_barcode!";
return;
}
my $image = GD::Barcode::EAN13->new($ean)->plot->png;
return $image;
}
=back
=cut
sub _set_isbn { $_[0]->{'isbn'} = $_[1]; }
sub _set_is_valid { $_[0]->{'valid'} = $_[1]; }
sub _set_prefix
{
croak "_set_prefix() must be implemented in Business::ISBN subclass"
}
sub _set_group_code { $_[0]->{'group_code'} = $_[1]; }
sub _set_group_code_string { $_[0]->{'group_code_string'} = $_[1]; }
sub _set_publisher_code { $_[0]->{'publisher_code'} = $_[1]; }
sub _set_publisher_code_string { $_[0]->{'publisher_code_string'} = $_[1]; }
sub _set_article_code { $_[0]->{'article_code'} = $_[1]; }
sub _set_checksum { $_[0]->{'checksum'} = $_[1]; }
sub _set_type {
croak "_set_type() must be implemented in Business::ISBN subclass"
}
# # # # # # # # # # # # # # # # # # # # # # # # # # # # # # # # # # #
# # # # # # # # # # # # # # # # # # # # # # # # # # # # # # # # # # #
# # internal methods. you don't get to use this one.
sub _common_format {
#we want uppercase X's
my $data = uc shift;
#get rid of everything except decimal digits and X
$data =~ s/[^0-9X]//g;
return $1 if $data =~ m/
\A #anchor at start
(
(?:\d\d\d)?
\d{9}[0-9X]
)
\z #anchor at end
/x;
return;
}
sub _init {
my $self = shift;
my $common_data = shift;
my $class = ref $self =~ m/.*::(.*)/g;
$self->_set_type;
$self->_set_isbn( $common_data );
# we don't know if we have a valid group code yet
# so let's assume that we don't
$self->_set_is_valid( INVALID_GROUP_CODE );
}
{
my @methods = (
[ qw( prefix ), INVALID_PREFIX ],
[ qw( group_code ), INVALID_GROUP_CODE ],
[ qw( publisher_code ), INVALID_PUBLISHER_CODE ],
[ qw( article_code ), BAD_ISBN ],
[ qw( checksum ), BAD_CHECKSUM ],
);
sub _parse_isbn {
my $self = shift;
foreach my $pair ( @methods )
{
my( $method, $error_code ) = @$pair;
my $parser = "_parse_$method";
my $result = $self->$parser;
unless( defined $result )
{
$self->_set_is_valid( $error_code );
#print STDERR "Got bad result for $method [$$self{isbn}]\n";
return;
}
$method = "_set_$method";
$self->$method( $result );
}
$self->_set_is_valid( $self->is_valid_checksum );
return $self;
}
}
sub _parse_group_code {
my $self = shift;
my $trial; # try this to see what we get
my $group_code_length = 0;
my $count = 1;
GROUP_CODE:
while( defined( $trial= substr($self->isbn, $self->_prefix_length, $count++) ) )
{
if( defined $self->_group_data( $trial ) )
{
return $trial;
last GROUP_CODE;
}
# if we've past the point of finding a group
# code we're pretty much stuffed.
return if $count > $self->_max_group_code_length;
}
return; #failed if I got this far
}
sub _parse_publisher_code {
my $self = shift;
my $pairs = $self->_publisher_ranges;
# get the longest possible publisher code
# I'll try substrs of this to get the real one
my $longest = substr(
$self->isbn,
$self->_prefix_length + $self->_group_code_length,
$self->_max_publisher_code_length,
);
#print STDERR "Trying to parse publisher: longest [$longest]\n";
while( @$pairs ) {
my $lower = shift @$pairs;
my $upper = shift @$pairs;
my $trial = substr( $longest, 0, length $lower );
#print STDERR "Trying [$trial] with $lower <-> $upper [$$self{isbn}]\n";
# this has to be a sring comparison because there are
# possibly leading 0s
if( $trial ge $lower and $trial le $upper )
{
#print STDERR "Returning $trial\n";
return $trial;
}
}
return; #failed if I got this far
}
sub _parse_article_code {
my $self = shift;
my $head = $self->_prefix_length +
$self->_group_code_length +
$self->_publisher_code_length;
my $length = length( $self->isbn ) - $head - 1;
substr( $self->isbn, $head, $length );
}
sub _parse_checksum {
my $self = shift;
substr( $self->isbn, -1, 1 );
}
sub _check_validity {
my $self = shift;
if( $self->is_valid_checksum eq GOOD_ISBN and
defined $self->group_code and
defined $self->publisher_code and
defined $self->prefix
) {
$self->_set_is_valid( GOOD_ISBN );
return GOOD_ISBN;
}
else {
$self->_set_is_valid( INVALID_PUBLISHER_CODE )
unless defined $self->publisher_code;
$self->_set_is_valid( INVALID_GROUP_CODE )
unless defined $self->group_code;
$self->_set_is_valid( INVALID_PREFIX )
unless defined $self->prefix;
return;
}
}
sub _hyphen_positions {
croak "hyphen_positions() must be implemented in Business::ISBN subclass"
}
1;
__END__
=head1 BUGS
=head1 TO DO
* i would like to create the bar codes with the price extension
=head1 SOURCE AVAILABILITY
This source is in Github:
https://github.com/briandfoy/business--isbn
=head1 AUTHOR
brian d foy C<< <bdfoy@cpan.org> >>
=head1 COPYRIGHT AND LICENSE
Copyright (c) 2001-2013, brian d foy, All Rights Reserved.
You may redistribute this under the same terms as Perl itself.
=head1 CREDITS
Thanks to Mark W. Eichin C<< <eichin@thok.org> >> for suggestions and
discussions on EAN support.
Thanks to Andy Lester C<< <andy@petdance.com> >> for lots of bug fixes
and testing.
Ed Summers C<< <esummers@cpan.org> >> has volunteered to help with
this module.
=cut