1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
|
# isbn.py - functions for handling ISBNs
#
# Copyright (C) 2010-2017 Arthur de Jong
#
# This library is free software; you can redistribute it and/or
# modify it under the terms of the GNU Lesser General Public
# License as published by the Free Software Foundation; either
# version 2.1 of the License, or (at your option) any later version.
#
# This library is distributed in the hope that it will be useful,
# but WITHOUT ANY WARRANTY; without even the implied warranty of
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
# Lesser General Public License for more details.
#
# You should have received a copy of the GNU Lesser General Public
# License along with this library; if not, write to the Free Software
# Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA
# 02110-1301 USA
"""ISBN (International Standard Book Number).
The ISBN is the International Standard Book Number, used to identify
publications. An ISBN is used to identify books. Numbers can either have 10
digits (in ISBN-10 format) or 13 digits (in ISBN-13, EAN compatible format).
An ISBN has the following components:
* 3-digit (only in ISBN-13) Bookland code
* 1 to 5-digit group identifier (identifies country or language)
* 1 to 7-digit publisher code
* 1 to 8-digit item number (identifies the book)
* a check digit
More information:
* https://en.wikipedia.org/wiki/International_Standard_Book_Number
* https://www.isbn-international.org/range_file_generation
This module also offers functions for converting to ISBN-13 and formatting
based on how the number should be split into a bookland code, group
identifier, publisher code, item number and check digit.
>>> validate('978-9024538270')
'9789024538270'
>>> validate('978-9024538271')
Traceback (most recent call last):
...
InvalidChecksum: ...
>>> compact('1-85798-218-5')
'1857982185'
>>> format('9780471117094')
'978-0-471-11709-4'
>>> format('1857982185')
'1-85798-218-5'
>>> isbn_type('1-85798-218-5')
'ISBN10'
>>> isbn_type('978-0-471-11709-4')
'ISBN13'
>>> to_isbn13('1-85798-218-5')
'978-1-85798-218-3'
>>> to_isbn10('978-1-85798-218-3')
'1-85798-218-5'
"""
from stdnum import ean
from stdnum.exceptions import *
from stdnum.util import clean
def compact(number, convert=False):
"""Convert the ISBN to the minimal representation. This strips the number
of any valid ISBN separators and removes surrounding whitespace. If the
covert parameter is True the number is also converted to ISBN-13
format."""
number = clean(number, ' -').strip().upper()
if len(number) == 9:
number = '0' + number
if convert:
return to_isbn13(number)
return number
def _calc_isbn10_check_digit(number):
"""Calculate the ISBN check digit for 10-digit numbers. The number passed
should not have the check bit included."""
check = sum((i + 1) * int(n)
for i, n in enumerate(number)) % 11
return 'X' if check == 10 else str(check)
def validate(number, convert=False):
"""Check if the number provided is a valid ISBN (either a legacy 10-digit
one or a 13-digit one). This checks the length and the check bit but does
not check if the group and publisher are valid (use split() for that)."""
number = compact(number, convert=False)
if not number[:-1].isdigit():
raise InvalidFormat()
if len(number) == 10:
if _calc_isbn10_check_digit(number[:-1]) != number[-1]:
raise InvalidChecksum()
elif len(number) == 13:
ean.validate(number)
if number[:3] not in ('978', '979'):
raise InvalidComponent()
else:
raise InvalidLength()
if convert:
number = to_isbn13(number)
return number
def isbn_type(number):
"""Check the passed number and return 'ISBN13', 'ISBN10' or None (for
invalid) for checking the type of number passed."""
try:
number = validate(number, convert=False)
except ValidationError:
return None
if len(number) == 10:
return 'ISBN10'
else: # len(number) == 13:
return 'ISBN13'
def is_valid(number):
"""Check if the number provided is a valid ISBN (either a legacy 10-digit
one or a 13-digit one). This checks the length and the check bit but does
not check if the group and publisher are valid (use split() for that)."""
try:
return bool(validate(number))
except ValidationError:
return False
def to_isbn13(number):
"""Convert the number to ISBN-13 format."""
number = number.strip()
min_number = clean(number, ' -')
if len(min_number) == 13:
return number # nothing to do, already ISBN-13
if len(min_number) == 9:
number = '0' + number # convert from 9 to 10 digits
# put new check digit in place
number = number[:-1] + ean.calc_check_digit('978' + min_number[:-1])
# add prefix
if ' ' in number:
return '978 ' + number
elif '-' in number:
return '978-' + number
else:
return '978' + number
def to_isbn10(number):
"""Convert the number to ISBN-10 format."""
number = number.strip()
min_number = compact(number, convert=False)
if len(min_number) == 10:
return number # nothing to do, already ISBN-10
elif isbn_type(min_number) != 'ISBN13':
raise InvalidFormat('Not a valid ISBN13.')
elif not number.startswith('978'):
raise InvalidComponent('Does not use 978 Bookland prefix.')
# strip EAN prefix
number = number[3:-1].strip().strip('-')
digit = _calc_isbn10_check_digit(min_number[3:-1])
# append the new check digit
if ' ' in number:
return number + ' ' + digit
elif '-' in number:
return number + '-' + digit
else:
return number + digit
def split(number, convert=False):
"""Split the specified ISBN into an EAN.UCC prefix, a group prefix, a
registrant, an item number and a check-digit. If the number is in ISBN-10
format the returned EAN.UCC prefix is '978'. If the covert parameter is
True the number is converted to ISBN-13 format first."""
from stdnum import numdb
# clean up number
number = compact(number, convert)
# get Bookland prefix if any
delprefix = False
if len(number) == 10:
number = '978' + number
delprefix = True
# split the number
result = numdb.get('isbn').split(number[:-1])
itemnr = result.pop() if result else ''
prefix = result.pop(0) if result else ''
group = result.pop(0) if result else ''
publisher = result.pop(0) if result else ''
# return results
return ('' if delprefix else prefix, group, publisher, itemnr, number[-1])
def format(number, separator='-', convert=False):
"""Reformat the number to the standard presentation format with the
EAN.UCC prefix (if any), the group prefix, the registrant, the item
number and the check-digit separated (if possible) by the specified
separator. Passing an empty separator should equal compact() though this
is less efficient. If the covert parameter is True the number is
converted to ISBN-13 format first."""
return separator.join(x for x in split(number, convert) if x)
|