1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
|
#!/usr/bin/env python3
# update/gs1_ai.py - script to get GS1 application identifiers
#
# Copyright (C) 2019-2023 Arthur de Jong
#
# This library is free software; you can redistribute it and/or
# modify it under the terms of the GNU Lesser General Public
# License as published by the Free Software Foundation; either
# version 2.1 of the License, or (at your option) any later version.
#
# This library is distributed in the hope that it will be useful,
# but WITHOUT ANY WARRANTY; without even the implied warranty of
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
# Lesser General Public License for more details.
#
# You should have received a copy of the GNU Lesser General Public
# License along with this library; if not, write to the Free Software
# Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA
# 02110-1301 USA
"""This script downloads GS1 application identifiers from the GS1 web site."""
import datetime
import json
import re
import lxml.html
import requests
# the location of the GS1 application identifiers
download_url = 'https://www.gs1.org/standards/barcodes/application-identifiers'
# The user agent that will be passed in requests
user_agent = 'Mozilla/5.0 (compatible; python-stdnum updater; +https://arthurdejong.org/python-stdnum/)'
def fetch_ais():
"""Download application identifiers frm the GS1 website."""
headers = {
'User-Agent': user_agent,
}
response = requests.get(download_url, headers=headers, timeout=30)
document = lxml.html.document_fromstring(response.content)
element = document.findall('.//script[@type="application/ld+json"]')[0]
for entry in json.loads(element.text)['@graph']:
yield (
entry['skos:prefLabel'].strip(), # AI
entry['gs1meta:formatAIvalue'].strip()[3:], # format
entry['gs1meta:requiresFNC1'], # require FNC1
[x['@value'] for x in entry['schema:name'] if x['@language'] == 'en'][0].strip(),
[x['@value'] for x in entry['schema:description'] if x['@language'] == 'en'][0].strip())
def group_ai_ranges():
"""Combine downloaded application identifiers into ranges."""
first = None
prev = (None, ) * 5
for value in sorted(fetch_ais()):
if value[1:] != prev[1:]:
if first:
yield (first, *prev)
first = value[0]
prev = value
yield (first, *prev)
if __name__ == '__main__':
print('# generated from %s' % download_url)
print('# on %s' % datetime.datetime.utcnow())
for ai1, ai2, format, require_fnc1, name, description in group_ai_ranges():
_type = 'str'
if re.match(r'^(N[68]\[?\+)?N[0-9]*[.]*[0-9]+\]?$', format) and 'date' in description.lower():
_type = 'date'
elif re.match(r'^N[.]*[0-9]+$', format) and 'count' in description.lower():
_type = 'int'
ai = ai1
if ai1 != ai2:
if len(ai1) == 4:
ai = ai1[:3]
_type = 'decimal'
else:
ai = '%s-%s' % (ai1, ai2)
print('%s format="%s" type="%s"%s name="%s" description="%s"' % (
ai, format, _type,
' fnc1="1"' if require_fnc1 else '',
name, description))
|