[sword-svn] r524 - trunk/versification
greg.hellings at crosswire.org
greg.hellings at crosswire.org
Wed Apr 4 19:29:48 MST 2018
Author: greg.hellings
Date: 2018-04-04 19:29:48 -0700 (Wed, 04 Apr 2018)
New Revision: 524
Modified:
trunk/versification/av11n.py
Log:
Use argparser.
Modified: trunk/versification/av11n.py
===================================================================
--- trunk/versification/av11n.py 2018-04-05 02:29:41 UTC (rev 523)
+++ trunk/versification/av11n.py 2018-04-05 02:29:48 UTC (rev 524)
@@ -9,12 +9,15 @@
# special as for ordering.
#
# Invoke simply by calling the program and the file name.
+import argparse
import io
import logging
# in normal state level should be debug.WARNING, debug.INFO and debug.DEBUG
# give additional information.
-logging.basicConfig(format='%(levelname)s:%(funcName)s:%(message)s',
- level=logging.WARNING)
+logging.basicConfig(format='%(levelname)s:%(message)s',
+ level=logging.INFO)
+log = logging.getLogger('versification')
+
import re
import sys
try:
@@ -22,40 +25,54 @@
except ImportError:
import xml.etree.ElementTree as ET
-VERSEID_RE = re.compile(r'^.+\..+\..+$')
+OSIS_NS = 'http://www.bibletechnologies.net/2003/OSIS/namespace'
+VERSEID_RE = re.compile(r'^(.+\.\d+\.\d+).*$')
# Inform the user that we need the SWORD extension
try:
import Sword
except ImportError:
- logging.exception(
+ log.exception(
"You do not have the SWORD library installed. Please install it.")
sys.exit(1)
-# Without the name of a file, we cannot proceed any further
-if len(sys.argv) < 2 or sys.argv[1] == '--help':
- print >>sys.stderr, "Usage: %s <OSISfile>" % sys.argv[0]
- sys.exit(1)
+arg_parser = argparse.ArgumentParser(
+ description='Compare OSIS file with available v11ns.')
+arg_parser.add_argument('--verbose', '-v', action='count')
+arg_parser.add_argument('filename', nargs=1)
+
+
+args = arg_parser.parse_args()
+
+if args.verbose:
+ log.setLevel = logging.DEBUG
+
+log.debug('args = %s', args)
+
# Open the file
-logging.debug('Opening %s' % (sys.argv[1],))
+log.debug('Opening %s' % args.filename[0])
-tree = ET.parse(io.open(sys.argv[1], encoding='utf8')).getroot()
+tree = ET.parse(io.open(args.filename[0], encoding='utf8')).getroot()
# Get the list of versifications
-logging.debug('Fetching a list of v11ns')
+log.debug('Fetching a list of v11ns')
vmgr = Sword.VersificationMgr.getSystemVersificationMgr()
av11ns = vmgr.getVersificationSystems()
+log.debug('av11ns = %s', av11ns)
# Get the list of all osisIDs
-logging.debug('Fetching a list of OSIS IDs')
+log.debug('Fetching a list of OSIS IDs')
ids = set()
-for item in tree.iter():
+for item in tree.iter('{%s}verse' % OSIS_NS):
if 'osisID' in item.attrib:
- ids.add(item.attrib['osisID'])
+ ids.add(item.attrib['osisID'].split('!')[0])
+log.debug('ids = len(%d)', len(ids))
# Iterate each versification scheme
for v11n in av11ns:
- print('Checking %s' % v11n.c_str())
+ v11n_name = v11n.c_str()
+ print('\nChecking %s:\n%s' %
+ (v11n_name, (len(v11n_name) + 10) * '-'))
# Construct a list of the IDs in this versification
key = Sword.VerseKey()
key.setVersificationSystem(v11n.c_str())
@@ -85,36 +102,42 @@
inNT = False
# Now iterate the ones we have in this file
for osisid in ids:
- logging.debug('Checking key %s', osisid)
+# log.debug('Checking key %s', osisid)
if osisid in otkeyList:
otkeyList.remove(osisid)
elif osisid in ntkeyList:
ntkeyList.remove(osisid)
inNT = True
- elif VERSEID_RE.match(osisid) and inNT:
- ntextraKeys.append(osisid)
- elif VERSEID_RE.match(osisid) and not inNT:
- otextraKeys.append(osisid)
- # Ignore it if not VERSEID_RE.match()
+ else:
+ verse_match = VERSEID_RE.match(osisid)
+ if verse_match and inNT:
+ ntextraKeys.append(verse_match.group(1))
+ elif verse_match and not inNT:
+ otextraKeys.append(verse_match.group(1))
+ # Ignore it if not VERSEID_RE.match()
# Now let's see what is left over
# Sets in Python cannot be ordered
keyList = list(otkeyList.union(ntkeyList))
keyList.sort()
if len(keyList) > 0:
- logging.info('\tThe following IDs don’t appear in your file:\n%s',
- str("\n".join(keyList)))
+ if len(keyList) < 100:
+ log.info('\tThe following IDs don’t appear in your file:\n%s',
+ str(", ".join(keyList)))
print ('\tThere are %d OT IDs and %d NT IDs ' +
- 'in v11n which arn’t in your file.') \
+ 'in v11n which aren’t in your file.') \
% (len(otkeyList), len(ntkeyList))
else:
print '\tYour file has all the references in this v11n'
# Now let's see if you had extra
if len(otextraKeys + ntextraKeys) > 0:
- logging.info(
- '\tThe following IDs don’t appear in v11n:\n%s',
- str("\n".join(keyList)))
+ # It doesn't make sense to print out lists longer than 100
+ # they cannot be read anyway
+ if len(keyList) < 100:
+ log.info(
+ '\tThe following IDs don’t appear in v11n:\n%s',
+ str(", ".join(keyList)))
print ('\tThere are %d OT IDs and %d NT IDs ' +
'in your file which don’t appear in v11n.') \
% (len(otextraKeys), len(ntextraKeys))
More information about the sword-cvs
mailing list