summaryrefslogtreecommitdiffstats
path: root/versification/v11nmax.py
blob: 99b2e204647eb54d0952a715cff32555cca524ec (plain) (blame)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
#!/usr/bin/env python

import re, sys
from collections import Counter
import datetime

if len(sys.argv) < 3:
    print 'Usage: ' + sys.argv[0] + ' <v11n name> <canon.h-style file(s)>'
    print
    print 'This utility takes a number of canon_*.h-style v11n definitions and'
    print '  combines them into a single larger v11n system that maximizes the'
    print '  chapters-per-book and verses-per-chapter present within its'
    print '  constituent v11ns. Book order is determined by the order in which'
    print '  the script encounters each Bible book.'
    print
    print 'For example, to create the versification system "Max" from the'
    print '  files contained in the directory ./canon, you might invoke:'
    print '      ' + sys.argv[0] + ' Max ./canon/canon*.h'
    print
    exit()

v11n = sys.argv[1]
files = sys.argv[2:]

bible = dict()
NTbookList = list()
OTbookList = list()
bookName = dict()

for fn in files:
    f = open(fn).readlines()

    inBooks = False
    inVm = False
    
    vmArray = list()
    localOTbookList = list()
    localNTbookList = list()

    for l in f:
        # This is not robust. It assumes that [on]tbooks[] precedes vm[] and
        # that all of the verse counts in vm[] are part of books listed in
        # [on]tbooks[]. In general, it assumes canon files that look like what
        # we include in the library and generate from v11nsys.pl.

        l = re.sub(r'//.*', '', l)
        l = re.sub(r'\s*$', '', l)
        
        if l:        
            if re.search(r'struct sbook otbooks.*?\[\]', l):
                inBooks = 1
            if re.search(r'struct sbook ntbooks.*?\[\]', l):
                inBooks = 2
            elif re.search(r'int vm.*?\[\]', l):
                inVm = True
            elif (inVm or inBooks) and re.search(r'};', l):            
                inBooks = False
                inVm = False
            elif inBooks:
                match = re.search(r'{"(.+?)", "(.+?)", ".+?", (\d+)},', l)
                if match:
                    id = match.group(2)
                    name = match.group(1)
                    if id not in OTbookList and id not in NTbookList:
                        if (inBooks == 1):
                            OTbookList.append(id)
                        else:
                            NTbookList.append(id)
                        bookName[id] = name
                        bible[id] = Counter()
                    if inBooks == 1:
                        localOTbookList.append((id, int(match.group(3))))
                    else:
                        localNTbookList.append((id, int(match.group(3))))
            elif inVm:
                vmArray.append(re.findall(r'(\d+),?', l))

    vmArray = sum(vmArray, [])
    vmArray = map(int, vmArray)
    #print localOTbookList
    #print localNTbookList
    #print vmArray

    for book,chapters in localOTbookList + localNTbookList:
        #print book,chapters
        for c in range(chapters):
            # update the master dictionary with the max of its current value
            # and the verse count for that chapter in the current v11n
            bible[book][c+1] = max(bible[book][c+1], vmArray.pop(0))
            

canonMax = open('canon_' + v11n.lower() + '.h', 'w')

# print header stuff
canonMax.write('/******************************************************************************\n')
canonMax.write(' *\n')
canonMax.write(' *  canon_' + v11n.lower() + '.h - Versification data for the ' + v11n + ' system\n')
canonMax.write(' *\n')
canonMax.write(' * $Id$\n')
canonMax.write(' *\n')
canonMax.write(' * Copyright '+str(datetime.date.today().year)+' CrossWire Bible Society (http://www.crosswire.org)\n')
canonMax.write(' *	CrossWire Bible Society\n')
canonMax.write(' *	P. O. Box 2528\n')
canonMax.write(' *	Tempe, AZ  85280-2528\n')
canonMax.write(' *\n')
canonMax.write(' * This program is free software; you can redistribute it and/or modify it\n')
canonMax.write(' * under the terms of the GNU General Public License as published by the\n')
canonMax.write(' * Free Software Foundation version 2.\n')
canonMax.write(' *\n')
canonMax.write(' * This program is distributed in the hope that it will be useful, but\n')
canonMax.write(' * WITHOUT ANY WARRANTY; without even the implied warranty of\n')
canonMax.write(' * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU\n')
canonMax.write(' * General Public License for more details.\n')
canonMax.write(' */\n')
canonMax.write('\n')
canonMax.write('#ifndef CANON_' + v11n.upper() + '_H\n')
canonMax.write('#define CANON_' + v11n.upper() + '_H\n')
canonMax.write('\n')
canonMax.write('SWORD_NAMESPACE_START\n')
canonMax.write('\n')
canonMax.write('\n')
canonMax.write('// Versification system: ' + v11n + '\n')
canonMax.write('// Book order: ' + ' '.join(OTbookList + NTbookList) + '\n')
canonMax.write('\n')
canonMax.write('\n')

# print otbooks and ntbooks
canonMax.write('/******************************************************************************\n')
canonMax.write(' * [on]tbooks_' + v11n.lower() + ' - initialize static instance for all canonical\n')
canonMax.write(' *		 text names and chapmax\n')
canonMax.write(' */\n')

if OTbookList:
    canonMax.write('struct sbook otbooks_' + v11n.lower() + '[] = {\n')

    for book in OTbookList:
        canonMax.write('  {"' + bookName[book] + '", "' + book + '", "' + book + '", ' + str(len(bible[book])) + '},\n')

    canonMax.write('  {"", "", "", 0}\n')
    canonMax.write('};\n')
    canonMax.write('\n')

if NTbookList:
    canonMax.write('struct sbook ntbooks_' + v11n.lower() + '[] = {\n')

    for book in NTbookList:
        canonMax.write('  {"' + bookName[book] + '", "' + book + '", "' + book + '", ' + str(len(bible[book])) + '},\n')

    canonMax.write('  {"", "", "", 0}\n')
    canonMax.write('};\n')
    canonMax.write('\n')


# print vm
canonMax.write('/******************************************************************************\n')
canonMax.write(' *	Maximum verses per chapter\n')
canonMax.write(' */\n')
canonMax.write('int vm_' + v11n.lower() + '[] = {\n')

for book in OTbookList + NTbookList:
    canonMax.write('  // ' + bookName[book] + '\n')
    verseCountList = list()
    for ch in range(1, len(bible[book])+1):
        verseCountList.append(bible[book][ch])
    verseCountString = ', '.join(map(str, verseCountList))
    verseCountString = re.sub(r'(([0-9]+, ){9}[0-9]+,) ', r'\1\n  ', verseCountString)
    canonMax.write('  ' + verseCountString + ',\n')

canonMax.write('};\n')
canonMax.write('\n')

# print footer stuff
canonMax.write('SWORD_NAMESPACE_END\n')
canonMax.write('#endif\n')