1 |
6620
|
aaronmk
|
#!/usr/bin/env python
|
2 |
|
|
# Translates a data dictionary spreadsheet to Redmine formatting
|
3 |
|
|
|
4 |
|
|
import csv
|
5 |
|
|
import re
|
6 |
|
|
import sys
|
7 |
|
|
|
8 |
|
|
# Spreadsheet format
|
9 |
|
|
source_sep = ', '
|
10 |
|
|
|
11 |
|
|
##### URLs
|
12 |
|
|
|
13 |
6636
|
aaronmk
|
url_comment_re = r'(?:\([^)]*\))'
|
14 |
|
|
|
15 |
6620
|
aaronmk
|
def simplify_url(url): return re.sub(r'\(.*?\)', r'', url)
|
16 |
|
|
|
17 |
6635
|
aaronmk
|
def url_comment_text(comment):
|
18 |
|
|
if not comment: return comment
|
19 |
|
|
|
20 |
6638
|
aaronmk
|
match = re.match(r'^\(\d*:?(.*?)\)$', comment)
|
21 |
6635
|
aaronmk
|
assert match
|
22 |
|
|
text, = match.groups()
|
23 |
|
|
return text
|
24 |
|
|
|
25 |
6620
|
aaronmk
|
def url_term(url):
|
26 |
6637
|
aaronmk
|
'''Prefixes any provider in the URL to the term name, to create a namespace.
|
27 |
|
|
Each hierarchical component of the provider is stored in a URL comment.
|
28 |
|
|
'''
|
29 |
|
|
match = re.match(r'^('+url_comment_re+r'*).*?([\w:-]+)$', url)
|
30 |
6620
|
aaronmk
|
assert match
|
31 |
6637
|
aaronmk
|
provider_str, term = match.groups()
|
32 |
6639
|
aaronmk
|
provider = filter(bool, map(url_comment_text,
|
33 |
|
|
re.findall(url_comment_re, provider_str)))
|
34 |
6637
|
aaronmk
|
|
35 |
|
|
return ':'.join(provider+[term])
|
36 |
6620
|
aaronmk
|
|
37 |
|
|
##### Redmine
|
38 |
|
|
|
39 |
6632
|
aaronmk
|
def redmine_bold(text): return '*'+text+'*'
|
40 |
|
|
|
41 |
6620
|
aaronmk
|
def redmine_url(text, url):
|
42 |
|
|
if url: return '"'+text+'":'+url
|
43 |
|
|
else: return text
|
44 |
|
|
|
45 |
|
|
def source2redmine_url(url):
|
46 |
6623
|
aaronmk
|
if url: return redmine_url(url_term(url), simplify_url(url))
|
47 |
|
|
else: return ''
|
48 |
6620
|
aaronmk
|
|
49 |
|
|
class RedmineTableWriter:
|
50 |
|
|
'''Formats rows as a Redmine table'''
|
51 |
|
|
|
52 |
|
|
def __init__(self, stream):
|
53 |
|
|
self.stream = stream
|
54 |
|
|
|
55 |
|
|
def writerow(self, row):
|
56 |
|
|
self.stream.write(('|'.join(['']+row+['']))+'\n')
|
57 |
|
|
|
58 |
6673
|
aaronmk
|
class RedmineDictWriter:
|
59 |
|
|
'''Formats rows as Redmine sections containing a table'''
|
60 |
|
|
|
61 |
|
|
def __init__(self, term_col, header, stream):
|
62 |
|
|
header.pop(term_col)
|
63 |
|
|
|
64 |
|
|
self.term_col = term_col
|
65 |
|
|
self.header = header
|
66 |
|
|
self.stream = stream
|
67 |
|
|
|
68 |
|
|
def writerow(self, row):
|
69 |
|
|
term = row.pop(self.term_col)
|
70 |
|
|
self.stream.write('\nh3. '+term+'\n\n')
|
71 |
|
|
|
72 |
|
|
table = RedmineTableWriter(self.stream)
|
73 |
|
|
for i, col_name in enumerate(self.header):
|
74 |
|
|
table.writerow([redmine_bold(col_name), row[i]])
|
75 |
6620
|
aaronmk
|
|
76 |
6673
|
aaronmk
|
|
77 |
6620
|
aaronmk
|
def main():
|
78 |
6633
|
aaronmk
|
try: _prog_name, term_col, sources_col = sys.argv
|
79 |
6626
|
aaronmk
|
except ValueError: raise SystemExit('Usage: '+sys.argv[0]
|
80 |
6633
|
aaronmk
|
+' <spreadsheet term_col# sources_col# >redmine')
|
81 |
|
|
term_col, sources_col = map(int, [term_col, sources_col])
|
82 |
6626
|
aaronmk
|
|
83 |
6632
|
aaronmk
|
# Translate input
|
84 |
6620
|
aaronmk
|
reader = csv.reader(sys.stdin)
|
85 |
6673
|
aaronmk
|
header = reader.next()
|
86 |
|
|
writer = RedmineDictWriter(term_col, header, sys.stdout)
|
87 |
6620
|
aaronmk
|
for row in reader:
|
88 |
|
|
term = row[term_col]
|
89 |
6634
|
aaronmk
|
sources = row[sources_col].split(source_sep)
|
90 |
6620
|
aaronmk
|
|
91 |
6634
|
aaronmk
|
row[term_col] = redmine_url(term, simplify_url(sources[0]))
|
92 |
6632
|
aaronmk
|
row[sources_col] = source_sep.join(map(source2redmine_url, sources))
|
93 |
6628
|
aaronmk
|
|
94 |
6632
|
aaronmk
|
writer.writerow(row)
|
95 |
6620
|
aaronmk
|
|
96 |
|
|
main()
|