3 import urllib, re, sys, optparse, os.path, datetime
4 import sqlite3 as dbapi2
6 blueprints_base_url = 'https://blueprints.launchpad.net'
8 valid_states = set(['todo', 'done', 'postponed'])
11 '''Open/initialize database.
13 This creates the database if it does not exist.
15 init = not os.path.exists(dbpath)
17 db = dbapi2.connect(dbpath)
21 cur.execute('''CREATE TABLE work_items (
22 blueprint VARCHAR(255) NOT NULL,
23 workitem VARCHAR(255) NOT NULL,
24 status VARCHAR(20) NOT NULL,
25 date TIMESTAMP NOT NULL)''')
31 '''Parse CLI arguments.
33 Return (options, args) tuple.
35 optparser = optparse.OptionParser()
36 optparser.add_option('-d', '--database',
37 help='Path to database', dest='database', metavar='PATH')
38 optparser.add_option('-r', '--release',
39 help='Release name', dest='release')
40 optparser.add_option('-p', '--pattern', metavar='REGEX',
41 help='Regex pattern for blueprint name', dest='pattern')
42 optparser.add_option('-D', '--dump', action='store_true', default=False,
43 help='Dump database', dest='dump')
44 optparser.add_option('-t', '--text', action='store_true', default=False,
45 help='Print work item summary in text format', dest='text')
46 optparser.add_option('-c', '--csv', action='store_true', default=False,
47 help='Print work item summary in text format', dest='csv')
48 optparser.add_option('--from', metavar='YYYY-MM-DD',
49 help='Generate CSV data from this day on', dest='from_date')
50 optparser.add_option('--to', metavar='YYYY-MM-DD',
51 help='Generate CSV data until this day', dest='to_date')
53 (opts, args) = optparser.parse_args()
56 optparser.error('No database given')
57 if not opts.dump and not opts.text and not opts.csv:
59 optparser.error('No release given')
61 optparser.error('No pattern given')
65 def get_blueprints(url, name_pattern):
66 '''Return a list of blueprint URLs for the current release.'''
68 blueprint_name_filter = re.compile('href="(/ubuntu/\+spec/%s[^"]+)"' %
72 for l in urllib.urlopen(url):
73 m = blueprint_name_filter.search(l)
75 result.append(blueprints_base_url + m.group(1))
79 def get_workitems(blueprint_url):
80 '''Collect work items from a particular blueprint URL.
82 This will return a list of ('item', 'status') pairs.
84 work_items_re = re.compile('(<p>|^)work items:\s*<br />', re.I)
86 found_workitems = False
88 for l in urllib.urlopen(blueprint_url):
89 if not found_workitems:
90 if work_items_re.search(l):
91 found_workitems = True
94 l = l.replace('<br />', '').replace('</div>', '').strip()
96 # ends with empty line
97 if l.endswith('</p>') or not l:
101 (desc, state) = l.rsplit(':', 1)
103 print >> sys.stderr, 'ERROR: invalid work item format: ' + l
106 state = state.strip().lower()
109 if state not in valid_states:
110 print >> sys.stderr, 'ERROR: invalid state "%s" for work item "%s"' % (
113 result.append((desc, state))
118 '''Dump database contents.'''
121 cur.execute('SELECT * FROM work_items')
122 for (blueprint, workitem, status, date) in cur:
123 print '%s [%s]\t%s: %s' % (date, blueprint, workitem, status)
125 def add_work_item(db, blueprint, item, status):
126 '''Add work item to database.'''
129 cur.execute('INSERT INTO work_items VALUES (?, ?, ?, date(CURRENT_TIMESTAMP))',
130 (blueprint, item, status))
132 def import_lp(db, name_pattern, release):
133 '''Collect blueprint work items from Launchpad into DB.'''
135 blueprints = get_blueprints('%s//ubuntu/%s/+specs' % (blueprints_base_url,
136 opts.release), name_pattern)
138 for bp in blueprints:
139 #print 'Checking', bp
140 bpname = bp.split('/')[-1]
141 work_items = get_workitems(bp)
143 print >> sys.stderr, 'WARNING: %s has no work items' % bpname
144 for (item, status) in work_items:
145 add_work_item(db, bpname, item, status)
148 def workitems_over_time(db):
149 '''Calculate work item development over time.
151 Return date -> state -> count mapping.
154 for s in valid_states:
156 cur.execute('SELECT date, count(*) FROM work_items WHERE status=? GROUP BY date',
158 for (date, num) in cur:
159 data.setdefault(date, {})[s] = num
162 def blueprint_status(db):
163 '''Determine current blueprint status.
165 Return blueprint -> [todo, done, postponed] mapping.
171 cur.execute('SELECT max(date) FROM work_items')
172 (last_date,) = cur.fetchone()
175 for s in valid_states:
177 cur.execute('SELECT blueprint, count(workitem) FROM work_items '
178 'WHERE status = ? AND date = ? GROUP BY blueprint',
180 for (bp, num) in cur:
181 data.setdefault(bp, [0, 0, 0])[index] = num
187 '''Print work item status as text.'''
189 data = workitems_over_time(db)
192 for d in sorted(data.keys()):
195 print '\nBlueprint status:'
196 data = blueprint_status(db)
197 for (bp, (todo, done, postponed)) in data.iteritems():
198 print '%s: %i/%i (%i%%)' % (bp, postponed+done, todo+done+postponed,
199 int(float(postponed+done)/(todo+done+postponed)*100 + 0.5))
201 def csv(db, from_date, to_date):
202 '''Print work item status as csv.'''
205 '''Convert datetime.date into MM/DD/YYYY'''
207 return '%s/%s/%s' % (d.month, d.day, d.year)
210 '''Convert YYYY-MM-DD string to datetime.date'''
212 (y, m, d) = s.split('-')
213 return datetime.date(int(y), int(m), int(d))
215 data = workitems_over_time(db)
217 dates = sorted(data.keys())
219 f = _fromstr(from_date or dates[0])
220 t = _fromstr(to_date or dates[-1])
224 entry = data.get('%i-%02i-%02i' % (d.year, d.month, d.day), {})
225 print '%02i/%02i/%i,%i,%i,%i' % (d.month, d.day, d.year,
226 entry.get('todo', 0), entry.get('done', 0),
227 entry.get('postponed', 0))
228 d += datetime.timedelta(days=1)
234 (opts, args) = parse_argv()
236 db = get_db(opts.database)
243 csv(db, opts.from_date, opts.to_date)
245 import_lp(db, opts.pattern, opts.release)