2 # emacs: -*- mode: python; py-indent-offset: 4; indent-tabs-mode: nil -*-
3 # vi: set ft=python sts=4 ts=4 sw=4 et:
8 from datetime import datetime
16 'etch': 'Debian GNU/Linux 4.0 (etch)',
17 'lenny': 'Debian GNU/Linux 5.0 (lenny)',
18 'squeeze': 'Debian GNU/Linux 6.0 (squeeze)',
19 'wheezy': 'Debian testing (wheezy)',
20 'sid': 'Debian unstable (sid)',
21 'hardy': 'Ubuntu 08.04 LTS "Hardy Heron" (hardy)',
22 'jaunty': 'Ubuntu 09.04 "Jaunty Jackalope" (jaunty)',
23 'karmic': 'Ubuntu 09.10 "Karmic Koala" (karmic)',
24 'lucid': 'Ubuntu 10.04 LTS "Lucid Lynx" (lucid)',
25 'maverick': 'Ubuntu 10.10 "Maverick Meerkat" (maverick)',
26 'natty': 'Ubuntu 11.04 "Natty Narwhal" (natty)',
27 'oneiric': 'Ubuntu 11.10 "Oneiric Ocelot" (oneiric)',
28 'precise': 'Ubuntu 12.04 LTS "Precise Pangolin" (precise)',
29 'quantal': 'Ubuntu 12.10 "Quantal Quetzal" (quantal)',
30 'raring': 'Ubuntu 13.04 "Raring Ringtail" (raring)',
31 'saucy': 'Ubuntu 13.10 "Saucy Salamander" (saucy)',
35 sys.stderr.write('E: %s\n' % msg)
38 sys.stderr.write("I: %s\n" % msg)
40 file_regex = re.compile('.*popcon-(\d{4}-\d{1,2}-\d{1,2})(|.gz)')
42 def read_popcon_stats(filename, read_packages=True):
43 info("Reading %s" % filename)
44 entry = dict(submissions = None,
49 for line in fileinput.FileInput(filename, openhook=fileinput.hook_compressed):
50 key, values = [x.strip().lower() for x in line.split(':', 1)]
51 if key == 'package': # most probable
55 pkg, vote, old, recent, nofiles = values.split()
57 raise ValueError("Failed to split %s" % values)
58 entry[key][pkg] = tuple(int(x) for x in (vote, old, recent, nofiles))
59 elif key in ('release', 'architecture'):
60 kvalue, value = values.split()
61 entry[key][kvalue] = int(value)
62 elif key == 'submissions':
63 entry[key] = int(values)
65 raise ValueError("Do not know how to handle line" % line)
68 if __name__ == '__main__':
72 timestamps = sets.Set()
74 for f in sys.argv[1:]:
75 file_reg = file_regex.match(f)
77 error("Failed to recognize filename %s" % f)
80 date = time.strptime(file_reg.groups()[0], '%Y-%m-%d')
81 entry = read_popcon_stats(f, read_packages=False)
83 date_int = int(time.mktime(date)*1000)
84 # Let's coarsen a bit -- to a week which makes sense anyways
85 # since popcon submissions are spread over a week for balanced
88 coarsen = coarsen_days*24*3600*1000
89 # coarsen and place marker at the end of the duration
90 # but not later than today
91 date_int = min((date_int//coarsen + 1)*coarsen,
93 for version, count in entry['release'].iteritems():
94 if not version in popcon_versions:
95 popcon_versions[version] = {}
96 popcon_ = popcon_versions[version]
97 popcon_[date_int] = count + popcon_.get(date_int, 0)
98 timestamps.add(date_int)
100 versions = sorted([x for x in popcon_versions.keys() if not 'ubuntu' in x]) + \
101 sorted([x for x in popcon_versions.keys() if 'ubuntu' in x])
103 # we need to make sure that for every date we have an entry for
104 # every version, otherwise d3 pukes because of ... d3.v2.js:expand
106 'values': [[date, popcon_versions[k].get(date, 0)/coarsen_days]
107 for date in sorted(list(timestamps))]}
109 print json.dumps(export)