3 """ Various statistical pr0nography fun and games """
4 # Copyright (C) 2000, 2001, 2002, 2003, 2006 James Troup <james@nocrew.org>
6 # This program is free software; you can redistribute it and/or modify
7 # it under the terms of the GNU General Public License as published by
8 # the Free Software Foundation; either version 2 of the License, or
9 # (at your option) any later version.
11 # This program is distributed in the hope that it will be useful,
12 # but WITHOUT ANY WARRANTY; without even the implied warranty of
13 # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
14 # GNU General Public License for more details.
16 # You should have received a copy of the GNU General Public License
17 # along with this program; if not, write to the Free Software
18 # Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
20 ################################################################################
22 # <aj> can we change the standards instead?
24 # <aj> whatever we're not conforming to
25 # <aj> if there's no written standard, why don't we declare linux as
26 # the defacto standard
29 # [aj's attempt to avoid ABI changes for released architecture(s)]
31 ################################################################################
35 from daklib import utils
36 from daklib import database
38 ################################################################################
43 ################################################################################
45 def usage(exit_code=0):
46 print """Usage: dak stats MODE
49 -h, --help show this help and exit.
51 The following MODEs are available:
53 arch-space - displays space used by each architecture
54 pkg-nums - displays the number of packages by suite/architecture
55 daily-install - displays daily install stats suitable for graphing
59 ################################################################################
61 def per_arch_space_use():
62 q = projectB.query("""
63 SELECT a.arch_string as Architecture, sum(f.size)
64 FROM files f, binaries b, architecture a
65 WHERE a.id=b.architecture AND f.id=b.file
66 GROUP BY a.arch_string""")
68 q = projectB.query("SELECT sum(size) FROM files WHERE filename ~ '.(diff.gz|tar.gz|dsc)$'")
71 ################################################################################
73 def daily_install_stats():
75 f = utils.open_file("2001-11")
76 for line in f.readlines():
77 split = line.strip().split('|')
79 if program != "katie" and program != "process-accepted":
82 if action != "installing changes" and action != "installed":
85 if not stats.has_key(date):
87 stats[date]["packages"] = 0
88 stats[date]["size"] = 0.0
89 if action == "installing changes":
90 stats[date]["packages"] += 1
91 elif action == "installed":
92 stats[date]["size"] += float(split[5])
97 packages = stats[date]["packages"]
98 size = int(stats[date]["size"] / 1024.0 / 1024.0)
99 print "%s %s %s" % (date, packages, size)
101 ################################################################################
111 def suite_sort(a, b):
112 if Cnf.has_key("Suite::%s::Priority" % (a)):
113 a_priority = int(Cnf["Suite::%s::Priority" % (a)])
116 if Cnf.has_key("Suite::%s::Priority" % (b)):
117 b_priority = int(Cnf["Suite::%s::Priority" % (b)])
120 return cmp(a_priority, b_priority)
122 def output_format(suite):
124 for word in suite.split("-"):
125 output_suite.append(word[0])
126 return "-".join(output_suite)
128 # Obvious query with GROUP BY and mapped names -> 50 seconds
129 # GROUP BY but ids instead of suite/architecture names -> 28 seconds
130 # Simple query -> 14 seconds
131 # Simple query into large dictionary + processing -> 21 seconds
132 # Simple query into large pre-created dictionary + processing -> 18 seconds
134 def number_of_packages():
140 # Build up suite mapping
141 q = projectB.query("SELECT id, suite_name FROM suite")
142 suite_ql = q.getresult()
146 suite_ids[name] = sid
147 # Build up architecture mapping
148 q = projectB.query("SELECT id, arch_string FROM architecture")
149 for i in q.getresult():
153 # Pre-create the dictionary
154 for suite_id in suites.keys():
156 for arch_id in arches.keys():
157 d[suite_id][arch_id] = 0
158 # Get the raw data for binaries
159 q = projectB.query("""
160 SELECT ba.suite, b.architecture
161 FROM binaries b, bin_associations ba
162 WHERE b.id = ba.bin""")
163 # Simultate 'GROUP by suite, architecture' with a dictionary
164 for i in q.getresult():
165 (suite_id, arch_id) = i
166 d[suite_id][arch_id] = d[suite_id][arch_id] + 1
167 # Get the raw data for source
168 arch_id = arch_ids["source"]
169 q = projectB.query("""
170 SELECT suite, count(suite) FROM src_associations GROUP BY suite;""")
171 for i in q.getresult():
172 (suite_id, count) = i
173 d[suite_id][arch_id] = d[suite_id][arch_id] + count
176 suite_list = suites.values()
177 suite_list.sort(suite_sort)
180 for suite in suite_list:
181 suite_id = suite_ids[suite]
182 suite_arches[suite_id] = {}
183 for arch in database.get_suite_architectures(suite_id):
184 suite_arches[suite_id][arch] = ""
185 suite_id_list.append(suite_id)
186 output_list = [ output_format(i) for i in suite_list ]
187 longest_suite = longest(output_list)
188 arch_list = arches.values()
190 longest_arch = longest(arch_list)
192 output = (" "*longest_arch) + " |"
193 for suite in output_list:
194 output = output + suite.center(longest_suite)+" |"
195 output = output + "\n"+(len(output)*"-")+"\n"
197 arch_list = arches.values()
199 longest_arch = longest(arch_list)
200 for arch in arch_list:
201 arch_id = arch_ids[arch]
202 output = output + arch.center(longest_arch)+" |"
203 for suite_id in suite_id_list:
204 if suite_arches[suite_id].has_key(arch):
205 count = repr(d[suite_id][arch_id])
208 output = output + count.rjust(longest_suite)+" |"
209 output = output + "\n"
212 ################################################################################
217 Cnf = utils.get_conf()
218 Arguments = [('h',"help","Stats::Options::Help")]
220 if not Cnf.has_key("Stats::Options::%s" % (i)):
221 Cnf["Stats::Options::%s" % (i)] = ""
223 args = apt_pkg.ParseCommandLine(Cnf, Arguments, sys.argv)
225 Options = Cnf.SubTree("Stats::Options")
230 utils.warn("dak stats requires a MODE argument")
233 utils.warn("dak stats accepts only one MODE argument")
235 mode = args[0].lower()
237 projectB = pg.connect(Cnf["DB::Name"], Cnf["DB::Host"], int(Cnf["DB::Port"]))
238 database.init(Cnf, projectB)
240 if mode == "arch-space":
242 elif mode == "pkg-nums":
244 elif mode == "daily-install":
245 daily_install_stats()
247 utils.warn("unknown mode '%s'" % (mode))
250 ################################################################################
252 if __name__ == '__main__':