Left: | ||
Right: |
OLD | NEW |
---|---|
1 # coding: utf-8 | 1 # coding: utf-8 |
2 | 2 |
3 # This file is part of the Adblock Plus web scripts, | 3 # This file is part of the Adblock Plus web scripts, |
4 # Copyright (C) 2006-2013 Eyeo GmbH | 4 # Copyright (C) 2006-2013 Eyeo GmbH |
5 # | 5 # |
6 # Adblock Plus is free software: you can redistribute it and/or modify | 6 # Adblock Plus is free software: you can redistribute it and/or modify |
7 # it under the terms of the GNU General Public License version 3 as | 7 # it under the terms of the GNU General Public License version 3 as |
8 # published by the Free Software Foundation. | 8 # published by the Free Software Foundation. |
9 # | 9 # |
10 # Adblock Plus is distributed in the hope that it will be useful, | 10 # Adblock Plus is distributed in the hope that it will be useful, |
11 # but WITHOUT ANY WARRANTY; without even the implied warranty of | 11 # but WITHOUT ANY WARRANTY; without even the implied warranty of |
12 # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the | 12 # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the |
13 # GNU General Public License for more details. | 13 # GNU General Public License for more details. |
14 # | 14 # |
15 # You should have received a copy of the GNU General Public License | 15 # You should have received a copy of the GNU General Public License |
16 # along with Adblock Plus. If not, see <http://www.gnu.org/licenses/>. | 16 # along with Adblock Plus. If not, see <http://www.gnu.org/licenses/>. |
17 | 17 |
18 import os, re, subprocess, urllib | 18 import os, sys, re, codecs, subprocess, urllib, simplejson, traceback |
Sebastian Noack
2013/08/26 16:05:22
Since Python 2.6 you can use the built-in "json" m
Wladimir Palant
2013/08/27 07:34:28
I am aware of that of course. However, simplejson
Wladimir Palant
2013/08/27 11:59:47
Reply by Sebastian:
That is strange since the ori
Wladimir Palant
2013/08/27 12:42:01
I did. However, looking at http://www.tablix.org/~
| |
19 import sitescripts.stats.common as common | |
19 from sitescripts.utils import get_config, setupStderr | 20 from sitescripts.utils import get_config, setupStderr |
20 from ConfigParser import SafeConfigParser, NoOptionError | |
21 from StringIO import StringIO | |
22 | 21 |
23 def readStatsFile(path): | 22 def read_stats_file(path): |
24 result = SafeConfigParser() | 23 match = re.search(r"^ssh://(\w+)@([^/:]+)(?::(\d+))?", path) |
25 match = re.search(r'^ssh://(\w+)@([^/:]+)(?::(\d+))?', path) | |
26 if match: | 24 if match: |
27 command = ['ssh', '-q', '-o' 'NumberOfPasswordPrompts 0', '-T', '-k', '-l', match.group(1), match.group(2)] | 25 command = ["ssh", "-q", "-o", "NumberOfPasswordPrompts 0", "-T", "-k", "-l", match.group(1), match.group(2)] |
28 if match.group(3): | 26 if match.group(3): |
29 command[1:1] = ['-P', match.group(3)] | 27 command[1:1] = ["-P", match.group(3)] |
30 data = subprocess.check_output(command) | 28 data = subprocess.check_output(command) |
31 result.readfp(StringIO(data)) | 29 return simplejson.loads(data.decode("utf-8")) |
32 elif path.startswith('http://') or path.startswith('https://'): | 30 elif path.startswith("http://") or path.startswith("https://"): |
33 result.readfp(urllib.urlopen(path)) | 31 return simplejson.load(urllib.urlopen(path).read().decode("utf-8")) |
34 elif os.path.exists(path): | 32 elif os.path.exists(path): |
35 result.read(path) | 33 with codecs.open(path, "rb", encoding="utf-8") as file: |
36 return result | 34 return simplejson.load(file) |
37 | 35 |
38 def getStatsFiles(): | 36 raise IOError("Path '%s' not recognized" % path) |
37 | |
38 def get_stats_files(mirrors): | |
39 config = get_config() | 39 config = get_config() |
40 | 40 |
41 for option in config.options('subscriptionStats'): | 41 if len(mirrors) > 0: |
42 match = re.search(r'^mirror_(.*)', option, re.I) | 42 options = map(lambda m: "mirror_" + m, mirrors) |
43 if match: | 43 else: |
44 yield (match.group(1), config.get('subscriptionStats', option)) | 44 options = filter(lambda o: o.startswith("mirror_"), config.options("stats")) |
45 for option in options: | |
46 if config.has_option("stats", option): | |
47 value = config.get("stats", option) | |
48 if " " in value: | |
49 yield re.split(r"\s+", value, 1) | |
Sebastian Noack
2013/08/26 16:05:22
Did you know that value.split(None, 1) would do th
Wladimir Palant
2013/08/27 07:34:28
No, I didn't. Fixed.
| |
50 else: | |
51 print >>sys.stderr, "Option '%s' has invalid value: '%s'" % (option, val ue) | |
52 else: | |
53 print >>sys.stderr, "Option '%s' not found in the configuration" % option | |
45 | 54 |
46 def mergeStatsFile(mirrorName, config1, config2): | 55 def merge_objects(object1, object2): |
47 def increaseOption(section, option, increase): | 56 for key, value in object2.iteritems(): |
48 if config1.has_option(section, option): | 57 if key in object1: |
49 oldval = config1.getint(section, option) | 58 if isinstance(value, int): |
50 config1.set(section, option, str(oldval + increase)) | 59 object1[key] += value |
60 else: | |
61 merge_objects(object1[key], object2[key]) | |
51 else: | 62 else: |
52 config1.set(section, option, str(increase)) | 63 object1[key] = value |
53 | 64 |
54 for section in config2.sections(): | 65 def merge_stats_file(server_type, data): |
55 if not config1.has_section(section): | 66 base_dir = os.path.join(get_config().get("stats", "dataDirectory"), common.fil ename_encode(server_type)) |
56 config1.add_section(section) | 67 for month, month_data in data.iteritems(): |
57 for option in config2.options(section): | 68 for name, file_data in month_data.iteritems(): |
58 increase = config2.getint(section, option) | 69 path = os.path.join(base_dir, common.filename_encode(month), common.filena me_encode(name + ".json")) |
59 increaseOption(section, option, increase) | 70 if os.path.exists(path): |
71 with codecs.open(path, "rb", encoding="utf-8") as file: | |
72 existing = simplejson.load(file) | |
73 else: | |
74 existing = {} | |
60 | 75 |
61 match = re.search(r'^(\S+) (hits|bandwidth)$', option, re.I) | 76 merge_objects(existing, file_data) |
62 if match: | |
63 increaseOption(section, '%s %s mirror %s' % (match.group(1), match.group (2), mirrorName), increase) | |
64 | 77 |
65 if __name__ == '__main__': | 78 dir = os.path.dirname(path) |
79 if not os.path.exists(dir): | |
80 os.makedirs(dir) | |
81 | |
82 with codecs.open(path, "wb", encoding="utf-8") as file: | |
83 simplejson.dump(existing, file, indent=2, sort_keys=True) | |
84 | |
85 def merge_mirror_stats(mirrors): | |
86 for server_type, path in get_stats_files(mirrors): | |
87 try: | |
88 merge_stats_file(server_type, read_stats_file(path)) | |
89 except: | |
90 print >>sys.stderr, "Unable to merge stats for '%s'" % path | |
91 traceback.print_exc() | |
92 | |
93 if __name__ == "__main__": | |
66 setupStderr() | 94 setupStderr() |
67 | 95 merge_mirror_stats(sys.argv[1:]) |
68 result = readStatsFile(get_config().get('subscriptionStats', 'mainFile')) | |
69 for (mirrorName, statsFile) in getStatsFiles(): | |
70 mergeStatsFile(mirrorName, result, readStatsFile(statsFile)) | |
71 file = open(get_config().get('subscriptionStats', 'mainFile'), 'wb') | |
72 result.write(file) | |
OLD | NEW |