| Index: mozharness/abb/transform_locales.py |
| diff --git a/mozharness/abb/transform_locales.py b/mozharness/abb/transform_locales.py |
| new file mode 100644 |
| index 0000000000000000000000000000000000000000..650b4d5fb8c22eee7236b3cc1422a9d9dd206922 |
| --- /dev/null |
| +++ b/mozharness/abb/transform_locales.py |
| @@ -0,0 +1,182 @@ |
| +# This file is part of Adblock Plus |
| +# Copyright (C) 2006-2015 Eyeo GmbH |
| +# |
| +# Adblock Plus is free software: you can redistribute it and/or modify |
| +# it under the terms of the GNU General Public License version 3 as |
| +# published by the Free Software Foundation. |
| +# |
| +# Adblock Plus is distributed in the hope that it will be useful, |
| +# but WITHOUT ANY WARRANTY; without even the implied warranty of |
| +# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the |
| +# GNU General Public License for more details. |
| +# |
| +# You should have received a copy of the GNU General Public License |
| +# along with Adblock Plus. If not, see <http://www.gnu.org/licenses/>. |
| + |
| +import os |
| +import re |
| + |
| +_LOCALE_RE = re.compile("^[a-z]{2}(-[A-Z]{2})?$") |
| +_SEARCH_PROPS_RE = re.compile("^browser\.search\." |
| + "(defaultenginename|order\.).*$") |
| +_SHORTNAME_RE = re.compile("^<ShortName>.*</ShortName>$") |
| + |
| +_SEARCHPLUGINS_PATH = os.path.join("browser", "searchplugins") |
| +_LIST_TXT_PATH = os.path.join(_SEARCHPLUGINS_PATH, "list.txt") |
| +_REGION_PROPS_PATH = os.path.join("browser", "region.properties") |
| + |
| +_DEFAULT_LOCALE = "en-US" |
| + |
| +_SEARCH_ENGINE_ORDER = { |
| + "en-US": ["duckduckgo", |
| + "yahoo", |
| + "google", |
| + "wikipedia", |
| + "amazon" |
| + ], |
| + "zh-CN": ["baidu", |
| + "duckduckgo", |
| + "yahoo", |
| + "google", |
| + "wikipedia", |
| + "amazon" |
| + ] |
| +} |
| + |
| + |
| +def _get_shortname_from_id(needle, engine_ids, engine_names): |
| + """Fuzzy finds needle in engine_ids and returns ShortName""" |
| + regex = re.compile("^%s.*$" % needle) |
| + for engine in engine_ids: |
| + if regex.match(engine.lower()): |
|
Felix Dahlke
2015/09/21 20:46:31
Sorry for not realising this earlier, but wouldn't
René Jeschke
2015/09/22 10:52:02
Done.
|
| + return engine_names[engine] |
| + return None |
| + |
| + |
| +def _write_lines(filename, lines): |
| + """Writes lines into file appending \\n""" |
| + with open(filename, "w") as fd: |
| + for l in lines: |
| + fd.write("%s\n" % l) |
| + |
| + |
| +def _transform_locale(locale, path, logger): |
| + logger.info("Processing locale '%s'..." % locale) |
| + |
| + # Check for list.txt existence |
| + list_file_path = os.path.join(path, _LIST_TXT_PATH) |
| + if not os.path.exists(list_file_path): |
| + logger.fatal("Missing 'list.txt' for locale '%s'" % locale) |
| + |
| + # Check for region.properties existence |
| + region_file_path = os.path.join(path, _REGION_PROPS_PATH) |
| + if not os.path.exists(region_file_path): |
| + logger.fatal("Missing 'region.properties' for locale '%s'" % locale) |
| + |
| + # Get whitelist and build regex |
| + whitelist = _SEARCH_ENGINE_ORDER.get(locale, |
| + _SEARCH_ENGINE_ORDER[_DEFAULT_LOCALE]) |
| + white_re = re.compile("^(%s).*$" % "|".join(whitelist)) |
| + |
| + # Read engine IDs from list.txt, discard engines not on whitelist |
| + engine_ids = [] |
| + with open(list_file_path, "r") as fd: |
| + for line in fd: |
| + line = line.strip() |
| + if len(line) > 0: |
| + if white_re.match(line.lower()): |
|
Felix Dahlke
2015/09/21 20:46:31
I think we should do proper case insensitive match
René Jeschke
2015/09/22 10:52:02
I threw out the case insensitive stuff completely,
|
| + engine_ids.append(line) |
| + else: |
| + logger.info("Removing '%s'" % line) |
| + |
| + # Make sure we still have search engines left |
| + if len(engine_ids) == 0: |
| + logger.fatal("No search engines left over for '%s'" % locale) |
| + |
| + # 'Parse' XML to get matching 'ShortName' for all engine IDs |
| + engine_names = {} |
| + for eid in engine_ids: |
| + xml_file_path = os.path.join(path, _SEARCHPLUGINS_PATH, "%s.xml" % eid) |
| + if os.path.exists(xml_file_path): |
| + short_name = None |
| + with open(xml_file_path, "r") as fd: |
| + for line in fd: |
| + line = line.strip() |
| + if _SHORTNAME_RE.match(line): |
| + short_name = line[11:-12].strip() |
|
Felix Dahlke
2015/09/21 20:46:31
Wow, just realised the hard coded offsets - that s
René Jeschke
2015/09/22 10:52:02
Done.
|
| + |
| + if not short_name: |
| + logger.fatal("No ShortName defined for '%s' in '%s" % |
| + (eid, locale)) |
| + engine_names[eid] = short_name |
| + else: |
| + logger.fatal("XML definiton for '%s' in '%s' missing" % |
| + (eid, locale)) |
| + |
| + logger.info("Remaining engine IDs: %s" % ", ".join(engine_ids)) |
| + |
| + # Create search engine order with real engine names |
| + engine_order = [] |
| + for eid in whitelist: |
| + sn = _get_shortname_from_id(eid, engine_ids, engine_names) |
| + if sn: |
| + engine_order.append(sn) |
| + |
| + logger.info("Resulting ordered list: %s" % (", ".join(engine_order))) |
| + |
| + # Read region.properties and remove browser.search.* lines |
| + props = [] |
| + with open(region_file_path, "r") as fd: |
| + for line in fd: |
| + line = line.rstrip("\r\n") |
| + if not _SEARCH_PROPS_RE.match(line.strip()): |
| + props.append(line) |
| + |
| + # Append default search engine name |
| + props.append("browser.search.defaultenginename=%s" % engine_order[0]) |
| + |
| + # Append search engine order |
| + for i in range(0, min(3, len(engine_order))): |
| + props.append("browser.search.order.%d=%s" % (i + 1, engine_order[i])) |
| + |
| + # Write back list.txt |
| + _write_lines(list_file_path, engine_ids) |
| + |
| + # Write back region.properties |
| + _write_lines(region_file_path, props) |
| + |
| + |
| +class MinimalLogger: |
| + def info(self, s): |
| + print "INFO: %s" % s |
| + |
| + def error(self, s): |
| + print "ERROR: %s" % s |
| + |
| + def fatal(self, s): |
| + print "FATAL: %s" % s |
| + exit(1) |
| + |
| + |
| +def transform_locales(build_object, obj_dir): |
|
Felix Dahlke
2015/09/21 20:46:31
Maybe it's just me, but I think this would be more
René Jeschke
2015/09/22 10:52:02
Done.
|
| + logger = build_object or MinimalLogger() |
| + |
| + chrome_path = os.path.join(obj_dir, "dist", "bin", "chrome") |
| + if not os.path.exists(chrome_path): |
| + logger.fatal("'%s' does not exist" % obj_dir) |
| + |
| + locales = [] |
| + for p in next(os.walk(chrome_path))[1]: |
| + if _LOCALE_RE.match(p): |
| + locales.append(p) |
| + locales.sort() |
| + |
| + logger.info("Found %d locales" % len(locales)) |
| + |
| + for locale in locales: |
| + locale_path = os.path.join(chrome_path, locale, "locale", locale) |
| + if os.path.exists(locale_path): |
| + _transform_locale(locale, locale_path, logger) |
| + else: |
| + logger.error("Missing 'locale' folder for '%s'" % locale) |
| + |