Rietveld Code Review Tool
Help | Bug tracker | Discussion group | Source code

Side by Side Diff: cms/bin/translate.py

Issue 29317015: Issue 2625 - [cms] Crowdin synchronisation script (Closed)
Patch Set: Created June 15, 2015, 2:12 p.m.
Left:
Right:
Use n/p to move between diff chunks; N/P to move between comments.
Jump to:
View unified diff | Download patch
« no previous file with comments | « README.md ('k') | cms/converters.py » ('j') | cms/converters.py » ('J')
Toggle Intra-line Diffs ('i') | Expand Comments ('e') | Collapse Comments ('c') | Show Comments Hide Comments ('s')
OLDNEW
(Empty)
1 # coding: utf-8
2
3 # This file is part of the Adblock Plus web scripts,
4 # Copyright (C) 2006-2015 Eyeo GmbH
5 #
6 # Adblock Plus is free software: you can redistribute it and/or modify
7 # it under the terms of the GNU General Public License version 3 as
8 # published by the Free Software Foundation.
9 #
10 # Adblock Plus is distributed in the hope that it will be useful,
11 # but WITHOUT ANY WARRANTY; without even the implied warranty of
12 # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
13 # GNU General Public License for more details.
14 #
15 # You should have received a copy of the GNU General Public License
16 # along with Adblock Plus. If not, see <http://www.gnu.org/licenses/>.
17
18 from io import BytesIO
19 from itertools import islice
Wladimir Palant 2015/06/29 19:05:36 Nit: I'm not a big fan of importing individual fun
kzar 2015/07/02 12:33:11 Done.
20 import json
21 import logging
22 import os
23 import sys
24 import zipfile
25
26 import requests
27
28 import cms.utils
29 from cms.sources import FileSource
30
31 FILES_PER_REQUEST = 20
32
33 logger = logging.getLogger("cms.bin.translate")
34 crowdin_api_key = None
35 crowdin_project_name = None
36 defaultlocale = None
Wladimir Palant 2015/06/29 19:05:37 The three variables above shouldn't be globals - t
kzar 2015/07/02 12:33:11 Done.
37
38 def grouper(iterable, n):
39 iterator = iter(iterable)
40 while True:
41 chunk = tuple(islice(iterator, n))
42 if chunk:
43 yield chunk
44 else:
45 break
Wladimir Palant 2015/06/29 19:05:36 Please link to https://stackoverflow.com/questions
kzar 2015/07/02 12:33:10 I originally did take this function from Stackover
46
47 def crowdin_request(request_method, api_endpoint, **kwargs):
48 url = "https://api.crowdin.com/api/project/%s/%s?key=%s&json=1" % (
49 crowdin_project_name, api_endpoint, crowdin_api_key
50 )
51 response = requests.request(request_method, url, **kwargs)
Wladimir Palant 2015/06/29 19:05:36 You seem to be assuming that this will not throw a
kzar 2015/07/02 12:33:12 Done.
52 try:
53 response.raise_for_status()
54 except requests.exceptions.HTTPError as e:
55 logger.error("API call to %s failed:\n%s" % (url, response.text))
56 raise
57 return response.json()
Wladimir Palant 2015/06/29 19:05:37 This call might also raise an exception - if JSON
kzar 2015/07/02 12:33:12 Done.
58
59 def extract_strings(source, defaultlocale):
60 logger.info("Extracting page strings (please be patient)...")
61 page_strings = {}
62 for page, format in source.list_pages():
63 params = cms.utils.get_page_params(source, defaultlocale, page)
64 strings = params["localedata"]
65 comments = params["localecomments"]
66 for string_name in strings.iterkeys():
67 strings[string_name] = {"message": strings[string_name]}
68 if string_name in comments:
69 strings[string_name]["description"] = comments[string_name]
70 page_strings[page] = strings
71 return page_strings
72
73 def ensure_required_locales(required_locales, enabled_locales, defaultlocale):
Wladimir Palant 2015/06/29 19:05:36 Nit: configure_locales maybe? This is more about c
kzar 2015/07/02 12:33:11 Done.
74 logger.info("Checking which locales are supported by Crowdin...")
75 response = crowdin_request("GET", "supported-languages")
76
77 supported_locales = {l["crowdin_code"] for l in response}
78 skipped_locales = list(required_locales.difference(supported_locales))
Wladimir Palant 2015/06/29 19:05:36 Nit: why convert a set to list here? Just change s
kzar 2015/07/02 12:33:12 Done.
79
80 if skipped_locales:
81 logger.warning("Ignoring locales that Crowdin doesn't support: %s" % (
82 ", ".join(skipped_locales)
83 ))
84 required_locales = required_locales.intersection(supported_locales)
Wladimir Palant 2015/06/29 19:05:36 Nit: required_locales = required_locales & support
kzar 2015/07/02 12:33:12 Done.
85
86 # It's useful to have a list of all locales to skip
87 skipped_locales.append(defaultlocale)
88
89 if not required_locales.issubset(enabled_locales):
90 logger.info("Enabling the required locales for the Crowdin project...")
91 crowdin_request(
92 "POST", "edit-project",
93 data={"languages[]": list(enabled_locales.union(required_locales))}
Wladimir Palant 2015/06/29 19:05:36 Nit: list(enabled_locales | required_locales) plea
kzar 2015/07/02 12:33:11 Done.
94 )
95
96 return required_locales, skipped_locales
97
98 def list_remote_files(project_info):
99 def parse_file_node(node, path=""):
100 if node["node_type"] == "file":
101 remote_files.add(path + node["name"])
102 elif node["node_type"] == "directory":
103 dir_name = path + node["name"]
104 remote_directories.add(dir_name)
105 for file in node.get("files", []):
106 parse_file_node(file, dir_name + "/")
107
108 remote_files = set()
109 remote_directories = set()
110 map(parse_file_node, project_info["files"])
Wladimir Palant 2015/06/29 19:05:37 You are misusing map() here, its callback should n
kzar 2015/07/02 12:33:12 Done.
111 return remote_files, remote_directories
112
113 def list_local_files(page_strings):
114 local_files = set()
115 local_directories = set()
116 for page, strings in page_strings.iteritems():
117 if strings:
118 local_files.add(page + ".json")
119 if "/" in page:
120 parts = page.split("/")[:-1]
121 path = ""
122 while parts:
123 path += parts.pop(0)
124 local_directories.add(path)
125 path += "/"
Wladimir Palant 2015/06/29 19:05:36 I think the following should be simpler: local_
kzar 2015/07/02 12:33:10 Done.
126 return local_files, local_directories
127
128 def create_directories(directories):
129 for directory in directories:
130 logger.info("Creating directory %s" % directory)
131 crowdin_request("POST", "add-directory", data={"name": directory})
132
133 def add_update_files(api_endpoint, message, files, page_strings):
134 for group in grouper(files, FILES_PER_REQUEST):
135 files = {}
136 for file_name in group:
137 page = file_name[:-5]
Wladimir Palant 2015/06/29 19:05:37 Use os.path.splitext()?
kzar 2015/07/02 12:33:12 Done.
138 files["files[%s]" % file_name] = (file_name, json.dumps(page_strings[page] ))
139 del page_strings[page]
Wladimir Palant 2015/06/29 19:05:37 Why delete the strings?
kzar 2015/07/02 12:33:11 We no longer need them, and as they might be quite
140 logger.info(message % len(files))
141 crowdin_request("POST", api_endpoint, files=files)
142
143 def upload_new_files(new_files, page_strings):
144 add_update_files("add-file", "Uploading %d new pages...",
145 new_files, page_strings)
146
147 def update_existing_files(existing_files, page_strings):
148 add_update_files("update-file", "Updating %d existing pages...",
149 existing_files, page_strings)
150
151 def upload_translations(source_dir, new_files, required_locales):
152 def open_locale_files(locale, files):
153 for file in files:
154 path = os.path.join(source_dir, "locales", locale, file)
155 if os.path.isfile(path):
156 yield ("files[%s]" % file, open(path, "r"))
157
158 if new_files:
159 for locale in required_locales:
160 for files in grouper(open_locale_files(locale, new_files),
161 FILES_PER_REQUEST):
162 logger.info("Uploading %d existing translation "
163 "files for locale %s..." % (len(files), locale))
Wladimir Palant 2015/06/29 19:05:37 Uploading per locale might result in doing one req
kzar 2015/07/02 12:33:12 This is deliberate, when uploading translations yo
164 crowdin_request("POST", "upload-translation", files=dict(files),
165 data={"language": locale})
166 for f in files:
167 f[1].close()
Wladimir Palant 2015/06/29 19:05:37 These files should be closed regardless of whether
kzar 2015/07/02 12:33:10 Done.
168
169 def remove_old_files(old_files):
170 for file_name in old_files:
171 logger.info("Removing old file %s" % file_name)
172 crowdin_request("POST", "delete-file", data={"file": file_name})
173
174 def remove_old_directories(old_directories):
175 for directory in reversed(sorted(old_directories, key=len)):
176 logger.info("Removing old directory %s" % directory)
177 crowdin_request("POST", "delete-directory", data={"name": directory})
178
179 def download_translations(source_dir, skipped_locales):
180 logger.info("Requesting generation of fresh translations archive...")
181 result = crowdin_request("GET", "export")
182 if result.get("success", {}).get("status") == "skipped":
183 logger.warning("Archive generation skipped, either "
184 "no changes or API usage excessive")
185
186 logger.info("Downloading translations archive...")
187 response = requests.get(
188 "https://api.crowdin.com/api/project/%s/download/all.zip?key=%s" % (
189 crowdin_project_name, crowdin_api_key
190 )
191 )
192 response.raise_for_status()
193 logger.info("Extracting translations archive...")
194 with zipfile.ZipFile(BytesIO(response.content), "r") as archive:
195 locale_path = os.path.join(source_dir, "locales")
196 # First clear existing translation files
197 for root, dirs, files in os.walk(locale_path, topdown=True):
198 if root == locale_path:
199 # Don't delete locale files for unsupported locales or the default
200 dirs[:] = [d for d in dirs if d not in skipped_locales]
201 for f in files:
202 if f.endswith(".json"):
203 os.remove(os.path.join(root, f))
204 # Then extract the new ones in place
205 archive.extractall(locale_path)
Wladimir Palant 2015/06/29 19:05:37 Running extractall is pretty dangerous IMHO. I'd s
kzar 2015/07/02 12:33:12 Done.
206
207 def crowdin_sync(source_dir, crowdin_api_key):
208 global crowdin_project_name, defaultlocale
209
210 with FileSource(source_dir) as source:
211 config = source.read_config()
212 defaultlocale = config.get("general", "defaultlocale")
213 crowdin_project_name = config.get("general", "crowdin-project-name")
214
215 logger.info("Requesting project information...")
216 project_info = crowdin_request("GET", "info")
Wladimir Palant 2015/06/29 19:05:37 Nit: The two lines above and setting enabled_local
kzar 2015/07/02 12:33:11 I originally didn't request the project informatio
217 page_strings = extract_strings(source, defaultlocale)
218
219 required_locales = {l for l in source.list_locales() if l != defaultlocale}
220 enabled_locales = {l["code"] for l in project_info["languages"]}
221
222 required_locales, skipped_locales = ensure_required_locales(
Wladimir Palant 2015/06/29 19:05:37 Why do we need to know the skipped locales here? T
kzar 2015/07/02 12:33:11 We need to avoid deleting locale files for skipped
Wladimir Palant 2015/07/08 23:11:05 You can (and should) limit deleting to required_lo
kzar 2015/07/11 19:21:15 Done.
223 required_locales, enabled_locales, defaultlocale
224 )
225 remote_files, remote_directories = list_remote_files(project_info)
226 local_files, local_directories = list_local_files(page_strings)
227
228 # Avoid deleting all remote content if there was a problem listing local files
229 if not local_files:
230 logger.error("No page strings found. (Wrong project directory?) Aborting!")
Wladimir Palant 2015/06/29 19:05:37 Nit: The settings.ini file is there, so it cannot
kzar 2015/07/02 12:33:11 Done.
231 sys.exit(1)
232
233 new_files = list(local_files.difference(remote_files))
234 new_directories = list(local_directories.difference(remote_directories))
Wladimir Palant 2015/06/29 19:05:37 Nit: I don't see the point converting sets to list
kzar 2015/07/02 12:33:11 (Cool I found this one myself and later noticed yo
235 create_directories(new_directories)
236 upload_new_files(new_files, page_strings)
237 upload_translations(source_dir, new_files, required_locales)
238
239 existing_files = list(local_files.intersection(remote_files))
Wladimir Palant 2015/06/29 19:05:36 Nit: existing_files = local_files - new_files?
kzar 2015/07/02 12:33:10 Done.
240 update_existing_files(existing_files, page_strings)
241
242 old_files = remote_files.difference(local_files)
243 old_directories = remote_directories.difference(local_directories)
244 remove_old_files(old_files)
245 remove_old_directories(old_directories)
246
247 download_translations(source_dir, skipped_locales)
248 logger.info("Crowdin sync completed.")
249
250 if __name__ == "__main__":
251 if len(sys.argv) < 3:
252 print >>sys.stderr, "Usage: python -m cms.bin.translate www_directory crowdi n_project_api_key [logging_level]"
253 sys.exit(1)
254
255 logging.basicConfig()
256 logger.setLevel(sys.argv[3] if len(sys.argv) > 3 else logging.INFO)
257
258 source_dir, crowdin_api_key = sys.argv[1:3]
259 crowdin_sync(source_dir, crowdin_api_key)
OLDNEW
« no previous file with comments | « README.md ('k') | cms/converters.py » ('j') | cms/converters.py » ('J')

Powered by Google App Engine
This is Rietveld