Left: | ||
Right: |
OLD | NEW |
---|---|
(Empty) | |
1 # coding: utf-8 | |
2 | |
3 # This file is part of the Adblock Plus web scripts, | |
4 # Copyright (C) 2006-2015 Eyeo GmbH | |
5 # | |
6 # Adblock Plus is free software: you can redistribute it and/or modify | |
7 # it under the terms of the GNU General Public License version 3 as | |
8 # published by the Free Software Foundation. | |
9 # | |
10 # Adblock Plus is distributed in the hope that it will be useful, | |
11 # but WITHOUT ANY WARRANTY; without even the implied warranty of | |
12 # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the | |
13 # GNU General Public License for more details. | |
14 # | |
15 # You should have received a copy of the GNU General Public License | |
16 # along with Adblock Plus. If not, see <http://www.gnu.org/licenses/>. | |
17 | |
18 from io import BytesIO | |
19 from itertools import islice | |
Wladimir Palant
2015/06/29 19:05:36
Nit: I'm not a big fan of importing individual fun
kzar
2015/07/02 12:33:11
Done.
| |
20 import json | |
21 import logging | |
22 import os | |
23 import sys | |
24 import zipfile | |
25 | |
26 import requests | |
27 | |
28 import cms.utils | |
29 from cms.sources import FileSource | |
30 | |
31 FILES_PER_REQUEST = 20 | |
32 | |
33 logger = logging.getLogger("cms.bin.translate") | |
34 crowdin_api_key = None | |
35 crowdin_project_name = None | |
36 defaultlocale = None | |
Wladimir Palant
2015/06/29 19:05:37
The three variables above shouldn't be globals - t
kzar
2015/07/02 12:33:11
Done.
| |
37 | |
38 def grouper(iterable, n): | |
39 iterator = iter(iterable) | |
40 while True: | |
41 chunk = tuple(islice(iterator, n)) | |
42 if chunk: | |
43 yield chunk | |
44 else: | |
45 break | |
Wladimir Palant
2015/06/29 19:05:36
Please link to https://stackoverflow.com/questions
kzar
2015/07/02 12:33:10
I originally did take this function from Stackover
| |
46 | |
47 def crowdin_request(request_method, api_endpoint, **kwargs): | |
48 url = "https://api.crowdin.com/api/project/%s/%s?key=%s&json=1" % ( | |
49 crowdin_project_name, api_endpoint, crowdin_api_key | |
50 ) | |
51 response = requests.request(request_method, url, **kwargs) | |
Wladimir Palant
2015/06/29 19:05:36
You seem to be assuming that this will not throw a
kzar
2015/07/02 12:33:12
Done.
| |
52 try: | |
53 response.raise_for_status() | |
54 except requests.exceptions.HTTPError as e: | |
55 logger.error("API call to %s failed:\n%s" % (url, response.text)) | |
56 raise | |
57 return response.json() | |
Wladimir Palant
2015/06/29 19:05:37
This call might also raise an exception - if JSON
kzar
2015/07/02 12:33:12
Done.
| |
58 | |
59 def extract_strings(source, defaultlocale): | |
60 logger.info("Extracting page strings (please be patient)...") | |
61 page_strings = {} | |
62 for page, format in source.list_pages(): | |
63 params = cms.utils.get_page_params(source, defaultlocale, page) | |
64 strings = params["localedata"] | |
65 comments = params["localecomments"] | |
66 for string_name in strings.iterkeys(): | |
67 strings[string_name] = {"message": strings[string_name]} | |
68 if string_name in comments: | |
69 strings[string_name]["description"] = comments[string_name] | |
70 page_strings[page] = strings | |
71 return page_strings | |
72 | |
73 def ensure_required_locales(required_locales, enabled_locales, defaultlocale): | |
Wladimir Palant
2015/06/29 19:05:36
Nit: configure_locales maybe? This is more about c
kzar
2015/07/02 12:33:11
Done.
| |
74 logger.info("Checking which locales are supported by Crowdin...") | |
75 response = crowdin_request("GET", "supported-languages") | |
76 | |
77 supported_locales = {l["crowdin_code"] for l in response} | |
78 skipped_locales = list(required_locales.difference(supported_locales)) | |
Wladimir Palant
2015/06/29 19:05:36
Nit: why convert a set to list here? Just change s
kzar
2015/07/02 12:33:12
Done.
| |
79 | |
80 if skipped_locales: | |
81 logger.warning("Ignoring locales that Crowdin doesn't support: %s" % ( | |
82 ", ".join(skipped_locales) | |
83 )) | |
84 required_locales = required_locales.intersection(supported_locales) | |
Wladimir Palant
2015/06/29 19:05:36
Nit: required_locales = required_locales & support
kzar
2015/07/02 12:33:12
Done.
| |
85 | |
86 # It's useful to have a list of all locales to skip | |
87 skipped_locales.append(defaultlocale) | |
88 | |
89 if not required_locales.issubset(enabled_locales): | |
90 logger.info("Enabling the required locales for the Crowdin project...") | |
91 crowdin_request( | |
92 "POST", "edit-project", | |
93 data={"languages[]": list(enabled_locales.union(required_locales))} | |
Wladimir Palant
2015/06/29 19:05:36
Nit: list(enabled_locales | required_locales) plea
kzar
2015/07/02 12:33:11
Done.
| |
94 ) | |
95 | |
96 return required_locales, skipped_locales | |
97 | |
98 def list_remote_files(project_info): | |
99 def parse_file_node(node, path=""): | |
100 if node["node_type"] == "file": | |
101 remote_files.add(path + node["name"]) | |
102 elif node["node_type"] == "directory": | |
103 dir_name = path + node["name"] | |
104 remote_directories.add(dir_name) | |
105 for file in node.get("files", []): | |
106 parse_file_node(file, dir_name + "/") | |
107 | |
108 remote_files = set() | |
109 remote_directories = set() | |
110 map(parse_file_node, project_info["files"]) | |
Wladimir Palant
2015/06/29 19:05:37
You are misusing map() here, its callback should n
kzar
2015/07/02 12:33:12
Done.
| |
111 return remote_files, remote_directories | |
112 | |
113 def list_local_files(page_strings): | |
114 local_files = set() | |
115 local_directories = set() | |
116 for page, strings in page_strings.iteritems(): | |
117 if strings: | |
118 local_files.add(page + ".json") | |
119 if "/" in page: | |
120 parts = page.split("/")[:-1] | |
121 path = "" | |
122 while parts: | |
123 path += parts.pop(0) | |
124 local_directories.add(path) | |
125 path += "/" | |
Wladimir Palant
2015/06/29 19:05:36
I think the following should be simpler:
local_
kzar
2015/07/02 12:33:10
Done.
| |
126 return local_files, local_directories | |
127 | |
128 def create_directories(directories): | |
129 for directory in directories: | |
130 logger.info("Creating directory %s" % directory) | |
131 crowdin_request("POST", "add-directory", data={"name": directory}) | |
132 | |
133 def add_update_files(api_endpoint, message, files, page_strings): | |
134 for group in grouper(files, FILES_PER_REQUEST): | |
135 files = {} | |
136 for file_name in group: | |
137 page = file_name[:-5] | |
Wladimir Palant
2015/06/29 19:05:37
Use os.path.splitext()?
kzar
2015/07/02 12:33:12
Done.
| |
138 files["files[%s]" % file_name] = (file_name, json.dumps(page_strings[page] )) | |
139 del page_strings[page] | |
Wladimir Palant
2015/06/29 19:05:37
Why delete the strings?
kzar
2015/07/02 12:33:11
We no longer need them, and as they might be quite
| |
140 logger.info(message % len(files)) | |
141 crowdin_request("POST", api_endpoint, files=files) | |
142 | |
143 def upload_new_files(new_files, page_strings): | |
144 add_update_files("add-file", "Uploading %d new pages...", | |
145 new_files, page_strings) | |
146 | |
147 def update_existing_files(existing_files, page_strings): | |
148 add_update_files("update-file", "Updating %d existing pages...", | |
149 existing_files, page_strings) | |
150 | |
151 def upload_translations(source_dir, new_files, required_locales): | |
152 def open_locale_files(locale, files): | |
153 for file in files: | |
154 path = os.path.join(source_dir, "locales", locale, file) | |
155 if os.path.isfile(path): | |
156 yield ("files[%s]" % file, open(path, "r")) | |
157 | |
158 if new_files: | |
159 for locale in required_locales: | |
160 for files in grouper(open_locale_files(locale, new_files), | |
161 FILES_PER_REQUEST): | |
162 logger.info("Uploading %d existing translation " | |
163 "files for locale %s..." % (len(files), locale)) | |
Wladimir Palant
2015/06/29 19:05:37
Uploading per locale might result in doing one req
kzar
2015/07/02 12:33:12
This is deliberate, when uploading translations yo
| |
164 crowdin_request("POST", "upload-translation", files=dict(files), | |
165 data={"language": locale}) | |
166 for f in files: | |
167 f[1].close() | |
Wladimir Palant
2015/06/29 19:05:37
These files should be closed regardless of whether
kzar
2015/07/02 12:33:10
Done.
| |
168 | |
169 def remove_old_files(old_files): | |
170 for file_name in old_files: | |
171 logger.info("Removing old file %s" % file_name) | |
172 crowdin_request("POST", "delete-file", data={"file": file_name}) | |
173 | |
174 def remove_old_directories(old_directories): | |
175 for directory in reversed(sorted(old_directories, key=len)): | |
176 logger.info("Removing old directory %s" % directory) | |
177 crowdin_request("POST", "delete-directory", data={"name": directory}) | |
178 | |
179 def download_translations(source_dir, skipped_locales): | |
180 logger.info("Requesting generation of fresh translations archive...") | |
181 result = crowdin_request("GET", "export") | |
182 if result.get("success", {}).get("status") == "skipped": | |
183 logger.warning("Archive generation skipped, either " | |
184 "no changes or API usage excessive") | |
185 | |
186 logger.info("Downloading translations archive...") | |
187 response = requests.get( | |
188 "https://api.crowdin.com/api/project/%s/download/all.zip?key=%s" % ( | |
189 crowdin_project_name, crowdin_api_key | |
190 ) | |
191 ) | |
192 response.raise_for_status() | |
193 logger.info("Extracting translations archive...") | |
194 with zipfile.ZipFile(BytesIO(response.content), "r") as archive: | |
195 locale_path = os.path.join(source_dir, "locales") | |
196 # First clear existing translation files | |
197 for root, dirs, files in os.walk(locale_path, topdown=True): | |
198 if root == locale_path: | |
199 # Don't delete locale files for unsupported locales or the default | |
200 dirs[:] = [d for d in dirs if d not in skipped_locales] | |
201 for f in files: | |
202 if f.endswith(".json"): | |
203 os.remove(os.path.join(root, f)) | |
204 # Then extract the new ones in place | |
205 archive.extractall(locale_path) | |
Wladimir Palant
2015/06/29 19:05:37
Running extractall is pretty dangerous IMHO. I'd s
kzar
2015/07/02 12:33:12
Done.
| |
206 | |
207 def crowdin_sync(source_dir, crowdin_api_key): | |
208 global crowdin_project_name, defaultlocale | |
209 | |
210 with FileSource(source_dir) as source: | |
211 config = source.read_config() | |
212 defaultlocale = config.get("general", "defaultlocale") | |
213 crowdin_project_name = config.get("general", "crowdin-project-name") | |
214 | |
215 logger.info("Requesting project information...") | |
216 project_info = crowdin_request("GET", "info") | |
Wladimir Palant
2015/06/29 19:05:37
Nit: The two lines above and setting enabled_local
kzar
2015/07/02 12:33:11
I originally didn't request the project informatio
| |
217 page_strings = extract_strings(source, defaultlocale) | |
218 | |
219 required_locales = {l for l in source.list_locales() if l != defaultlocale} | |
220 enabled_locales = {l["code"] for l in project_info["languages"]} | |
221 | |
222 required_locales, skipped_locales = ensure_required_locales( | |
Wladimir Palant
2015/06/29 19:05:37
Why do we need to know the skipped locales here? T
kzar
2015/07/02 12:33:11
We need to avoid deleting locale files for skipped
Wladimir Palant
2015/07/08 23:11:05
You can (and should) limit deleting to required_lo
kzar
2015/07/11 19:21:15
Done.
| |
223 required_locales, enabled_locales, defaultlocale | |
224 ) | |
225 remote_files, remote_directories = list_remote_files(project_info) | |
226 local_files, local_directories = list_local_files(page_strings) | |
227 | |
228 # Avoid deleting all remote content if there was a problem listing local files | |
229 if not local_files: | |
230 logger.error("No page strings found. (Wrong project directory?) Aborting!") | |
Wladimir Palant
2015/06/29 19:05:37
Nit: The settings.ini file is there, so it cannot
kzar
2015/07/02 12:33:11
Done.
| |
231 sys.exit(1) | |
232 | |
233 new_files = list(local_files.difference(remote_files)) | |
234 new_directories = list(local_directories.difference(remote_directories)) | |
Wladimir Palant
2015/06/29 19:05:37
Nit: I don't see the point converting sets to list
kzar
2015/07/02 12:33:11
(Cool I found this one myself and later noticed yo
| |
235 create_directories(new_directories) | |
236 upload_new_files(new_files, page_strings) | |
237 upload_translations(source_dir, new_files, required_locales) | |
238 | |
239 existing_files = list(local_files.intersection(remote_files)) | |
Wladimir Palant
2015/06/29 19:05:36
Nit: existing_files = local_files - new_files?
kzar
2015/07/02 12:33:10
Done.
| |
240 update_existing_files(existing_files, page_strings) | |
241 | |
242 old_files = remote_files.difference(local_files) | |
243 old_directories = remote_directories.difference(local_directories) | |
244 remove_old_files(old_files) | |
245 remove_old_directories(old_directories) | |
246 | |
247 download_translations(source_dir, skipped_locales) | |
248 logger.info("Crowdin sync completed.") | |
249 | |
250 if __name__ == "__main__": | |
251 if len(sys.argv) < 3: | |
252 print >>sys.stderr, "Usage: python -m cms.bin.translate www_directory crowdi n_project_api_key [logging_level]" | |
253 sys.exit(1) | |
254 | |
255 logging.basicConfig() | |
256 logger.setLevel(sys.argv[3] if len(sys.argv) > 3 else logging.INFO) | |
257 | |
258 source_dir, crowdin_api_key = sys.argv[1:3] | |
259 crowdin_sync(source_dir, crowdin_api_key) | |
OLD | NEW |