blob: 26eddcc7038daafe6b8946b271e97912c6f4b7b6 [file] [log] [blame]
Marco Brohet4683bee2014-02-28 01:06:03 +01001#!/usr/bin/python2
Marco Brohetf1742722014-03-04 22:41:18 +01002# -*- coding: utf-8 -*-
Marco Brohet4683bee2014-02-28 01:06:03 +01003# cm_crowdin_sync.py
4#
5# Updates Crowdin source translations and pulls translations
Marco Brohet8b78a1b2014-02-28 21:01:26 +01006# directly to CyanogenMod's Git.
7#
8# Copyright (C) 2014 The CyanogenMod Project
9#
10# Licensed under the Apache License, Version 2.0 (the "License");
11# you may not use this file except in compliance with the License.
12# You may obtain a copy of the License at
13#
14# http://www.apache.org/licenses/LICENSE-2.0
15#
16# Unless required by applicable law or agreed to in writing, software
17# distributed under the License is distributed on an "AS IS" BASIS,
18# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
19# See the License for the specific language governing permissions and
20# limitations under the License.
Marco Brohet4683bee2014-02-28 01:06:03 +010021
Marco Brohetf1742722014-03-04 22:41:18 +010022import codecs
Marco Brohet4683bee2014-02-28 01:06:03 +010023import git
24import mmap
Marco Brohetcf4069b2014-02-28 18:48:17 +010025import os
Marco Brohet4683bee2014-02-28 01:06:03 +010026import os.path
27import re
28import shutil
29import subprocess
30import sys
31from urllib import urlretrieve
32from xml.dom import minidom
33
Marco Brohet8b78a1b2014-02-28 21:01:26 +010034def get_caf_additions(strings_base, strings_cm):
35 # Load AOSP file and resources
36 xml_base = minidom.parse(strings_base)
37 list_base_string = xml_base.getElementsByTagName('string')
38 list_base_string_array = xml_base.getElementsByTagName('string-array')
39 list_base_plurals = xml_base.getElementsByTagName('plurals')
40 # Load CM file and resources
41 xml_cm = minidom.parse(strings_cm)
42 list_cm_string = xml_cm.getElementsByTagName('string')
43 list_cm_string_array = xml_cm.getElementsByTagName('string-array')
44 list_cm_plurals = xml_cm.getElementsByTagName('plurals')
Marco Brohet4683bee2014-02-28 01:06:03 +010045
Marco Brohet8b78a1b2014-02-28 21:01:26 +010046 # All names from CM
47 names_cm_string = []
48 names_cm_string_array = []
49 names_cm_plurals = []
50 # All names from AOSP
51 names_base_string = []
52 names_base_string_array = []
53 names_base_plurals = []
54
55 # Get all names from CM
56 for s in list_cm_string :
57 if not s.hasAttribute('translatable') and not s.hasAttribute('translate'):
58 names_cm_string.append(s.attributes['name'].value)
59 for s in list_cm_string_array :
60 if not s.hasAttribute('translatable') and not s.hasAttribute('translate'):
61 names_cm_string_array.append(s.attributes['name'].value)
62 for s in list_cm_plurals :
63 if not s.hasAttribute('translatable') and not s.hasAttribute('translate'):
64 names_cm_plurals.append(s.attributes['name'].value)
65 # Get all names from AOSP
66 for s in list_base_string :
67 if not s.hasAttribute('translatable') and not s.hasAttribute('translate'):
68 names_base_string.append(s.attributes['name'].value)
69 for s in list_base_string_array :
70 if not s.hasAttribute('translatable') and not s.hasAttribute('translate'):
71 names_base_string_array.append(s.attributes['name'].value)
72 for s in list_base_plurals :
73 if not s.hasAttribute('translatable') and not s.hasAttribute('translate'):
74 names_base_plurals.append(s.attributes['name'].value)
75
76 # Store all differences in this list
77 caf_additions = []
78
79 # Add all CAF additions to the list 'caf_additions'
80 for z in names_cm_string:
Marco Brohet25623ce2014-03-08 19:13:07 +010081 if z not in names_base_string:
82 for string_item in list_cm_string:
83 if string_item.attributes['name'].value == z:
84 caf_additions.append(' ' + string_item.toxml())
Marco Brohet25623ce2014-03-08 19:13:07 +010085 for y in names_cm_string_array:
86 if y not in names_base_string_array:
87 for string_array_item in list_cm_string_array:
88 if string_array_item.attributes['name'].value == y:
89 caf_additions.append(' ' + string_array_item.toxml())
Marco Brohet25623ce2014-03-08 19:13:07 +010090 for x in names_cm_plurals:
91 if x not in names_base_plurals:
92 for plurals_item in list_cm_plurals:
93 if plurals_item.attributes['name'].value == x:
94 caf_additions.append(' ' + plurals_item.toxml())
Marco Brohet8b78a1b2014-02-28 21:01:26 +010095
96 # Done :-)
97 return caf_additions
98
Marco Brohet7165b4e2014-03-02 17:31:17 +010099def sync_js_translations(sync_type, path, lang=''):
100 # lang is necessary in download mode
101 if sync_type == 'download' and lang == '':
102 sys.exit('Invalid syntax. Language code is required in download mode.')
103
104 # Read source en.js file. This is necessary for both upload and download modes
Marco Brohet44657ed2014-03-04 22:49:23 +0100105 with codecs.open(path + 'en.js', 'r', 'utf-8') as f:
Marco Brohet7165b4e2014-03-02 17:31:17 +0100106 content = f.readlines()
107
108 if sync_type == 'upload':
109 # Prepare XML file structure
110 doc = xml.dom.minidom.Document()
111 header = doc.createElement('resources')
Marco Brohet44657ed2014-03-04 22:49:23 +0100112 file_write = codecs.open(path + 'en.xml', 'w', 'utf-8')
Marco Brohet7165b4e2014-03-02 17:31:17 +0100113 else:
114 # Open translation files
Marco Brohet44657ed2014-03-04 22:49:23 +0100115 file_write = codecs.open(path + lang + '.js', 'w', 'utf-8')
Marco Brohet7165b4e2014-03-02 17:31:17 +0100116 xml_base = xml.dom.minidom.parse(path + lang + '.xml')
117 tags = xml_base.getElementsByTagName('string')
118
119 # Read each line of en.js
120 for a_line in content:
121 # Regex to determine string id
122 m = re.search(' (.*): [\'|\"]', a_line)
123 if m is not None:
124 for string_id in m.groups():
125 if string_id is not None:
126 # Find string id
127 string_id = string_id.replace(' ', '')
128 m2 = re.search('\'(.*)\'|"(.*)"', a_line)
129 # Find string contents
130 for string_content in m2.groups():
131 if string_content is not None:
132 break
133 if sync_type == 'upload':
134 # In upload mode, create the appropriate string element.
135 contents = doc.createElement('string')
136 contents.attributes['name'] = string_id
137 contents.appendChild(doc.createTextNode(string_content))
138 header.appendChild(contents)
139 else:
140 # In download mode, check if string_id matches a name attribute in the translation XML file.
141 # If it does, replace English text with the translation.
142 # If it does not, English text will remain and will be added to the file to retain the file structure.
143 for string in tags:
144 if string.attributes['name'].value == string_id:
145 a_line = a_line.replace(string_content.rstrip(), string.firstChild.nodeValue)
146 break
147 break
148 # In download mode do not write comments
149 if sync_type == 'download' and not '//' in a_line:
150 # Add language identifier (1)
151 if 'cmaccount.l10n.en' in a_line:
152 a_line = a_line.replace('l10n.en', 'l10n.' + lang)
153 # Add language identifier (2)
154 if 'l10n.add(\'en\'' in a_line:
155 a_line = a_line.replace('l10n.add(\'en\'', 'l10n.add(\'' + lang + '\'')
156 # Now write the line
157 file_write.write(a_line)
158
159
160 # Create XML file structure
161 if sync_type == 'upload':
162 header.appendChild(contents)
163 contents = header.toxml().replace('<string', '\n <string').replace('</resources>', '\n</resources>')
164 file_write.write('<?xml version="1.0" encoding="utf-8"?>\n')
165 file_write.write('<!-- .JS CONVERTED TO .XML - DO NOT MERGE THIS FILE -->\n')
166 file_write.write(contents)
167
168 # Close file
169 file_write.close()
170
Marco Brohet8b78a1b2014-02-28 21:01:26 +0100171def push_as_commit(path, name):
172 # Get path
173 path = os.getcwd() + '/' + path
174
175 # Create git commit
176 repo = git.Repo(path)
177 repo.git.add(path)
178 try:
179 repo.git.commit(m='DO NOT MERGE: Automatic translation import test commit')
180# repo.git.push('ssh://cobjeM@review.cyanogenmod.org:29418/' + name, 'HEAD:refs/for/cm-11.0')
181 print 'Succesfully pushed commit for ' + name
182 except:
183 # If git commit fails, it's probably because of no changes.
184 # Just continue.
185 print 'No commit pushed (probably empty?) for ' + name
186 print 'WARNING: If the repository name was not obtained from default.xml, the name might be wrong!'
187
188print('Welcome to the CM Crowdin sync script!')
189
190print('\nSTEP 0: Checking dependencies')
Marco Brohet7165b4e2014-03-02 17:31:17 +0100191# Check for Ruby version of crowdin-cli
Marco Brohet4683bee2014-02-28 01:06:03 +0100192if subprocess.check_output(['rvm', 'all', 'do', 'gem', 'list', 'crowdin-cli', '-i']) == 'true':
193 sys.exit('You have not installed crowdin-cli. Terminating.')
Marco Brohet8b78a1b2014-02-28 21:01:26 +0100194else:
195 print('Found: crowdin-cli')
Marco Brohet7165b4e2014-03-02 17:31:17 +0100196# Check for caf.xml
Marco Brohet4683bee2014-02-28 01:06:03 +0100197if not os.path.isfile('caf.xml'):
198 sys.exit('You have no caf.xml. Terminating.')
Marco Brohet8b78a1b2014-02-28 21:01:26 +0100199else:
200 print('Found: caf.xml')
Marco Brohet7165b4e2014-03-02 17:31:17 +0100201# Check for default.xml
Marco Brohet4683bee2014-02-28 01:06:03 +0100202if not os.path.isfile('default.xml'):
203 sys.exit('You have no default.xml. Terminating.')
Marco Brohet8b78a1b2014-02-28 21:01:26 +0100204else:
205 print('Found: default.xml')
Marco Brohet7165b4e2014-03-02 17:31:17 +0100206# Check for repo
207try:
208 subprocess.check_output(['which', 'repo'])
209except:
210 sys.exit('You have not installed repo. Terminating.')
Marco Brohet4683bee2014-02-28 01:06:03 +0100211
Marco Brohet25623ce2014-03-08 19:13:07 +0100212print('\nSTEP 1: Create cm_caf.xml')
Marco Brohet8b78a1b2014-02-28 21:01:26 +0100213# Load caf.xml
Marco Brohet25623ce2014-03-08 19:13:07 +0100214print('Loading caf.xml')
215xml = minidom.parse('caf.xml')
216items = xml.getElementsByTagName('item')
Marco Brohet4683bee2014-02-28 01:06:03 +0100217
Marco Brohet8b78a1b2014-02-28 21:01:26 +0100218# Store all created cm_caf.xml files in here.
219# Easier to remove them afterwards, as they cannot be committed
Marco Brohet25623ce2014-03-08 19:13:07 +0100220cm_caf = []
Marco Brohet4683bee2014-02-28 01:06:03 +0100221
Marco Brohet25623ce2014-03-08 19:13:07 +0100222for item in items:
223 # Create tmp dir for download of AOSP base file
224 path_to_values = item.attributes["path"].value
225 subprocess.call(['mkdir', '-p', 'tmp/' + path_to_values])
226 # Create cm_caf.xml - header
227 f = codecs.open(path_to_values + '/cm_caf.xml', 'w', 'utf-8')
228 f.write('<?xml version="1.0" encoding="utf-8"?>\n')
229 f.write('<resources xmlns:xliff="urn:oasis:names:tc:xliff:document:1.2">\n')
230 # Create cm_caf.xml - contents
231 # This means we also support multiple base files (e.g. checking if strings.xml and arrays.xml are changed)
232 contents = []
233 item_aosp = item.getElementsByTagName('aosp')
234 for aosp_item in item_aosp:
235 url = aosp_item.firstChild.nodeValue
236 xml_file = aosp_item.attributes["file"].value
237 path_to_base = 'tmp/' + path_to_values + '/' + xml_file
238 path_to_cm = path_to_values + '/' + xml_file
239 urlretrieve(url, path_to_base)
240 contents = contents + get_caf_additions(path_to_base, path_to_cm)
241 for addition in contents:
242 f.write(addition + '\n')
243 # Create cm_caf.xml - the end
244 f.write('</resources>')
245 f.close()
246 cm_caf.append(path_to_values + '/cm_caf.xml')
247 print('Created ' + path_to_values + '/cm_caf.xml')
Marco Brohet4683bee2014-02-28 01:06:03 +0100248
249print('\nSTEP 2: Upload Crowdin source translations')
Marco Brohet8b78a1b2014-02-28 21:01:26 +0100250# Execute 'crowdin-cli upload sources' and show output
Marco Brohet4683bee2014-02-28 01:06:03 +0100251print(subprocess.check_output(['crowdin-cli', 'upload', 'sources']))
252
Marco Brohetcf4069b2014-02-28 18:48:17 +0100253print('STEP 3: Download Crowdin translations')
Marco Brohet8b78a1b2014-02-28 21:01:26 +0100254# Execute 'crowdin-cli download' and show output
Marco Brohetcf4069b2014-02-28 18:48:17 +0100255print(subprocess.check_output(['crowdin-cli', "download"]))
Marco Brohet4683bee2014-02-28 01:06:03 +0100256
Marco Brohet25623ce2014-03-08 19:13:07 +0100257print('STEP 4A: Clean up of source cm_caf.xmls')
258# Remove all cm_caf.xml files, which you can find in the list 'cm_caf'
259for cm_caf_file in cm_caf:
260 print ('Removing ' + cm_caf_file)
261 os.remove(cm_caf_file)
Marco Brohetcf4069b2014-02-28 18:48:17 +0100262
Marco Brohet25623ce2014-03-08 19:13:07 +0100263print('\nSTEP 4B: Clean up of temp dir')
264# We are done with cm_caf.xml files, so remove tmp/
265shutil.rmtree(os.getcwd() + '/tmp')
Marco Brohetcf4069b2014-02-28 18:48:17 +0100266
Marco Brohet8b78a1b2014-02-28 21:01:26 +0100267print('\nSTEP 4C: Clean up of empty translations')
268# Some line of code that I found to find all XML files
Marco Brohet4683bee2014-02-28 01:06:03 +0100269result = [os.path.join(dp, f) for dp, dn, filenames in os.walk(os.getcwd()) for f in filenames if os.path.splitext(f)[1] == '.xml']
270for xml_file in result:
Marco Brohet8b78a1b2014-02-28 21:01:26 +0100271 # We hate empty, useless files. Crowdin exports them with <resources/> (sometimes with xliff).
272 # That means: easy to find
Marco Brohet4683bee2014-02-28 01:06:03 +0100273 if '<resources/>' in open(xml_file).read():
274 print ('Removing ' + xml_file)
275 os.remove(xml_file)
Marco Brohetcf4069b2014-02-28 18:48:17 +0100276 elif '<resources xmlns:xliff="urn:oasis:names:tc:xliff:document:1.2"/>' in open(xml_file).read():
Marco Brohet4683bee2014-02-28 01:06:03 +0100277 print ('Removing ' + xml_file)
278 os.remove(xml_file)
279
Marco Brohet4683bee2014-02-28 01:06:03 +0100280print('\nSTEP 5: Push translations to Git')
Marco Brohet8b78a1b2014-02-28 21:01:26 +0100281# Get all files that Crowdin pushed
Marco Brohet4683bee2014-02-28 01:06:03 +0100282proc = subprocess.Popen(['crowdin-cli', 'list', 'sources'],stdout=subprocess.PIPE)
Marco Brohet4683bee2014-02-28 01:06:03 +0100283xml = minidom.parse('default.xml')
284items = xml.getElementsByTagName('project')
Marco Brohetcf4069b2014-02-28 18:48:17 +0100285all_projects = []
Marco Brohet4683bee2014-02-28 01:06:03 +0100286
Marco Brohetcf4069b2014-02-28 18:48:17 +0100287for path in iter(proc.stdout.readline,''):
Marco Brohet8b78a1b2014-02-28 21:01:26 +0100288 # Remove the \n at the end of each line
Marco Brohetcf4069b2014-02-28 18:48:17 +0100289 path = path.rstrip()
Marco Brohet8b78a1b2014-02-28 21:01:26 +0100290 # Get project root dir from Crowdin's output
Marco Brohetcf4069b2014-02-28 18:48:17 +0100291 m = re.search('/(.*Superuser)/Superuser.*|/(.*LatinIME).*|/(frameworks/base).*|/(.*CMFileManager).*|/(device/.*/.*)/.*/res/values.*|/(hardware/.*/.*)/.*/res/values.*|/(.*)/res/values.*', path)
292 for good_path in m.groups():
Marco Brohet8b78a1b2014-02-28 21:01:26 +0100293 # When a project has multiple translatable files, Crowdin will give duplicates.
294 # We don't want that (useless empty commits), so we save each project in all_projects
295 # and check if it's already in there.
Marco Brohetcf4069b2014-02-28 18:48:17 +0100296 if good_path is not None and not good_path in all_projects:
297 all_projects.append(good_path)
298 working = 'false'
299 for project_item in items:
Marco Brohet8b78a1b2014-02-28 21:01:26 +0100300 # We need to have the Github repository for the git push url. Obtain them from
301 # default.xml based on the project root dir.
Marco Brohetcf4069b2014-02-28 18:48:17 +0100302 if project_item.attributes["path"].value == good_path:
303 working = 'true'
Marco Brohet8b78a1b2014-02-28 21:01:26 +0100304 push_as_commit(good_path, project_item.attributes['name'].value)
305 print 'Committing ' + project_item.attributes['name'].value + ' (based on default.xml)'
306 # We also translate repositories that are not downloaded by default (e.g. device parts).
307 # This is just a fallback.
308 # WARNING: If the name is wrong, this will not stop the script.
Marco Brohetcf4069b2014-02-28 18:48:17 +0100309 if working == 'false':
Marco Brohet8b78a1b2014-02-28 21:01:26 +0100310 push_as_commit(good_path, 'CyanogenMod/android_' + good_path.replace('/', '_'))
311 print 'Committing ' + project_item.attributes['name'].value + ' (workaround)'
Marco Brohet4683bee2014-02-28 01:06:03 +0100312
313print('STEP 6: Done!')