Blame - cm_crowdin_sync.py - crowdin

2014-02-28 01:06:03 +0100

[diff] [blame]

#!/usr/bin/python2

#

# cm_crowdin_sync.py

#

# Updates Crowdin source translations and pulls translations

Marco Brohet

2014-02-28 21:01:26 +0100

[diff] [blame]

6

# directly to CyanogenMod's Git.

#

#

# Licensed under the Apache License, Version 2.0 (the "License");

11

# you may not use this file except in compliance with the License.

12

# You may obtain a copy of the License at

13

#

14

# http://www.apache.org/licenses/LICENSE-2.0

15

#

16

# Unless required by applicable law or agreed to in writing, software

17

# distributed under the License is distributed on an "AS IS" BASIS,

18

# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.

19

# See the License for the specific language governing permissions and

20

# limitations under the License.

Marco Brohet

2014-02-28 01:06:03 +0100

[diff] [blame]

21

Marco Brohet

2014-02-28 01:06:03 +0100

[diff] [blame]

22

import git

23

import mmap

Marco Brohet

2014-02-28 18:48:17 +0100

[diff] [blame]

24

import os

Marco Brohet

2014-02-28 01:06:03 +0100

[diff] [blame]

import os.path

import re

import shutil

import subprocess

import sys

from urllib import urlretrieve

31

from xml.dom import minidom

32

Marco Brohet

2014-02-28 21:01:26 +0100

[diff] [blame]

33

def get_caf_additions(strings_base, strings_cm):

34

# Load AOSP file and resources

35

xml_base = minidom.parse(strings_base)

36

list_base_string = xml_base.getElementsByTagName('string')

37

list_base_string_array = xml_base.getElementsByTagName('string-array')

38

list_base_plurals = xml_base.getElementsByTagName('plurals')

39

# Load CM file and resources

40

xml_cm = minidom.parse(strings_cm)

41

list_cm_string = xml_cm.getElementsByTagName('string')

42

list_cm_string_array = xml_cm.getElementsByTagName('string-array')

43

list_cm_plurals = xml_cm.getElementsByTagName('plurals')

Marco Brohet

2014-02-28 01:06:03 +0100

[diff] [blame]

44

Marco Brohet

2014-02-28 21:01:26 +0100

[diff] [blame]

45

# All names from CM

46

names_cm_string = []

47

names_cm_string_array = []

48

names_cm_plurals = []

49

# All names from AOSP

50

names_base_string = []

51

names_base_string_array = []

52

names_base_plurals = []

53

54

# Get all names from CM

55

for s in list_cm_string :

56

if not s.hasAttribute('translatable') and not s.hasAttribute('translate'):

57

names_cm_string.append(s.attributes['name'].value)

58

for s in list_cm_string_array :

59

if not s.hasAttribute('translatable') and not s.hasAttribute('translate'):

60

names_cm_string_array.append(s.attributes['name'].value)

61

for s in list_cm_plurals :

62

if not s.hasAttribute('translatable') and not s.hasAttribute('translate'):

63

names_cm_plurals.append(s.attributes['name'].value)

64

# Get all names from AOSP

65

for s in list_base_string :

66

if not s.hasAttribute('translatable') and not s.hasAttribute('translate'):

67

names_base_string.append(s.attributes['name'].value)

68

for s in list_base_string_array :

69

if not s.hasAttribute('translatable') and not s.hasAttribute('translate'):

70

names_base_string_array.append(s.attributes['name'].value)

71

for s in list_base_plurals :

72

if not s.hasAttribute('translatable') and not s.hasAttribute('translate'):

73

names_base_plurals.append(s.attributes['name'].value)

74

75

# Store all differences in this list

76

caf_additions = []

77

78

# Add all CAF additions to the list 'caf_additions'

79

for z in names_cm_string:

80

if not z in names_base_string:

81

caf_additions.append(' ' + list_cm_string[names_cm_string.index(z)].toxml())

82

for z in names_cm_string_array:

83

if not z in names_base_string_array:

84

caf_additions.append(' ' + list_cm_string_array[names_cm_string_array.index(z)].toxml())

85

for z in names_cm_plurals:

86

if not z in names_base_plurals:

87

caf_additions.append(' ' + list_cm_plurals[names_cm_plurals.index(z)].toxml())

# Done :-)

return caf_additions

Marco Brohet

2014-03-02 17:31:17 +0100

[diff] [blame]

92

def sync_js_translations(sync_type, path, lang=''):

93

# lang is necessary in download mode

94

if sync_type == 'download' and lang == '':

95

sys.exit('Invalid syntax. Language code is required in download mode.')

96

97

# Read source en.js file. This is necessary for both upload and download modes

98

with open(path + 'en.js') as f:

99

content = f.readlines()

100

101

if sync_type == 'upload':

102

# Prepare XML file structure

103

doc = xml.dom.minidom.Document()

104

header = doc.createElement('resources')

105

file_write = open(path + 'en.xml', 'w')

106

else:

107

# Open translation files

108

file_write = open(path + lang + '.js', 'w')

109

xml_base = xml.dom.minidom.parse(path + lang + '.xml')

110

tags = xml_base.getElementsByTagName('string')

111

112

# Read each line of en.js

113

for a_line in content:

114

# Regex to determine string id

115

m = re.search(' (.*): [\'|\"]', a_line)

116

if m is not None:

117

for string_id in m.groups():

118

if string_id is not None:

119

# Find string id

120

string_id = string_id.replace(' ', '')

121

m2 = re.search('\'(.*)\'|"(.*)"', a_line)

122

# Find string contents

123

for string_content in m2.groups():

124

if string_content is not None:

125

break

126

if sync_type == 'upload':

127

# In upload mode, create the appropriate string element.

128

contents = doc.createElement('string')

129

contents.attributes['name'] = string_id

130

contents.appendChild(doc.createTextNode(string_content))

131

header.appendChild(contents)

132

else:

133

# In download mode, check if string_id matches a name attribute in the translation XML file.

134

# If it does, replace English text with the translation.

135

# If it does not, English text will remain and will be added to the file to retain the file structure.

136

for string in tags:

137

if string.attributes['name'].value == string_id:

138

a_line = a_line.replace(string_content.rstrip(), string.firstChild.nodeValue)

139

break

140

break

141

# In download mode do not write comments

142

if sync_type == 'download' and not '//' in a_line:

143

# Add language identifier (1)

144

if 'cmaccount.l10n.en' in a_line:

145

a_line = a_line.replace('l10n.en', 'l10n.' + lang)

146

# Add language identifier (2)

147

if 'l10n.add(\'en\'' in a_line:

148

a_line = a_line.replace('l10n.add(\'en\'', 'l10n.add(\'' + lang + '\'')

149

# Now write the line

150

file_write.write(a_line)

151

152

153

# Create XML file structure

154

if sync_type == 'upload':

155

header.appendChild(contents)

156

contents = header.toxml().replace('<string', '\n <string').replace('</resources>', '\n</resources>')

157

file_write.write('<?xml version="1.0" encoding="utf-8"?>\n')

158

file_write.write('\n')

159

file_write.write(contents)

# Close file

file_write.close()

Marco Brohet

2014-02-28 21:01:26 +0100

[diff] [blame]

164

def push_as_commit(path, name):

165

# Get path

166

path = os.getcwd() + '/' + path

167

168

# Create git commit

169

repo = git.Repo(path)

170

repo.git.add(path)

171

try:

172

repo.git.commit(m='DO NOT MERGE: Automatic translation import test commit')

173

# repo.git.push('ssh://cobjeM@review.cyanogenmod.org:29418/' + name, 'HEAD:refs/for/cm-11.0')

174

print 'Succesfully pushed commit for ' + name

175

except:

176

# If git commit fails, it's probably because of no changes.

177

# Just continue.

178

print 'No commit pushed (probably empty?) for ' + name

179

print 'WARNING: If the repository name was not obtained from default.xml, the name might be wrong!'

180

181

print('Welcome to the CM Crowdin sync script!')

182

183

print('\nSTEP 0: Checking dependencies')

Marco Brohet

2014-03-02 17:31:17 +0100

[diff] [blame]

184

# Check for Ruby version of crowdin-cli

Marco Brohet

2014-02-28 01:06:03 +0100

[diff] [blame]

185

if subprocess.check_output(['rvm', 'all', 'do', 'gem', 'list', 'crowdin-cli', '-i']) == 'true':

186

sys.exit('You have not installed crowdin-cli. Terminating.')

Marco Brohet

2014-02-28 21:01:26 +0100

[diff] [blame]

187

else:

188

print('Found: crowdin-cli')

Marco Brohet

2014-03-02 17:31:17 +0100

[diff] [blame]

189

# Check for caf.xml

Marco Brohet

2014-02-28 01:06:03 +0100

[diff] [blame]

190

if not os.path.isfile('caf.xml'):

191

sys.exit('You have no caf.xml. Terminating.')

Marco Brohet

2014-02-28 21:01:26 +0100

[diff] [blame]

192

else:

193

print('Found: caf.xml')

Marco Brohet

2014-03-02 17:31:17 +0100

[diff] [blame]

194

# Check for default.xml

Marco Brohet

2014-02-28 01:06:03 +0100

[diff] [blame]

195

if not os.path.isfile('default.xml'):

196

sys.exit('You have no default.xml. Terminating.')

Marco Brohet

2014-02-28 21:01:26 +0100

[diff] [blame]

197

else:

198

print('Found: default.xml')

Marco Brohet

2014-03-02 17:31:17 +0100

[diff] [blame]

199

# Check for repo

200

try:

201

subprocess.check_output(['which', 'repo'])

202

except:

203

sys.exit('You have not installed repo. Terminating.')

Marco Brohet

2014-02-28 01:06:03 +0100

[diff] [blame]

204

Marco Brohet

2014-02-28 21:01:26 +0100

[diff] [blame]

205

print('\nSTEP 1: Create cm_caf.xml')

206

# Load caf.xml

Marco Brohet

2014-03-02 17:31:17 +0100

[diff] [blame]

207

print('Loading caf.xml')

Marco Brohet

2014-02-28 01:06:03 +0100

[diff] [blame]

208

xml = minidom.parse('caf.xml')

209

items = xml.getElementsByTagName('item')

210

Marco Brohet

2014-02-28 21:01:26 +0100

[diff] [blame]

211

# Store all created cm_caf.xml files in here.

212

# Easier to remove them afterwards, as they cannot be committed

Marco Brohet

2014-02-28 01:06:03 +0100

[diff] [blame]

213

cm_caf = []

214

215

for item in items:

Marco Brohet

2014-02-28 21:01:26 +0100

[diff] [blame]

216

# Create tmp dir for download of AOSP base file

217

path_to_values = item.attributes["path"].value

218

subprocess.call(['mkdir', '-p', 'tmp/' + path_to_values])

219

# Create cm_caf.xml - header

220

f = open(path_to_values + '/cm_caf.xml','w')

221

f.write('<?xml version="1.0" encoding="utf-8"?>\n')

222

f.write('<resources xmlns:xliff="urn:oasis:names:tc:xliff:document:1.2">\n')

223

# Create cm_caf.xml - contents

224

# This means we also support multiple base files (e.g. checking if strings.xml and arrays.xml are changed)

225

contents = []

Marco Brohet

2014-02-28 01:06:03 +0100

[diff] [blame]

226

item_aosp = item.getElementsByTagName('aosp')

227

for aosp_item in item_aosp:

228

url = aosp_item.firstChild.nodeValue

Marco Brohet

2014-02-28 21:01:26 +0100

[diff] [blame]

229

xml_file = aosp_item.attributes["file"].value

230

path_to_base = 'tmp/' + path_to_values + '/' + xml_file

231

path_to_cm = path_to_values + '/' + xml_file

Marco Brohet

2014-02-28 01:06:03 +0100

[diff] [blame]

232

urlretrieve(url, path_to_base)

Marco Brohet

2014-02-28 21:01:26 +0100

[diff] [blame]

233

contents = contents + get_caf_additions(path_to_base, path_to_cm)

234

for addition in contents:

235

f.write(addition + '\n')

236

# Create cm_caf.xml - the end

237

f.write('</resources>')

238

f.close()

239

cm_caf.append(path_to_values + '/cm_caf.xml')

240

print('Created ' + path_to_values + '/cm_caf.xml')

Marco Brohet

2014-02-28 01:06:03 +0100

[diff] [blame]

241

242

print('\nSTEP 2: Upload Crowdin source translations')

Marco Brohet

2014-02-28 21:01:26 +0100

[diff] [blame]

243

# Execute 'crowdin-cli upload sources' and show output

Marco Brohet

2014-02-28 01:06:03 +0100

[diff] [blame]

244

print(subprocess.check_output(['crowdin-cli', 'upload', 'sources']))

245

Marco Brohet

2014-02-28 18:48:17 +0100

[diff] [blame]

246

print('STEP 3: Download Crowdin translations')

Marco Brohet

2014-02-28 21:01:26 +0100

[diff] [blame]

247

# Execute 'crowdin-cli download' and show output

Marco Brohet

2014-02-28 18:48:17 +0100

[diff] [blame]

248

print(subprocess.check_output(['crowdin-cli', "download"]))

Marco Brohet

2014-02-28 01:06:03 +0100

[diff] [blame]

249

Marco Brohet

2014-02-28 18:48:17 +0100

[diff] [blame]

250

print('STEP 4A: Clean up of source cm_caf.xmls')

Marco Brohet

2014-02-28 21:01:26 +0100

[diff] [blame]

251

# Remove all cm_caf.xml files, which you can find in the list 'cm_caf'

Marco Brohet

2014-02-28 18:48:17 +0100

[diff] [blame]

252

for cm_caf_file in cm_caf:

253

print ('Removing ' + cm_caf_file)

254

os.remove(cm_caf_file)

255

256

print('\nSTEP 4B: Clean up of temp dir')

Marco Brohet

2014-02-28 21:01:26 +0100

[diff] [blame]

257

# We are done with cm_caf.xml files, so remove tmp/

Marco Brohet

2014-02-28 18:48:17 +0100

[diff] [blame]

258

shutil.rmtree(os.getcwd() + '/tmp')

259

Marco Brohet

2014-02-28 21:01:26 +0100

[diff] [blame]

260

print('\nSTEP 4C: Clean up of empty translations')

261

# Some line of code that I found to find all XML files

Marco Brohet

2014-02-28 01:06:03 +0100

[diff] [blame]

262

result = [os.path.join(dp, f) for dp, dn, filenames in os.walk(os.getcwd()) for f in filenames if os.path.splitext(f)[1] == '.xml']

263

for xml_file in result:

Marco Brohet

2014-02-28 21:01:26 +0100

[diff] [blame]

264

# We hate empty, useless files. Crowdin exports them with <resources/> (sometimes with xliff).

265

# That means: easy to find

Marco Brohet

2014-02-28 01:06:03 +0100

[diff] [blame]

266

if '<resources/>' in open(xml_file).read():

267

print ('Removing ' + xml_file)

268

os.remove(xml_file)

Marco Brohet

2014-02-28 18:48:17 +0100

[diff] [blame]

269

elif '<resources xmlns:xliff="urn:oasis:names:tc:xliff:document:1.2"/>' in open(xml_file).read():

Marco Brohet

2014-02-28 01:06:03 +0100

[diff] [blame]

270

print ('Removing ' + xml_file)

271

os.remove(xml_file)

272

Marco Brohet

2014-02-28 01:06:03 +0100

[diff] [blame]

273

print('\nSTEP 5: Push translations to Git')

Marco Brohet

2014-02-28 21:01:26 +0100

[diff] [blame]

274

# Get all files that Crowdin pushed

Marco Brohet

2014-02-28 01:06:03 +0100

[diff] [blame]

275

proc = subprocess.Popen(['crowdin-cli', 'list', 'sources'],stdout=subprocess.PIPE)

Marco Brohet

2014-02-28 01:06:03 +0100

[diff] [blame]

276

xml = minidom.parse('default.xml')

277

items = xml.getElementsByTagName('project')

Marco Brohet

2014-02-28 18:48:17 +0100

[diff] [blame]

278

all_projects = []

Marco Brohet

2014-02-28 01:06:03 +0100

[diff] [blame]

279

Marco Brohet

2014-02-28 18:48:17 +0100

[diff] [blame]

280

for path in iter(proc.stdout.readline,''):

Marco Brohet

2014-02-28 21:01:26 +0100

[diff] [blame]

281

# Remove the \n at the end of each line

Marco Brohet

2014-02-28 18:48:17 +0100

[diff] [blame]

282

path = path.rstrip()

Marco Brohet

2014-02-28 21:01:26 +0100

[diff] [blame]

283

# Get project root dir from Crowdin's output

Marco Brohet

2014-02-28 18:48:17 +0100

[diff] [blame]

284

285

for good_path in m.groups():

Marco Brohet

2014-02-28 21:01:26 +0100

[diff] [blame]

286

# When a project has multiple translatable files, Crowdin will give duplicates.

287

# We don't want that (useless empty commits), so we save each project in all_projects

288

# and check if it's already in there.

Marco Brohet

2014-02-28 18:48:17 +0100

[diff] [blame]

289

if good_path is not None and not good_path in all_projects:

290

all_projects.append(good_path)

291

working = 'false'

292

for project_item in items:

Marco Brohet

2014-02-28 21:01:26 +0100

[diff] [blame]

293

# We need to have the Github repository for the git push url. Obtain them from

294

# default.xml based on the project root dir.

Marco Brohet

2014-02-28 18:48:17 +0100

[diff] [blame]

295

if project_item.attributes["path"].value == good_path:

296

working = 'true'

Marco Brohet

2014-02-28 21:01:26 +0100

[diff] [blame]

297

push_as_commit(good_path, project_item.attributes['name'].value)

298

print 'Committing ' + project_item.attributes['name'].value + ' (based on default.xml)'

299

# We also translate repositories that are not downloaded by default (e.g. device parts).

300

# This is just a fallback.

301

# WARNING: If the name is wrong, this will not stop the script.

Marco Brohet

2014-02-28 18:48:17 +0100

[diff] [blame]

302

if working == 'false':

Marco Brohet

2014-02-28 21:01:26 +0100

[diff] [blame]

303

push_as_commit(good_path, 'CyanogenMod/android_' + good_path.replace('/', '_'))

304

print 'Committing ' + project_item.attributes['name'].value + ' (workaround)'

Marco Brohet