Blame - cm_crowdin_sync.py - crowdin

2014-02-28 01:06:03 +0100

[diff] [blame]

1

#!/usr/bin/python2

Marco Brohet

f174272

2014-03-04 22:41:18 +0100

[diff] [blame]

2

# -*- coding: utf-8 -*-

Marco Brohet

2014-02-28 01:06:03 +0100

[diff] [blame]

3

# cm_crowdin_sync.py

4

#

5

# Updates Crowdin source translations and pulls translations

Marco Brohet

2014-02-28 21:01:26 +0100

[diff] [blame]

6

# directly to CyanogenMod's Git.

#

#

# Licensed under the Apache License, Version 2.0 (the "License");

11

# you may not use this file except in compliance with the License.

12

# You may obtain a copy of the License at

13

#

14

# http://www.apache.org/licenses/LICENSE-2.0

15

#

16

# Unless required by applicable law or agreed to in writing, software

17

# distributed under the License is distributed on an "AS IS" BASIS,

18

# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.

19

# See the License for the specific language governing permissions and

20

# limitations under the License.

Marco Brohet

2014-02-28 01:06:03 +0100

[diff] [blame]

21

Marco Brohet

f174272

2014-03-04 22:41:18 +0100

[diff] [blame]

22

import codecs

Marco Brohet

2014-02-28 01:06:03 +0100

[diff] [blame]

23

import git

24

import mmap

Marco Brohet

2014-02-28 18:48:17 +0100

[diff] [blame]

25

import os

Marco Brohet

2014-02-28 01:06:03 +0100

[diff] [blame]

import os.path

import re

import shutil

import subprocess

import sys

from urllib import urlretrieve

32

from xml.dom import minidom

33

Marco Brohet

2014-02-28 21:01:26 +0100

[diff] [blame]

34

def get_caf_additions(strings_base, strings_cm):

35

# Load AOSP file and resources

36

xml_base = minidom.parse(strings_base)

37

list_base_string = xml_base.getElementsByTagName('string')

38

list_base_string_array = xml_base.getElementsByTagName('string-array')

39

list_base_plurals = xml_base.getElementsByTagName('plurals')

40

# Load CM file and resources

41

xml_cm = minidom.parse(strings_cm)

42

list_cm_string = xml_cm.getElementsByTagName('string')

43

list_cm_string_array = xml_cm.getElementsByTagName('string-array')

44

list_cm_plurals = xml_cm.getElementsByTagName('plurals')

Marco Brohet

2014-02-28 01:06:03 +0100

[diff] [blame]

45

Marco Brohet

2014-02-28 21:01:26 +0100

[diff] [blame]

46

# All names from CM

47

names_cm_string = []

48

names_cm_string_array = []

49

names_cm_plurals = []

50

# All names from AOSP

51

names_base_string = []

52

names_base_string_array = []

53

names_base_plurals = []

54

55

# Get all names from CM

56

for s in list_cm_string :

57

if not s.hasAttribute('translatable') and not s.hasAttribute('translate'):

58

names_cm_string.append(s.attributes['name'].value)

59

for s in list_cm_string_array :

60

if not s.hasAttribute('translatable') and not s.hasAttribute('translate'):

61

names_cm_string_array.append(s.attributes['name'].value)

62

for s in list_cm_plurals :

63

if not s.hasAttribute('translatable') and not s.hasAttribute('translate'):

64

names_cm_plurals.append(s.attributes['name'].value)

65

# Get all names from AOSP

66

for s in list_base_string :

67

if not s.hasAttribute('translatable') and not s.hasAttribute('translate'):

68

names_base_string.append(s.attributes['name'].value)

69

for s in list_base_string_array :

70

if not s.hasAttribute('translatable') and not s.hasAttribute('translate'):

71

names_base_string_array.append(s.attributes['name'].value)

72

for s in list_base_plurals :

73

if not s.hasAttribute('translatable') and not s.hasAttribute('translate'):

74

names_base_plurals.append(s.attributes['name'].value)

75

76

# Store all differences in this list

77

caf_additions = []

78

79

# Add all CAF additions to the list 'caf_additions'

80

for z in names_cm_string:

Marco Brohet

2014-03-08 19:13:07 +0100

[diff] [blame]

81

if z not in names_base_string:

82

for string_item in list_cm_string:

83

if string_item.attributes['name'].value == z:

84

caf_additions.append(' ' + string_item.toxml())

Marco Brohet

2014-03-08 19:13:07 +0100

[diff] [blame]

85

for y in names_cm_string_array:

86

if y not in names_base_string_array:

87

for string_array_item in list_cm_string_array:

88

if string_array_item.attributes['name'].value == y:

89

caf_additions.append(' ' + string_array_item.toxml())

Marco Brohet

2014-03-08 19:13:07 +0100

[diff] [blame]

90

for x in names_cm_plurals:

91

if x not in names_base_plurals:

92

for plurals_item in list_cm_plurals:

93

if plurals_item.attributes['name'].value == x:

94

caf_additions.append(' ' + plurals_item.toxml())

Marco Brohet

2014-02-28 21:01:26 +0100

[diff] [blame]

# Done :-)

return caf_additions

Marco Brohet

2014-03-02 17:31:17 +0100

[diff] [blame]

99

def sync_js_translations(sync_type, path, lang=''):

100

# lang is necessary in download mode

101

if sync_type == 'download' and lang == '':

102

sys.exit('Invalid syntax. Language code is required in download mode.')

103

104

# Read source en.js file. This is necessary for both upload and download modes

Marco Brohet

44657ed

2014-03-04 22:49:23 +0100

[diff] [blame]

105

with codecs.open(path + 'en.js', 'r', 'utf-8') as f:

Marco Brohet

2014-03-02 17:31:17 +0100

[diff] [blame]

106

content = f.readlines()

107

108

if sync_type == 'upload':

109

# Prepare XML file structure

110

doc = xml.dom.minidom.Document()

111

header = doc.createElement('resources')

Marco Brohet

44657ed

2014-03-04 22:49:23 +0100

[diff] [blame]

112

file_write = codecs.open(path + 'en.xml', 'w', 'utf-8')

Marco Brohet

2014-03-02 17:31:17 +0100

[diff] [blame]

113

else:

114

# Open translation files

Marco Brohet

44657ed

2014-03-04 22:49:23 +0100

[diff] [blame]

115

file_write = codecs.open(path + lang + '.js', 'w', 'utf-8')

Marco Brohet

2014-03-02 17:31:17 +0100

[diff] [blame]

116

xml_base = xml.dom.minidom.parse(path + lang + '.xml')

117

tags = xml_base.getElementsByTagName('string')

118

119

# Read each line of en.js

120

for a_line in content:

121

# Regex to determine string id

122

m = re.search(' (.*): [\'|\"]', a_line)

123

if m is not None:

124

for string_id in m.groups():

125

if string_id is not None:

126

# Find string id

127

string_id = string_id.replace(' ', '')

128

m2 = re.search('\'(.*)\'|"(.*)"', a_line)

129

# Find string contents

130

for string_content in m2.groups():

131

if string_content is not None:

132

break

133

if sync_type == 'upload':

134

# In upload mode, create the appropriate string element.

135

contents = doc.createElement('string')

136

contents.attributes['name'] = string_id

137

contents.appendChild(doc.createTextNode(string_content))

138

header.appendChild(contents)

139

else:

140

# In download mode, check if string_id matches a name attribute in the translation XML file.

141

# If it does, replace English text with the translation.

142

# If it does not, English text will remain and will be added to the file to retain the file structure.

143

for string in tags:

144

if string.attributes['name'].value == string_id:

145

a_line = a_line.replace(string_content.rstrip(), string.firstChild.nodeValue)

146

break

147

break

148

# In download mode do not write comments

149

if sync_type == 'download' and not '//' in a_line:

150

# Add language identifier (1)

151

if 'cmaccount.l10n.en' in a_line:

152

a_line = a_line.replace('l10n.en', 'l10n.' + lang)

153

# Add language identifier (2)

154

if 'l10n.add(\'en\'' in a_line:

155

a_line = a_line.replace('l10n.add(\'en\'', 'l10n.add(\'' + lang + '\'')

156

# Now write the line

157

file_write.write(a_line)

158

159

160

# Create XML file structure

161

if sync_type == 'upload':

162

header.appendChild(contents)

163

contents = header.toxml().replace('<string', '\n <string').replace('</resources>', '\n</resources>')

164

file_write.write('<?xml version="1.0" encoding="utf-8"?>\n')

165

file_write.write('\n')

166

file_write.write(contents)

# Close file

file_write.close()

Marco Brohet

2014-02-28 21:01:26 +0100

[diff] [blame]

171

def push_as_commit(path, name):

172

# Get path

173

path = os.getcwd() + '/' + path

174

175

# Create git commit

176

repo = git.Repo(path)

177

repo.git.add(path)

178

try:

179

repo.git.commit(m='DO NOT MERGE: Automatic translation import test commit')

180

# repo.git.push('ssh://cobjeM@review.cyanogenmod.org:29418/' + name, 'HEAD:refs/for/cm-11.0')

181

print 'Succesfully pushed commit for ' + name

182

except:

183

# If git commit fails, it's probably because of no changes.

184

# Just continue.

185

print 'No commit pushed (probably empty?) for ' + name

186

print 'WARNING: If the repository name was not obtained from default.xml, the name might be wrong!'

187

188

print('Welcome to the CM Crowdin sync script!')

189

190

print('\nSTEP 0: Checking dependencies')

Marco Brohet

2014-03-02 17:31:17 +0100

[diff] [blame]

191

# Check for Ruby version of crowdin-cli

Marco Brohet

2014-02-28 01:06:03 +0100

[diff] [blame]

192

if subprocess.check_output(['rvm', 'all', 'do', 'gem', 'list', 'crowdin-cli', '-i']) == 'true':

193

sys.exit('You have not installed crowdin-cli. Terminating.')

Marco Brohet

2014-02-28 21:01:26 +0100

[diff] [blame]

194

else:

195

print('Found: crowdin-cli')

Marco Brohet

2014-03-02 17:31:17 +0100

[diff] [blame]

196

# Check for caf.xml

Marco Brohet

2014-02-28 01:06:03 +0100

[diff] [blame]

197

if not os.path.isfile('caf.xml'):

198

sys.exit('You have no caf.xml. Terminating.')

Marco Brohet

2014-02-28 21:01:26 +0100

[diff] [blame]

199

else:

200

print('Found: caf.xml')

Marco Brohet

2014-03-02 17:31:17 +0100

[diff] [blame]

201

# Check for default.xml

Marco Brohet

2014-02-28 01:06:03 +0100

[diff] [blame]

202

if not os.path.isfile('default.xml'):

203

sys.exit('You have no default.xml. Terminating.')

Marco Brohet

2014-02-28 21:01:26 +0100

[diff] [blame]

204

else:

205

print('Found: default.xml')

Marco Brohet

2014-03-02 17:31:17 +0100

[diff] [blame]

206

# Check for repo

207

try:

208

subprocess.check_output(['which', 'repo'])

209

except:

210

sys.exit('You have not installed repo. Terminating.')

Marco Brohet

2014-02-28 01:06:03 +0100

[diff] [blame]

211

Marco Brohet

2014-03-08 19:13:07 +0100

[diff] [blame]

212

print('\nSTEP 1: Create cm_caf.xml')

Marco Brohet

2014-02-28 21:01:26 +0100

[diff] [blame]

213

# Load caf.xml

Marco Brohet

2014-03-08 19:13:07 +0100

[diff] [blame]

214

print('Loading caf.xml')

215

xml = minidom.parse('caf.xml')

216

items = xml.getElementsByTagName('item')

Marco Brohet

2014-02-28 01:06:03 +0100

[diff] [blame]

217

Marco Brohet

2014-02-28 21:01:26 +0100

[diff] [blame]

218

# Store all created cm_caf.xml files in here.

219

# Easier to remove them afterwards, as they cannot be committed

Marco Brohet

2014-03-08 19:13:07 +0100

[diff] [blame]

220

cm_caf = []

Marco Brohet

2014-02-28 01:06:03 +0100

[diff] [blame]

221

Marco Brohet

2014-03-08 19:13:07 +0100

[diff] [blame]

222

for item in items:

223

# Create tmp dir for download of AOSP base file

224

path_to_values = item.attributes["path"].value

225

subprocess.call(['mkdir', '-p', 'tmp/' + path_to_values])

226

# Create cm_caf.xml - header

227

f = codecs.open(path_to_values + '/cm_caf.xml', 'w', 'utf-8')

228

f.write('<?xml version="1.0" encoding="utf-8"?>\n')

229

f.write('<resources xmlns:xliff="urn:oasis:names:tc:xliff:document:1.2">\n')

230

# Create cm_caf.xml - contents

231

# This means we also support multiple base files (e.g. checking if strings.xml and arrays.xml are changed)

232

contents = []

233

item_aosp = item.getElementsByTagName('aosp')

234

for aosp_item in item_aosp:

235

url = aosp_item.firstChild.nodeValue

236

xml_file = aosp_item.attributes["file"].value

237

path_to_base = 'tmp/' + path_to_values + '/' + xml_file

238

path_to_cm = path_to_values + '/' + xml_file

239

urlretrieve(url, path_to_base)

240

contents = contents + get_caf_additions(path_to_base, path_to_cm)

241

for addition in contents:

242

f.write(addition + '\n')

243

# Create cm_caf.xml - the end

244

f.write('</resources>')

245

f.close()

246

cm_caf.append(path_to_values + '/cm_caf.xml')

247

print('Created ' + path_to_values + '/cm_caf.xml')

Marco Brohet

2014-02-28 01:06:03 +0100

[diff] [blame]

248

249

print('\nSTEP 2: Upload Crowdin source translations')

Marco Brohet

2014-02-28 21:01:26 +0100

[diff] [blame]

250

# Execute 'crowdin-cli upload sources' and show output

Marco Brohet

2014-02-28 01:06:03 +0100

[diff] [blame]

251

print(subprocess.check_output(['crowdin-cli', 'upload', 'sources']))

252

Marco Brohet

2014-02-28 18:48:17 +0100

[diff] [blame]

253

print('STEP 3: Download Crowdin translations')

Marco Brohet

2014-02-28 21:01:26 +0100

[diff] [blame]

254

# Execute 'crowdin-cli download' and show output

Marco Brohet

2014-02-28 18:48:17 +0100

[diff] [blame]

255

print(subprocess.check_output(['crowdin-cli', "download"]))

Marco Brohet

2014-02-28 01:06:03 +0100

[diff] [blame]

256

Marco Brohet

2014-03-08 19:13:07 +0100

[diff] [blame]

257

print('STEP 4A: Clean up of source cm_caf.xmls')

258

# Remove all cm_caf.xml files, which you can find in the list 'cm_caf'

259

for cm_caf_file in cm_caf:

260

print ('Removing ' + cm_caf_file)

261

os.remove(cm_caf_file)

Marco Brohet

2014-02-28 18:48:17 +0100

[diff] [blame]

262

Marco Brohet

2014-03-08 19:13:07 +0100

[diff] [blame]

263

print('\nSTEP 4B: Clean up of temp dir')

264

# We are done with cm_caf.xml files, so remove tmp/

265

shutil.rmtree(os.getcwd() + '/tmp')

Marco Brohet

2014-02-28 18:48:17 +0100

[diff] [blame]

266

Marco Brohet

2014-02-28 21:01:26 +0100

[diff] [blame]

267

print('\nSTEP 4C: Clean up of empty translations')

268

# Some line of code that I found to find all XML files

Marco Brohet

2014-02-28 01:06:03 +0100

[diff] [blame]

269

result = [os.path.join(dp, f) for dp, dn, filenames in os.walk(os.getcwd()) for f in filenames if os.path.splitext(f)[1] == '.xml']

270

for xml_file in result:

Marco Brohet

2014-02-28 21:01:26 +0100

[diff] [blame]

271

# We hate empty, useless files. Crowdin exports them with <resources/> (sometimes with xliff).

272

# That means: easy to find

Marco Brohet

2014-02-28 01:06:03 +0100

[diff] [blame]

273

if '<resources/>' in open(xml_file).read():

274

print ('Removing ' + xml_file)

275

os.remove(xml_file)

Marco Brohet

2014-02-28 18:48:17 +0100

[diff] [blame]

276

elif '<resources xmlns:xliff="urn:oasis:names:tc:xliff:document:1.2"/>' in open(xml_file).read():

Marco Brohet

2014-02-28 01:06:03 +0100

[diff] [blame]

277

print ('Removing ' + xml_file)

278

os.remove(xml_file)

279

Marco Brohet

2014-02-28 01:06:03 +0100

[diff] [blame]

280

print('\nSTEP 5: Push translations to Git')

Marco Brohet

2014-02-28 21:01:26 +0100

[diff] [blame]

281

# Get all files that Crowdin pushed

Marco Brohet

2014-02-28 01:06:03 +0100

[diff] [blame]

282

proc = subprocess.Popen(['crowdin-cli', 'list', 'sources'],stdout=subprocess.PIPE)

Marco Brohet

2014-02-28 01:06:03 +0100

[diff] [blame]

283

xml = minidom.parse('default.xml')

284

items = xml.getElementsByTagName('project')

Marco Brohet

2014-02-28 18:48:17 +0100

[diff] [blame]

285

all_projects = []

Marco Brohet

2014-02-28 01:06:03 +0100

[diff] [blame]

286

Marco Brohet

2014-02-28 18:48:17 +0100

[diff] [blame]

287

for path in iter(proc.stdout.readline,''):

Marco Brohet

2014-02-28 21:01:26 +0100

[diff] [blame]

288

# Remove the \n at the end of each line

Marco Brohet

2014-02-28 18:48:17 +0100

[diff] [blame]

289

path = path.rstrip()

Marco Brohet

2014-02-28 21:01:26 +0100

[diff] [blame]

290

# Get project root dir from Crowdin's output

Marco Brohet

2014-02-28 18:48:17 +0100

[diff] [blame]

291

292

for good_path in m.groups():

Marco Brohet

2014-02-28 21:01:26 +0100

[diff] [blame]

293

# When a project has multiple translatable files, Crowdin will give duplicates.

294

# We don't want that (useless empty commits), so we save each project in all_projects

295

# and check if it's already in there.

Marco Brohet

2014-02-28 18:48:17 +0100

[diff] [blame]

296

if good_path is not None and not good_path in all_projects:

297

all_projects.append(good_path)

298

working = 'false'

299

for project_item in items:

Marco Brohet

2014-02-28 21:01:26 +0100

[diff] [blame]

300

# We need to have the Github repository for the git push url. Obtain them from

301

# default.xml based on the project root dir.

Marco Brohet

2014-02-28 18:48:17 +0100

[diff] [blame]

302

if project_item.attributes["path"].value == good_path:

303

working = 'true'

Marco Brohet

2014-02-28 21:01:26 +0100

[diff] [blame]

304

push_as_commit(good_path, project_item.attributes['name'].value)

305

print 'Committing ' + project_item.attributes['name'].value + ' (based on default.xml)'

306

# We also translate repositories that are not downloaded by default (e.g. device parts).

307

# This is just a fallback.

308

# WARNING: If the name is wrong, this will not stop the script.

Marco Brohet

2014-02-28 18:48:17 +0100

[diff] [blame]

309

if working == 'false':

Marco Brohet

2014-02-28 21:01:26 +0100

[diff] [blame]

310

push_as_commit(good_path, 'CyanogenMod/android_' + good_path.replace('/', '_'))

311

print 'Committing ' + project_item.attributes['name'].value + ' (workaround)'

Marco Brohet