Blame - cm_crowdin_sync.py - crowdin

2014-02-28 01:06:03 +0100

[diff] [blame]

1

#!/usr/bin/python2

Marco Brohet

f174272

2014-03-04 22:41:18 +0100

[diff] [blame]

2

# -*- coding: utf-8 -*-

Marco Brohet

2014-02-28 01:06:03 +0100

[diff] [blame]

3

# cm_crowdin_sync.py

4

#

5

# Updates Crowdin source translations and pulls translations

Marco Brohet

2014-02-28 21:01:26 +0100

[diff] [blame]

6

# directly to CyanogenMod's Git.

#

#

# Licensed under the Apache License, Version 2.0 (the "License");

11

# you may not use this file except in compliance with the License.

12

# You may obtain a copy of the License at

13

#

14

# http://www.apache.org/licenses/LICENSE-2.0

15

#

16

# Unless required by applicable law or agreed to in writing, software

17

# distributed under the License is distributed on an "AS IS" BASIS,

18

# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.

19

# See the License for the specific language governing permissions and

20

# limitations under the License.

Marco Brohet

2014-02-28 01:06:03 +0100

[diff] [blame]

21

Marco Brohet

f174272

2014-03-04 22:41:18 +0100

[diff] [blame]

22

import codecs

Marco Brohet

2014-02-28 01:06:03 +0100

[diff] [blame]

23

import git

24

import mmap

Marco Brohet

2014-02-28 18:48:17 +0100

[diff] [blame]

25

import os

Marco Brohet

2014-02-28 01:06:03 +0100

[diff] [blame]

import os.path

import re

import shutil

import subprocess

import sys

from urllib import urlretrieve

32

from xml.dom import minidom

33

Marco Brohet

2014-02-28 21:01:26 +0100

[diff] [blame]

34

def get_caf_additions(strings_base, strings_cm):

35

# Load AOSP file and resources

36

xml_base = minidom.parse(strings_base)

37

list_base_string = xml_base.getElementsByTagName('string')

38

list_base_string_array = xml_base.getElementsByTagName('string-array')

39

list_base_plurals = xml_base.getElementsByTagName('plurals')

40

# Load CM file and resources

41

xml_cm = minidom.parse(strings_cm)

42

list_cm_string = xml_cm.getElementsByTagName('string')

43

list_cm_string_array = xml_cm.getElementsByTagName('string-array')

44

list_cm_plurals = xml_cm.getElementsByTagName('plurals')

Marco Brohet

2014-02-28 01:06:03 +0100

[diff] [blame]

45

Marco Brohet

2014-02-28 21:01:26 +0100

[diff] [blame]

46

# All names from CM

47

names_cm_string = []

48

names_cm_string_array = []

49

names_cm_plurals = []

50

# All names from AOSP

51

names_base_string = []

52

names_base_string_array = []

53

names_base_plurals = []

54

55

# Get all names from CM

56

for s in list_cm_string :

57

if not s.hasAttribute('translatable') and not s.hasAttribute('translate'):

58

names_cm_string.append(s.attributes['name'].value)

59

for s in list_cm_string_array :

60

if not s.hasAttribute('translatable') and not s.hasAttribute('translate'):

61

names_cm_string_array.append(s.attributes['name'].value)

62

for s in list_cm_plurals :

63

if not s.hasAttribute('translatable') and not s.hasAttribute('translate'):

64

names_cm_plurals.append(s.attributes['name'].value)

65

# Get all names from AOSP

66

for s in list_base_string :

67

if not s.hasAttribute('translatable') and not s.hasAttribute('translate'):

68

names_base_string.append(s.attributes['name'].value)

69

for s in list_base_string_array :

70

if not s.hasAttribute('translatable') and not s.hasAttribute('translate'):

71

names_base_string_array.append(s.attributes['name'].value)

72

for s in list_base_plurals :

73

if not s.hasAttribute('translatable') and not s.hasAttribute('translate'):

74

names_base_plurals.append(s.attributes['name'].value)

75

76

# Store all differences in this list

77

caf_additions = []

78

79

# Add all CAF additions to the list 'caf_additions'

80

for z in names_cm_string:

81

if not z in names_base_string:

82

caf_additions.append(' ' + list_cm_string[names_cm_string.index(z)].toxml())

83

for z in names_cm_string_array:

84

if not z in names_base_string_array:

85

caf_additions.append(' ' + list_cm_string_array[names_cm_string_array.index(z)].toxml())

86

for z in names_cm_plurals:

87

if not z in names_base_plurals:

88

caf_additions.append(' ' + list_cm_plurals[names_cm_plurals.index(z)].toxml())

# Done :-)

return caf_additions

Marco Brohet

2014-03-02 17:31:17 +0100

[diff] [blame]

93

def sync_js_translations(sync_type, path, lang=''):

94

# lang is necessary in download mode

95

if sync_type == 'download' and lang == '':

96

sys.exit('Invalid syntax. Language code is required in download mode.')

97

98

# Read source en.js file. This is necessary for both upload and download modes

Marco Brohet

44657ed

2014-03-04 22:49:23 +0100

[diff] [blame^]

99

with codecs.open(path + 'en.js', 'r', 'utf-8') as f:

Marco Brohet

2014-03-02 17:31:17 +0100

[diff] [blame]

100

content = f.readlines()

101

102

if sync_type == 'upload':

103

# Prepare XML file structure

104

doc = xml.dom.minidom.Document()

105

header = doc.createElement('resources')

Marco Brohet

44657ed

2014-03-04 22:49:23 +0100

[diff] [blame^]

106

file_write = codecs.open(path + 'en.xml', 'w', 'utf-8')

Marco Brohet

2014-03-02 17:31:17 +0100

[diff] [blame]

107

else:

108

# Open translation files

Marco Brohet

44657ed

2014-03-04 22:49:23 +0100

[diff] [blame^]

109

file_write = codecs.open(path + lang + '.js', 'w', 'utf-8')

Marco Brohet

2014-03-02 17:31:17 +0100

[diff] [blame]

110

xml_base = xml.dom.minidom.parse(path + lang + '.xml')

111

tags = xml_base.getElementsByTagName('string')

112

113

# Read each line of en.js

114

for a_line in content:

115

# Regex to determine string id

116

m = re.search(' (.*): [\'|\"]', a_line)

117

if m is not None:

118

for string_id in m.groups():

119

if string_id is not None:

120

# Find string id

121

string_id = string_id.replace(' ', '')

122

m2 = re.search('\'(.*)\'|"(.*)"', a_line)

123

# Find string contents

124

for string_content in m2.groups():

125

if string_content is not None:

126

break

127

if sync_type == 'upload':

128

# In upload mode, create the appropriate string element.

129

contents = doc.createElement('string')

130

contents.attributes['name'] = string_id

131

contents.appendChild(doc.createTextNode(string_content))

132

header.appendChild(contents)

133

else:

134

# In download mode, check if string_id matches a name attribute in the translation XML file.

135

# If it does, replace English text with the translation.

136

# If it does not, English text will remain and will be added to the file to retain the file structure.

137

for string in tags:

138

if string.attributes['name'].value == string_id:

139

a_line = a_line.replace(string_content.rstrip(), string.firstChild.nodeValue)

140

break

141

break

142

# In download mode do not write comments

143

if sync_type == 'download' and not '//' in a_line:

144

# Add language identifier (1)

145

if 'cmaccount.l10n.en' in a_line:

146

a_line = a_line.replace('l10n.en', 'l10n.' + lang)

147

# Add language identifier (2)

148

if 'l10n.add(\'en\'' in a_line:

149

a_line = a_line.replace('l10n.add(\'en\'', 'l10n.add(\'' + lang + '\'')

150

# Now write the line

151

file_write.write(a_line)

152

153

154

# Create XML file structure

155

if sync_type == 'upload':

156

header.appendChild(contents)

157

contents = header.toxml().replace('<string', '\n <string').replace('</resources>', '\n</resources>')

158

file_write.write('<?xml version="1.0" encoding="utf-8"?>\n')

159

file_write.write('\n')

160

file_write.write(contents)

# Close file

file_write.close()

Marco Brohet

2014-02-28 21:01:26 +0100

[diff] [blame]

165

def push_as_commit(path, name):

166

# Get path

167

path = os.getcwd() + '/' + path

168

169

# Create git commit

170

repo = git.Repo(path)

171

repo.git.add(path)

172

try:

173

repo.git.commit(m='DO NOT MERGE: Automatic translation import test commit')

174

# repo.git.push('ssh://cobjeM@review.cyanogenmod.org:29418/' + name, 'HEAD:refs/for/cm-11.0')

175

print 'Succesfully pushed commit for ' + name

176

except:

177

# If git commit fails, it's probably because of no changes.

178

# Just continue.

179

print 'No commit pushed (probably empty?) for ' + name

180

print 'WARNING: If the repository name was not obtained from default.xml, the name might be wrong!'

181

182

print('Welcome to the CM Crowdin sync script!')

183

184

print('\nSTEP 0: Checking dependencies')

Marco Brohet

2014-03-02 17:31:17 +0100

[diff] [blame]

185

# Check for Ruby version of crowdin-cli

Marco Brohet

2014-02-28 01:06:03 +0100

[diff] [blame]

186

if subprocess.check_output(['rvm', 'all', 'do', 'gem', 'list', 'crowdin-cli', '-i']) == 'true':

187

sys.exit('You have not installed crowdin-cli. Terminating.')

Marco Brohet

2014-02-28 21:01:26 +0100

[diff] [blame]

188

else:

189

print('Found: crowdin-cli')

Marco Brohet

2014-03-02 17:31:17 +0100

[diff] [blame]

190

# Check for caf.xml

Marco Brohet

2014-02-28 01:06:03 +0100

[diff] [blame]

191

if not os.path.isfile('caf.xml'):

192

sys.exit('You have no caf.xml. Terminating.')

Marco Brohet

2014-02-28 21:01:26 +0100

[diff] [blame]

193

else:

194

print('Found: caf.xml')

Marco Brohet

2014-03-02 17:31:17 +0100

[diff] [blame]

195

# Check for default.xml

Marco Brohet

2014-02-28 01:06:03 +0100

[diff] [blame]

196

if not os.path.isfile('default.xml'):

197

sys.exit('You have no default.xml. Terminating.')

Marco Brohet

2014-02-28 21:01:26 +0100

[diff] [blame]

198

else:

199

print('Found: default.xml')

Marco Brohet

2014-03-02 17:31:17 +0100

[diff] [blame]

200

# Check for repo

201

try:

202

subprocess.check_output(['which', 'repo'])

203

except:

204

sys.exit('You have not installed repo. Terminating.')

Marco Brohet

2014-02-28 01:06:03 +0100

[diff] [blame]

205

Marco Brohet

2014-02-28 21:01:26 +0100

[diff] [blame]

206

print('\nSTEP 1: Create cm_caf.xml')

207

# Load caf.xml

Marco Brohet

2014-03-02 17:31:17 +0100

[diff] [blame]

208

print('Loading caf.xml')

Marco Brohet

2014-02-28 01:06:03 +0100

[diff] [blame]

209

xml = minidom.parse('caf.xml')

210

items = xml.getElementsByTagName('item')

211

Marco Brohet

2014-02-28 21:01:26 +0100

[diff] [blame]

212

# Store all created cm_caf.xml files in here.

213

# Easier to remove them afterwards, as they cannot be committed

Marco Brohet

2014-02-28 01:06:03 +0100

[diff] [blame]

214

cm_caf = []

215

216

for item in items:

Marco Brohet

2014-02-28 21:01:26 +0100

[diff] [blame]

217

# Create tmp dir for download of AOSP base file

218

path_to_values = item.attributes["path"].value

219

subprocess.call(['mkdir', '-p', 'tmp/' + path_to_values])

220

# Create cm_caf.xml - header

Marco Brohet

f174272

2014-03-04 22:41:18 +0100

[diff] [blame]

221

f = codecs.open(path_to_values + '/cm_caf.xml', 'w', 'utf-8')

Marco Brohet

2014-02-28 21:01:26 +0100

[diff] [blame]

222

f.write('<?xml version="1.0" encoding="utf-8"?>\n')

223

f.write('<resources xmlns:xliff="urn:oasis:names:tc:xliff:document:1.2">\n')

224

# Create cm_caf.xml - contents

225

# This means we also support multiple base files (e.g. checking if strings.xml and arrays.xml are changed)

226

contents = []

Marco Brohet

2014-02-28 01:06:03 +0100

[diff] [blame]

227

item_aosp = item.getElementsByTagName('aosp')

228

for aosp_item in item_aosp:

229

url = aosp_item.firstChild.nodeValue

Marco Brohet

2014-02-28 21:01:26 +0100

[diff] [blame]

230

xml_file = aosp_item.attributes["file"].value

231

path_to_base = 'tmp/' + path_to_values + '/' + xml_file

232

path_to_cm = path_to_values + '/' + xml_file

Marco Brohet

2014-02-28 01:06:03 +0100

[diff] [blame]

233

urlretrieve(url, path_to_base)

Marco Brohet

2014-02-28 21:01:26 +0100

[diff] [blame]

234

contents = contents + get_caf_additions(path_to_base, path_to_cm)

235

for addition in contents:

236

f.write(addition + '\n')

237

# Create cm_caf.xml - the end

238

f.write('</resources>')

239

f.close()

240

cm_caf.append(path_to_values + '/cm_caf.xml')

241

print('Created ' + path_to_values + '/cm_caf.xml')

Marco Brohet

2014-02-28 01:06:03 +0100

[diff] [blame]

242

243

print('\nSTEP 2: Upload Crowdin source translations')

Marco Brohet

2014-02-28 21:01:26 +0100

[diff] [blame]

244

# Execute 'crowdin-cli upload sources' and show output

Marco Brohet

2014-02-28 01:06:03 +0100

[diff] [blame]

245

print(subprocess.check_output(['crowdin-cli', 'upload', 'sources']))

246

Marco Brohet

2014-02-28 18:48:17 +0100

[diff] [blame]

247

print('STEP 3: Download Crowdin translations')

Marco Brohet

2014-02-28 21:01:26 +0100

[diff] [blame]

248

# Execute 'crowdin-cli download' and show output

Marco Brohet

2014-02-28 18:48:17 +0100

[diff] [blame]

249

print(subprocess.check_output(['crowdin-cli', "download"]))

Marco Brohet

2014-02-28 01:06:03 +0100

[diff] [blame]

250

Marco Brohet

2014-02-28 18:48:17 +0100

[diff] [blame]

251

print('STEP 4A: Clean up of source cm_caf.xmls')

Marco Brohet

2014-02-28 21:01:26 +0100

[diff] [blame]

252

# Remove all cm_caf.xml files, which you can find in the list 'cm_caf'

Marco Brohet

2014-02-28 18:48:17 +0100

[diff] [blame]

253

for cm_caf_file in cm_caf:

254

print ('Removing ' + cm_caf_file)

255

os.remove(cm_caf_file)

256

257

print('\nSTEP 4B: Clean up of temp dir')

Marco Brohet

2014-02-28 21:01:26 +0100

[diff] [blame]

258

# We are done with cm_caf.xml files, so remove tmp/

Marco Brohet

2014-02-28 18:48:17 +0100

[diff] [blame]

259

shutil.rmtree(os.getcwd() + '/tmp')

260

Marco Brohet

2014-02-28 21:01:26 +0100

[diff] [blame]

261

print('\nSTEP 4C: Clean up of empty translations')

262

# Some line of code that I found to find all XML files

Marco Brohet

2014-02-28 01:06:03 +0100

[diff] [blame]

263

result = [os.path.join(dp, f) for dp, dn, filenames in os.walk(os.getcwd()) for f in filenames if os.path.splitext(f)[1] == '.xml']

264

for xml_file in result:

Marco Brohet

2014-02-28 21:01:26 +0100

[diff] [blame]

265

# We hate empty, useless files. Crowdin exports them with <resources/> (sometimes with xliff).

266

# That means: easy to find

Marco Brohet

2014-02-28 01:06:03 +0100

[diff] [blame]

267

if '<resources/>' in open(xml_file).read():

268

print ('Removing ' + xml_file)

269

os.remove(xml_file)

Marco Brohet

2014-02-28 18:48:17 +0100

[diff] [blame]

270

elif '<resources xmlns:xliff="urn:oasis:names:tc:xliff:document:1.2"/>' in open(xml_file).read():

Marco Brohet

2014-02-28 01:06:03 +0100

[diff] [blame]

271

print ('Removing ' + xml_file)

272

os.remove(xml_file)

273

Marco Brohet

2014-02-28 01:06:03 +0100

[diff] [blame]

274

print('\nSTEP 5: Push translations to Git')

Marco Brohet

2014-02-28 21:01:26 +0100

[diff] [blame]

275

# Get all files that Crowdin pushed

Marco Brohet

2014-02-28 01:06:03 +0100

[diff] [blame]

276

proc = subprocess.Popen(['crowdin-cli', 'list', 'sources'],stdout=subprocess.PIPE)

Marco Brohet

2014-02-28 01:06:03 +0100

[diff] [blame]

277

xml = minidom.parse('default.xml')

278

items = xml.getElementsByTagName('project')

Marco Brohet

2014-02-28 18:48:17 +0100

[diff] [blame]

279

all_projects = []

Marco Brohet

2014-02-28 01:06:03 +0100

[diff] [blame]

280

Marco Brohet

2014-02-28 18:48:17 +0100

[diff] [blame]

281

for path in iter(proc.stdout.readline,''):

Marco Brohet

2014-02-28 21:01:26 +0100

[diff] [blame]

282

# Remove the \n at the end of each line

Marco Brohet

2014-02-28 18:48:17 +0100

[diff] [blame]

283

path = path.rstrip()

Marco Brohet

2014-02-28 21:01:26 +0100

[diff] [blame]

284

# Get project root dir from Crowdin's output

Marco Brohet

2014-02-28 18:48:17 +0100

[diff] [blame]

285

286

for good_path in m.groups():

Marco Brohet

2014-02-28 21:01:26 +0100

[diff] [blame]

287

# When a project has multiple translatable files, Crowdin will give duplicates.

288

# We don't want that (useless empty commits), so we save each project in all_projects

289

# and check if it's already in there.

Marco Brohet

2014-02-28 18:48:17 +0100

[diff] [blame]

290

if good_path is not None and not good_path in all_projects:

291

all_projects.append(good_path)

292

working = 'false'

293

for project_item in items:

Marco Brohet

2014-02-28 21:01:26 +0100

[diff] [blame]

294

# We need to have the Github repository for the git push url. Obtain them from

295

# default.xml based on the project root dir.

Marco Brohet

2014-02-28 18:48:17 +0100

[diff] [blame]

296

if project_item.attributes["path"].value == good_path:

297

working = 'true'

Marco Brohet

2014-02-28 21:01:26 +0100

[diff] [blame]

298

push_as_commit(good_path, project_item.attributes['name'].value)

299

print 'Committing ' + project_item.attributes['name'].value + ' (based on default.xml)'

300

# We also translate repositories that are not downloaded by default (e.g. device parts).

301

# This is just a fallback.

302

# WARNING: If the name is wrong, this will not stop the script.

Marco Brohet

2014-02-28 18:48:17 +0100

[diff] [blame]

303

if working == 'false':

Marco Brohet

2014-02-28 21:01:26 +0100

[diff] [blame]

304

push_as_commit(good_path, 'CyanogenMod/android_' + good_path.replace('/', '_'))

305

print 'Committing ' + project_item.attributes['name'].value + ' (workaround)'

Marco Brohet