Blame - tools/releasetools/blockimgdiff.py - platform_build_make

2014-08-26 13:10:25 -0700

[diff] [blame]

15

from __future__ import print_function

16

17

from collections import deque, OrderedDict

18

from hashlib import sha1

Doug Zongker

2016-02-09 08:28:09 -0800

[diff] [blame]

19

import array

Tao Bao

8dcf738

2015-05-21 14:09:49 -0700

[diff] [blame]

20

import common

Doug Zongker

2016-02-09 08:28:09 -0800

[diff] [blame]

21

import functools

Doug Zongker

2014-09-08 08:29:55 -0700

[diff] [blame]

22

import heapq

Doug Zongker

2014-08-26 13:10:25 -0700

[diff] [blame]

23

import itertools

24

import multiprocessing

25

import os

Doug Zongker

2014-08-26 13:10:25 -0700

[diff] [blame]

26

import re

27

import subprocess

Doug Zongker

2014-08-26 13:10:25 -0700

[diff] [blame]

28

import threading

Doug Zongker

2016-02-09 08:28:09 -0800

[diff] [blame]

29

import time

Doug Zongker

2014-08-26 13:10:25 -0700

[diff] [blame]

30

import tempfile

31

Dan Albert

2015-03-23 19:13:21 -0700

[diff] [blame]

32

from rangelib import RangeSet

33

Doug Zongker

2014-08-26 13:10:25 -0700

[diff] [blame]

34

Doug Zongker

2014-08-26 10:40:28 -0700

[diff] [blame]

35

__all__ = ["EmptyImage", "DataImage", "BlockImageDiff"]

36

Dan Albert

2015-03-23 19:13:21 -0700

[diff] [blame]

37

Doug Zongker

2014-08-26 13:10:25 -0700

[diff] [blame]

38

def compute_patch(src, tgt, imgdiff=False):

39

srcfd, srcfile = tempfile.mkstemp(prefix="src-")

40

tgtfd, tgtfile = tempfile.mkstemp(prefix="tgt-")

41

patchfd, patchfile = tempfile.mkstemp(prefix="patch-")

os.close(patchfd)

try:

with os.fdopen(srcfd, "wb") as f_src:

for p in src:

f_src.write(p)

with os.fdopen(tgtfd, "wb") as f_tgt:

for p in tgt:

f_tgt.write(p)

try:

os.unlink(patchfile)

except OSError:

pass

if imgdiff:

p = subprocess.call(["imgdiff", "-z", srcfile, tgtfile, patchfile],

58

stdout=open("/dev/null", "a"),

59

stderr=subprocess.STDOUT)

60

else:

61

p = subprocess.call(["bsdiff", srcfile, tgtfile, patchfile])

62

63

if p:

64

raise ValueError("diff failed: " + str(p))

65

66

with open(patchfile, "rb") as f:

return f.read()

finally:

try:

os.unlink(srcfile)

os.unlink(tgtfile)

os.unlink(patchfile)

except OSError:

pass

Dan Albert

2015-03-23 19:13:21 -0700

[diff] [blame]

76

77

class Image(object):

78

def ReadRangeSet(self, ranges):

79

raise NotImplementedError

80

Tao Bao

2015-06-01 13:40:49 -0700

[diff] [blame]

81

def TotalSha1(self, include_clobbered_blocks=False):

Dan Albert

2015-03-23 19:13:21 -0700

[diff] [blame]

82

raise NotImplementedError

83

84

85

class EmptyImage(Image):

Doug Zongker

2014-08-26 13:10:25 -0700

[diff] [blame]

86

"""A zero-length image."""

87

blocksize = 4096

88

care_map = RangeSet()

Tao Bao

2015-05-12 11:42:31 -0700

[diff] [blame]

89

clobbered_blocks = RangeSet()

Tao Bao

2015-07-09 17:37:49 -0700

[diff] [blame]

90

extended = RangeSet()

Doug Zongker

2014-08-26 13:10:25 -0700

[diff] [blame]

91

total_blocks = 0

92

file_map = {}

93

def ReadRangeSet(self, ranges):

94

return ()

Tao Bao

2015-06-01 13:40:49 -0700

[diff] [blame]

95

def TotalSha1(self, include_clobbered_blocks=False):

96

# EmptyImage always carries empty clobbered_blocks, so

97

# include_clobbered_blocks can be ignored.

98

assert self.clobbered_blocks.size() == 0

Doug Zongker

2014-08-26 10:40:28 -0700

[diff] [blame]

99

return sha1().hexdigest()

100

101

Dan Albert

2015-03-23 19:13:21 -0700

[diff] [blame]

102

class DataImage(Image):

Doug Zongker

2014-08-26 10:40:28 -0700

[diff] [blame]

103

"""An image wrapped around a single string of data."""

104

105

def __init__(self, data, trim=False, pad=False):

106

self.data = data

107

self.blocksize = 4096

108

109

assert not (trim and pad)

110

111

partial = len(self.data) % self.blocksize

Tao Bao

2015-09-05 20:35:32 -0700

[diff] [blame]

112

padded = False

Doug Zongker

2014-08-26 10:40:28 -0700

[diff] [blame]

113

if partial > 0:

114

if trim:

115

self.data = self.data[:-partial]

116

elif pad:

117

self.data += '\0' * (self.blocksize - partial)

Tao Bao

2015-09-05 20:35:32 -0700

[diff] [blame]

118

padded = True

Doug Zongker

2014-08-26 10:40:28 -0700

[diff] [blame]

119

else:

120

raise ValueError(("data for DataImage must be multiple of %d bytes "

121

"unless trim or pad is specified") %

122

(self.blocksize,))

123

124

assert len(self.data) % self.blocksize == 0

125

126

self.total_blocks = len(self.data) / self.blocksize

127

self.care_map = RangeSet(data=(0, self.total_blocks))

Tao Bao

2015-09-05 20:35:32 -0700

[diff] [blame]

128

# When the last block is padded, we always write the whole block even for

129

# incremental OTAs. Because otherwise the last block may get skipped if

130

# unchanged for an incremental, but would fail the post-install

131

# verification if it has non-zero contents in the padding bytes.

132

# Bug: 23828506

133

if padded:

Tao Bao

2015-09-08 13:39:40 -0700

[diff] [blame]

134

clobbered_blocks = [self.total_blocks-1, self.total_blocks]

Tao Bao

2015-09-05 20:35:32 -0700

[diff] [blame]

135

else:

Tao Bao

2015-09-08 13:39:40 -0700

[diff] [blame]

136

clobbered_blocks = []

137

self.clobbered_blocks = clobbered_blocks

Tao Bao

2015-07-09 17:37:49 -0700

[diff] [blame]

138

self.extended = RangeSet()

Doug Zongker

2014-08-26 10:40:28 -0700

[diff] [blame]

zero_blocks = []

nonzero_blocks = []

reference = '\0' * self.blocksize

143

Tao Bao

2015-09-05 20:35:32 -0700

[diff] [blame]

144

for i in range(self.total_blocks-1 if padded else self.total_blocks):

Doug Zongker

2014-08-26 10:40:28 -0700

[diff] [blame]

145

d = self.data[i*self.blocksize : (i+1)*self.blocksize]

146

if d == reference:

147

zero_blocks.append(i)

148

zero_blocks.append(i+1)

149

else:

150

nonzero_blocks.append(i)

151

nonzero_blocks.append(i+1)

152

Tao Bao

2015-09-08 13:39:40 -0700

[diff] [blame]

153

assert zero_blocks or nonzero_blocks or clobbered_blocks

Doug Zongker

2014-08-26 10:40:28 -0700

[diff] [blame]

154

Tao Bao

2015-09-08 13:39:40 -0700

[diff] [blame]

155

self.file_map = dict()

156

if zero_blocks:

157

self.file_map["__ZERO"] = RangeSet(data=zero_blocks)

158

if nonzero_blocks:

159

self.file_map["__NONZERO"] = RangeSet(data=nonzero_blocks)

160

if clobbered_blocks:

161

self.file_map["__COPY"] = RangeSet(data=clobbered_blocks)

Tao Bao

2015-09-05 20:35:32 -0700

[diff] [blame]

162

Doug Zongker

2014-08-26 10:40:28 -0700

[diff] [blame]

163

def ReadRangeSet(self, ranges):

164

return [self.data[s*self.blocksize:e*self.blocksize] for (s, e) in ranges]

165

Tao Bao

2015-06-01 13:40:49 -0700

[diff] [blame]

166

def TotalSha1(self, include_clobbered_blocks=False):

Tao Bao

2015-09-05 20:35:32 -0700

[diff] [blame]

167

if not include_clobbered_blocks:

168

ranges = self.care_map.subtract(self.clobbered_blocks)

169

return sha1(self.ReadRangeSet(ranges)).hexdigest()

170

else:

171

return sha1(self.data).hexdigest()

Doug Zongker

2014-08-26 10:40:28 -0700

[diff] [blame]

172

Doug Zongker

2014-08-26 13:10:25 -0700

[diff] [blame]

173

174

class Transfer(object):

175

def __init__(self, tgt_name, src_name, tgt_ranges, src_ranges, style, by_id):

176

self.tgt_name = tgt_name

177

self.src_name = src_name

178

self.tgt_ranges = tgt_ranges

179

self.src_ranges = src_ranges

180

self.style = style

181

self.intact = (getattr(tgt_ranges, "monotonic", False) and

182

getattr(src_ranges, "monotonic", False))

Tao Bao

b8c8717

2015-03-19 19:42:12 -0700

[diff] [blame]

183

184

# We use OrderedDict rather than dict so that the output is repeatable;

185

# otherwise it would depend on the hash values of the Transfer objects.

186

self.goes_before = OrderedDict()

187

self.goes_after = OrderedDict()

Doug Zongker

2014-08-26 13:10:25 -0700

[diff] [blame]

188

Doug Zongker

2014-09-08 08:29:55 -0700

[diff] [blame]

189

self.stash_before = []

190

self.use_stash = []

191

Doug Zongker

2014-08-26 13:10:25 -0700

[diff] [blame]

self.id = len(by_id)

by_id.append(self)

Doug Zongker

2014-09-08 08:29:55 -0700

[diff] [blame]

195

def NetStashChange(self):

196

return (sum(sr.size() for (_, sr) in self.stash_before) -

197

sum(sr.size() for (_, sr) in self.use_stash))

198

Tao Bao

2015-08-17 09:45:13 -0700

[diff] [blame]

199

def ConvertToNew(self):

200

assert self.style != "new"

201

self.use_stash = []

202

self.style = "new"

203

self.src_ranges = RangeSet()

204

Doug Zongker

2014-08-26 13:10:25 -0700

[diff] [blame]

205

def __str__(self):

206

return (str(self.id) + ": <" + str(self.src_ranges) + " " + self.style +

207

" to " + str(self.tgt_ranges) + ">")

208

209

Doug Zongker

2016-02-09 08:28:09 -0800

[diff] [blame]

210

@functools.total_ordering

211

class HeapItem(object):

212

def __init__(self, item):

213

self.item = item

214

# Negate the score since python's heap is a min-heap and we want

215

# the maximum score.

216

self.score = -item.score

def clear(self):

self.item = None

def __bool__(self):

return self.item is None

221

def __eq__(self, other):

222

return self.score == other.score

223

def __le__(self, other):

224

return self.score <= other.score

225

226

Doug Zongker

2014-08-26 13:10:25 -0700

[diff] [blame]

227

# BlockImageDiff works on two image objects. An image object is

228

# anything that provides the following attributes:

229

#

230

# blocksize: the size in bytes of a block, currently must be 4096.

231

#

232

# total_blocks: the total size of the partition/image, in blocks.

233

#

234

# care_map: a RangeSet containing which blocks (in the range [0,

235

# total_blocks) we actually care about; i.e. which blocks contain

236

# data.

237

#

238

# file_map: a dict that partitions the blocks contained in care_map

239

# into smaller domains that are useful for doing diffs on.

240

# (Typically a domain is a file, and the key in file_map is the

241

# pathname.)

242

#

Tao Bao

2015-05-12 11:42:31 -0700

[diff] [blame]

243

# clobbered_blocks: a RangeSet containing which blocks contain data

244

# but may be altered by the FS. They need to be excluded when

245

# verifying the partition integrity.

246

#

Doug Zongker

2014-08-26 13:10:25 -0700

[diff] [blame]

247

# ReadRangeSet(): a function that takes a RangeSet and returns the

248

# data contained in the image blocks of that RangeSet. The data

249

# is returned as a list or tuple of strings; concatenating the

250

# elements together should produce the requested data.

251

# Implementations are free to break up the data into list/tuple

252

# elements in any way that is convenient.

253

#

Doug Zongker

2014-08-26 10:40:28 -0700

[diff] [blame]

254

# TotalSha1(): a function that returns (as a hex string) the SHA-1

255

# hash of all the data in the image (ie, all the blocks in the

Tao Bao

2015-06-01 13:40:49 -0700

[diff] [blame]

256

# care_map minus clobbered_blocks, or including the clobbered

257

# blocks if include_clobbered_blocks is True).

Doug Zongker

2014-08-26 10:40:28 -0700

[diff] [blame]

258

#

Doug Zongker

2014-08-26 13:10:25 -0700

[diff] [blame]

259

# When creating a BlockImageDiff, the src image may be None, in which

260

# case the list of transfers produced will never read from the

261

# original image.

262

263

class BlockImageDiff(object):

Tao Bao

2016-06-11 12:19:23 -0700

[diff] [blame]

264

def __init__(self, tgt, src=None, threads=None, version=4,

265

disable_imgdiff=False):

Doug Zongker

2014-08-26 13:10:25 -0700

[diff] [blame]

266

if threads is None:

267

threads = multiprocessing.cpu_count() // 2

Dan Albert

2015-03-23 19:13:21 -0700

[diff] [blame]

268

if threads == 0:

269

threads = 1

Doug Zongker

2014-08-26 13:10:25 -0700

[diff] [blame]

270

self.threads = threads

Doug Zongker

2014-09-08 08:29:55 -0700

[diff] [blame]

271

self.version = version

Dan Albert

2015-03-23 19:13:21 -0700

[diff] [blame]

272

self.transfers = []

273

self.src_basenames = {}

274

self.src_numpatterns = {}

Tao Bao

2016-02-04 14:26:02 -0800

[diff] [blame]

275

self._max_stashed_size = 0

Tao Bao

2016-04-12 15:53:16 -0700

[diff] [blame]

276

self.touched_src_ranges = RangeSet()

277

self.touched_src_sha1 = None

Tao Bao

2016-06-11 12:19:23 -0700

[diff] [blame]

278

self.disable_imgdiff = disable_imgdiff

Doug Zongker

2014-09-08 08:29:55 -0700

[diff] [blame]

279

Tao Bao

eba409c

2015-10-21 13:30:43 -0700

[diff] [blame]

280

assert version in (1, 2, 3, 4)

Doug Zongker

2014-08-26 13:10:25 -0700

[diff] [blame]

self.tgt = tgt

if src is None:

src = EmptyImage()

self.src = src

# The updater code that installs the patch always uses 4k blocks.

288

assert tgt.blocksize == 4096

289

assert src.blocksize == 4096

290

291

# The range sets in each filemap should comprise a partition of

292

# the care map.

293

self.AssertPartition(src.care_map, src.file_map.values())

294

self.AssertPartition(tgt.care_map, tgt.file_map.values())

295

Tao Bao

2016-02-04 14:26:02 -0800

[diff] [blame]

296

@property

297

def max_stashed_size(self):

298

return self._max_stashed_size

299

Doug Zongker

2014-08-26 13:10:25 -0700

[diff] [blame]

300

def Compute(self, prefix):

301

# When looking for a source file to use as the diff input for a

302

# target file, we try:

303

# 1) an exact path match if available, otherwise

304

# 2) a exact basename match if available, otherwise

305

# 3) a basename match after all runs of digits are replaced by

306

# "#" if available, otherwise

307

# 4) we have no source for this target.

308

self.AbbreviateSourceNames()

309

self.FindTransfers()

310

311

# Find the ordering dependencies among transfers (this is O(n^2)

312

# in the number of transfers).

313

self.GenerateDigraph()

314

# Find a sequence of transfers that satisfies as many ordering

315

# dependencies as possible (heuristically).

316

self.FindVertexSequence()

317

# Fix up the ordering dependencies that the sequence didn't

318

# satisfy.

Doug Zongker

2014-09-08 08:29:55 -0700

[diff] [blame]

319

if self.version == 1:

320

self.RemoveBackwardEdges()

321

else:

322

self.ReverseBackwardEdges()

323

self.ImproveVertexSequence()

324

Tao Bao

2015-08-17 09:45:13 -0700

[diff] [blame]

325

# Ensure the runtime stash size is under the limit.

326

if self.version >= 2 and common.OPTIONS.cache_size is not None:

327

self.ReviseStashSize()

328

Doug Zongker

2014-08-26 13:10:25 -0700

[diff] [blame]

329

# Double-check our work.

330

self.AssertSequenceGood()

331

332

self.ComputePatches(prefix)

333

self.WriteTransfers(prefix)

334

Dan Albert

2015-03-23 19:13:21 -0700

[diff] [blame]

335

def HashBlocks(self, source, ranges): # pylint: disable=no-self-use

Sami Tolvanen

2014-12-09 16:40:34 +0000

[diff] [blame]

336

data = source.ReadRangeSet(ranges)

ctx = sha1()

for p in data:

ctx.update(p)

return ctx.hexdigest()

343

Doug Zongker

2014-08-26 13:10:25 -0700

[diff] [blame]

344

def WriteTransfers(self, prefix):

Tianjie Xu

2016-06-23 16:10:35 -0700

[diff] [blame]

345

def WriteSplitTransfers(out, style, target_blocks):

346

"""Limit the size of operand in command 'new' and 'zero' to 1024 blocks.

Tianjie Xu

2016-06-21 15:54:09 -0700

[diff] [blame]

347

348

This prevents the target size of one command from being too large; and

349

might help to avoid fsync errors on some devices."""

350

Tianjie Xu

2016-06-23 16:10:35 -0700

[diff] [blame]

351

assert (style == "new" or style == "zero")

352

blocks_limit = 1024

Tianjie Xu

2016-06-21 15:54:09 -0700

[diff] [blame]

353

total = 0

Tianjie Xu

2016-06-23 16:10:35 -0700

[diff] [blame]

354

while target_blocks:

355

blocks_to_write = target_blocks.first(blocks_limit)

356

out.append("%s %s\n" % (style, blocks_to_write.to_string_raw()))

357

total += blocks_to_write.size()

358

target_blocks = target_blocks.subtract(blocks_to_write)

Tianjie Xu

2016-06-21 15:54:09 -0700

[diff] [blame]

359

return total

360

Doug Zongker

2014-08-26 13:10:25 -0700

[diff] [blame]

361

out = []

362

Doug Zongker

2014-08-26 13:10:25 -0700

[diff] [blame]

363

total = 0

Doug Zongker

2014-08-26 13:10:25 -0700

[diff] [blame]

364

Doug Zongker

2014-09-08 08:29:55 -0700

[diff] [blame]

365

stashes = {}

366

stashed_blocks = 0

367

max_stashed_blocks = 0

free_stash_ids = []

next_stash_id = 0

Doug Zongker

2014-08-26 13:10:25 -0700

[diff] [blame]

372

for xf in self.transfers:

373

Doug Zongker

2014-09-08 08:29:55 -0700

[diff] [blame]

374

if self.version < 2:

375

assert not xf.stash_before

376

assert not xf.use_stash

377

378

for s, sr in xf.stash_before:

379

assert s not in stashes

380

if free_stash_ids:

381

sid = heapq.heappop(free_stash_ids)

else:

sid = next_stash_id

next_stash_id += 1

stashes[s] = sid

Sami Tolvanen

2014-12-09 16:40:34 +0000

[diff] [blame]

386

if self.version == 2:

caozhiyuan

2015-10-21 15:14:03 +0800

[diff] [blame]

387

stashed_blocks += sr.size()

Sami Tolvanen

2014-12-09 16:40:34 +0000

[diff] [blame]

388

out.append("stash %d %s\n" % (sid, sr.to_string_raw()))

389

else:

390

sh = self.HashBlocks(self.src, sr)

if sh in stashes:

stashes[sh] += 1

else:

stashes[sh] = 1

caozhiyuan

2015-10-21 15:14:03 +0800

[diff] [blame]

395

stashed_blocks += sr.size()

Tao Bao

2016-04-12 15:53:16 -0700

[diff] [blame]

396

self.touched_src_ranges = self.touched_src_ranges.union(sr)

Sami Tolvanen

2014-12-09 16:40:34 +0000

[diff] [blame]

397

out.append("stash %s %s\n" % (sh, sr.to_string_raw()))

Doug Zongker

2014-09-08 08:29:55 -0700

[diff] [blame]

398

399

if stashed_blocks > max_stashed_blocks:

400

max_stashed_blocks = stashed_blocks

401

Jesse Zhao

7b985f6

2015-03-02 16:53:08 -0800

[diff] [blame]

402

free_string = []

caozhiyuan

2015-10-21 15:14:03 +0800

[diff] [blame]

403

free_size = 0

Jesse Zhao

7b985f6

2015-03-02 16:53:08 -0800

[diff] [blame]

404

Doug Zongker

2014-09-08 08:29:55 -0700

[diff] [blame]

405

if self.version == 1:

Tao Bao

4fcb77e

2015-10-21 13:36:01 -0700

[diff] [blame]

406

src_str = xf.src_ranges.to_string_raw() if xf.src_ranges else ""

Sami Tolvanen

2014-12-09 16:40:34 +0000

[diff] [blame]

407

elif self.version >= 2:

Doug Zongker

2014-09-08 08:29:55 -0700

[diff] [blame]

408

409

# <# blocks> <src ranges>

410

# OR

411

# <# blocks> <src ranges> <src locs> <stash refs...>

412

# OR

413

# <# blocks> - <stash refs...>

414

415

size = xf.src_ranges.size()

Dan Albert

2015-03-23 19:13:21 -0700

[diff] [blame]

416

src_str = [str(size)]

Doug Zongker

2014-09-08 08:29:55 -0700

[diff] [blame]

417

418

unstashed_src_ranges = xf.src_ranges

419

mapped_stashes = []

420

for s, sr in xf.use_stash:

Tao Bao

2016-12-16 11:13:55 -0800

[diff] [blame]

421

# TODO: We don't need 'sid' (nor free_stash_ids) in BBOTA v3+.

Doug Zongker

2014-09-08 08:29:55 -0700

[diff] [blame]

422

sid = stashes.pop(s)

Doug Zongker

2014-09-08 08:29:55 -0700

[diff] [blame]

423

unstashed_src_ranges = unstashed_src_ranges.subtract(sr)

Sami Tolvanen

2014-12-09 16:40:34 +0000

[diff] [blame]

424

sh = self.HashBlocks(self.src, sr)

Doug Zongker

2014-09-08 08:29:55 -0700

[diff] [blame]

425

sr = xf.src_ranges.map_within(sr)

426

mapped_stashes.append(sr)

Sami Tolvanen

2014-12-09 16:40:34 +0000

[diff] [blame]

427

if self.version == 2:

Dan Albert

2015-03-23 19:13:21 -0700

[diff] [blame]

428

src_str.append("%d:%s" % (sid, sr.to_string_raw()))

Tao Bao

bb625d2

2015-08-13 14:44:15 -0700

[diff] [blame]

429

# A stash will be used only once. We need to free the stash

430

# immediately after the use, instead of waiting for the automatic

431

# clean-up at the end. Because otherwise it may take up extra space

432

# and lead to OTA failures.

433

# Bug: 23119955

434

free_string.append("free %d\n" % (sid,))

caozhiyuan

2015-10-21 15:14:03 +0800

[diff] [blame]

435

free_size += sr.size()

Sami Tolvanen

2014-12-09 16:40:34 +0000

[diff] [blame]

436

else:

437

assert sh in stashes

Dan Albert

2015-03-23 19:13:21 -0700

[diff] [blame]

438

src_str.append("%s:%s" % (sh, sr.to_string_raw()))

Sami Tolvanen

2014-12-09 16:40:34 +0000

[diff] [blame]

439

stashes[sh] -= 1

440

if stashes[sh] == 0:

caozhiyuan

2015-10-21 15:14:03 +0800

[diff] [blame]

441

free_size += sr.size()

Tao Bao

2016-12-16 11:13:55 -0800

[diff] [blame]

442

free_string.append("free %s\n" % (sh,))

Sami Tolvanen

2014-12-09 16:40:34 +0000

[diff] [blame]

443

stashes.pop(sh)

Doug Zongker

2014-09-08 08:29:55 -0700

[diff] [blame]

444

heapq.heappush(free_stash_ids, sid)

445

446

if unstashed_src_ranges:

Dan Albert

2015-03-23 19:13:21 -0700

[diff] [blame]

447

src_str.insert(1, unstashed_src_ranges.to_string_raw())

Doug Zongker

2014-09-08 08:29:55 -0700

[diff] [blame]

448

if xf.use_stash:

449

mapped_unstashed = xf.src_ranges.map_within(unstashed_src_ranges)

Dan Albert

2015-03-23 19:13:21 -0700

[diff] [blame]

450

src_str.insert(2, mapped_unstashed.to_string_raw())

Doug Zongker

2014-09-08 08:29:55 -0700

[diff] [blame]

451

mapped_stashes.append(mapped_unstashed)

452

self.AssertPartition(RangeSet(data=(0, size)), mapped_stashes)

453

else:

Dan Albert

2015-03-23 19:13:21 -0700

[diff] [blame]

454

src_str.insert(1, "-")

Doug Zongker

2014-09-08 08:29:55 -0700

[diff] [blame]

455

self.AssertPartition(RangeSet(data=(0, size)), mapped_stashes)

456

Dan Albert

2015-03-23 19:13:21 -0700

[diff] [blame]

457

src_str = " ".join(src_str)

Doug Zongker

2014-09-08 08:29:55 -0700

[diff] [blame]

458

Sami Tolvanen

2014-12-09 16:40:34 +0000

[diff] [blame]

459

# all versions:

Doug Zongker

2014-09-08 08:29:55 -0700

[diff] [blame]

# zero <rangeset>

# new <rangeset>

# erase <rangeset>

#

# version 1:

# bsdiff patchstart patchlen <src rangeset> <tgt rangeset>

466

# imgdiff patchstart patchlen <src rangeset> <tgt rangeset>

467

# move <src rangeset> <tgt rangeset>

468

#

469

# version 2:

Dan Albert

2015-03-23 19:13:21 -0700

[diff] [blame]

470

# bsdiff patchstart patchlen <tgt rangeset> <src_str>

471

# imgdiff patchstart patchlen <tgt rangeset> <src_str>

472

# move <tgt rangeset> <src_str>

Sami Tolvanen

2014-12-09 16:40:34 +0000

[diff] [blame]

473

#

474

# version 3:

Dan Albert

2015-03-23 19:13:21 -0700

[diff] [blame]

475

# bsdiff patchstart patchlen srchash tgthash <tgt rangeset> <src_str>

476

# imgdiff patchstart patchlen srchash tgthash <tgt rangeset> <src_str>

477

# move hash <tgt rangeset> <src_str>

Doug Zongker

2014-08-26 13:10:25 -0700

[diff] [blame]

478

479

tgt_size = xf.tgt_ranges.size()

480

481

if xf.style == "new":

482

assert xf.tgt_ranges

Tianjie Xu

2016-06-23 16:10:35 -0700

[diff] [blame]

483

assert tgt_size == WriteSplitTransfers(out, xf.style, xf.tgt_ranges)

Doug Zongker

2014-08-26 13:10:25 -0700

[diff] [blame]

484

total += tgt_size

485

elif xf.style == "move":

Doug Zongker

2014-08-26 13:10:25 -0700

[diff] [blame]

486

assert xf.tgt_ranges

487

assert xf.src_ranges.size() == tgt_size

488

if xf.src_ranges != xf.tgt_ranges:

Doug Zongker

2014-09-08 08:29:55 -0700

[diff] [blame]

489

if self.version == 1:

490

out.append("%s %s %s\n" % (

491

xf.style,

492

xf.src_ranges.to_string_raw(), xf.tgt_ranges.to_string_raw()))

493

elif self.version == 2:

494

out.append("%s %s %s\n" % (

495

xf.style,

Dan Albert

2015-03-23 19:13:21 -0700

[diff] [blame]

496

xf.tgt_ranges.to_string_raw(), src_str))

Sami Tolvanen

2014-12-09 16:40:34 +0000

[diff] [blame]

497

elif self.version >= 3:

Sami Tolvanen

2015-04-17 16:28:08 +0100

[diff] [blame]

498

# take into account automatic stashing of overlapping blocks

499

if xf.src_ranges.overlaps(xf.tgt_ranges):

Tao Bao

2015-07-09 17:37:49 -0700

[diff] [blame]

500

temp_stash_usage = stashed_blocks + xf.src_ranges.size()

Sami Tolvanen

2015-04-17 16:28:08 +0100

[diff] [blame]

501

if temp_stash_usage > max_stashed_blocks:

502

max_stashed_blocks = temp_stash_usage

503

Tao Bao

2016-04-12 15:53:16 -0700

[diff] [blame]

504

self.touched_src_ranges = self.touched_src_ranges.union(

505

xf.src_ranges)

506

Sami Tolvanen

2014-12-09 16:40:34 +0000

[diff] [blame]

507

out.append("%s %s %s %s\n" % (

508

xf.style,

509

self.HashBlocks(self.tgt, xf.tgt_ranges),

Dan Albert

2015-03-23 19:13:21 -0700

[diff] [blame]

510

xf.tgt_ranges.to_string_raw(), src_str))

Doug Zongker

2014-08-26 13:10:25 -0700

[diff] [blame]

511

total += tgt_size

512

elif xf.style in ("bsdiff", "imgdiff"):

Doug Zongker

2014-08-26 13:10:25 -0700

[diff] [blame]

513

assert xf.tgt_ranges

514

assert xf.src_ranges

Doug Zongker

2014-09-08 08:29:55 -0700

[diff] [blame]

515

if self.version == 1:

516

out.append("%s %d %d %s %s\n" % (

517

xf.style, xf.patch_start, xf.patch_len,

518

xf.src_ranges.to_string_raw(), xf.tgt_ranges.to_string_raw()))

519

elif self.version == 2:

520

out.append("%s %d %d %s %s\n" % (

521

xf.style, xf.patch_start, xf.patch_len,

Dan Albert

2015-03-23 19:13:21 -0700

[diff] [blame]

522

xf.tgt_ranges.to_string_raw(), src_str))

Sami Tolvanen

2014-12-09 16:40:34 +0000

[diff] [blame]

523

elif self.version >= 3:

Sami Tolvanen

2015-04-17 16:28:08 +0100

[diff] [blame]

524

# take into account automatic stashing of overlapping blocks

525

if xf.src_ranges.overlaps(xf.tgt_ranges):

Tao Bao

2015-07-09 17:37:49 -0700

[diff] [blame]

526

temp_stash_usage = stashed_blocks + xf.src_ranges.size()

Sami Tolvanen

2015-04-17 16:28:08 +0100

[diff] [blame]

527

if temp_stash_usage > max_stashed_blocks:

528

max_stashed_blocks = temp_stash_usage

529

Tao Bao

2016-04-12 15:53:16 -0700

[diff] [blame]

530

self.touched_src_ranges = self.touched_src_ranges.union(

531

xf.src_ranges)

532

Sami Tolvanen

2014-12-09 16:40:34 +0000

[diff] [blame]

533

out.append("%s %d %d %s %s %s %s\n" % (

534

xf.style,

535

xf.patch_start, xf.patch_len,

536

self.HashBlocks(self.src, xf.src_ranges),

537

self.HashBlocks(self.tgt, xf.tgt_ranges),

Dan Albert

2015-03-23 19:13:21 -0700

[diff] [blame]

538

xf.tgt_ranges.to_string_raw(), src_str))

Doug Zongker

2014-08-26 13:10:25 -0700

[diff] [blame]

539

total += tgt_size

540

elif xf.style == "zero":

541

assert xf.tgt_ranges

542

to_zero = xf.tgt_ranges.subtract(xf.src_ranges)

Tianjie Xu

2016-06-23 16:10:35 -0700

[diff] [blame]

543

assert WriteSplitTransfers(out, xf.style, to_zero) == to_zero.size()

Tianjie Xu

2016-06-21 15:54:09 -0700

[diff] [blame]

544

total += to_zero.size()

Doug Zongker

2014-08-26 13:10:25 -0700

[diff] [blame]

545

else:

Dan Albert

2015-03-23 19:13:21 -0700

[diff] [blame]

546

raise ValueError("unknown transfer style '%s'\n" % xf.style)

Doug Zongker

2014-08-26 13:10:25 -0700

[diff] [blame]

547

Sami Tolvanen

2014-12-09 16:40:34 +0000

[diff] [blame]

548

if free_string:

549

out.append("".join(free_string))

caozhiyuan

2015-10-21 15:14:03 +0800

[diff] [blame]

550

stashed_blocks -= free_size

Sami Tolvanen

2014-12-09 16:40:34 +0000

[diff] [blame]

551

Tao Bao

575d68a

2015-08-07 19:49:45 -0700

[diff] [blame]

552

if self.version >= 2 and common.OPTIONS.cache_size is not None:

Tao Bao

8dcf738

2015-05-21 14:09:49 -0700

[diff] [blame]

553

# Sanity check: abort if we're going to need more stash space than

554

# the allowed size (cache_size * threshold). There are two purposes

555

# of having a threshold here. a) Part of the cache may have been

556

# occupied by some recovery logs. b) It will buy us some time to deal

557

# with the oversize issue.

558

cache_size = common.OPTIONS.cache_size

559

stash_threshold = common.OPTIONS.stash_threshold

560

max_allowed = cache_size * stash_threshold

561

assert max_stashed_blocks * self.tgt.blocksize < max_allowed, \

562

'Stash size %d (%d * %d) exceeds the limit %d (%d * %.2f)' % (

563

max_stashed_blocks * self.tgt.blocksize, max_stashed_blocks,

564

self.tgt.blocksize, max_allowed, cache_size,

565

stash_threshold)

Doug Zongker

2014-08-26 13:10:25 -0700

[diff] [blame]

566

Tao Bao

2016-04-12 15:53:16 -0700

[diff] [blame]

567

if self.version >= 3:

568

self.touched_src_sha1 = self.HashBlocks(

569

self.src, self.touched_src_ranges)

570

Tao Bao

2015-07-09 17:37:49 -0700

[diff] [blame]

571

# Zero out extended blocks as a workaround for bug 20881595.

572

if self.tgt.extended:

Tianjie Xu

2016-06-23 16:10:35 -0700

[diff] [blame]

573

assert (WriteSplitTransfers(out, "zero", self.tgt.extended) ==

Tianjie Xu

2016-06-21 15:54:09 -0700

[diff] [blame]

574

self.tgt.extended.size())

Tao Bao

b32d56e

2015-09-09 11:55:01 -0700

[diff] [blame]

575

total += self.tgt.extended.size()

Tao Bao

2015-07-09 17:37:49 -0700

[diff] [blame]

576

577

# We erase all the blocks on the partition that a) don't contain useful

Tao Bao

66f1fa6

2016-05-03 10:02:01 -0700

[diff] [blame]

578

# data in the new image; b) will not be touched by dm-verity. Out of those

579

# blocks, we erase the ones that won't be used in this update at the

580

# beginning of an update. The rest would be erased at the end. This is to

581

# work around the eMMC issue observed on some devices, which may otherwise

582

# get starving for clean blocks and thus fail the update. (b/28347095)

Doug Zongker

2014-08-26 13:10:25 -0700

[diff] [blame]

583

all_tgt = RangeSet(data=(0, self.tgt.total_blocks))

Tao Bao

2015-07-09 17:37:49 -0700

[diff] [blame]

584

all_tgt_minus_extended = all_tgt.subtract(self.tgt.extended)

585

new_dontcare = all_tgt_minus_extended.subtract(self.tgt.care_map)

Tao Bao

66f1fa6

2016-05-03 10:02:01 -0700

[diff] [blame]

586

587

erase_first = new_dontcare.subtract(self.touched_src_ranges)

588

if erase_first:

589

out.insert(0, "erase %s\n" % (erase_first.to_string_raw(),))

590

591

erase_last = new_dontcare.subtract(erase_first)

592

if erase_last:

593

out.append("erase %s\n" % (erase_last.to_string_raw(),))

Doug Zongker

e985f6f

2014-09-09 12:38:47 -0700

[diff] [blame]

594

595

out.insert(0, "%d\n" % (self.version,)) # format version number

Tao Bao

b32d56e

2015-09-09 11:55:01 -0700

[diff] [blame]

596

out.insert(1, "%d\n" % (total,))

Doug Zongker

e985f6f

2014-09-09 12:38:47 -0700

[diff] [blame]

597

if self.version >= 2:

598

# version 2 only: after the total block count, we give the number

599

# of stash slots needed, and the maximum size needed (in blocks)

600

out.insert(2, str(next_stash_id) + "\n")

601

out.insert(3, str(max_stashed_blocks) + "\n")

Doug Zongker

2014-08-26 13:10:25 -0700

[diff] [blame]

602

603

with open(prefix + ".transfer.list", "wb") as f:

for i in out:

f.write(i)

Doug Zongker

2014-09-08 08:29:55 -0700

[diff] [blame]

607

if self.version >= 2:

Tao Bao

2016-02-04 14:26:02 -0800

[diff] [blame]

608

self._max_stashed_size = max_stashed_blocks * self.tgt.blocksize

Tao Bao

575d68a

2015-08-07 19:49:45 -0700

[diff] [blame]

609

OPTIONS = common.OPTIONS

610

if OPTIONS.cache_size is not None:

611

max_allowed = OPTIONS.cache_size * OPTIONS.stash_threshold

612

print("max stashed blocks: %d (%d bytes), "

613

"limit: %d bytes (%.2f%%)\n" % (

Tao Bao

2016-02-04 14:26:02 -0800

[diff] [blame]

614

max_stashed_blocks, self._max_stashed_size, max_allowed,

615

self._max_stashed_size * 100.0 / max_allowed))

Tao Bao

575d68a

2015-08-07 19:49:45 -0700

[diff] [blame]

616

else:

617

print("max stashed blocks: %d (%d bytes), limit: <unknown>\n" % (

Tao Bao

2016-02-04 14:26:02 -0800

[diff] [blame]

618

max_stashed_blocks, self._max_stashed_size))

Doug Zongker

2014-09-08 08:29:55 -0700

[diff] [blame]

619

Tao Bao

2015-08-17 09:45:13 -0700

[diff] [blame]

620

def ReviseStashSize(self):

621

print("Revising stash size...")

Tao Bao

2016-12-16 11:13:55 -0800

[diff] [blame]

622

stash_map = {}

Tao Bao

2015-08-17 09:45:13 -0700

[diff] [blame]

623

624

# Create the map between a stash and its def/use points. For example, for a

625

# given stash of (idx, sr), stashes[idx] = (sr, def_cmd, use_cmd).

626

for xf in self.transfers:

627

# Command xf defines (stores) all the stashes in stash_before.

628

for idx, sr in xf.stash_before:

Tao Bao

2016-12-16 11:13:55 -0800

[diff] [blame]

629

stash_map[idx] = (sr, xf)

Tao Bao

2015-08-17 09:45:13 -0700

[diff] [blame]

630

631

# Record all the stashes command xf uses.

632

for idx, _ in xf.use_stash:

Tao Bao

2016-12-16 11:13:55 -0800

[diff] [blame]

633

stash_map[idx] += (xf,)

Tao Bao

2015-08-17 09:45:13 -0700

[diff] [blame]

634

635

# Compute the maximum blocks available for stash based on /cache size and

636

# the threshold.

637

cache_size = common.OPTIONS.cache_size

638

stash_threshold = common.OPTIONS.stash_threshold

639

max_allowed = cache_size * stash_threshold / self.tgt.blocksize

640

Tao Bao

2016-12-16 11:13:55 -0800

[diff] [blame]

641

stashes = {}

Tao Bao

2015-08-17 09:45:13 -0700

[diff] [blame]

642

stashed_blocks = 0

Tao Bao

2015-08-25 15:10:10 -0700

[diff] [blame]

643

new_blocks = 0

Tao Bao

2015-08-17 09:45:13 -0700

[diff] [blame]

644

Tao Bao

2016-12-16 11:13:55 -0800

[diff] [blame]

free_stash_ids = []

next_stash_id = 0

Tao Bao

2015-08-17 09:45:13 -0700

[diff] [blame]

648

# Now go through all the commands. Compute the required stash size on the

649

# fly. If a command requires excess stash than available, it deletes the

650

# stash by replacing the command that uses the stash with a "new" command

651

# instead.

652

for xf in self.transfers:

653

replaced_cmds = []

654

655

# xf.stash_before generates explicit stash commands.

656

for idx, sr in xf.stash_before:

Tao Bao

2016-12-16 11:13:55 -0800

[diff] [blame]

657

assert idx not in stashes

658

if free_stash_ids:

659

sid = heapq.heappop(free_stash_ids)

else:

sid = next_stash_id

next_stash_id += 1

stashes[idx] = sid

# Check the post-command stashed_blocks.

666

stashed_blocks_after = stashed_blocks

667

if self.version == 2:

668

stashed_blocks_after += sr.size()

669

else:

670

sh = self.HashBlocks(self.src, sr)

if sh in stashes:

stashes[sh] += 1

else:

stashes[sh] = 1

stashed_blocks_after += sr.size()

676

677

if stashed_blocks_after > max_allowed:

Tao Bao

2015-08-17 09:45:13 -0700

[diff] [blame]

678

# We cannot stash this one for a later command. Find out the command

679

# that will use this stash and replace the command with "new".

Tao Bao

2016-12-16 11:13:55 -0800

[diff] [blame]

680

use_cmd = stash_map[idx][2]

Tao Bao

2015-08-17 09:45:13 -0700

[diff] [blame]

681

replaced_cmds.append(use_cmd)

Tao Bao

2015-08-25 15:10:10 -0700

[diff] [blame]

682

print("%10d %9s %s" % (sr.size(), "explicit", use_cmd))

Tao Bao

2015-08-17 09:45:13 -0700

[diff] [blame]

683

else:

Tao Bao

2016-12-16 11:13:55 -0800

[diff] [blame]

684

stashed_blocks = stashed_blocks_after

Tao Bao

2015-08-17 09:45:13 -0700

[diff] [blame]

685

686

# "move" and "diff" may introduce implicit stashes in BBOTA v3. Prior to

687

# ComputePatches(), they both have the style of "diff".

688

if xf.style == "diff" and self.version >= 3:

689

assert xf.tgt_ranges and xf.src_ranges

690

if xf.src_ranges.overlaps(xf.tgt_ranges):

691

if stashed_blocks + xf.src_ranges.size() > max_allowed:

692

replaced_cmds.append(xf)

Tao Bao

2015-08-25 15:10:10 -0700

[diff] [blame]

693

print("%10d %9s %s" % (xf.src_ranges.size(), "implicit", xf))

Tao Bao

2015-08-17 09:45:13 -0700

[diff] [blame]

694

695

# Replace the commands in replaced_cmds with "new"s.

696

for cmd in replaced_cmds:

697

# It no longer uses any commands in "use_stash". Remove the def points

698

# for all those stashes.

699

for idx, sr in cmd.use_stash:

Tao Bao

2016-12-16 11:13:55 -0800

[diff] [blame]

700

def_cmd = stash_map[idx][1]

Tao Bao

2015-08-17 09:45:13 -0700

[diff] [blame]

701

assert (idx, sr) in def_cmd.stash_before

702

def_cmd.stash_before.remove((idx, sr))

703

Tianjie Xu

ebe39a0

2016-01-14 14:12:26 -0800

[diff] [blame]

704

# Add up blocks that violates space limit and print total number to

705

# screen later.

706

new_blocks += cmd.tgt_ranges.size()

Tao Bao

2015-08-17 09:45:13 -0700

[diff] [blame]

707

cmd.ConvertToNew()

708

Tao Bao

2016-12-16 11:13:55 -0800

[diff] [blame]

709

# xf.use_stash generates free commands.

710

for idx, sr in xf.use_stash:

711

sid = stashes.pop(idx)

712

if self.version == 2:

713

stashed_blocks -= sr.size()

714

else:

715

sh = self.HashBlocks(self.src, sr)

assert sh in stashes

stashes[sh] -= 1

if stashes[sh] == 0:

stashed_blocks -= sr.size()

720

stashes.pop(sh)

721

heapq.heappush(free_stash_ids, sid)

722

Tianjie Xu

ebe39a0

2016-01-14 14:12:26 -0800

[diff] [blame]

723

num_of_bytes = new_blocks * self.tgt.blocksize

724

print(" Total %d blocks (%d bytes) are packed as new blocks due to "

725

"insufficient cache size." % (new_blocks, num_of_bytes))

Tao Bao

304ee27

2016-12-19 11:01:38 -0800

[diff] [blame^]

726

return new_blocks

Tao Bao

2015-08-25 15:10:10 -0700

[diff] [blame]

727

Doug Zongker

2014-08-26 13:10:25 -0700

[diff] [blame]

728

def ComputePatches(self, prefix):

729

print("Reticulating splines...")

730

diff_q = []

731

patch_num = 0

732

with open(prefix + ".new.dat", "wb") as new_f:

733

for xf in self.transfers:

734

if xf.style == "zero":

Tao Bao

2016-09-19 22:26:30 -0700

[diff] [blame]

735

tgt_size = xf.tgt_ranges.size() * self.tgt.blocksize

736

print("%10d %10d (%6.2f%%) %7s %s %s" % (

737

tgt_size, tgt_size, 100.0, xf.style, xf.tgt_name,

738

str(xf.tgt_ranges)))

739

Doug Zongker

2014-08-26 13:10:25 -0700

[diff] [blame]

740

elif xf.style == "new":

741

for piece in self.tgt.ReadRangeSet(xf.tgt_ranges):

742

new_f.write(piece)

Tao Bao

2016-09-19 22:26:30 -0700

[diff] [blame]

743

tgt_size = xf.tgt_ranges.size() * self.tgt.blocksize

744

print("%10d %10d (%6.2f%%) %7s %s %s" % (

745

tgt_size, tgt_size, 100.0, xf.style,

746

xf.tgt_name, str(xf.tgt_ranges)))

747

Doug Zongker

2014-08-26 13:10:25 -0700

[diff] [blame]

748

elif xf.style == "diff":

749

src = self.src.ReadRangeSet(xf.src_ranges)

750

tgt = self.tgt.ReadRangeSet(xf.tgt_ranges)

751

752

# We can't compare src and tgt directly because they may have

753

# the same content but be broken up into blocks differently, eg:

754

#

755

# ["he", "llo"] vs ["h", "ello"]

756

#

757

# We want those to compare equal, ideally without having to

758

# actually concatenate the strings (these may be tens of

# megabytes).

src_sha1 = sha1()

for p in src:

src_sha1.update(p)

tgt_sha1 = sha1()

tgt_size = 0

for p in tgt:

tgt_sha1.update(p)

tgt_size += len(p)

if src_sha1.digest() == tgt_sha1.digest():

771

# These are identical; we don't need to generate a patch,

772

# just issue copy commands on the device.

773

xf.style = "move"

Tao Bao

2016-09-19 22:26:30 -0700

[diff] [blame]

774

if xf.src_ranges != xf.tgt_ranges:

775

print("%10d %10d (%6.2f%%) %7s %s %s (from %s)" % (

776

tgt_size, tgt_size, 100.0, xf.style,

777

xf.tgt_name if xf.tgt_name == xf.src_name else (

778

xf.tgt_name + " (from " + xf.src_name + ")"),

779

str(xf.tgt_ranges), str(xf.src_ranges)))

Doug Zongker

2014-08-26 13:10:25 -0700

[diff] [blame]

780

else:

781

# For files in zip format (eg, APKs, JARs, etc.) we would

782

# like to use imgdiff -z if possible (because it usually

783

# produces significantly smaller patches than bsdiff).

784

# This is permissible if:

785

#

Tao Bao

2016-06-11 12:19:23 -0700

[diff] [blame]

786

# - imgdiff is not disabled, and

Doug Zongker

2014-08-26 13:10:25 -0700

[diff] [blame]

787

# - the source and target files are monotonic (ie, the

788

# data is stored with blocks in increasing order), and

789

# - we haven't removed any blocks from the source set.

790

#

791

# If these conditions are satisfied then appending all the

792

# blocks in the set together in order will produce a valid

793

# zip file (plus possibly extra zeros in the last block),

794

# which is what imgdiff needs to operate. (imgdiff is

795

# fine with extra zeros at the end of the file.)

Tao Bao

2016-06-11 12:19:23 -0700

[diff] [blame]

796

imgdiff = (not self.disable_imgdiff and xf.intact and

Doug Zongker

2014-08-26 13:10:25 -0700

[diff] [blame]

797

xf.tgt_name.split(".")[-1].lower()

798

in ("apk", "jar", "zip"))

799

xf.style = "imgdiff" if imgdiff else "bsdiff"

800

diff_q.append((tgt_size, src, tgt, xf, patch_num))

patch_num += 1

else:

assert False, "unknown style " + xf.style

if diff_q:

if self.threads > 1:

print("Computing patches (using %d threads)..." % (self.threads,))

809

else:

810

print("Computing patches...")

811

diff_q.sort()

812

813

patches = [None] * patch_num

814

Dan Albert

2015-03-23 19:13:21 -0700

[diff] [blame]

815

# TODO: Rewrite with multiprocessing.ThreadPool?

Doug Zongker

2014-08-26 13:10:25 -0700

[diff] [blame]

816

lock = threading.Lock()

817

def diff_worker():

818

while True:

819

with lock:

Dan Albert

2015-03-23 19:13:21 -0700

[diff] [blame]

820

if not diff_q:

821

return

Doug Zongker

2014-08-26 13:10:25 -0700

[diff] [blame]

822

tgt_size, src, tgt, xf, patchnum = diff_q.pop()

823

patch = compute_patch(src, tgt, imgdiff=(xf.style == "imgdiff"))

824

size = len(patch)

825

with lock:

826

patches[patchnum] = (patch, xf)

Tao Bao

2016-09-19 22:26:30 -0700

[diff] [blame]

827

print("%10d %10d (%6.2f%%) %7s %s %s %s" % (

Doug Zongker

2014-08-26 13:10:25 -0700

[diff] [blame]

828

size, tgt_size, size * 100.0 / tgt_size, xf.style,

829

xf.tgt_name if xf.tgt_name == xf.src_name else (

Tao Bao

2016-09-19 22:26:30 -0700

[diff] [blame]

830

xf.tgt_name + " (from " + xf.src_name + ")"),

831

str(xf.tgt_ranges), str(xf.src_ranges)))

Doug Zongker

2014-08-26 13:10:25 -0700

[diff] [blame]

832

833

threads = [threading.Thread(target=diff_worker)

Dan Albert

2015-03-23 19:13:21 -0700

[diff] [blame]

834

for _ in range(self.threads)]

Doug Zongker

2014-08-26 13:10:25 -0700

[diff] [blame]

for th in threads:

th.start()

while threads:

threads.pop().join()

else:

patches = []

p = 0

with open(prefix + ".patch.dat", "wb") as patch_f:

844

for patch, xf in patches:

845

xf.patch_start = p

846

xf.patch_len = len(patch)

patch_f.write(patch)

p += len(patch)

def AssertSequenceGood(self):

851

# Simulate the sequences of transfers we will output, and check that:

852

# - we never read a block after writing it, and

853

# - we write every block we care about exactly once.

854

855

# Start with no blocks having been touched yet.

Doug Zongker

2016-02-09 08:28:09 -0800

[diff] [blame]

856

touched = array.array("B", "\0" * self.tgt.total_blocks)

Doug Zongker

2014-08-26 13:10:25 -0700

[diff] [blame]

857

858

# Imagine processing the transfers in order.

859

for xf in self.transfers:

860

# Check that the input blocks for this transfer haven't yet been touched.

Doug Zongker

2014-09-08 08:29:55 -0700

[diff] [blame]

861

862

x = xf.src_ranges

863

if self.version >= 2:

864

for _, sr in xf.use_stash:

865

x = x.subtract(sr)

866

Doug Zongker

2016-02-09 08:28:09 -0800

[diff] [blame]

867

for s, e in x:

Tao Bao

ff75c23

2016-03-04 15:23:34 -0800

[diff] [blame]

868

# Source image could be larger. Don't check the blocks that are in the

869

# source image only. Since they are not in 'touched', and won't ever

870

# be touched.

871

for i in range(s, min(e, self.tgt.total_blocks)):

Doug Zongker

2016-02-09 08:28:09 -0800

[diff] [blame]

872

assert touched[i] == 0

873

874

# Check that the output blocks for this transfer haven't yet

875

# been touched, and touch all the blocks written by this

876

# transfer.

877

for s, e in xf.tgt_ranges:

878

for i in range(s, e):

879

assert touched[i] == 0

880

touched[i] = 1

Doug Zongker

2014-08-26 13:10:25 -0700

[diff] [blame]

881

882

# Check that we've written every target block.

Doug Zongker

2016-02-09 08:28:09 -0800

[diff] [blame]

883

for s, e in self.tgt.care_map:

884

for i in range(s, e):

885

assert touched[i] == 1

Doug Zongker

2014-08-26 13:10:25 -0700

[diff] [blame]

886

Doug Zongker

2014-09-08 08:29:55 -0700

[diff] [blame]

887

def ImproveVertexSequence(self):

888

print("Improving vertex order...")

889

890

# At this point our digraph is acyclic; we reversed any edges that

891

# were backwards in the heuristically-generated sequence. The

892

# previously-generated order is still acceptable, but we hope to

893

# find a better order that needs less memory for stashed data.

894

# Now we do a topological sort to generate a new vertex order,

895

# using a greedy algorithm to choose which vertex goes next

896

# whenever we have a choice.

897

898

# Make a copy of the edge set; this copy will get destroyed by the

899

# algorithm.

900

for xf in self.transfers:

901

xf.incoming = xf.goes_after.copy()

902

xf.outgoing = xf.goes_before.copy()

903

904

L = [] # the new vertex order

905

906

# S is the set of sources in the remaining graph; we always choose

907

# the one that leaves the least amount of stashed data after it's

908

# executed.

909

S = [(u.NetStashChange(), u.order, u) for u in self.transfers

if not u.incoming]

heapq.heapify(S)

while S:

_, _, xf = heapq.heappop(S)

915

L.append(xf)

916

for u in xf.outgoing:

917

del u.incoming[xf]

918

if not u.incoming:

919

heapq.heappush(S, (u.NetStashChange(), u.order, u))

920

921

# if this fails then our graph had a cycle.

922

assert len(L) == len(self.transfers)

923

924

self.transfers = L

925

for i, xf in enumerate(L):

926

xf.order = i

927

Doug Zongker

2014-08-26 13:10:25 -0700

[diff] [blame]

928

def RemoveBackwardEdges(self):

929

print("Removing backward edges...")

in_order = 0

out_of_order = 0

lost_source = 0

for xf in self.transfers:

Doug Zongker

2014-08-26 13:10:25 -0700

[diff] [blame]

935

lost = 0

936

size = xf.src_ranges.size()

937

for u in xf.goes_before:

938

# xf should go before u

939

if xf.order < u.order:

940

# it does, hurray!

Doug Zongker

2014-09-08 08:29:55 -0700

[diff] [blame]

941

in_order += 1

Doug Zongker

2014-08-26 13:10:25 -0700

[diff] [blame]

942

else:

943

# it doesn't, boo. trim the blocks that u writes from xf's

944

# source, so that xf can go after u.

Doug Zongker

2014-09-08 08:29:55 -0700

[diff] [blame]

945

out_of_order += 1

Doug Zongker

2014-08-26 13:10:25 -0700

[diff] [blame]

946

assert xf.src_ranges.overlaps(u.tgt_ranges)

947

xf.src_ranges = xf.src_ranges.subtract(u.tgt_ranges)

948

xf.intact = False

949

950

if xf.style == "diff" and not xf.src_ranges:

951

# nothing left to diff from; treat as new data

952

xf.style = "new"

953

954

lost = size - xf.src_ranges.size()

955

lost_source += lost

Doug Zongker

2014-08-26 13:10:25 -0700

[diff] [blame]

956

957

print((" %d/%d dependencies (%.2f%%) were violated; "

958

"%d source blocks removed.") %

959

(out_of_order, in_order + out_of_order,

960

(out_of_order * 100.0 / (in_order + out_of_order))

961

if (in_order + out_of_order) else 0.0,

962

lost_source))

963

Doug Zongker

2014-09-08 08:29:55 -0700

[diff] [blame]

964

def ReverseBackwardEdges(self):

965

print("Reversing backward edges...")

in_order = 0

out_of_order = 0

stashes = 0

stash_size = 0

for xf in self.transfers:

Doug Zongker

2014-09-08 08:29:55 -0700

[diff] [blame]

972

for u in xf.goes_before.copy():

973

# xf should go before u

974

if xf.order < u.order:

# it does, hurray!

in_order += 1

else:

# it doesn't, boo. modify u to stash the blocks that it

979

# writes that xf wants to read, and then require u to go

# before xf.

out_of_order += 1

overlap = xf.src_ranges.intersect(u.tgt_ranges)

984

assert overlap

985

986

u.stash_before.append((stashes, overlap))

987

xf.use_stash.append((stashes, overlap))

988

stashes += 1

989

stash_size += overlap.size()

990

991

# reverse the edge direction; now xf must go after u

992

del xf.goes_before[u]

993

del u.goes_after[xf]

994

xf.goes_after[u] = None # value doesn't matter

995

u.goes_before[xf] = None

996

997

print((" %d/%d dependencies (%.2f%%) were violated; "

998

"%d source blocks stashed.") %

999

(out_of_order, in_order + out_of_order,

1000

(out_of_order * 100.0 / (in_order + out_of_order))

1001

if (in_order + out_of_order) else 0.0,

1002

stash_size))

1003

Doug Zongker

2014-08-26 13:10:25 -0700

[diff] [blame]

1004

def FindVertexSequence(self):

1005

print("Finding vertex sequence...")

1006

1007

# This is based on "A Fast & Effective Heuristic for the Feedback

1008

# Arc Set Problem" by P. Eades, X. Lin, and W.F. Smyth. Think of

1009

# it as starting with the digraph G and moving all the vertices to

1010

# be on a horizontal line in some order, trying to minimize the

1011

# number of edges that end up pointing to the left. Left-pointing

1012

# edges will get removed to turn the digraph into a DAG. In this

1013

# case each edge has a weight which is the number of source blocks

1014

# we'll lose if that edge is removed; we try to minimize the total

1015

# weight rather than just the number of edges.

1016

1017

# Make a copy of the edge set; this copy will get destroyed by the

1018

# algorithm.

1019

for xf in self.transfers:

1020

xf.incoming = xf.goes_after.copy()

1021

xf.outgoing = xf.goes_before.copy()

Doug Zongker

2016-02-09 08:28:09 -0800

[diff] [blame]

1022

xf.score = sum(xf.outgoing.values()) - sum(xf.incoming.values())

Doug Zongker

2014-08-26 13:10:25 -0700

[diff] [blame]

1023

1024

# We use an OrderedDict instead of just a set so that the output

1025

# is repeatable; otherwise it would depend on the hash values of

1026

# the transfer objects.

1027

G = OrderedDict()

1028

for xf in self.transfers:

1029

G[xf] = None

1030

s1 = deque() # the left side of the sequence, built from left to right

1031

s2 = deque() # the right side of the sequence, built from right to left

1032

Doug Zongker

2016-02-09 08:28:09 -0800

[diff] [blame]

1033

heap = []

1034

for xf in self.transfers:

1035

xf.heap_item = HeapItem(xf)

1036

heap.append(xf.heap_item)

1037

heapq.heapify(heap)

Doug Zongker

2014-08-26 13:10:25 -0700

[diff] [blame]

1038

Tao Bao

2016-10-24 16:49:08 -0700

[diff] [blame]

1039

# Use OrderedDict() instead of set() to preserve the insertion order. Need

1040

# to use 'sinks[key] = None' to add key into the set. sinks will look like

1041

# { key1: None, key2: None, ... }.

1042

sinks = OrderedDict.fromkeys(u for u in G if not u.outgoing)

1043

sources = OrderedDict.fromkeys(u for u in G if not u.incoming)

Doug Zongker

2016-02-09 08:28:09 -0800

[diff] [blame]

1044

1045

def adjust_score(iu, delta):

1046

iu.score += delta

1047

iu.heap_item.clear()

1048

iu.heap_item = HeapItem(iu)

1049

heapq.heappush(heap, iu.heap_item)

1050

1051

while G:

Doug Zongker

2014-08-26 13:10:25 -0700

[diff] [blame]

1052

# Put all sinks at the end of the sequence.

Doug Zongker

2016-02-09 08:28:09 -0800

[diff] [blame]

1053

while sinks:

Tao Bao

2016-10-24 16:49:08 -0700

[diff] [blame]

1054

new_sinks = OrderedDict()

Doug Zongker

2014-08-26 13:10:25 -0700

[diff] [blame]

1055

for u in sinks:

Doug Zongker

2016-02-09 08:28:09 -0800

[diff] [blame]

1056

if u not in G: continue

Doug Zongker

2014-08-26 13:10:25 -0700

[diff] [blame]

1057

s2.appendleft(u)

1058

del G[u]

1059

for iu in u.incoming:

Doug Zongker

2016-02-09 08:28:09 -0800

[diff] [blame]

1060

adjust_score(iu, -iu.outgoing.pop(u))

Tao Bao

2016-10-24 16:49:08 -0700

[diff] [blame]

1061

if not iu.outgoing:

1062

new_sinks[iu] = None

Doug Zongker

2016-02-09 08:28:09 -0800

[diff] [blame]

1063

sinks = new_sinks

Doug Zongker

2014-08-26 13:10:25 -0700

[diff] [blame]

1064

1065

# Put all the sources at the beginning of the sequence.

Doug Zongker

2016-02-09 08:28:09 -0800

[diff] [blame]

1066

while sources:

Tao Bao

2016-10-24 16:49:08 -0700

[diff] [blame]

1067

new_sources = OrderedDict()

Doug Zongker

2014-08-26 13:10:25 -0700

[diff] [blame]

1068

for u in sources:

Doug Zongker

2016-02-09 08:28:09 -0800

[diff] [blame]

1069

if u not in G: continue

Doug Zongker

2014-08-26 13:10:25 -0700

[diff] [blame]

1070

s1.append(u)

1071

del G[u]

1072

for iu in u.outgoing:

Doug Zongker

2016-02-09 08:28:09 -0800

[diff] [blame]

1073

adjust_score(iu, +iu.incoming.pop(u))

Tao Bao

2016-10-24 16:49:08 -0700

[diff] [blame]

1074

if not iu.incoming:

1075

new_sources[iu] = None

Doug Zongker

2016-02-09 08:28:09 -0800

[diff] [blame]

1076

sources = new_sources

Doug Zongker

2014-08-26 13:10:25 -0700

[diff] [blame]

1077

Doug Zongker

2016-02-09 08:28:09 -0800

[diff] [blame]

1078

if not G: break

Doug Zongker

2014-08-26 13:10:25 -0700

[diff] [blame]

1079

1080

# Find the "best" vertex to put next. "Best" is the one that

1081

# maximizes the net difference in source blocks saved we get by

1082

# pretending it's a source rather than a sink.

1083

Doug Zongker

2016-02-09 08:28:09 -0800

[diff] [blame]

1084

while True:

1085

u = heapq.heappop(heap)

1086

if u and u.item in G:

1087

u = u.item

1088

break

Doug Zongker

2014-08-26 13:10:25 -0700

[diff] [blame]

1089

Doug Zongker

2014-08-26 13:10:25 -0700

[diff] [blame]

1090

s1.append(u)

1091

del G[u]

1092

for iu in u.outgoing:

Doug Zongker

2016-02-09 08:28:09 -0800

[diff] [blame]

1093

adjust_score(iu, +iu.incoming.pop(u))

Tao Bao

2016-10-24 16:49:08 -0700

[diff] [blame]

1094

if not iu.incoming:

1095

sources[iu] = None

Doug Zongker

2016-02-09 08:28:09 -0800

[diff] [blame]

1096

Doug Zongker

2014-08-26 13:10:25 -0700

[diff] [blame]

1097

for iu in u.incoming:

Doug Zongker

2016-02-09 08:28:09 -0800

[diff] [blame]

1098

adjust_score(iu, -iu.outgoing.pop(u))

Tao Bao

2016-10-24 16:49:08 -0700

[diff] [blame]

1099

if not iu.outgoing:

1100

sinks[iu] = None

Doug Zongker

2014-08-26 13:10:25 -0700

[diff] [blame]

1101

1102

# Now record the sequence in the 'order' field of each transfer,

1103

# and by rearranging self.transfers to be in the chosen sequence.

1104

1105

new_transfers = []

1106

for x in itertools.chain(s1, s2):

1107

x.order = len(new_transfers)

1108

new_transfers.append(x)

del x.incoming

del x.outgoing

self.transfers = new_transfers

1113

1114

def GenerateDigraph(self):

1115

print("Generating digraph...")

Doug Zongker

2016-02-09 08:28:09 -0800

[diff] [blame]

1116

1117

# Each item of source_ranges will be:

1118

# - None, if that block is not used as a source,

Tao Bao

2016-10-24 16:49:08 -0700

[diff] [blame]

1119

# - an ordered set of transfers.

Doug Zongker

2016-02-09 08:28:09 -0800

[diff] [blame]

1120

source_ranges = []

1121

for b in self.transfers:

1122

for s, e in b.src_ranges:

1123

if e > len(source_ranges):

1124

source_ranges.extend([None] * (e-len(source_ranges)))

1125

for i in range(s, e):

1126

if source_ranges[i] is None:

Tao Bao

2016-10-24 16:49:08 -0700

[diff] [blame]

1127

source_ranges[i] = OrderedDict.fromkeys([b])

Doug Zongker

2016-02-09 08:28:09 -0800

[diff] [blame]

1128

else:

Tao Bao

2016-10-24 16:49:08 -0700

[diff] [blame]

1129

source_ranges[i][b] = None

Doug Zongker

2016-02-09 08:28:09 -0800

[diff] [blame]

1130

Doug Zongker

2014-08-26 13:10:25 -0700

[diff] [blame]

1131

for a in self.transfers:

Tao Bao

2016-10-24 16:49:08 -0700

[diff] [blame]

1132

intersections = OrderedDict()

Doug Zongker

2016-02-09 08:28:09 -0800

[diff] [blame]

1133

for s, e in a.tgt_ranges:

1134

for i in range(s, e):

1135

if i >= len(source_ranges): break

Tao Bao

2016-10-24 16:49:08 -0700

[diff] [blame]

1136

# Add all the Transfers in source_ranges[i] to the (ordered) set.

1137

if source_ranges[i] is not None:

1138

for j in source_ranges[i]:

1139

intersections[j] = None

Doug Zongker

2016-02-09 08:28:09 -0800

[diff] [blame]

1140

1141

for b in intersections:

1142

if a is b: continue

Doug Zongker

2014-08-26 13:10:25 -0700

[diff] [blame]

1143

1144

# If the blocks written by A are read by B, then B needs to go before A.

1145

i = a.tgt_ranges.intersect(b.src_ranges)

1146

if i:

Doug Zongker

2014-08-26 10:40:28 -0700

[diff] [blame]

1147

if b.src_name == "__ZERO":

1148

# the cost of removing source blocks for the __ZERO domain

# is (nearly) zero.

size = 0

else:

size = i.size()

Doug Zongker

2014-08-26 13:10:25 -0700

[diff] [blame]

1153

b.goes_before[a] = size

1154

a.goes_after[b] = size

1155

1156

def FindTransfers(self):

Tao Bao

2015-08-25 15:10:10 -0700

[diff] [blame]

1157

"""Parse the file_map to generate all the transfers."""

1158

Tao Bao

2016-09-19 22:26:30 -0700

[diff] [blame]

1159

def AddSplitTransfers(tgt_name, src_name, tgt_ranges, src_ranges,

1160

style, by_id):

1161

"""Add one or multiple Transfer()s by splitting large files.

Tao Bao

2015-08-25 15:10:10 -0700

[diff] [blame]

1162

1163

For BBOTA v3, we need to stash source blocks for resumable feature.

1164

However, with the growth of file size and the shrink of the cache

1165

partition source blocks are too large to be stashed. If a file occupies

Tao Bao

2016-09-19 22:26:30 -0700

[diff] [blame]

1166

too many blocks, we split it into smaller pieces by getting multiple

1167

Transfer()s.

Tao Bao

2015-08-25 15:10:10 -0700

[diff] [blame]

1168

Tianjie Xu

2016-01-13 16:14:10 -0800

[diff] [blame]

1169

The downside is that after splitting, we may increase the package size

1170

since the split pieces don't align well. According to our experiments,

1171

1/8 of the cache size as the per-piece limit appears to be optimal.

1172

Compared to the fixed 1024-block limit, it reduces the overall package

Tao Bao

2016-09-19 22:26:30 -0700

[diff] [blame]

1173

size by 30% for volantis, and 20% for angler and bullhead."""

Tao Bao

2015-08-25 15:10:10 -0700

[diff] [blame]

1174

Tao Bao

2016-09-19 22:26:30 -0700

[diff] [blame]

1175

# Possibly split large files into smaller chunks.

Tianjie Xu

2016-01-13 16:14:10 -0800

[diff] [blame]

1176

pieces = 0

1177

cache_size = common.OPTIONS.cache_size

1178

split_threshold = 0.125

1179

max_blocks_per_transfer = int(cache_size * split_threshold /

1180

self.tgt.blocksize)

1181

Tao Bao

2015-08-25 15:10:10 -0700

[diff] [blame]

1182

# Change nothing for small files.

Tianjie Xu

2016-01-13 16:14:10 -0800

[diff] [blame]

1183

if (tgt_ranges.size() <= max_blocks_per_transfer and

1184

src_ranges.size() <= max_blocks_per_transfer):

Tao Bao

2015-08-25 15:10:10 -0700

[diff] [blame]

1185

Transfer(tgt_name, src_name, tgt_ranges, src_ranges, style, by_id)

1186

return

1187

Tianjie Xu

2016-01-13 16:14:10 -0800

[diff] [blame]

1188

while (tgt_ranges.size() > max_blocks_per_transfer and

1189

src_ranges.size() > max_blocks_per_transfer):

Tao Bao

2015-08-25 15:10:10 -0700

[diff] [blame]

1190

tgt_split_name = "%s-%d" % (tgt_name, pieces)

1191

src_split_name = "%s-%d" % (src_name, pieces)

Tianjie Xu

2016-01-13 16:14:10 -0800

[diff] [blame]

1192

tgt_first = tgt_ranges.first(max_blocks_per_transfer)

1193

src_first = src_ranges.first(max_blocks_per_transfer)

1194

Tao Bao

2015-08-25 15:10:10 -0700

[diff] [blame]

1195

Transfer(tgt_split_name, src_split_name, tgt_first, src_first, style,

1196

by_id)

1197

1198

tgt_ranges = tgt_ranges.subtract(tgt_first)

1199

src_ranges = src_ranges.subtract(src_first)

1200

pieces += 1

1201

1202

# Handle remaining blocks.

1203

if tgt_ranges.size() or src_ranges.size():

1204

# Must be both non-empty.

1205

assert tgt_ranges.size() and src_ranges.size()

1206

tgt_split_name = "%s-%d" % (tgt_name, pieces)

1207

src_split_name = "%s-%d" % (src_name, pieces)

1208

Transfer(tgt_split_name, src_split_name, tgt_ranges, src_ranges, style,

1209

by_id)

1210

Tao Bao

2016-09-19 22:26:30 -0700

[diff] [blame]

1211

def AddTransfer(tgt_name, src_name, tgt_ranges, src_ranges, style, by_id,

1212

split=False):

1213

"""Wrapper function for adding a Transfer()."""

1214

1215

# We specialize diff transfers only (which covers bsdiff/imgdiff/move);

1216

# otherwise add the Transfer() as is.

1217

if style != "diff" or not split:

1218

Transfer(tgt_name, src_name, tgt_ranges, src_ranges, style, by_id)

1219

return

1220

1221

# Handle .odex files specially to analyze the block-wise difference. If

1222

# most of the blocks are identical with only few changes (e.g. header),

1223

# we will patch the changed blocks only. This avoids stashing unchanged

1224

# blocks while patching. We limit the analysis to files without size

1225

# changes only. This is to avoid sacrificing the OTA generation cost too

1226

# much.

1227

if (tgt_name.split(".")[-1].lower() == 'odex' and

1228

tgt_ranges.size() == src_ranges.size()):

1229

1230

# 0.5 threshold can be further tuned. The tradeoff is: if only very

1231

# few blocks remain identical, we lose the opportunity to use imgdiff

1232

# that may have better compression ratio than bsdiff.

1233

crop_threshold = 0.5

1234

1235

tgt_skipped = RangeSet()

1236

src_skipped = RangeSet()

1237

tgt_size = tgt_ranges.size()

1238

tgt_changed = 0

1239

for src_block, tgt_block in zip(src_ranges.next_item(),

1240

tgt_ranges.next_item()):

1241

src_rs = RangeSet(str(src_block))

1242

tgt_rs = RangeSet(str(tgt_block))

1243

if self.src.ReadRangeSet(src_rs) == self.tgt.ReadRangeSet(tgt_rs):

1244

tgt_skipped = tgt_skipped.union(tgt_rs)

1245

src_skipped = src_skipped.union(src_rs)

1246

else:

1247

tgt_changed += tgt_rs.size()

1248

1249

# Terminate early if no clear sign of benefits.

1250

if tgt_changed > tgt_size * crop_threshold:

1251

break

1252

1253

if tgt_changed < tgt_size * crop_threshold:

1254

assert tgt_changed + tgt_skipped.size() == tgt_size

1255

print('%10d %10d (%6.2f%%) %s' % (tgt_skipped.size(), tgt_size,

1256

tgt_skipped.size() * 100.0 / tgt_size, tgt_name))

1257

AddSplitTransfers(

1258

"%s-skipped" % (tgt_name,),

1259

"%s-skipped" % (src_name,),

1260

tgt_skipped, src_skipped, style, by_id)

1261

1262

# Intentionally change the file extension to avoid being imgdiff'd as

1263

# the files are no longer in their original format.

1264

tgt_name = "%s-cropped" % (tgt_name,)

1265

src_name = "%s-cropped" % (src_name,)

1266

tgt_ranges = tgt_ranges.subtract(tgt_skipped)

1267

src_ranges = src_ranges.subtract(src_skipped)

1268

1269

# Possibly having no changed blocks.

if not tgt_ranges:

return

# Add the transfer(s).

1274

AddSplitTransfers(

1275

tgt_name, src_name, tgt_ranges, src_ranges, style, by_id)

1276

1277

print("Finding transfers...")

1278

Doug Zongker

2014-08-26 13:10:25 -0700

[diff] [blame]

1279

empty = RangeSet()

1280

for tgt_fn, tgt_ranges in self.tgt.file_map.items():

1281

if tgt_fn == "__ZERO":

1282

# the special "__ZERO" domain is all the blocks not contained

1283

# in any file and that are filled with zeros. We have a

1284

# special transfer style for zero blocks.

1285

src_ranges = self.src.file_map.get("__ZERO", empty)

Tao Bao

2015-08-25 15:10:10 -0700

[diff] [blame]

1286

AddTransfer(tgt_fn, "__ZERO", tgt_ranges, src_ranges,

1287

"zero", self.transfers)

Doug Zongker

2014-08-26 13:10:25 -0700

[diff] [blame]

1288

continue

1289

Tao Bao

2015-05-12 11:42:31 -0700

[diff] [blame]

1290

elif tgt_fn == "__COPY":

1291

# "__COPY" domain includes all the blocks not contained in any

1292

# file and that need to be copied unconditionally to the target.

Tao Bao

2015-08-25 15:10:10 -0700

[diff] [blame]

1293

AddTransfer(tgt_fn, None, tgt_ranges, empty, "new", self.transfers)

Tao Bao

2015-05-12 11:42:31 -0700

[diff] [blame]

1294

continue

1295

Doug Zongker

2014-08-26 13:10:25 -0700

[diff] [blame]

1296

elif tgt_fn in self.src.file_map:

1297

# Look for an exact pathname match in the source.

Tao Bao

2015-08-25 15:10:10 -0700

[diff] [blame]

1298

AddTransfer(tgt_fn, tgt_fn, tgt_ranges, self.src.file_map[tgt_fn],

1299

"diff", self.transfers, self.version >= 3)

Doug Zongker

2014-08-26 13:10:25 -0700

[diff] [blame]

1300

continue

1301

1302

b = os.path.basename(tgt_fn)

1303

if b in self.src_basenames:

1304

# Look for an exact basename match in the source.

1305

src_fn = self.src_basenames[b]

Tao Bao

2015-08-25 15:10:10 -0700

[diff] [blame]

1306

AddTransfer(tgt_fn, src_fn, tgt_ranges, self.src.file_map[src_fn],

1307

"diff", self.transfers, self.version >= 3)

Doug Zongker

2014-08-26 13:10:25 -0700

[diff] [blame]

1308

continue

1309

1310

b = re.sub("[0-9]+", "#", b)

1311

if b in self.src_numpatterns:

1312

# Look for a 'number pattern' match (a basename match after

1313

# all runs of digits are replaced by "#"). (This is useful

1314

# for .so files that contain version numbers in the filename

1315

# that get bumped.)

1316

src_fn = self.src_numpatterns[b]

Tao Bao

2015-08-25 15:10:10 -0700

[diff] [blame]

1317

AddTransfer(tgt_fn, src_fn, tgt_ranges, self.src.file_map[src_fn],

1318

"diff", self.transfers, self.version >= 3)

Doug Zongker

2014-08-26 13:10:25 -0700

[diff] [blame]

1319

continue

1320

Tao Bao

2015-08-25 15:10:10 -0700

[diff] [blame]

1321

AddTransfer(tgt_fn, None, tgt_ranges, empty, "new", self.transfers)

Doug Zongker

2014-08-26 13:10:25 -0700

[diff] [blame]

1322

1323

def AbbreviateSourceNames(self):

Doug Zongker

2014-08-26 13:10:25 -0700

[diff] [blame]

1324

for k in self.src.file_map.keys():

1325

b = os.path.basename(k)

1326

self.src_basenames[b] = k

1327

b = re.sub("[0-9]+", "#", b)

1328

self.src_numpatterns[b] = k

1329

1330

@staticmethod

1331

def AssertPartition(total, seq):

1332

"""Assert that all the RangeSets in 'seq' form a partition of the

1333

'total' RangeSet (ie, they are nonintersecting and their union

1334

equals 'total')."""

Doug Zongker

2016-02-09 08:28:09 -0800

[diff] [blame]

1335

Doug Zongker