Blame - tools/releasetools/sparse_img.py - SHIFTPHONES/android_build

2014-08-26 13:10:25 -0700

[diff] [blame]

20

import bisect

Tao Bao

32fcdab

2018-10-12 10:30:39 -0700

[diff] [blame]

21

import logging

Doug Zongker

2014-08-26 13:10:25 -0700

[diff] [blame]

22

import os

Doug Zongker

2014-08-26 13:10:25 -0700

[diff] [blame]

23

import struct

Tianjie Xu

2018-01-27 17:35:41 -0800

[diff] [blame]

24

import threading

Doug Zongker

2014-08-26 13:10:25 -0700

[diff] [blame]

25

from hashlib import sha1

26

Dan Albert

2015-03-23 19:13:21 -0700

[diff] [blame]

27

import rangelib

28

Tao Bao

32fcdab

2018-10-12 10:30:39 -0700

[diff] [blame]

29

logger = logging.getLogger(__name__)

30

Doug Zongker

2014-08-26 13:10:25 -0700

[diff] [blame]

31

32

class SparseImage(object):

Tao Bao

2015-05-12 11:42:31 -0700

[diff] [blame]

33

"""Wraps a sparse image file into an image object.

Doug Zongker

2014-08-26 13:10:25 -0700

[diff] [blame]

34

Tao Bao

2015-05-12 11:42:31 -0700

[diff] [blame]

35

Wraps a sparse image file (and optional file map and clobbered_blocks) into

36

an image object suitable for passing to BlockImageDiff. file_map contains

37

the mapping between files and their blocks. clobbered_blocks contains the set

38

of blocks that should be always written to the target regardless of the old

39

contents (i.e. copying instead of patching). clobbered_blocks should be in

40

the form of a string like "0" or "0 1-5 8".

41

"""

42

Sami Tolvanen

2016-02-09 12:28:58 -0800

[diff] [blame]

43

def __init__(self, simg_fn, file_map_fn=None, clobbered_blocks=None,

Tianjie Xu

2018-08-30 00:32:07 -0700

[diff] [blame]

44

mode="rb", build_map=True, allow_shared_blocks=False,

45

hashtree_info_generator=None):

Sami Tolvanen

2016-02-09 12:28:58 -0800

[diff] [blame]

46

self.simg_f = f = open(simg_fn, mode)

Doug Zongker

2014-08-26 13:10:25 -0700

[diff] [blame]

47

48

header_bin = f.read(28)

49

header = struct.unpack("<I4H4I", header_bin)

50

51

magic = header[0]

52

major_version = header[1]

53

minor_version = header[2]

54

file_hdr_sz = header[3]

55

chunk_hdr_sz = header[4]

56

self.blocksize = blk_sz = header[5]

57

self.total_blocks = total_blks = header[6]

Sami Tolvanen

2016-02-09 12:28:58 -0800

[diff] [blame]

58

self.total_chunks = total_chunks = header[7]

Doug Zongker

2014-08-26 13:10:25 -0700

[diff] [blame]

59

60

if magic != 0xED26FF3A:

61

raise ValueError("Magic should be 0xED26FF3A but is 0x%08X" % (magic,))

62

if major_version != 1 or minor_version != 0:

63

raise ValueError("I know about version 1.0, but this is version %u.%u" %

64

(major_version, minor_version))

65

if file_hdr_sz != 28:

66

raise ValueError("File header size was expected to be 28, but is %u." %

67

(file_hdr_sz,))

68

if chunk_hdr_sz != 12:

69

raise ValueError("Chunk header size was expected to be 12, but is %u." %

70

(chunk_hdr_sz,))

71

Tao Bao

32fcdab

2018-10-12 10:30:39 -0700

[diff] [blame]

72

logger.info(

73

"Total of %u %u-byte output blocks in %u input chunks.", total_blks,

74

blk_sz, total_chunks)

Doug Zongker

2014-08-26 13:10:25 -0700

[diff] [blame]

75

Sami Tolvanen

2016-02-09 12:28:58 -0800

[diff] [blame]

76

if not build_map:

Tianjie Xu

2018-08-30 00:32:07 -0700

[diff] [blame]

77

assert not hashtree_info_generator, \

78

"Cannot generate the hashtree info without building the offset map."

Sami Tolvanen

2016-02-09 12:28:58 -0800

[diff] [blame]

79

return

80

Doug Zongker

2014-08-26 13:10:25 -0700

[diff] [blame]

81

pos = 0 # in blocks

82

care_data = []

83

self.offset_map = offset_map = []

Tao Bao

2015-05-12 11:42:31 -0700

[diff] [blame]

84

self.clobbered_blocks = rangelib.RangeSet(data=clobbered_blocks)

Doug Zongker

2014-08-26 13:10:25 -0700

[diff] [blame]

85

86

for i in range(total_chunks):

87

header_bin = f.read(12)

88

header = struct.unpack("<2H2I", header_bin)

89

chunk_type = header[0]

Doug Zongker

2014-08-26 13:10:25 -0700

[diff] [blame]

90

chunk_sz = header[2]

91

total_sz = header[3]

92

data_sz = total_sz - 12

93

94

if chunk_type == 0xCAC1:

95

if data_sz != (chunk_sz * blk_sz):

96

raise ValueError(

97

"Raw chunk input size (%u) does not match output size (%u)" %

98

(data_sz, chunk_sz * blk_sz))

99

else:

100

care_data.append(pos)

101

care_data.append(pos + chunk_sz)

Doug Zongker

2014-10-15 15:55:50 -0700

[diff] [blame]

102

offset_map.append((pos, chunk_sz, f.tell(), None))

Doug Zongker

2014-08-26 13:10:25 -0700

[diff] [blame]

103

pos += chunk_sz

104

f.seek(data_sz, os.SEEK_CUR)

105

106

elif chunk_type == 0xCAC2:

Doug Zongker

2014-10-15 15:55:50 -0700

[diff] [blame]

107

fill_data = f.read(4)

108

care_data.append(pos)

109

care_data.append(pos + chunk_sz)

110

offset_map.append((pos, chunk_sz, None, fill_data))

111

pos += chunk_sz

Doug Zongker

2014-08-26 13:10:25 -0700

[diff] [blame]

112

113

elif chunk_type == 0xCAC3:

114

if data_sz != 0:

115

raise ValueError("Don't care chunk input size is non-zero (%u)" %

116

(data_sz))

Tianjie Xu

2018-08-30 00:32:07 -0700

[diff] [blame]

117

# Fills the don't care data ranges with zeros.

118

# TODO(xunchang) pass the care_map to hashtree info generator.

119

if hashtree_info_generator:

120

fill_data = '\x00' * 4

121

# In order to compute verity hashtree on device, we need to write

122

# zeros explicitly to the don't care ranges. Because these ranges may

123

# contain non-zero data from the previous build.

124

care_data.append(pos)

125

care_data.append(pos + chunk_sz)

126

offset_map.append((pos, chunk_sz, None, fill_data))

127

128

pos += chunk_sz

Doug Zongker

2014-08-26 13:10:25 -0700

[diff] [blame]

129

130

elif chunk_type == 0xCAC4:

131

raise ValueError("CRC32 chunks are not supported")

132

133

else:

134

raise ValueError("Unknown chunk type 0x%04X not supported" %

135

(chunk_type,))

136

Tianjie Xu

2018-01-27 17:35:41 -0800

[diff] [blame]

137

self.generator_lock = threading.Lock()

138

Dan Albert

2015-03-23 19:13:21 -0700

[diff] [blame]

139

self.care_map = rangelib.RangeSet(care_data)

Doug Zongker

2014-08-26 13:10:25 -0700

[diff] [blame]

140

self.offset_index = [i[0] for i in offset_map]

141

Tao Bao

2fd2c9b

2015-07-09 17:37:49 -0700

[diff] [blame]

142

# Bug: 20881595

143

# Introduce extended blocks as a workaround for the bug. dm-verity may

144

# touch blocks that are not in the care_map due to block device

145

# read-ahead. It will fail if such blocks contain non-zeroes. We zero out

146

# the extended blocks explicitly to avoid dm-verity failures. 512 blocks

147

# are the maximum read-ahead we configure for dm-verity block devices.

148

extended = self.care_map.extend(512)

149

all_blocks = rangelib.RangeSet(data=(0, self.total_blocks))

150

extended = extended.intersect(all_blocks).subtract(self.care_map)

151

self.extended = extended

152

Tianjie Xu

2018-08-30 00:32:07 -0700

[diff] [blame]

153

self.hashtree_info = None

154

if hashtree_info_generator:

155

self.hashtree_info = hashtree_info_generator.Generate(self)

156

Doug Zongker

2014-08-26 13:10:25 -0700

[diff] [blame]

157

if file_map_fn:

Tao Bao

2018-02-07 12:40:00 -0800

[diff] [blame]

158

self.LoadFileBlockMap(file_map_fn, self.clobbered_blocks,

159

allow_shared_blocks)

Doug Zongker

2014-08-26 13:10:25 -0700

[diff] [blame]

160

else:

161

self.file_map = {"__DATA": self.care_map}

162

Sami Tolvanen

2016-02-09 12:28:58 -0800

[diff] [blame]

163

def AppendFillChunk(self, data, blocks):

164

f = self.simg_f

165

166

# Append a fill chunk

167

f.seek(0, os.SEEK_END)

168

f.write(struct.pack("<2H3I", 0xCAC2, 0, blocks, 16, data))

169

170

# Update the sparse header

171

self.total_blocks += blocks

172

self.total_chunks += 1

173

174

f.seek(16, os.SEEK_SET)

175

f.write(struct.pack("<2I", self.total_blocks, self.total_chunks))

176

Tao Bao

183e56e

2017-03-05 17:05:09 -0800

[diff] [blame]

177

def RangeSha1(self, ranges):

178

h = sha1()

179

for data in self._GetRangeData(ranges):

h.update(data)

return h.hexdigest()

Doug Zongker

2014-08-26 13:10:25 -0700

[diff] [blame]

183

def ReadRangeSet(self, ranges):

184

return [d for d in self._GetRangeData(ranges)]

185

Tao Bao

5fcaaef

2015-06-01 13:40:49 -0700

[diff] [blame]

186

def TotalSha1(self, include_clobbered_blocks=False):

187

"""Return the SHA-1 hash of all data in the 'care' regions.

188

189

If include_clobbered_blocks is True, it returns the hash including the

190

clobbered_blocks."""

191

ranges = self.care_map

192

if not include_clobbered_blocks:

Tao Bao

2b4ff17

2015-06-23 17:30:35 -0700

[diff] [blame]

193

ranges = ranges.subtract(self.clobbered_blocks)

Tao Bao

183e56e

2017-03-05 17:05:09 -0800

[diff] [blame]

194

return self.RangeSha1(ranges)

195

196

def WriteRangeDataToFd(self, ranges, fd):

197

for data in self._GetRangeData(ranges):

198

fd.write(data)

Doug Zongker

2014-08-26 13:10:25 -0700

[diff] [blame]

199

200

def _GetRangeData(self, ranges):

201

"""Generator that produces all the image data in 'ranges'. The

202

number of individual pieces returned is arbitrary (and in

203

particular is not necessarily equal to the number of ranges in

204

'ranges'.

205

Tianjie Xu

2018-01-27 17:35:41 -0800

[diff] [blame]

206

Use a lock to protect the generator so that we will not run two

Doug Zongker

2014-08-26 13:10:25 -0700

[diff] [blame]

207

instances of this generator on the same object simultaneously."""

208

209

f = self.simg_f

Tianjie Xu

2018-01-27 17:35:41 -0800

[diff] [blame]

210

with self.generator_lock:

211

for s, e in ranges:

212

to_read = e-s

213

idx = bisect.bisect_right(self.offset_index, s) - 1

Doug Zongker

2014-10-15 15:55:50 -0700

[diff] [blame]

214

chunk_start, chunk_len, filepos, fill_data = self.offset_map[idx]

Tianjie Xu

2018-01-27 17:35:41 -0800

[diff] [blame]

215

216

# for the first chunk we may be starting partway through it.

217

remain = chunk_len - (s - chunk_start)

218

this_read = min(remain, to_read)

Doug Zongker

2014-10-15 15:55:50 -0700

[diff] [blame]

219

if filepos is not None:

Tianjie Xu

2018-01-27 17:35:41 -0800

[diff] [blame]

220

p = filepos + ((s - chunk_start) * self.blocksize)

221

f.seek(p, os.SEEK_SET)

Doug Zongker

2014-10-15 15:55:50 -0700

[diff] [blame]

222

yield f.read(this_read * self.blocksize)

223

else:

224

yield fill_data * (this_read * (self.blocksize >> 2))

Doug Zongker

2014-08-26 13:10:25 -0700

[diff] [blame]

225

to_read -= this_read

226

Tianjie Xu

2018-01-27 17:35:41 -0800

[diff] [blame]

227

while to_read > 0:

228

# continue with following chunks if this range spans multiple chunks.

229

idx += 1

230

chunk_start, chunk_len, filepos, fill_data = self.offset_map[idx]

231

this_read = min(chunk_len, to_read)

232

if filepos is not None:

233

f.seek(filepos, os.SEEK_SET)

234

yield f.read(this_read * self.blocksize)

235

else:

236

yield fill_data * (this_read * (self.blocksize >> 2))

237

to_read -= this_read

238

Tao Bao

2018-02-07 12:40:00 -0800

[diff] [blame]

239

def LoadFileBlockMap(self, fn, clobbered_blocks, allow_shared_blocks):

240

"""Loads the given block map file.

241

242

Args:

243

fn: The filename of the block map file.

244

clobbered_blocks: A RangeSet instance for the clobbered blocks.

245

allow_shared_blocks: Whether having shared blocks is allowed.

246

"""

Doug Zongker

2014-08-26 13:10:25 -0700

[diff] [blame]

247

remaining = self.care_map

248

self.file_map = out = {}

with open(fn) as f:

for line in f:

fn, ranges = line.split(None, 1)

Dan Albert

2015-03-23 19:13:21 -0700

[diff] [blame]

253

ranges = rangelib.RangeSet.parse(ranges)

Tao Bao

2018-02-07 12:40:00 -0800

[diff] [blame]

254

255

if allow_shared_blocks:

Tao Bao

2a20f34

2018-12-03 15:08:23 -0800

[diff] [blame]

256

# Find the shared blocks that have been claimed by others. If so, tag

257

# the entry so that we can skip applying imgdiff on this file.

Tao Bao

2018-02-07 12:40:00 -0800

[diff] [blame]

258

shared_blocks = ranges.subtract(remaining)

259

if shared_blocks:

Tao Bao

2a20f34

2018-12-03 15:08:23 -0800

[diff] [blame]

260

non_shared = ranges.subtract(shared_blocks)

261

if not non_shared:

Tao Bao

2018-02-07 12:40:00 -0800

[diff] [blame]

262

continue

263

Tao Bao

2a20f34

2018-12-03 15:08:23 -0800

[diff] [blame]

264

# There shouldn't anything in the extra dict yet.

265

assert not ranges.extra, "Non-empty RangeSet.extra"

266

267

# Put the non-shared RangeSet as the value in the block map, which

268

# has a copy of the original RangeSet.

269

non_shared.extra['uses_shared_blocks'] = ranges

270

ranges = non_shared

Tao Bao

2018-02-07 12:40:00 -0800

[diff] [blame]

271

Doug Zongker

2014-08-26 13:10:25 -0700

[diff] [blame]

272

out[fn] = ranges

273

assert ranges.size() == ranges.intersect(remaining).size()

Tao Bao

2015-05-12 11:42:31 -0700

[diff] [blame]

274

275

# Currently we assume that blocks in clobbered_blocks are not part of

276

# any file.

277

assert not clobbered_blocks.overlaps(ranges)

Doug Zongker

2014-08-26 13:10:25 -0700

[diff] [blame]

278

remaining = remaining.subtract(ranges)

279

Tao Bao

2015-05-12 11:42:31 -0700

[diff] [blame]

280

remaining = remaining.subtract(clobbered_blocks)

Tianjie Xu

2018-08-30 00:32:07 -0700

[diff] [blame]

281

if self.hashtree_info:

282

remaining = remaining.subtract(self.hashtree_info.hashtree_range)

Tao Bao

2015-05-12 11:42:31 -0700

[diff] [blame]

283

Doug Zongker

2014-08-26 13:10:25 -0700

[diff] [blame]

284

# For all the remaining blocks in the care_map (ie, those that

Tao Bao

2015-05-12 11:42:31 -0700

[diff] [blame]

285

# aren't part of the data for any file nor part of the clobbered_blocks),

286

# divide them into blocks that are all zero and blocks that aren't.

287

# (Zero blocks are handled specially because (1) there are usually

288

# a lot of them and (2) bsdiff handles files with long sequences of

289

# repeated bytes especially poorly.)

Doug Zongker

2014-08-26 13:10:25 -0700

[diff] [blame]

zero_blocks = []

nonzero_blocks = []

reference = '\0' * self.blocksize

294

Tao Bao

7c4c6f5

2015-08-19 17:07:50 -0700

[diff] [blame]

295

# Workaround for bug 23227672. For squashfs, we don't have a system.map. So

296

# the whole system image will be treated as a single file. But for some

297

# unknown bug, the updater will be killed due to OOM when writing back the

298

# patched image to flash (observed on lenok-userdebug MEA49). Prior to

299

# getting a real fix, we evenly divide the non-zero blocks into smaller

300

# groups (currently 1024 blocks or 4MB per group).

301

# Bug: 23227672

302

MAX_BLOCKS_PER_GROUP = 1024

303

nonzero_groups = []

304

Doug Zongker

2014-08-26 13:10:25 -0700

[diff] [blame]

305

f = self.simg_f

306

for s, e in remaining:

307

for b in range(s, e):

308

idx = bisect.bisect_right(self.offset_index, b) - 1

Dan Albert

2015-03-23 19:13:21 -0700

[diff] [blame]

309

chunk_start, _, filepos, fill_data = self.offset_map[idx]

Doug Zongker

2014-10-15 15:55:50 -0700

[diff] [blame]

310

if filepos is not None:

311

filepos += (b-chunk_start) * self.blocksize

312

f.seek(filepos, os.SEEK_SET)

313

data = f.read(self.blocksize)

314

else:

315

if fill_data == reference[:4]: # fill with all zeros

316

data = reference

317

else:

318

data = None

Doug Zongker

2014-08-26 13:10:25 -0700

[diff] [blame]

319

320

if data == reference:

321

zero_blocks.append(b)

322

zero_blocks.append(b+1)

323

else:

324

nonzero_blocks.append(b)

325

nonzero_blocks.append(b+1)

326

Tao Bao

7c4c6f5

2015-08-19 17:07:50 -0700

[diff] [blame]

327

if len(nonzero_blocks) >= MAX_BLOCKS_PER_GROUP:

328

nonzero_groups.append(nonzero_blocks)

# Clear the list.

nonzero_blocks = []

if nonzero_blocks:

nonzero_groups.append(nonzero_blocks)

334

nonzero_blocks = []

335

336

assert zero_blocks or nonzero_groups or clobbered_blocks

Tao Bao

7f9470c

2015-06-26 17:49:39 -0700

[diff] [blame]

337

338

if zero_blocks:

339

out["__ZERO"] = rangelib.RangeSet(data=zero_blocks)

Tao Bao

7c4c6f5

2015-08-19 17:07:50 -0700

[diff] [blame]

340

if nonzero_groups:

341

for i, blocks in enumerate(nonzero_groups):

342

out["__NONZERO-%d" % i] = rangelib.RangeSet(data=blocks)

Tao Bao

8bd7202

2015-07-01 18:06:33 -0700

[diff] [blame]

343

if clobbered_blocks:

344

out["__COPY"] = clobbered_blocks

Tianjie Xu

2018-08-30 00:32:07 -0700

[diff] [blame]

345

if self.hashtree_info:

346

out["__HASHTREE"] = self.hashtree_info.hashtree_range

Doug Zongker