/brz/remove-bazaar : revision 4454.3.63

To get this branch, use:

bzr branch
http://gegoxaren.bato24.eu/bzr/brz/remove-bazaar

« back to all changes in this revision

Viewing changes to bzrlib/_annotator_pyx.pyx

Committer: John Arbash Meinel
Date: 2009-07-06 19:16:19 UTC
mto: This revision was merged to the branch mainline in revision 4522.
Revision ID: john@arbash-meinel.com-20090706191619-lycpcdwo73j2g1cg

Copy the implementation over to the Pyrex version.

files modified:
bzrlib/_annotator_py.py

bzrlib/_annotator_pyx.pyx

Show diffs side-by-side

added added

removed removed

bzrlib/_annotator_pyx.pyx

cdef object counter

cdef object text_cache

cdef object stream

cdef object ann_keys

cdef object stream_len

cdef object pb

cdef int stream_is_consumed

cdef int ann_key_pos

def __init__(self, stream, text_cache, stream_len, pb=None):

def __init__(self, stream, text_cache, stream_len, ann_keys, pb=None):

self.counter = 0

self.stream = stream

self.stream_len = stream_len

self.text_cache = text_cache

self.stream_len = stream_len

self.ann_keys = list(ann_keys)

self.pb = pb

self.stream_is_consumed = 0

self.ann_key_pos = 0

def __iter__(self):

return self

cdef _get_ann_text(self):

if self.ann_key_pos >= len(self.ann_keys):

raise StopIteration

key = self.ann_keys[self.ann_key_pos]

self.ann_key_pos = self.ann_key_pos + 1

lines = self.text_cache[key]

num_lines = len(lines)

return key, lines, num_lines

def __next__(self):

record = self.stream.next()

if self.stream_is_consumed:

return self._get_ann_text()

try:

record = self.stream.next()

100

except StopIteration:

101

self.stream_is_consumed = 1

102

return self._get_ann_text()

103

if self.pb is not None:

104

self.pb.update('extracting', self.counter, self.stream_len)

105

if record.storage_kind == 'absent':

106

raise errors.RevisionNotPresent(record.key, None)

107

self.counter = self.counter + 1

108

lines = osutils.chunks_to_lines(record.get_bytes_as('chunked'))

109

num_lines = len(lines)

222

245

self._heads_provider = None

223

246

self._ann_tuple_cache = {}

224

247

248

249

def _update_needed_children(self, key, parent_keys):

250

for parent_key in parent_keys:

251

if parent_key in self._num_needed_children:

252

self._num_needed_children[parent_key] += 1

253

else:

254

self._num_needed_children[parent_key] = 1

255

225

256

def _get_needed_keys(self, key):

226

graph = _mod_graph.Graph(self._vf)

227

parent_map = {}

257

"""Determine the texts we need to get from the backing vf.

258

259

:return: (vf_keys_needed, ann_keys_needed)

260

vf_keys_needed These are keys that we need to get from the vf

261

ann_keys_needed Texts which we have in self._text_cache but we

262

don't have annotations for. We need to yield these

263

in the proper order so that we can get proper

264

annotations.

265

"""

266

parent_map = self._parent_map

228

267

# We need 1 extra copy of the node we will be looking at when we are

229

268

# done

230

269

self._num_needed_children[key] = 1

231

for key, parent_keys in graph.iter_ancestry([key]):

232

if parent_keys is None:

233

continue

234

parent_map[key] = parent_keys

235

for parent_key in parent_keys:

236

if parent_key in self._num_needed_children:

237

self._num_needed_children[parent_key] += 1

270

vf_keys_needed = set()

271

ann_keys_needed = set()

272

needed_keys = set([key])

273

while needed_keys:

274

parent_lookup = []

275

next_parent_map = {}

276

for key in needed_keys:

277

if key in self._parent_map:

278

# We don't need to lookup this key in the vf

279

if key not in self._text_cache:

280

# Extract this text from the vf

281

vf_keys_needed.add(key)

282

elif key not in self._annotations_cache:

283

# We do need to annotate

284

ann_keys_needed.add(key)

285

next_parent_map[key] = self._parent_map[key]

238

286

else:

239

self._num_needed_children[parent_key] = 1

240

self._parent_map.update(parent_map)

241

# _heads_provider does some graph caching, so it is only valid while

242

# self._parent_map hasn't changed

243

self._heads_provider = None

244

keys = parent_map.keys()

245

return keys

287

parent_lookup.append(key)

288

vf_keys_needed.add(key)

289

needed_keys = set()

290

next_parent_map.update(self._vf.get_parent_map(parent_lookup))

291

for key, parent_keys in next_parent_map.iteritems():

292

self._update_needed_children(key, parent_keys)

293

for key in parent_keys:

294

if key not in parent_map:

295

needed_keys.add(key)

296

parent_map.update(next_parent_map)

297

# _heads_provider does some graph caching, so it is only valid while

298

# self._parent_map hasn't changed

299

self._heads_provider = None

300

return vf_keys_needed, ann_keys_needed

246

301

247

302

def _get_needed_texts(self, key, pb=None):

248

303

"""Get the texts we need to properly annotate key.

253

308

matcher object we are using. Currently it is always 'lines' but

254

309

future improvements may change this to a simple text string.

255

310

"""

256

keys = self._get_needed_keys(key)

311

keys, ann_keys = self._get_needed_keys(key)

257

312

if pb is not None:

258

313

pb.update('getting stream', 0, len(keys))

259

314

stream = self._vf.get_record_stream(keys, 'topological', True)

260

iterator = _NeededTextIterator(stream, self._text_cache, len(keys), pb)

315

iterator = _NeededTextIterator(stream, self._text_cache, len(keys),

316

ann_keys, pb)

261

317

return iterator

262

318

263

319

def _get_parent_annotations_and_matches(self, key, text, parent_key):

364

420

365

421

def add_special_text(self, key, parent_keys, text):

366

422

"""Add a specific text to the graph."""

423

self._parent_map[key] = parent_keys

424

self._text_cache[key] = osutils.split_lines(text)

425

self._heads_provider = None

367

426

368

427

def annotate(self, key):

369

428

"""Return annotated fulltext for the given key."""

Older »