Merge lp:~jelmer/brz/iter-changes-all-the-way into lp:brz

Proposed by Jelmer Vernooij
Status: Merged
Approved by: Jelmer Vernooij
Approved revision: no longer in the source branch.
Merge reported by: The Breezy Bot
Merged at revision: not available
Proposed branch: lp:~jelmer/brz/iter-changes-all-the-way
Merge into: lp:brz
Prerequisite: lp:~jelmer/brz/delete-will-record-deletes
Diff against target: 356 lines (+14/-247)
4 files modified
breezy/commit.py (+8/-247)
breezy/tests/per_workingtree/test_commit.py (+1/-0)
breezy/tests/test_merge.py (+2/-0)
doc/en/release-notes/brz-3.0.txt (+3/-0)
To merge this branch: bzr merge lp:~jelmer/brz/iter-changes-all-the-way
Reviewer Review Type Date Requested Status
Martin Packman Approve
Review via email: mp+325965@code.launchpad.net

Commit message

Stop calling CommitBuilder.record_entry_contents.

Description of the change

Stop calling CommitBuilder.record_entry_contents.

This was one of the two ways in which commits can be created, the other being CommitBuilder.record_iter_changes. record_entry_contents is O(tree), record_iter_changes is (with newer formats) O(changes).

This doesn't yet remove the implementation of record_entry_contents or its plethora of tests. I'm leaving that for the next branch.

Note that I had two mark as known failing two tree-reference related tests.

To post a comment you must log in.
Revision history for this message
Martin Packman (gz) wrote :

Looks good to me. There's a minor argument for using skipTest over knownFailure but it's not important.

review: Approve
Revision history for this message
The Breezy Bot (the-breezy-bot) wrote :

Preview Diff

[H/L] Next/Prev Comment, [J/K] Next/Prev File, [N/P] Next/Prev Hunk
1=== modified file 'breezy/commit.py'
2--- breezy/commit.py 2017-06-20 22:29:58 +0000
3+++ breezy/commit.py 2017-06-20 22:37:22 +0000
4@@ -344,9 +344,6 @@
5 self.work_tree.lock_write()
6 operation.add_cleanup(self.work_tree.unlock)
7 self.parents = self.work_tree.get_parent_ids()
8- # We can use record_iter_changes IFF no tree references are involved.
9- self.use_record_iter_changes = (
10- not self.branch.repository._format.supports_tree_reference)
11 self.pb = ui.ui_factory.nested_progress_bar()
12 operation.add_cleanup(self.pb.finished)
13 self.basis_revid = self.work_tree.last_revision()
14@@ -371,8 +368,6 @@
15 if self.config_stack is None:
16 self.config_stack = self.work_tree.get_config_stack()
17
18- self._set_specific_file_ids()
19-
20 # Setup the progress bar. As the number of files that need to be
21 # committed in unknown, progress is reported as stages.
22 # We keep track of entries separately though and include that
23@@ -390,7 +385,6 @@
24 self.pb.show_count = True
25 self.pb.show_bar = True
26
27- self._gather_parents()
28 # After a merge, a selected file commit is not supported.
29 # See 'bzr help merge' for an explanation as to why.
30 if len(self.parents) > 1 and self.specific_files is not None:
31@@ -654,44 +648,21 @@
32 old_revno, old_revid, new_revno, self.rev_id,
33 tree_delta, future_tree)
34
35- def _gather_parents(self):
36- """Record the parents of a merge for merge detection."""
37- # TODO: Make sure that this list doesn't contain duplicate
38- # entries and the order is preserved when doing this.
39- if self.use_record_iter_changes:
40- return
41- self.basis_inv = self.basis_tree.root_inventory
42- self.parent_invs = [self.basis_inv]
43- for revision in self.parents[1:]:
44- if self.branch.repository.has_revision(revision):
45- mutter('commit parent revision {%s}', revision)
46- inventory = self.branch.repository.get_inventory(revision)
47- self.parent_invs.append(inventory)
48- else:
49- mutter('commit parent ghost revision {%s}', revision)
50-
51 def _update_builder_with_changes(self):
52 """Update the commit builder with the data about what has changed.
53 """
54- exclude = self.exclude
55 specific_files = self.specific_files
56 mutter("Selecting files for commit with filter %r", specific_files)
57
58 self._check_strict()
59- if self.use_record_iter_changes:
60- iter_changes = self.work_tree.iter_changes(self.basis_tree,
61- specific_files=specific_files)
62- if self.exclude:
63- iter_changes = filter_excluded(iter_changes, self.exclude)
64- iter_changes = self._filter_iter_changes(iter_changes)
65- for file_id, path, fs_hash in self.builder.record_iter_changes(
66- self.work_tree, self.basis_revid, iter_changes):
67- self.work_tree._observed_sha1(file_id, path, fs_hash)
68- else:
69- # Build the new inventory
70- self._populate_from_inventory()
71- self._record_unselected()
72- self._report_and_accumulate_deletes()
73+ iter_changes = self.work_tree.iter_changes(self.basis_tree,
74+ specific_files=specific_files)
75+ if self.exclude:
76+ iter_changes = filter_excluded(iter_changes, self.exclude)
77+ iter_changes = self._filter_iter_changes(iter_changes)
78+ for file_id, path, fs_hash in self.builder.record_iter_changes(
79+ self.work_tree, self.basis_revid, iter_changes):
80+ self.work_tree._observed_sha1(file_id, path, fs_hash)
81
82 def _filter_iter_changes(self, iter_changes):
83 """Process iter_changes.
84@@ -745,55 +716,6 @@
85 # Unversion IDs that were found to be deleted
86 self.deleted_ids = deleted_ids
87
88- def _record_unselected(self):
89- # If specific files are selected, then all un-selected files must be
90- # recorded in their previous state. For more details, see
91- # https://lists.ubuntu.com/archives/bazaar/2007q3/028476.html.
92- if self.specific_files or self.exclude:
93- specific_files = self.specific_files or []
94- for path, old_ie in self.basis_inv.iter_entries():
95- if self.builder.new_inventory.has_id(old_ie.file_id):
96- # already added - skip.
97- continue
98- if (is_inside_any(specific_files, path)
99- and not is_inside_any(self.exclude, path)):
100- # was inside the selected path, and not excluded - if not
101- # present it has been deleted so skip.
102- continue
103- # From here down it was either not selected, or was excluded:
104- # We preserve the entry unaltered.
105- ie = old_ie.copy()
106- # Note: specific file commits after a merge are currently
107- # prohibited. This test is for sanity/safety in case it's
108- # required after that changes.
109- if len(self.parents) > 1:
110- ie.revision = None
111- self.builder.record_entry_contents(ie, self.parent_invs, path,
112- self.basis_tree, None)
113-
114- def _report_and_accumulate_deletes(self):
115- if (isinstance(self.basis_inv, Inventory)
116- and isinstance(self.builder.new_inventory, Inventory)):
117- # the older Inventory classes provide a _byid dict, and building a
118- # set from the keys of this dict is substantially faster than even
119- # getting a set of ids from the inventory
120- #
121- # <lifeless> set(dict) is roughly the same speed as
122- # set(iter(dict)) and both are significantly slower than
123- # set(dict.keys())
124- deleted_ids = set(self.basis_inv._byid.keys()) - \
125- set(self.builder.new_inventory._byid.keys())
126- else:
127- deleted_ids = set(self.basis_inv) - set(self.builder.new_inventory)
128- if deleted_ids:
129- self.any_entries_deleted = True
130- deleted = sorted([(self.basis_tree.id2path(file_id), file_id)
131- for file_id in deleted_ids])
132- # XXX: this is not quite directory-order sorting
133- for path, file_id in deleted:
134- self.builder.record_delete(path, file_id)
135- self.reporter.deleted(path)
136-
137 def _check_strict(self):
138 # XXX: when we use iter_changes this would likely be faster if
139 # iter_changes would check for us (even in the presence of
140@@ -803,107 +725,6 @@
141 for unknown in self.work_tree.unknowns():
142 raise StrictCommitFailed()
143
144- def _populate_from_inventory(self):
145- """Populate the CommitBuilder by walking the working tree inventory."""
146- # Build the revision inventory.
147- #
148- # This starts by creating a new empty inventory. Depending on
149- # which files are selected for commit, and what is present in the
150- # current tree, the new inventory is populated. inventory entries
151- # which are candidates for modification have their revision set to
152- # None; inventory entries that are carried over untouched have their
153- # revision set to their prior value.
154- #
155- # ESEPARATIONOFCONCERNS: this function is diffing and using the diff
156- # results to create a new inventory at the same time, which results
157- # in bugs like #46635. Any reason not to use/enhance Tree.changes_from?
158- # ADHB 11-07-2006
159-
160- specific_files = self.specific_files
161- exclude = self.exclude
162- report_changes = self.reporter.is_verbose()
163- deleted_ids = []
164- # A tree of paths that have been deleted. E.g. if foo/bar has been
165- # deleted, then we have {'foo':{'bar':{}}}
166- deleted_paths = {}
167- # XXX: Note that entries may have the wrong kind because the entry does
168- # not reflect the status on disk.
169- # NB: entries will include entries within the excluded ids/paths
170- # because iter_entries_by_dir has no 'exclude' facility today.
171- entries = self.work_tree.iter_entries_by_dir(
172- specific_file_ids=self.specific_file_ids, yield_parents=True)
173- for path, existing_ie in entries:
174- file_id = existing_ie.file_id
175- name = existing_ie.name
176- parent_id = existing_ie.parent_id
177- kind = existing_ie.kind
178- # Skip files that have been deleted from the working tree.
179- # The deleted path ids are also recorded so they can be explicitly
180- # unversioned later.
181- if deleted_paths:
182- path_segments = splitpath(path)
183- deleted_dict = deleted_paths
184- for segment in path_segments:
185- deleted_dict = deleted_dict.get(segment, None)
186- if not deleted_dict:
187- # We either took a path not present in the dict
188- # (deleted_dict was None), or we've reached an empty
189- # child dir in the dict, so are now a sub-path.
190- break
191- else:
192- deleted_dict = None
193- if deleted_dict is not None:
194- # the path has a deleted parent, do not add it.
195- continue
196- if exclude and is_inside_any(exclude, path):
197- # Skip excluded paths. Excluded paths are processed by
198- # _update_builder_with_changes.
199- continue
200- content_summary = self.work_tree.path_content_summary(path)
201- kind = content_summary[0]
202- # Note that when a filter of specific files is given, we must only
203- # skip/record deleted files matching that filter.
204- if not specific_files or is_inside_any(specific_files, path):
205- if kind == 'missing':
206- if not deleted_paths:
207- # path won't have been split yet.
208- path_segments = splitpath(path)
209- deleted_dict = deleted_paths
210- for segment in path_segments:
211- deleted_dict = deleted_dict.setdefault(segment, {})
212- self.reporter.missing(path)
213- self._next_progress_entry()
214- deleted_ids.append(file_id)
215- continue
216- # TODO: have the builder do the nested commit just-in-time IF and
217- # only if needed.
218- if kind == 'tree-reference':
219- # enforce repository nested tree policy.
220- if (not self.work_tree.supports_tree_reference() or
221- # repository does not support it either.
222- not self.branch.repository._format.supports_tree_reference):
223- kind = 'directory'
224- content_summary = (kind, None, None, None)
225- elif self.recursive == 'down':
226- nested_revision_id = self._commit_nested_tree(
227- file_id, path)
228- content_summary = (kind, None, None, nested_revision_id)
229- else:
230- nested_revision_id = self.work_tree.get_reference_revision(file_id)
231- content_summary = (kind, None, None, nested_revision_id)
232-
233- # Record an entry for this item
234- # Note: I don't particularly want to have the existing_ie
235- # parameter but the test suite currently (28-Jun-07) breaks
236- # without it thanks to a unicode normalisation issue. :-(
237- definitely_changed = kind != existing_ie.kind
238- self._record_entry(path, file_id, specific_files, kind, name,
239- parent_id, definitely_changed, existing_ie, report_changes,
240- content_summary)
241-
242- # Unversion IDs that were found to be deleted
243- self.deleted_ids = deleted_ids
244-
245 def _commit_nested_tree(self, file_id, path):
246 "Commit a nested tree."
247 sub_tree = self.work_tree.get_nested_tree(file_id, path)
248@@ -929,49 +750,6 @@
249 except errors.PointlessCommit:
250 return self.work_tree.get_reference_revision(file_id)
251
252- def _record_entry(self, path, file_id, specific_files, kind, name,
253- parent_id, definitely_changed, existing_ie, report_changes,
254- content_summary):
255- "Record the new inventory entry for a path if any."
256- # mutter('check %s {%s}', path, file_id)
257- # mutter('%s selected for commit', path)
258- if definitely_changed or existing_ie is None:
259- ie = make_entry(kind, name, parent_id, file_id)
260- else:
261- ie = existing_ie.copy()
262- ie.revision = None
263- # For carried over entries we don't care about the fs hash - the repo
264- # isn't generating a sha, so we're not saving computation time.
265- _, _, fs_hash = self.builder.record_entry_contents(
266- ie, self.parent_invs, path, self.work_tree, content_summary)
267- if report_changes:
268- self._report_change(ie, path)
269- if fs_hash:
270- self.work_tree._observed_sha1(ie.file_id, path, fs_hash)
271- return ie
272-
273- def _report_change(self, ie, path):
274- """Report a change to the user.
275-
276- The change that has occurred is described relative to the basis
277- inventory.
278- """
279- if (self.basis_inv.has_id(ie.file_id)):
280- basis_ie = self.basis_inv[ie.file_id]
281- else:
282- basis_ie = None
283- change = ie.describe_change(basis_ie, ie)
284- if change in (InventoryEntry.RENAMED,
285- InventoryEntry.MODIFIED_AND_RENAMED):
286- old_path = self.basis_inv.id2path(ie.file_id)
287- self.reporter.renamed(change, old_path, path)
288- self._next_progress_entry()
289- else:
290- if change == gettext('unchanged'):
291- return
292- self.reporter.snapshot_change(change, path)
293- self._next_progress_entry()
294-
295 def _set_progress_stage(self, name, counter=False):
296 """Set the progress stage and emit an update to the progress bar."""
297 self.pb_stage_name = name
298@@ -994,20 +772,3 @@
299 else:
300 text = gettext("%s - Stage") % (self.pb_stage_name, )
301 self.pb.update(text, self.pb_stage_count, self.pb_stage_total)
302-
303- def _set_specific_file_ids(self):
304- """populate self.specific_file_ids if we will use it."""
305- if not self.use_record_iter_changes:
306- # If provided, ensure the specified files are versioned
307- if self.specific_files is not None:
308- # Note: This routine is being called because it raises
309- # PathNotVersionedError as a side effect of finding the IDs. We
310- # later use the ids we found as input to the working tree
311- # inventory iterator, so we only consider those ids rather than
312- # examining the whole tree again.
313- # XXX: Dont we have filter_unversioned to do this more
314- # cheaply?
315- self.specific_file_ids = tree.find_ids_across_trees(
316- self.specific_files, [self.basis_tree, self.work_tree])
317- else:
318- self.specific_file_ids = None
319
320=== modified file 'breezy/tests/per_workingtree/test_commit.py'
321--- breezy/tests/per_workingtree/test_commit.py 2017-06-10 00:17:06 +0000
322+++ breezy/tests/per_workingtree/test_commit.py 2017-06-20 22:37:22 +0000
323@@ -420,6 +420,7 @@
324 if not tree.supports_tree_reference():
325 # inapplicable test.
326 return
327+ self.knownFailure('nested trees don\'t work well with iter_changes')
328 subtree = self.make_branch_and_tree('subtree')
329 tree.add(['subtree'])
330 self.build_tree(['subtree/file'])
331
332=== modified file 'breezy/tests/test_merge.py'
333--- breezy/tests/test_merge.py 2017-06-10 16:40:42 +0000
334+++ breezy/tests/test_merge.py 2017-06-20 22:37:22 +0000
335@@ -226,6 +226,8 @@
336 tree_a.conflicts())
337
338 def test_nested_merge(self):
339+ self.knownFailure(
340+ 'iter_changes doesn\'t work with changes in nested trees')
341 tree = self.make_branch_and_tree('tree',
342 format='development-subtree')
343 sub_tree = self.make_branch_and_tree('tree/sub-tree',
344
345=== modified file 'doc/en/release-notes/brz-3.0.txt'
346--- doc/en/release-notes/brz-3.0.txt 2017-06-19 14:35:58 +0000
347+++ doc/en/release-notes/brz-3.0.txt 2017-06-20 22:37:22 +0000
348@@ -121,6 +121,9 @@
349 * All previously deprecated functionality has been removed.
350 (Jelmer Vernooij)
351
352+ * ``CommitBuilder.record_entry_contents`` has been removed.
353+ (Jelmer Vernooij, #731433, #604953)
354+
355 * Renamed ``breezy.delta.report_delta`` parameter ``filter=`` to
356 ``predicate=``. (Martin Packman)
357

Subscribers

People subscribed via source and target branches