Rev 4782: Revert the ugly stuff, and do it properly, one step at a time. in http://bazaar.launchpad.net/~jameinel/bzr/2.1-static-tuple-chk-map

Fri Oct 23 16:37:07 BST 2009

At http://bazaar.launchpad.net/~jameinel/bzr/2.1-static-tuple-chk-map

------------------------------------------------------------
revno: 4782
revision-id: john at arbash-meinel.com-20091023153654-n8in6fpsc8p4665h
parent: john at arbash-meinel.com-20091023152444-pomqe6xmbyaowpom
committer: John Arbash Meinel <john at arbash-meinel.com>
branch nick: 2.1-static-tuple-chk-map
timestamp: Fri 2009-10-23 10:36:54 -0500
message:
  Revert the ugly stuff, and do it properly, one step at a time.
  
  In _filter_text_keys, we were extracting (file_id, revision_id) from the
  CHKMap value section. However, we were leaving them as regular strings, and a
  regular tuple. Using StaticTuple(intern(file_id), intern(revision_id)).intern()
  results in a 40MB decrease in peak memory during 'stream test'.
-------------- next part --------------
=== modified file 'bzrlib/chk_map.py'

--- a/bzrlib/chk_map.py	2009-10-23 15:24:44 +0000
+++ b/bzrlib/chk_map.py	2009-10-23 15:36:54 +0000
@@ -1460,7 +1460,6 @@
         #       that just meanst that we will have *both* a StaticTuple and a
         #       tuple() in memory, referring to the same object. (so a net
         #       increase in memory, not a decrease.)
-        trace.debug_memory('starting a new CHKMapDifference')
         self._store = store
         self._new_root_keys = new_root_keys
         self._old_root_keys = old_root_keys
@@ -1490,7 +1489,6 @@
         # this code. (We may want to evaluate saving the raw bytes into the
         # page cache, which would allow a working tree update after the fetch
         # to not have to read the bytes again.)
-        as_st = StaticTuple.from_sequence
         stream = self._store.get_record_stream(keys, 'unordered', True)
         for record in stream:
             if self._pb is not None:
@@ -1503,15 +1501,23 @@
             if type(node) is InternalNode:
                 # Note we don't have to do node.refs() because we know that
                 # there are no children that have been pushed into this node
-                # TODO: We might want to intern these StaticTuple instances, we
-                #       need to check how much redundancy there is
-                prefix_refs = [as_st(item) for item in node._items.iteritems()]
+                # TODO: Turn these into StaticTuple, and possibly intern them.
+                #       The sha1 pointer (in this case the value), should
+                #       already be a static tuple, and properly interned. So
+                #       i'm not sure if there is a big win on top of that
+                prefix_refs = node._items.items()
                 items = []
             else:
                 prefix_refs = []
-                # TODO: We might want to intern these StaticTuple instances, we
-                #       need to check how much redundancy there is
-                items = [as_st(item) for item in node._items.iteritems()]
+                # TODO: Turn these into StaticTuple, and possibly intern them.
+                #       This points (ST(file_id), value), which in reality
+                #       should be pretty common, because of all the leaf nodes
+                #       that share most of the entries. Note, though, that we
+                #       didn't find a benefit to interning the value, so there
+                #       may not be an actual benefit to interning this tuple.
+                #       The file_key should already be interned. If it isn't we
+                #       need to look into it.
+                items = node._items.items()
             yield record, node, prefix_refs, items
 
     def _read_old_roots(self):
@@ -1605,8 +1611,6 @@
         # First pass, flush all interesting items and convert to using direct refs
         all_old_chks = self._all_old_chks
         processed_new_refs = self._processed_new_refs
-        # We will be processing these in this pass
-        processed_new_refs.update(refs)
         all_old_items = self._all_old_items
         new_items = [item for item in self._new_item_queue
                            if item not in all_old_items]
@@ -1614,35 +1618,19 @@
         if new_items:
             yield None, new_items
         refs = refs.difference(all_old_chks)
-        trace.debug_memory('sent %d new_items' % (len(new_items),))
         while refs:
             next_refs = set()
             next_refs_update = next_refs.update
             # Inlining _read_nodes_from_store improves 'bzr branch bzr.dev'
             # from 1m54s to 1m51s. Consider it.
-            idx = 0
             for record, _, p_refs, items in self._read_nodes_from_store(refs):
-                idx += 1
-                if idx & 0x7fff == 0:
-                    import sys
-                    from meliae import scanner
-                    #scanner.dump_all_objects('memory_dump-%d.json' % (idx,))
-                    # Generally *everything* is reachable from _getframe
-                    count, size = scanner.get_recursive_size(sys._getframe())
-                    trace.debug_memory('read %d records %d objects %.1fMB'
-                                       % (idx, count, size/ 1024. / 1024))
                 items = [item for item in items
                          if item not in all_old_items]
                 yield record, items
                 next_refs_update([p_r[1] for p_r in p_refs])
-            trace.debug_memory('processed %d refs, shrinking %d'
-                               % (len(refs), len(next_refs)))
             next_refs = next_refs.difference(all_old_chks)
             next_refs = next_refs.difference(processed_new_refs)
             processed_new_refs.update(next_refs)
-            trace.debug_memory('processed %d refs (%d total), working on %d'
-                               % (len(refs), len(processed_new_refs),
-                                  len(next_refs)))
             refs = next_refs
 
     def _process_next_old(self):
@@ -1660,19 +1648,13 @@
     def _process_queues(self):
         while self._old_queue:
             self._process_next_old()
-            trace.debug_memory('processed next old')
-        trace.debug_memory('preparing to flush new queue %d'
-                           % (len(self._new_queue),))
         return self._flush_new_queue()
 
     def process(self):
         for record in self._read_all_roots():
             yield record, []
-        trace.debug_memory('after reading all roots (%d old to proc)'
-                           % (len(self._old_queue)))
         for record, items in self._process_queues():
             yield record, items
-        trace.debug_memory('processed queues')
 
 
 def iter_interesting_nodes(store, interesting_root_keys,

=== modified file 'bzrlib/groupcompress.py'
--- a/bzrlib/groupcompress.py	2009-10-23 15:24:44 +0000
+++ b/bzrlib/groupcompress.py	2009-10-23 15:36:54 +0000
@@ -1832,9 +1832,6 @@
         self.has_graph = parents
         self._is_locked = is_locked
         self._inconsistency_fatal = inconsistency_fatal
-        # GroupCompress records tend to have the same 'group' start + offset
-        # repeated over and over, this creates a surplus of ints
-        self._int_cache = {}
         if track_external_parent_refs:
             self._key_dependencies = knit._KeyRefs(
                 track_new_keys=track_new_keys)
@@ -2016,17 +2013,13 @@
         """Convert an index value to position details."""
         bits = node[2].split(' ')
         # It would be nice not to read the entire gzip.
-        # Note, start and stop would be good objects to 'intern', they are
-        # likely to be duplicated many times in a given index
+        # TODO: Intern the start and stop integers. They are *very* common
+        #       between all records in the index. See revno 4781
         start = int(bits[0])
-        start = self._int_cache.setdefault(start, start)
         stop = int(bits[1])
-        stop = self._int_cache.setdefault(stop, stop)
         basis_end = int(bits[2])
         delta_end = int(bits[3])
-        # We can't use StaticTuple here, because node[0] is a BTreeGraphIndex
-        # instance...
-        return (node[0], start, stop, basis_end, delta_end)
+        return node[0], start, stop, basis_end, delta_end
 
     def scan_unvalidated_index(self, graph_index):
         """Inform this _GCGraphIndex that there is an unvalidated index.

=== modified file 'bzrlib/repofmt/groupcompress_repo.py'
--- a/bzrlib/repofmt/groupcompress_repo.py	2009-10-23 15:24:44 +0000
+++ b/bzrlib/repofmt/groupcompress_repo.py	2009-10-23 15:36:54 +0000
@@ -598,7 +598,6 @@
         #   - and any present parent inventories have their chk root
         #     entries too.
         # And all this should be independent of any fallback repository.
-        trace.debug_memory('starting _check_new_inventories')
         problems = []
         key_deps = self.repo.revisions._index._key_dependencies
         new_revisions_keys = key_deps.get_new_keys()
@@ -640,7 +639,6 @@
                 % (sorted(missing_chk_roots),))
             # Don't bother checking any further.
             return problems
-        trace.debug_memory('after looking for missing_chk_roots')
         # Find all interesting chk_bytes records, and make sure they are
         # present, as well as the text keys they reference.
         chk_bytes_no_fallbacks = self.repo.chk_bytes.without_fallbacks()
@@ -671,7 +669,6 @@
         if missing_text_keys:
             problems.append("missing text keys: %r"
                 % (sorted(missing_text_keys),))
-        trace.debug_memory('after checking for missing text keys')
         return problems
 
     def _execute_pack_operations(self, pack_operations,
@@ -1111,14 +1108,10 @@
         for stream_info in self._fetch_revision_texts(revision_ids):
             yield stream_info
         self._revision_keys = [(rev_id,) for rev_id in revision_ids]
-        trace.debug_memory('Before clearing revisions cache')
         self.from_repository.revisions.clear_cache()
         self.from_repository.signatures.clear_cache()
-        trace.debug_memory('after clearing revisions cache')
         yield self._get_inventory_stream(self._revision_keys)
-        trace.debug_memory('before clearing inventories cache')
         self.from_repository.inventories.clear_cache()
-        trace.debug_memory('after clearing inventories cache')
         # TODO: The keys to exclude might be part of the search recipe
         # For now, exclude all parents that are at the edge of ancestry, for
         # which we have inventories
@@ -1126,15 +1119,10 @@
         parent_keys = from_repo._find_parent_keys_of_revisions(
                         self._revision_keys)
         for stream_info in self._get_filtered_chk_streams(parent_keys):
-            trace.debug_memory('during _get_filtered_chk_streams')
             yield stream_info
-        trace.debug_memory('before clearing chk_bytes')
         self.from_repository.chk_bytes.clear_cache()
-        trace.debug_memory('after clearing chk_bytes')
         yield self._get_text_stream()
-        trace.debug_memory('after text stream')
         self.from_repository.texts.clear_cache()
-        trace.debug_memory('after clearing text cache')
 
     def get_stream_for_missing_keys(self, missing_keys):
         # missing keys can only occur when we are byte copying and not