Rev 2503: Refactor, so that the inner _fields_to_entries function is the in http://bzr.arbash-meinel.com/branches/bzr/0.17-dev/dirstate_pyrex
John Arbash Meinel
john at arbash-meinel.com
Fri May 4 22:04:53 BST 2007
At http://bzr.arbash-meinel.com/branches/bzr/0.17-dev/dirstate_pyrex
------------------------------------------------------------
revno: 2503
revision-id: john at arbash-meinel.com-20070504210438-cvtzgzh4xbad7kww
parent: john at arbash-meinel.com-20070504200015-yli1te8jfhk3xpjc
committer: John Arbash Meinel <john at arbash-meinel.com>
branch nick: dirstate_pyrex
timestamp: Fri 2007-05-04 16:04:38 -0500
message:
Refactor, so that the inner _fields_to_entries function is the
doing the path comparison, and it will re-use the dirname object,
rather than copying a new string each time.
This should have equivalent performance, but have a rather large
memory savings, because we don't maintain N copies of the dirname
for N files in that directory.
It (theoretically) will speed up some comparisons, too,
because the string hash, etc, will be properly cached.
modified:
bzrlib/compiled/dirstate_helpers.pyx dirstate_helpers.pyx-20070503201057-u425eni465q4idwn-3
-------------- next part --------------
=== modified file 'bzrlib/compiled/dirstate_helpers.pyx'
--- a/bzrlib/compiled/dirstate_helpers.pyx 2007-05-04 20:00:15 +0000
+++ b/bzrlib/compiled/dirstate_helpers.pyx 2007-05-04 21:04:38 +0000
@@ -58,6 +58,7 @@
int PyString_CheckExact(object p)
void Py_INCREF(object)
+ void Py_INCREF_PyObject "Py_INCREF" (PyObject *)
void Py_DECREF(object)
@@ -192,17 +193,31 @@
cdef object _fields_to_entry_0_parents(PyListObject *fields, int offset,
- void **dirname, char **dirname_str):
+ void **p_current_dirname,
+ int *new_block):
cdef object path_name_file_id_key
cdef char *size_str
cdef unsigned long int size
cdef char* executable_str
cdef int is_executable
cdef PyObject **base
+ cdef void* dirname
+ cdef char* dirname_str
+
+ # Is this too abusive?
base = fields.ob_item + offset
- dirname[0] = base[0]
- dirname_str[0] = PyString_AS_STRING_void(base[0])
- path_name_file_id_key = (<object>(base[0]),
+
+ dirname = base[0]
+ dirname_str = PyString_AS_STRING_void(dirname)
+
+ if strcmp(dirname_str,
+ PyString_AS_STRING_void(p_current_dirname[0])) != 0:
+ Py_INCREF_PyObject(<PyObject *>dirname)
+ p_current_dirname[0] = dirname
+ new_block[0] = 1
+ else:
+ new_block[0] = 0
+ path_name_file_id_key = (<object>p_current_dirname[0],
<object>(base[1]),
<object>(base[2]),
)
@@ -229,27 +244,28 @@
int field_count):
cdef object current_block
cdef object entry
- cdef void* dirname
- cdef char* dirname_str
- cdef char* current_dirname_str
+ cdef void * current_dirname
+ cdef int new_block
if not PyList_CheckExact(fields):
raise TypeError('fields must be a list')
state._dirblocks = [('', []), ('', [])]
current_block = state._dirblocks[0][1]
- current_dirname_str = ''
+ obj = ''
+ current_dirname= <void*>obj
+ new_block = 0
while pos < field_count:
entry = _fields_to_entry_0_parents(<PyListObject *>fields, pos,
- &dirname, &dirname_str)
+ ¤t_dirname,
+ &new_block)
pos = pos + entry_size
- if (strcmp(dirname_str, current_dirname_str) != 0):
+ if new_block:
# new block - different dirname
current_block = []
- current_dirname_str = dirname_str
PyList_Append(state._dirblocks,
- (<object>dirname, current_block))
+ (<object>current_dirname, current_block))
PyList_Append(current_block, entry)
state._split_root_dirblock_into_contents()
More information about the bazaar-commits
mailing list