diff options
author | Nicolas Pitre <nico@cam.org> | 2005-05-06 13:48:34 -0400 |
---|---|---|
committer | Linus Torvalds <torvalds@ppc970.osdl.org> | 2005-05-06 11:02:01 -0700 |
commit | bd2c39f58f915af532b488c5bda753314f0db603 (patch) | |
tree | 8c1e85a4af5d77cff94fc2703c271bbfc512778e /blob.c | |
parent | f4f21ce367a5119be1c4396d01271ece6e40ff70 (diff) | |
download | git-bd2c39f58f915af532b488c5bda753314f0db603.tar.gz |
[PATCH] don't load and decompress objects twice with parse_object()
It turns out that parse_object() is loading and decompressing given
object to free it just before calling the specific object parsing
function which does mmap and decompress the same object again. This
patch introduces the ability to parse specific objects directly from a
memory buffer.
Without this patch, running git-fsck-cache on the kernel repositorytake:
real 0m13.006s
user 0m11.421s
sys 0m1.218s
With this patch applied:
real 0m8.060s
user 0m7.071s
sys 0m0.710s
The performance increase is significant, and this is kind of a
prerequisite for sane delta object support with fsck.
Signed-off-by: Nicolas Pitre <nico@cam.org>
Signed-off-by: Linus Torvalds <torvalds@osdl.org>
Diffstat (limited to 'blob.c')
-rw-r--r-- | blob.c | 14 |
1 files changed, 11 insertions, 3 deletions
@@ -22,21 +22,29 @@ struct blob *lookup_blob(unsigned char *sha1) return (struct blob *) obj; } +int parse_blob_buffer(struct blob *item, void *buffer, unsigned long size) +{ + item->object.parsed = 1; + return 0; +} + int parse_blob(struct blob *item) { char type[20]; void *buffer; unsigned long size; + int ret; + if (item->object.parsed) return 0; - item->object.parsed = 1; buffer = read_sha1_file(item->object.sha1, type, &size); if (!buffer) return error("Could not read %s", sha1_to_hex(item->object.sha1)); - free(buffer); if (strcmp(type, blob_type)) return error("Object %s not a blob", sha1_to_hex(item->object.sha1)); - return 0; + ret = parse_blob_buffer(item, buffer, size); + free(buffer); + return ret; } |