Signed-off-by: Stefan Beller <[email protected]>
---
>> The reason for my doubt is the potential quadratic behavior for new
>> allocations,
>> in mem_pool_alloc() we walk all mp_blocks to see if we can fit the requested
>> allocation in one of the later blocks.
>> So if we call mem_pool_alloc a million times, we get a O(n) mp_blocks which
>> we'd have to walk in each call.
>
> With the current design, when a new mp_block is allocated, it is
> placed at the head of the linked list. This means that the most
> recently allocated mp_block is the 1st block that is
> searched. The *vast* majority of allocations should be fulfilled
> from this 1st block. It is only when the block is full that we
> search other mp_blocks in the list.
I just measured on git.git and linux.git (both of which are not *huge* by
any standard, but should give a good indication. linux has 6M objects,
and when allocating 1024 at a time, we run into the new block allocation
~6000 times).
I could not measure any meaningful difference.
linux.git $ git count-objects -v
count: 0
size: 0
in-pack: 6036543
packs: 2
size-pack: 2492985
prune-packable: 0
garbage: 0
size-garbage: 0
(with this patch)
Performance counter stats for '/u/git/git count-objects -v' (30 runs):
2.123683 task-clock:u (msec) # 0.831 CPUs utilized
( +- 2.32% )
0 context-switches:u # 0.000 K/sec
0 cpu-migrations:u # 0.000 K/sec
126 page-faults:u # 0.059 M/sec
( +- 0.22% )
895,900 cycles:u # 0.422 GHz
( +- 1.40% )
976,596 instructions:u # 1.09 insn per cycle
( +- 0.01% )
218,256 branches:u # 102.772 M/sec
( +- 0.01% )
8,331 branch-misses:u # 3.82% of all branches
( +- 0.61% )
0.002556203 seconds time elapsed
( +- 2.20% )
Performance counter stats for 'git count-objects -v' (30 runs):
2.410352 task-clock:u (msec) # 0.801 CPUs utilized
( +- 2.79% )
0 context-switches:u # 0.000 K/sec
0 cpu-migrations:u # 0.000 K/sec
131 page-faults:u # 0.054 M/sec
( +- 0.16% )
993,301 cycles:u # 0.412 GHz
( +- 1.99% )
1,087,428 instructions:u # 1.09 insn per cycle
( +- 0.02% )
244,292 branches:u # 101.351 M/sec
( +- 0.02% )
9,264 branch-misses:u # 3.79% of all branches
( +- 0.57% )
0.003010854 seconds time elapsed
( +- 2.54% )
So I think we could just replace it for now and optimize again later, if it
turns out to be a problem. I think the easiest optimisation is to increase
the allocation size of having a lot more objects per mp_block.
> If this is a concern, I think
> we have a couple low cost options to mitigate it (maybe a flag to
> control whether we search past the 1st mp_block for space, or
> logic to move blocks out of the search queue when they are
> full or fall below a threshold for available space).
Instead of a flag I thought of its own struct with its own functions,
which would not just have a different searching behavior, but also
store the size in the struct such that you can just call
fixed_size_mem_pool_alloc(void) to get another pointer.
A flag might be more elegant.
>
> If this is of interest, I could contribute a patch to enable one
> of these behaviors?
I am tempted to just do away with alloc.c for now and use the mem-pool.
Thanks,
Stefan
alloc.c | 60 +++++++++++----------------------------------------------
1 file changed, 11 insertions(+), 49 deletions(-)
diff --git a/alloc.c b/alloc.c
index 12afadfacdd..bf003e161be 100644
--- a/alloc.c
+++ b/alloc.c
@@ -15,6 +15,7 @@
#include "tree.h"
#include "commit.h"
#include "tag.h"
+#include "mem-pool.h"
#define BLOCKING 1024
@@ -26,61 +27,39 @@ union any_object {
struct tag tag;
};
-struct alloc_state {
- int count; /* total number of nodes allocated */
- int nr; /* number of nodes left in current allocation */
- void *p; /* first free node in current allocation */
-};
-
-static inline void *alloc_node(struct alloc_state *s, size_t node_size)
-{
- void *ret;
-
- if (!s->nr) {
- s->nr = BLOCKING;
- s->p = xmalloc(BLOCKING * node_size);
- }
- s->nr--;
- s->count++;
- ret = s->p;
- s->p = (char *)s->p + node_size;
- memset(ret, 0, node_size);
- return ret;
-}
-
-static struct alloc_state blob_state;
+static struct mem_pool blob_state = {NULL, sizeof(struct blob)*1024 -
sizeof(struct mp_block), 0 };
void *alloc_blob_node(void)
{
- struct blob *b = alloc_node(&blob_state, sizeof(struct blob));
+ struct blob *b = mem_pool_alloc(&blob_state, sizeof(struct blob));
b->object.type = OBJ_BLOB;
return b;
}
-static struct alloc_state tree_state;
+static struct mem_pool tree_state = {NULL, sizeof(struct tree)*1024 -
sizeof(struct mp_block), 0 };
void *alloc_tree_node(void)
{
- struct tree *t = alloc_node(&tree_state, sizeof(struct tree));
+ struct tree *t = mem_pool_alloc(&tree_state, sizeof(struct tree));
t->object.type = OBJ_TREE;
return t;
}
-static struct alloc_state tag_state;
+static struct mem_pool tag_state = {NULL, sizeof(struct tag)*1024 -
sizeof(struct mp_block), 0 };
void *alloc_tag_node(void)
{
- struct tag *t = alloc_node(&tag_state, sizeof(struct tag));
+ struct tag *t = mem_pool_alloc(&tag_state, sizeof(struct tag));
t->object.type = OBJ_TAG;
return t;
}
-static struct alloc_state object_state;
+static struct mem_pool object_state = {NULL, sizeof(union any_object)*1024 -
sizeof(struct mp_block), 0 };
void *alloc_object_node(void)
{
- struct object *obj = alloc_node(&object_state, sizeof(union
any_object));
+ struct object *obj = mem_pool_alloc(&object_state, sizeof(union
any_object));
obj->type = OBJ_NONE;
return obj;
}
-static struct alloc_state commit_state;
+static struct mem_pool commit_state = {NULL, sizeof(struct commit)*1024 -
sizeof(struct mp_block), 0 };
unsigned int alloc_commit_index(void)
{
@@ -90,26 +69,9 @@ unsigned int alloc_commit_index(void)
void *alloc_commit_node(void)
{
- struct commit *c = alloc_node(&commit_state, sizeof(struct commit));
+ struct commit *c = mem_pool_alloc(&commit_state, sizeof(struct commit));
c->object.type = OBJ_COMMIT;
c->index = alloc_commit_index();
return c;
}
-static void report(const char *name, unsigned int count, size_t size)
-{
- fprintf(stderr, "%10s: %8u (%"PRIuMAX" kB)\n",
- name, count, (uintmax_t) size);
-}
-
-#define REPORT(name, type) \
- report(#name, name##_state.count, name##_state.count * sizeof(type) >> 10)
-
-void alloc_report(void)
-{
- REPORT(blob, struct blob);
- REPORT(tree, struct tree);
- REPORT(commit, struct commit);
- REPORT(tag, struct tag);
- REPORT(object, union any_object);
-}
--
2.17.0.441.gb46fe60e1d-goog