index-pack: calculate {ref,ofs}_{first,last} early

This is refactoring 2 of 2 to simplify struct base_data.

Whenever we make a struct base_data, immediately calculate its delta
children. This eliminates confusion as to when the
{ref,ofs}_{first,last} fields are initialized.

Before this patch, the delta children were calculated at the last
possible moment. This allowed the members of struct base_data to be
populated in any order, superficially useful when we have the object
contents before the struct object_entry. But this makes reasoning about
the state of struct base_data more complicated, hence this patch.

Signed-off-by: Jonathan Tan <jonathantanmy@google.com>
Signed-off-by: Junio C Hamano <gitster@pobox.com>
This commit is contained in:
Jonathan Tan 2020-08-24 12:16:36 -07:00 committed by Junio C Hamano
parent a7f7e84a49
commit b4718cae51

View file

@ -33,12 +33,15 @@ struct object_stat {
}; };
struct base_data { struct base_data {
/* Initialized by make_base(). */
struct base_data *base; struct base_data *base;
struct object_entry *obj; struct object_entry *obj;
void *data;
unsigned long size;
int ref_first, ref_last; int ref_first, ref_last;
int ofs_first, ofs_last; int ofs_first, ofs_last;
/* Not initialized by make_base(). */
void *data;
unsigned long size;
}; };
struct thread_local { struct thread_local {
@ -362,14 +365,6 @@ static void set_thread_data(struct thread_local *data)
pthread_setspecific(key, data); pthread_setspecific(key, data);
} }
static struct base_data *alloc_base_data(void)
{
struct base_data *base = xcalloc(1, sizeof(struct base_data));
base->ref_last = -1;
base->ofs_last = -1;
return base;
}
static void free_base_data(struct base_data *c) static void free_base_data(struct base_data *c)
{ {
if (c->data) { if (c->data) {
@ -406,19 +401,6 @@ static void prune_base_data(struct base_data *youngest_child)
free(ancestry); free(ancestry);
} }
static void link_base_data(struct base_data *base, struct base_data *c)
{
c->base = base;
if (c->data)
get_thread_data()->base_cache_used += c->size;
prune_base_data(c);
}
static void unlink_base_data(struct base_data *c)
{
free_base_data(c);
}
static int is_delta_type(enum object_type type) static int is_delta_type(enum object_type type)
{ {
return (type == OBJ_REF_DELTA || type == OBJ_OFS_DELTA); return (type == OBJ_REF_DELTA || type == OBJ_OFS_DELTA);
@ -929,10 +911,25 @@ static void *get_base_data(struct base_data *c)
return c->data; return c->data;
} }
static void resolve_delta(struct object_entry *delta_obj, static struct base_data *make_base(struct object_entry *obj,
struct base_data *base, struct base_data *result) struct base_data *parent)
{ {
void *base_data, *delta_data; struct base_data *base = xcalloc(1, sizeof(struct base_data));
base->base = parent;
base->obj = obj;
find_ref_delta_children(&obj->idx.oid,
&base->ref_first, &base->ref_last);
find_ofs_delta_children(obj->idx.offset,
&base->ofs_first, &base->ofs_last);
return base;
}
static struct base_data *resolve_delta(struct object_entry *delta_obj,
struct base_data *base)
{
void *base_data, *delta_data, *result_data;
struct base_data *result;
unsigned long result_size;
if (show_stat) { if (show_stat) {
int i = delta_obj - objects; int i = delta_obj - objects;
@ -946,19 +943,31 @@ static void resolve_delta(struct object_entry *delta_obj,
} }
delta_data = get_data_from_pack(delta_obj); delta_data = get_data_from_pack(delta_obj);
base_data = get_base_data(base); base_data = get_base_data(base);
result->obj = delta_obj; result_data = patch_delta(base_data, base->size,
result->data = patch_delta(base_data, base->size, delta_data, delta_obj->size, &result_size);
delta_data, delta_obj->size, &result->size);
free(delta_data); free(delta_data);
if (!result->data) if (!result_data)
bad_object(delta_obj->idx.offset, _("failed to apply delta")); bad_object(delta_obj->idx.offset, _("failed to apply delta"));
hash_object_file(the_hash_algo, result->data, result->size, hash_object_file(the_hash_algo, result_data, result_size,
type_name(delta_obj->real_type), &delta_obj->idx.oid); type_name(delta_obj->real_type), &delta_obj->idx.oid);
sha1_object(result->data, NULL, result->size, delta_obj->real_type, sha1_object(result_data, NULL, result_size, delta_obj->real_type,
&delta_obj->idx.oid); &delta_obj->idx.oid);
result = make_base(delta_obj, base);
if (result->ref_last == -1 && result->ofs_last == -1) {
free(result_data);
} else {
result->data = result_data;
result->size = result_size;
get_thread_data()->base_cache_used += result->size;
prune_base_data(result);
}
counter_lock(); counter_lock();
nr_resolved_deltas++; nr_resolved_deltas++;
counter_unlock(); counter_unlock();
return result;
} }
/* /*
@ -984,24 +993,9 @@ static int compare_and_swap_type(signed char *type,
static struct base_data *find_unresolved_deltas_1(struct base_data *base, static struct base_data *find_unresolved_deltas_1(struct base_data *base,
struct base_data *prev_base) struct base_data *prev_base)
{ {
if (base->ref_last == -1 && base->ofs_last == -1) {
find_ref_delta_children(&base->obj->idx.oid,
&base->ref_first, &base->ref_last);
find_ofs_delta_children(base->obj->idx.offset,
&base->ofs_first, &base->ofs_last);
if (base->ref_last == -1 && base->ofs_last == -1) {
free(base->data);
return NULL;
}
link_base_data(prev_base, base);
}
if (base->ref_first <= base->ref_last) { if (base->ref_first <= base->ref_last) {
struct object_entry *child = objects + ref_deltas[base->ref_first].obj_no; struct object_entry *child = objects + ref_deltas[base->ref_first].obj_no;
struct base_data *result = alloc_base_data(); struct base_data *result;
if (!compare_and_swap_type(&child->real_type, OBJ_REF_DELTA, if (!compare_and_swap_type(&child->real_type, OBJ_REF_DELTA,
base->obj->real_type)) base->obj->real_type))
@ -1009,7 +1003,7 @@ static struct base_data *find_unresolved_deltas_1(struct base_data *base,
(uintmax_t)child->idx.offset, (uintmax_t)child->idx.offset,
oid_to_hex(&base->obj->idx.oid)); oid_to_hex(&base->obj->idx.oid));
resolve_delta(child, base, result); result = resolve_delta(child, base);
if (base->ref_first == base->ref_last && base->ofs_last == -1) if (base->ref_first == base->ref_last && base->ofs_last == -1)
free_base_data(base); free_base_data(base);
@ -1019,11 +1013,11 @@ static struct base_data *find_unresolved_deltas_1(struct base_data *base,
if (base->ofs_first <= base->ofs_last) { if (base->ofs_first <= base->ofs_last) {
struct object_entry *child = objects + ofs_deltas[base->ofs_first].obj_no; struct object_entry *child = objects + ofs_deltas[base->ofs_first].obj_no;
struct base_data *result = alloc_base_data(); struct base_data *result;
assert(child->real_type == OBJ_OFS_DELTA); assert(child->real_type == OBJ_OFS_DELTA);
child->real_type = base->obj->real_type; child->real_type = base->obj->real_type;
resolve_delta(child, base, result); result = resolve_delta(child, base);
if (base->ofs_first == base->ofs_last) if (base->ofs_first == base->ofs_last)
free_base_data(base); free_base_data(base);
@ -1031,7 +1025,7 @@ static struct base_data *find_unresolved_deltas_1(struct base_data *base,
return result; return result;
} }
unlink_base_data(base); free_base_data(base);
return NULL; return NULL;
} }
@ -1074,9 +1068,8 @@ static int compare_ref_delta_entry(const void *a, const void *b)
static void resolve_base(struct object_entry *obj) static void resolve_base(struct object_entry *obj)
{ {
struct base_data *base_obj = alloc_base_data(); struct base_data *base_obj = make_base(obj, NULL);
base_obj->obj = obj;
base_obj->data = NULL;
find_unresolved_deltas(base_obj); find_unresolved_deltas(base_obj);
} }
@ -1369,22 +1362,26 @@ static void fix_unresolved_deltas(struct hashfile *f)
for (i = 0; i < nr_ref_deltas; i++) { for (i = 0; i < nr_ref_deltas; i++) {
struct ref_delta_entry *d = sorted_by_pos[i]; struct ref_delta_entry *d = sorted_by_pos[i];
enum object_type type; enum object_type type;
struct base_data *base_obj = alloc_base_data(); struct base_data *base;
void *data;
unsigned long size;
struct object_entry *obj;
if (objects[d->obj_no].real_type != OBJ_REF_DELTA) if (objects[d->obj_no].real_type != OBJ_REF_DELTA)
continue; continue;
base_obj->data = read_object_file(&d->oid, &type, data = read_object_file(&d->oid, &type, &size);
&base_obj->size); if (!data)
if (!base_obj->data)
continue; continue;
if (check_object_signature(the_repository, &d->oid, if (check_object_signature(the_repository, &d->oid,
base_obj->data, base_obj->size, data, size,
type_name(type))) type_name(type)))
die(_("local object %s is corrupt"), oid_to_hex(&d->oid)); die(_("local object %s is corrupt"), oid_to_hex(&d->oid));
base_obj->obj = append_obj_to_pack(f, d->oid.hash, obj = append_obj_to_pack(f, d->oid.hash, data, size, type);
base_obj->data, base_obj->size, type); base = make_base(obj, NULL);
find_unresolved_deltas(base_obj); base->data = data;
base->size = size;
find_unresolved_deltas(base);
display_progress(progress, nr_resolved_deltas); display_progress(progress, nr_resolved_deltas);
} }
free(sorted_by_pos); free(sorted_by_pos);