Skip to content

Commit

Permalink
IdDict: support deletion, and support nothing used as a key
Browse files Browse the repository at this point in the history
previously, if we deleted one key or added `nothing` as a key,
we might lose some of the other entries too (until rehash)

fix #26833

(cherry-pick PR #26839, 5e57c21)
  • Loading branch information
vtjnash committed Apr 27, 2018
1 parent 41143e8 commit 6d60f78
Show file tree
Hide file tree
Showing 2 changed files with 61 additions and 23 deletions.
60 changes: 37 additions & 23 deletions src/table.c
Original file line number Diff line number Diff line change
Expand Up @@ -8,7 +8,7 @@
#define keyhash(k) jl_object_id(k)
#define h2index(hv,sz) (size_t)(((hv) & ((sz)-1))*2)

static void **jl_table_lookup_bp(jl_array_t **pa, void *key);
static int jl_table_assign_bp(jl_array_t **pa, void *key, void *val);

JL_DLLEXPORT jl_array_t *jl_idtable_rehash(jl_array_t *a, size_t newsz)
{
Expand All @@ -23,7 +23,7 @@ JL_DLLEXPORT jl_array_t *jl_idtable_rehash(jl_array_t *a, size_t newsz)
JL_GC_PUSH1(&newa);
for(i=0; i < sz; i+=2) {
if (ol[i+1] != NULL) {
(*jl_table_lookup_bp(&newa, ol[i])) = ol[i+1];
jl_table_assign_bp(&newa, ol[i], ol[i + 1]);
jl_gc_wb(newa, ol[i+1]);
// it is however necessary here because allocation
// can (and will) occur in a recursive call inside table_lookup_bp
Expand All @@ -37,12 +37,12 @@ JL_DLLEXPORT jl_array_t *jl_idtable_rehash(jl_array_t *a, size_t newsz)
return newa;
}

static void **jl_table_lookup_bp(jl_array_t **pa, void *key)
static int jl_table_assign_bp(jl_array_t **pa, void *key, void *val)
{
// pa points to a **rooted** gc frame slot
uint_t hv;
jl_array_t *a = *pa;
size_t orig, index, iter;
size_t orig, index, iter, empty_slot;
size_t newsz, sz = hash_size(a);
assert(sz >= 1);
size_t maxprobe = max_probe(sz);
Expand All @@ -54,23 +54,40 @@ static void **jl_table_lookup_bp(jl_array_t **pa, void *key)
index = h2index(hv,sz);
sz *= 2;
orig = index;
empty_slot = -1;

do {
if (tab[index+1] == NULL) {
tab[index] = key;
jl_gc_wb(a, key);
return &tab[index+1];
if (tab[index] == NULL) {
if (empty_slot == -1)
empty_slot = index;
break;
}
if (jl_egal((jl_value_t *)key, (jl_value_t *)tab[index])) {
if (tab[index + 1] != NULL) {
tab[index + 1] = val;
jl_gc_wb(a, val);
return 0;
}
// `nothing` is our sentinel value for deletion, so need to keep searching if it's also our search key
assert(key == jl_nothing);
if (empty_slot == -1)
empty_slot = index;
}

if (jl_egal((jl_value_t*)key, (jl_value_t*)tab[index]))
return &tab[index+1];

index = (index+2) & (sz-1);
iter++;
if (iter > maxprobe)
break;
} while (index != orig);

if (empty_slot != -1) {
tab[empty_slot] = key;
jl_gc_wb(a, key);
tab[empty_slot + 1] = val;
jl_gc_wb(a, val);
return 1;
}

/* table full */
/* quadruple size, rehash, retry the insert */
/* it's important to grow the table really fast; otherwise we waste */
Expand All @@ -90,12 +107,9 @@ static void **jl_table_lookup_bp(jl_array_t **pa, void *key)
maxprobe = max_probe(sz);

goto retry_bp;

return NULL;
}

/* returns bp if key is in hash, otherwise NULL */
/* if return is non-NULL and *bp == NULL then key was deleted */
static void **jl_table_peek_bp(jl_array_t *a, void *key)
{
size_t sz = hash_size(a);
Expand All @@ -111,8 +125,12 @@ static void **jl_table_peek_bp(jl_array_t *a, void *key)
do {
if (tab[index] == NULL)
return NULL;
if (jl_egal((jl_value_t*)key, (jl_value_t*)tab[index]))
return &tab[index+1];
if (jl_egal((jl_value_t*)key, (jl_value_t*)tab[index])) {
if (tab[index+1] != NULL)
return &tab[index+1];
// `nothing` is our sentinel value for deletion, so need to keep searching if it's also our search key
assert(key == jl_nothing);
}

index = (index+2) & (sz-1);
iter++;
Expand All @@ -128,9 +146,7 @@ jl_array_t *jl_eqtable_put(jl_array_t *h, void *key, void *val)
{
JL_GC_PUSH1(&h);
// &h may be assigned to in jl_idtable_rehash so it need to be rooted
void **bp = jl_table_lookup_bp(&h, key);
*bp = val;
jl_gc_wb(h, val);
jl_table_assign_bp(&h, key, val);
JL_GC_POP();
return h;
}
Expand All @@ -139,16 +155,14 @@ JL_DLLEXPORT
jl_value_t *jl_eqtable_get(jl_array_t *h, void *key, jl_value_t *deflt)
{
void **bp = jl_table_peek_bp(h, key);
if (bp == NULL || *bp == NULL)
return deflt;
return (jl_value_t*)*bp;
return (bp == NULL) ? deflt : (jl_value_t *)*bp;
}

JL_DLLEXPORT
jl_value_t *jl_eqtable_pop(jl_array_t *h, void *key, jl_value_t *deflt)
{
void **bp = jl_table_peek_bp(h, key);
if (bp == NULL || *bp == NULL)
if (bp == NULL)
return deflt;
jl_value_t *val = (jl_value_t*)*bp;
*(bp-1) = jl_nothing; // clear the key
Expand Down
24 changes: 24 additions & 0 deletions test/dict.jl
Original file line number Diff line number Diff line change
Expand Up @@ -413,6 +413,30 @@ let d = @inferred ObjectIdDict(Pair(1,1), Pair(2,2), Pair(3,3))
@test eltype(d) == Pair{Any,Any}
end

@testset "issue #26833, deletion from IdDict" begin
d = ObjectIdDict()
i = 1
# generate many hash collisions
while length(d) < 32 # expected to occur at i <≈ 2^16 * 2^5
if object_id(i) % UInt16 == 0x1111
push!(d, i => true)
end
i += 1
end
k = collect(keys(d))
@test haskey(d, k[1])
delete!(d, k[1])
@test length(d) == 31
@test !haskey(d, k[1])
@test haskey(d, k[end])
push!(d, k[end] => false)
@test length(d) == 31
@test haskey(d, k[end])
@test !pop!(d, k[end])
@test !haskey(d, k[end])
@test length(d) == 30
end

# Issue #7944
let d = Dict{Int,Int}()
get!(d, 0) do
Expand Down

0 comments on commit 6d60f78

Please sign in to comment.