diff options
| author | tompng (tomoya ishida) <tomoyapenguin@gmail.com> | 2021-04-11 19:04:31 +0900 |
|---|---|---|
| committer | Nobuyoshi Nakada <nobu@ruby-lang.org> | 2021-04-11 19:05:26 +0900 |
| commit | 9f9045123efefbd11dd397b4d59596290765feec (patch) | |
| tree | 7b7b4d76d96ca6be82e7c4d26eb3f5e161ea0d18 | |
| parent | 60bdf03b6d982777656acc11bdeb2ca4b4c3f1ef (diff) | |
st.c: skip all deleted entries [Bug #17779]
Update the start entry skipping all already deleted entries.
Fixes performance issue of `Hash#first` in a certain case.
| -rw-r--r-- | benchmark/hash_first.yml | 11 | ||||
| -rw-r--r-- | st.c | 9 |
2 files changed, 18 insertions, 2 deletions
diff --git a/benchmark/hash_first.yml b/benchmark/hash_first.yml new file mode 100644 index 0000000000..c26df1a7ed --- /dev/null +++ b/benchmark/hash_first.yml @@ -0,0 +1,11 @@ +prelude: | + hash1 = 1_000_000.times.to_h { [rand, true]} + hash2 = hash1.dup + hash2.keys[1..100_000].each { hash2.delete _1 } + hash2.delete hash2.first[0] + +benchmark: + hash1: hash1.first + hash2: hash2.first + +loop_count: 100_000 @@ -1244,8 +1244,13 @@ update_range_for_deleted(st_table *tab, st_index_t n) { /* Do not update entries_bound here. Otherwise, we can fill all bins by deleted entry value before rebuilding the table. */ - if (tab->entries_start == n) - tab->entries_start = n + 1; + if (tab->entries_start == n) { + st_index_t start = n + 1; + st_index_t bound = tab->entries_bound; + st_table_entry *entries = tab->entries; + while (start < bound && DELETED_ENTRY_P(&entries[start])) start++; + tab->entries_start = start; + } } /* Delete entry with KEY from table TAB, set up *VALUE (unless |
