/**
|
* \file
|
* Hashtable implementation
|
*
|
* Author:
|
* Miguel de Icaza (miguel@novell.com)
|
*
|
* (C) 2006 Novell, Inc.
|
*
|
* Permission is hereby granted, free of charge, to any person obtaining
|
* a copy of this software and associated documentation files (the
|
* "Software"), to deal in the Software without restriction, including
|
* without limitation the rights to use, copy, modify, merge, publish,
|
* distribute, sublicense, and/or sell copies of the Software, and to
|
* permit persons to whom the Software is furnished to do so, subject to
|
* the following conditions:
|
*
|
* The above copyright notice and this permission notice shall be
|
* included in all copies or substantial portions of the Software.
|
*
|
* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
|
* EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
|
* MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
|
* NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE
|
* LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION
|
* OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION
|
* WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
|
*/
|
#include <config.h>
|
#include <stdio.h>
|
#include <math.h>
|
#include <glib.h>
|
#include "mono-hash.h"
|
#include "metadata/gc-internals.h"
|
#include "metadata/il2cpp-compat-metadata.h"
|
#include <mono/utils/checked-build.h>
|
#include <mono/utils/mono-threads-coop.h>
|
#include <mono/utils/unlocked.h>
|
|
void il2cpp_mono_gc_wbarrier_generic_store (void* ptr, MonoObject* value);
|
|
gint32 mono_g_hash_table_max_chain_length;
|
|
struct _MonoGHashTable {
|
GHashFunc hash_func;
|
GEqualFunc key_equal_func;
|
|
MonoObject **keys;
|
MonoObject **values;
|
int table_size;
|
int in_use;
|
GDestroyNotify value_destroy_func, key_destroy_func;
|
MonoGHashGCType gc_type;
|
MonoGCRootSource source;
|
void *key;
|
const char *msg;
|
};
|
|
#if UNUSED
|
static gboolean
|
test_prime (int x)
|
{
|
if ((x & 1) != 0) {
|
int n;
|
for (n = 3; n< (int)sqrt (x); n += 2) {
|
if ((x % n) == 0)
|
return FALSE;
|
}
|
return TRUE;
|
}
|
// There is only one even prime - 2.
|
return (x == 2);
|
}
|
|
static int
|
calc_prime (int x)
|
{
|
int i;
|
|
for (i = (x & (~1))-1; i< G_MAXINT32; i += 2) {
|
if (test_prime (i))
|
return i;
|
}
|
return x;
|
}
|
#endif
|
|
#define HASH_TABLE_MAX_LOAD_FACTOR 0.7f
|
/* We didn't really do compaction before, keep it lenient for now */
|
#define HASH_TABLE_MIN_LOAD_FACTOR 0.05f
|
/* We triple the table size at rehash time, similar with previous implementation */
|
#define HASH_TABLE_RESIZE_RATIO 3
|
|
static inline void mono_g_hash_table_key_store (MonoGHashTable *hash, int slot, MonoObject* key)
|
{
|
MonoObject **key_addr = &hash->keys [slot];
|
if (hash->gc_type & MONO_HASH_KEY_GC)
|
mono_gc_wbarrier_generic_store (key_addr, key);
|
else
|
*key_addr = key;
|
}
|
|
static inline void mono_g_hash_table_value_store (MonoGHashTable *hash, int slot, MonoObject* value)
|
{
|
MonoObject **value_addr = &hash->values [slot];
|
if (hash->gc_type & MONO_HASH_VALUE_GC)
|
mono_gc_wbarrier_generic_store (value_addr, value);
|
else
|
*value_addr = value;
|
}
|
|
/* Returns position of key or of an empty slot for it */
|
static inline int mono_g_hash_table_find_slot (MonoGHashTable *hash, const MonoObject *key)
|
{
|
guint start = ((*hash->hash_func) (key)) % hash->table_size;
|
guint i = start;
|
|
if (hash->key_equal_func) {
|
GEqualFunc equal = hash->key_equal_func;
|
|
while (hash->keys [i] && !(*equal) (hash->keys [i], key)) {
|
i++;
|
if (i == hash->table_size)
|
i = 0;
|
}
|
} else {
|
while (hash->keys [i] && hash->keys [i] != key) {
|
i++;
|
if (i == hash->table_size)
|
i = 0;
|
}
|
}
|
|
gint32 max_length = UnlockedRead (&mono_g_hash_table_max_chain_length);
|
if (i > start && (i - start) > max_length)
|
UnlockedWrite (&mono_g_hash_table_max_chain_length, i - start);
|
else if (i < start && (hash->table_size - (start - i)) > max_length)
|
UnlockedWrite (&mono_g_hash_table_max_chain_length, hash->table_size - (start - i));
|
|
return i;
|
}
|
|
|
MonoGHashTable *
|
mono_g_hash_table_new_type (GHashFunc hash_func, GEqualFunc key_equal_func, MonoGHashGCType type, MonoGCRootSource source, void *key, const char *msg)
|
{
|
MonoGHashTable *hash;
|
|
if (!hash_func)
|
hash_func = g_direct_hash;
|
|
hash = g_new0 (MonoGHashTable, 1);
|
|
hash->hash_func = hash_func;
|
hash->key_equal_func = key_equal_func;
|
|
hash->table_size = g_spaced_primes_closest (1);
|
hash->keys = g_new0 (MonoObject*, hash->table_size);
|
hash->values = g_new0 (MonoObject*, hash->table_size);
|
|
hash->gc_type = type;
|
hash->source = source;
|
hash->key = key;
|
hash->msg = msg;
|
|
if (type > MONO_HASH_KEY_VALUE_GC)
|
g_error ("wrong type for gc hashtable");
|
|
if (hash->gc_type & MONO_HASH_KEY_GC)
|
mono_gc_register_root_wbarrier ((char*)hash->keys, sizeof (MonoObject*) * hash->table_size, mono_gc_make_vector_descr (), hash->source, hash->key, hash->msg);
|
if (hash->gc_type & MONO_HASH_VALUE_GC)
|
mono_gc_register_root_wbarrier ((char*)hash->values, sizeof (MonoObject*) * hash->table_size, mono_gc_make_vector_descr (), hash->source, hash->key, hash->msg);
|
|
return hash;
|
}
|
|
typedef struct {
|
MonoGHashTable *hash;
|
int new_size;
|
MonoObject **keys;
|
MonoObject **values;
|
} RehashData;
|
|
static void*
|
do_rehash (void *_data)
|
{
|
RehashData *data = (RehashData *)_data;
|
MonoGHashTable *hash = data->hash;
|
int current_size, i;
|
MonoObject **old_keys;
|
MonoObject **old_values;
|
|
current_size = hash->table_size;
|
hash->table_size = data->new_size;
|
old_keys = hash->keys;
|
old_values = hash->values;
|
hash->keys = data->keys;
|
hash->values = data->values;
|
|
for (i = 0; i < current_size; i++) {
|
if (old_keys [i]) {
|
int slot = mono_g_hash_table_find_slot (hash, old_keys [i]);
|
mono_g_hash_table_key_store (hash, slot, old_keys [i]);
|
mono_g_hash_table_value_store (hash, slot, old_values [i]);
|
}
|
}
|
return NULL;
|
}
|
|
static void
|
rehash (MonoGHashTable *hash)
|
{
|
MONO_REQ_GC_UNSAFE_MODE; //we must run in unsafe mode to make rehash safe
|
|
RehashData data;
|
void *old_keys = hash->keys;
|
void *old_values = hash->values;
|
|
data.hash = hash;
|
/*
|
* Rehash to a size that can fit the current elements. Rehash relative to in_use
|
* to allow also for compaction.
|
*/
|
data.new_size = g_spaced_primes_closest (hash->in_use / HASH_TABLE_MAX_LOAD_FACTOR * HASH_TABLE_RESIZE_RATIO);
|
data.keys = g_new0 (MonoObject*, data.new_size);
|
data.values = g_new0 (MonoObject*, data.new_size);
|
|
if (hash->gc_type & MONO_HASH_KEY_GC)
|
mono_gc_register_root_wbarrier ((char*)data.keys, sizeof (MonoObject*) * data.new_size, mono_gc_make_vector_descr (), hash->source, hash->key, hash->msg);
|
if (hash->gc_type & MONO_HASH_VALUE_GC)
|
mono_gc_register_root_wbarrier ((char*)data.values, sizeof (MonoObject*) * data.new_size, mono_gc_make_vector_descr (), hash->source, hash->key, hash->msg);
|
|
if (!mono_threads_is_coop_enabled ()) {
|
mono_gc_invoke_with_gc_lock (do_rehash, &data);
|
} else {
|
/* We cannot be preempted */
|
do_rehash (&data);
|
}
|
|
if (hash->gc_type & MONO_HASH_KEY_GC)
|
mono_gc_deregister_root ((char*)old_keys);
|
if (hash->gc_type & MONO_HASH_VALUE_GC)
|
mono_gc_deregister_root ((char*)old_values);
|
|
g_free (old_keys);
|
g_free (old_values);
|
}
|
|
/**
|
* mono_g_hash_table_size:
|
*/
|
guint
|
mono_g_hash_table_size (MonoGHashTable *hash)
|
{
|
g_return_val_if_fail (hash != NULL, 0);
|
|
return hash->in_use;
|
}
|
|
/**
|
* mono_g_hash_table_lookup:
|
*/
|
gpointer
|
mono_g_hash_table_lookup (MonoGHashTable *hash, gconstpointer key)
|
{
|
gpointer orig_key, value;
|
|
if (mono_g_hash_table_lookup_extended (hash, key, &orig_key, &value))
|
return value;
|
else
|
return NULL;
|
}
|
|
/**
|
* mono_g_hash_table_lookup_extended:
|
*/
|
gboolean
|
mono_g_hash_table_lookup_extended (MonoGHashTable *hash, gconstpointer key, gpointer *orig_key, gpointer *value)
|
{
|
int slot;
|
|
g_return_val_if_fail (hash != NULL, FALSE);
|
|
slot = mono_g_hash_table_find_slot (hash, key);
|
|
if (hash->keys [slot]) {
|
*orig_key = hash->keys [slot];
|
*value = hash->values [slot];
|
return TRUE;
|
}
|
|
return FALSE;
|
}
|
|
/**
|
* mono_g_hash_table_foreach:
|
*/
|
void
|
mono_g_hash_table_foreach (MonoGHashTable *hash, GHFunc func, gpointer user_data)
|
{
|
int i;
|
|
g_return_if_fail (hash != NULL);
|
g_return_if_fail (func != NULL);
|
|
for (i = 0; i < hash->table_size; i++) {
|
if (hash->keys [i])
|
(*func)(hash->keys [i], hash->values [i], user_data);
|
}
|
}
|
|
gpointer
|
mono_g_hash_table_find (MonoGHashTable *hash, GHRFunc predicate, gpointer user_data)
|
{
|
int i;
|
|
g_return_val_if_fail (hash != NULL, NULL);
|
g_return_val_if_fail (predicate != NULL, NULL);
|
|
for (i = 0; i < hash->table_size; i++) {
|
if (hash->keys [i] && (*predicate)(hash->keys [i], hash->values [i], user_data))
|
return hash->values [i];
|
}
|
return NULL;
|
}
|
|
/**
|
* mono_g_hash_table_remove:
|
*/
|
gboolean
|
mono_g_hash_table_remove (MonoGHashTable *hash, gconstpointer key)
|
{
|
int slot, last_clear_slot;
|
|
g_return_val_if_fail (hash != NULL, FALSE);
|
slot = mono_g_hash_table_find_slot (hash, key);
|
|
if (!hash->keys [slot])
|
return FALSE;
|
|
if (hash->key_destroy_func)
|
(*hash->key_destroy_func)(hash->keys [slot]);
|
hash->keys [slot] = NULL;
|
if (hash->value_destroy_func)
|
(*hash->value_destroy_func)(hash->values [slot]);
|
hash->values [slot] = NULL;
|
hash->in_use--;
|
|
/*
|
* When we insert in the hashtable, if the required position is occupied we
|
* consecutively try out following positions. In order to be able to find
|
* if a key exists or not in the array (without traversing the entire hash)
|
* we maintain the constraint that there can be no free slots between two
|
* entries that are hashed to the same position. This means that, at search
|
* time, when we encounter a free slot we can stop looking for collissions.
|
* Similarly, at remove time, we need to shift all following slots to their
|
* normal slot, until we reach an empty slot.
|
*/
|
last_clear_slot = slot;
|
slot = (slot + 1) % hash->table_size;
|
while (hash->keys [slot]) {
|
guint hashcode = ((*hash->hash_func)(hash->keys [slot])) % hash->table_size;
|
/*
|
* We try to move the current element to last_clear_slot, but only if
|
* it brings it closer to its normal position (hashcode)
|
*/
|
if ((last_clear_slot < slot && (hashcode > slot || hashcode <= last_clear_slot)) ||
|
(last_clear_slot > slot && (hashcode > slot && hashcode <= last_clear_slot))) {
|
mono_g_hash_table_key_store (hash, last_clear_slot, hash->keys [slot]);
|
mono_g_hash_table_value_store (hash, last_clear_slot, hash->values [slot]);
|
hash->keys [slot] = NULL;
|
hash->values [slot] = NULL;
|
last_clear_slot = slot;
|
}
|
slot++;
|
if (slot == hash->table_size)
|
slot = 0;
|
}
|
return TRUE;
|
}
|
|
/**
|
* mono_g_hash_table_foreach_remove:
|
*/
|
guint
|
mono_g_hash_table_foreach_remove (MonoGHashTable *hash, GHRFunc func, gpointer user_data)
|
{
|
int i;
|
int count = 0;
|
|
g_return_val_if_fail (hash != NULL, 0);
|
g_return_val_if_fail (func != NULL, 0);
|
|
for (i = 0; i < hash->table_size; i++) {
|
if (hash->keys [i] && (*func)(hash->keys [i], hash->values [i], user_data)) {
|
mono_g_hash_table_remove (hash, hash->keys [i]);
|
count++;
|
/* Retry current slot in case the removal shifted elements */
|
i--;
|
}
|
}
|
if (hash->in_use < hash->table_size * HASH_TABLE_MIN_LOAD_FACTOR)
|
rehash (hash);
|
return count;
|
}
|
|
/**
|
* mono_g_hash_table_destroy:
|
*/
|
void
|
mono_g_hash_table_destroy (MonoGHashTable *hash)
|
{
|
int i;
|
|
g_return_if_fail (hash != NULL);
|
|
if (hash->gc_type & MONO_HASH_KEY_GC)
|
mono_gc_deregister_root ((char*)hash->keys);
|
if (hash->gc_type & MONO_HASH_VALUE_GC)
|
mono_gc_deregister_root ((char*)hash->values);
|
|
for (i = 0; i < hash->table_size; i++) {
|
if (hash->keys [i]) {
|
if (hash->key_destroy_func)
|
(*hash->key_destroy_func)(hash->keys [i]);
|
if (hash->value_destroy_func)
|
(*hash->value_destroy_func)(hash->values [i]);
|
}
|
}
|
g_free (hash->keys);
|
g_free (hash->values);
|
g_free (hash);
|
}
|
|
static void
|
mono_g_hash_table_insert_replace (MonoGHashTable *hash, gpointer key, gpointer value, gboolean replace)
|
{
|
int slot;
|
g_return_if_fail (hash != NULL);
|
|
if (hash->in_use > (hash->table_size * HASH_TABLE_MAX_LOAD_FACTOR))
|
rehash (hash);
|
|
slot = mono_g_hash_table_find_slot (hash, key);
|
|
if (hash->keys [slot]) {
|
if (replace) {
|
if (hash->key_destroy_func)
|
(*hash->key_destroy_func)(hash->keys [slot]);
|
mono_g_hash_table_key_store (hash, slot, (MonoObject*)key);
|
}
|
if (hash->value_destroy_func)
|
(*hash->value_destroy_func) (hash->values [slot]);
|
mono_g_hash_table_value_store (hash, slot, (MonoObject*)value);
|
} else {
|
mono_g_hash_table_key_store (hash, slot, (MonoObject*)key);
|
mono_g_hash_table_value_store (hash, slot, (MonoObject*)value);
|
hash->in_use++;
|
}
|
}
|
|
/**
|
* mono_g_hash_table_insert:
|
*/
|
void
|
mono_g_hash_table_insert (MonoGHashTable *h, gpointer k, gpointer v)
|
{
|
mono_g_hash_table_insert_replace (h, k, v, FALSE);
|
}
|
|
/**
|
* mono_g_hash_table_replace:
|
*/
|
void
|
mono_g_hash_table_replace(MonoGHashTable *h, gpointer k, gpointer v)
|
{
|
mono_g_hash_table_insert_replace (h, k, v, TRUE);
|
}
|
|
void
|
mono_g_hash_table_print_stats (MonoGHashTable *hash)
|
{
|
int i = 0, chain_size = 0, max_chain_size = 0;
|
gboolean wrapped_around = FALSE;
|
|
while (TRUE) {
|
if (hash->keys [i]) {
|
chain_size++;
|
} else {
|
max_chain_size = MAX(max_chain_size, chain_size);
|
chain_size = 0;
|
if (wrapped_around)
|
break;
|
}
|
|
if (i == (hash->table_size - 1)) {
|
wrapped_around = TRUE;
|
i = 0;
|
} else {
|
i++;
|
}
|
}
|
/* Rehash to a size that can fit the current elements */
|
printf ("Size: %d Table Size: %d Max Chain Length: %d\n", hash->in_use, hash->table_size, max_chain_size);
|
}
|