libaaruformat 1.0
Aaru Data Preservation Suite - Format Library
Loading...
Searching...
No Matches
hash_map.c
Go to the documentation of this file.
1/*
2 * This file is part of the Aaru Data Preservation Suite.
3 * Copyright (c) 2019-2026 Natalia Portillo.
4 *
5 * This library is free software; you can redistribute it and/or modify
6 * it under the terms of the GNU Lesser General Public License as
7 * published by the Free Software Foundation; either version 2.1 of the
8 * License, or (at your option) any later version.
9 *
10 * This library is distributed in the hope that it will be useful, but
11 * WITHOUT ANY WARRANTY; without even the implied warranty of
12 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
13 * Lesser General Public License for more details.
14 *
15 * You should have received a copy of the GNU Lesser General Public
16 * License along with this library; if not, see <http://www.gnu.org/licenses/>.
17 */
18
19#include <stdbool.h>
20#include <stdint.h>
21#include <stdlib.h>
22
23#include "hash_map.h"
24
25#define INITIAL_SIZE 1024
26#define LOAD_FACTOR 0.75
27#define LARGE_MAP_THRESHOLD (2ULL * 1024 * 1024 * 1024 / sizeof(kv_pair_t)) // ~2GB worth of entries
28#define LARGE_GROWTH_FACTOR 1.25 // 25% growth for large maps
29
52{
53 // Enforce minimum size to prevent division by zero in modulo operations
54 if(size < INITIAL_SIZE) size = INITIAL_SIZE;
55
56 hash_map_t *map = malloc(sizeof(hash_map_t));
57 map->table = calloc(size, sizeof(kv_pair_t));
58 map->size = size;
59 map->count = 0;
60
61 return map;
62}
63
79{
80 free(map->table);
81 free(map);
82}
83
103static size_t calculate_new_size(size_t current_size)
104{
105 if(current_size < LARGE_MAP_THRESHOLD) return current_size * 2;
106
107 return (size_t)((double)current_size * LARGE_GROWTH_FACTOR);
108}
109
133static void resize_map(hash_map_t *map, size_t new_size)
134{
135 kv_pair_t *old_table = map->table;
136 size_t old_size = map->size;
137
138 map->table = calloc(new_size, sizeof(kv_pair_t));
139 map->size = new_size;
140 map->count = 0;
141
142 for(size_t i = 0; i < old_size; i++)
143 if(old_table[i].key != 0)
144 {
145 // Re-insert
146 size_t idx = old_table[i].key % new_size;
147
148 while(map->table[idx].key != 0) idx = (idx + 1) % new_size;
149
150 map->table[idx] = old_table[i];
151 map->count++;
152 }
153
154 free(old_table);
155}
156
185bool insert_map(hash_map_t *map, uint64_t key, uint64_t value)
186{
187 if((double)map->count / map->size > LOAD_FACTOR) resize_map(map, calculate_new_size(map->size));
188
189 size_t idx = key % map->size;
190
191 while(map->table[idx].key != 0 && map->table[idx].key != key) idx = (idx + 1) % map->size;
192
193 if(map->table[idx].key == key) return false; // Already present
194
195 map->table[idx].key = key;
196 map->table[idx].value = value;
197 map->count++;
198
199 return true;
200}
201
228bool lookup_map(const hash_map_t *map, uint64_t key, uint64_t *out_value)
229{
230 size_t idx = key % map->size;
231
232 while(map->table[idx].key != 0)
233 {
234 if(map->table[idx].key == key)
235 {
236 *out_value = map->table[idx].value;
237 return true;
238 }
239
240 idx = (idx + 1) % map->size;
241 }
242
243 return false;
244}
bool lookup_map(const hash_map_t *map, uint64_t key, uint64_t *out_value)
Looks up a value by key in the hash map.
Definition hash_map.c:228
static size_t calculate_new_size(size_t current_size)
Calculates the new size for hash map resizing.
Definition hash_map.c:103
#define LARGE_GROWTH_FACTOR
Definition hash_map.c:28
#define INITIAL_SIZE
Definition hash_map.c:25
hash_map_t * create_map(size_t size)
Creates a new hash map with the specified initial size.
Definition hash_map.c:51
bool insert_map(hash_map_t *map, uint64_t key, uint64_t value)
Inserts a key-value pair into the hash map.
Definition hash_map.c:185
#define LARGE_MAP_THRESHOLD
Definition hash_map.c:27
#define LOAD_FACTOR
Definition hash_map.c:26
void free_map(hash_map_t *map)
Frees all memory associated with a hash map.
Definition hash_map.c:78
static void resize_map(hash_map_t *map, size_t new_size)
Resizes the hash map to a new size and rehashes all entries.
Definition hash_map.c:133
Minimal open-addressing hash map for 64-bit key/value pairs used in deduplication lookup.
Definition hash_map.h:50
size_t count
Number of active (filled) entries.
Definition hash_map.h:53
size_t size
Allocated slot capacity of table.
Definition hash_map.h:52
kv_pair_t * table
Array of key/value slots of length == size.
Definition hash_map.h:51
Single key/value slot used internally by the open-addressing hash map.
Definition hash_map.h:33
uint64_t value
Associated value payload (64-bit) stored alongside the key.
Definition hash_map.h:35
uint64_t key
Stored key (64-bit). May use a reserved sentinel to denote an empty slot.
Definition hash_map.h:34