lifted the hash maps and the string cache to the grime package

2024-05-31 20:51:30 -04:00
parent e84ec719b3
commit 9ba718254c
10 changed files with 111 additions and 84 deletions
--- a/code/sectr/grime/Readme.md
+++ b/code/sectr/grime/Readme.md
@@ -0,0 +1,3 @@
+# Sectr's Grime
+
+This just contains the mappings file and some stuff I haven't felt like lifting to the grime package yet.
--- a/code/sectr/grime/hashmap_zpl.odin
+++ b/code/sectr/grime/hashmap_zpl.odin
@@ -1,278 +0,0 @@
-/*
-This is an alternative to Odin's default map type.
-The only reason I may need this is due to issues with allocator callbacks or something else going on
-with hot-reloads...
---------------------------------------------------------------------------------------------------------
-5-21-2024 Update: Still haven't taken the time to see why but just to add the original case for the above
-was I believe exclusively when I didn't set the base addresss of vmem
-OR when I was attempting to use Casey's brute force replay feature with memory.
-5-26-2024 Update:
-TODO(Ed): There is a Raw_Map structure defined in base:runtime/core.odin
-We can use the regulare dynamic 
---------------------------------------------------------------------------------------------------------
-
-This implementation uses two ZPL-Based Arrays to hold entires and the actual hash table.
-Instead of using separate chains, it maintains linked entries within the array.
-Each entry contains a next field, which is an index pointing to the next entry in the same array.
-
-Growing this hashtable is destructive, so it should usually be kept to a fixed-size unless
-the populating operations only occur in one place and from then on its read-only.
-*/
-package sectr
-
-import "core:slice"
-
-// Note(Ed) : See core:hash for hasing procs.
-
-HMapZPL_MapProc    :: #type proc( $ Type : typeid, key : u64, value :   Type )
-HMapZPL_MapMutProc :: #type proc( $ Type : typeid, key : u64, value : ^ Type )
-
-HMapZPL_CritialLoadScale :: 0.70
-HMapZPL_HashToEntryRatio :: 1.50
-
-HMapZPL_FindResult :: struct {
-	hash_index  : i64,
-	prev_index  : i64,
-	entry_index : i64,
-}
-
-HMapZPL_Entry :: struct ( $ Type : typeid) {
-	key   : u64,
-	next  : i64,
-	value : Type,
-}
-
-HMapZPL :: struct ( $ Type : typeid ) {
-	table   : Array( i64 ),
-	entries : Array( HMapZPL_Entry(Type) ),
-}
-
-hmap_zpl_init :: proc
-( $HMapZPL_Type : typeid / HMapZPL($Type), num : u64, allocator := context.allocator, dbg_name : string = "" ) -> ( HMapZPL( Type), AllocatorError )
-{
-	result                       : HMapZPL(Type)
-	table_result, entries_result : AllocatorError
-
-	result.table, table_result = make( Array(i64), num, dbg_name = dbg_name, allocator = allocator )
-	if table_result != AllocatorError.None {
-		ensure( false, "Failed to allocate table array" )
-		return result, table_result
-	}
-	array_resize( & result.table, num )
-	slice.fill( slice_ptr( result.table.data, cast(int) result.table.num), -1 )
-
-	result.entries, entries_result = make( Array( HMapZPL_Entry(Type) ), num, dbg_name = dbg_name, allocator = allocator )
-	if entries_result != AllocatorError.None {
-		ensure( false, "Failed to allocate entries array" )
-		return result, entries_result
-	}
-	return result, AllocatorError.None
-}
-
-hamp_zpl_clear :: proc( using self : ^ HMapZPL( $ Type ) ) {
-	for id := 0; id < table.num; id += 1 {
-		table[id] = -1
-	}
-
-	array_clear( table )
-	array_clear( entries )
-}
-
-hamp_zpl_destroy :: proc( using self : ^ HMapZPL( $ Type ) ) {
-	if table.data != nil && table.capacity > 0 {
-		array_free( table )
-		array_free( entries )
-	}
-}
-
-hamp_zpl_get :: proc ( using self : ^ HMapZPL( $ Type ), key : u64 ) -> ^ Type
-{
-	// profile(#procedure)
-	id := hamp_zpl_find( self, key ).entry_index
-	if id >= 0 {
-		return & entries.data[id].value
-	}
-
-	return nil
-}
-
-hamp_zpl_map :: proc( using self : ^ HMapZPL( $ Type), map_proc : HMapZPL_MapProc ) {
-	ensure( map_proc != nil, "Mapping procedure must not be null" )
-	for id := 0; id < entries.num; id += 1 {
-		map_proc( Type, entries[id].key, entries[id].value )
-	}
-}
-
-hamp_zpl_map_mut :: proc( using self : ^ HMapZPL( $ Type), map_proc : HMapZPL_MapMutProc ) {
-	ensure( map_proc != nil, "Mapping procedure must not be null" )
-	for id := 0; id < entries.num; id += 1 {
-		map_proc( Type, entries[id].key, & entries[id].value )
-	}
-}
-
-hamp_zpl_grow :: proc( using self : ^ HMapZPL( $ Type ) ) -> AllocatorError {
-	new_num := array_grow_formula( entries.num )
-	return hamp_zpl_rehash( self, new_num )
-}
-
-hamp_zpl_rehash :: proc( ht : ^ HMapZPL( $ Type ), new_num : u64 ) -> AllocatorError
-{
-	profile(#procedure)
-	// For now the prototype should never allow this to happen.
-	ensure( false, "ZPL HMAP IS REHASHING" )
-	last_added_index : i64
-
-	new_ht, init_result := hmap_zpl_init( HMapZPL(Type), new_num, ht.table.backing, ht.table.dbg_name )
-	if init_result != AllocatorError.None {
-		ensure( false, "New hamp_zpl failed to allocate" )
-		return init_result
-	}
-
-	for id : u64 = 0; id < ht.entries.num; id += 1 {
-		find_result : HMapZPL_FindResult
-
-		entry           := & ht.entries.data[id]
-		find_result      = hamp_zpl_find( & new_ht, entry.key )
-		last_added_index = hamp_zpl_add_entry( & new_ht, entry.key )
-
-		if find_result.prev_index < 0 {
-			new_ht.table.data[ find_result.hash_index ] = last_added_index
-		}
-		else {
-			new_ht.entries.data[ find_result.prev_index ].next = last_added_index
-		}
-
-		new_ht.entries.data[ last_added_index ].next  = find_result.entry_index
-		new_ht.entries.data[ last_added_index ].value = entry.value
-	}
-
-	hamp_zpl_destroy( ht )
-
-	(ht ^) = new_ht
-	return AllocatorError.None
-}
-
-hamp_zpl_rehash_fast :: proc( using self : ^ HMapZPL( $ Type ) )
-{
-	for id := 0; id < entries.num; id += 1 {
-		entries[id].Next = -1;
-	}
-	for id := 0; id < table.num; id += 1 {
-		table[id] = -1
-	}
-	for id := 0; id < entries.num; id += 1 {
-		entry       := & entries[id]
-		find_result := hamp_zpl_find( entry.key )
-
-		if find_result.prev_index < 0 {
-			table[ find_result.hash_index ] = id
-		}
-		else {
-			entries[ find_result.prev_index ].next = id
-		}
-	}
-}
-
-// Used when the address space of the allocator changes and the backing reference must be updated
-hamp_zpl_reload :: proc( using self : ^HMapZPL($Type), new_backing : Allocator ) {
-	table.backing   = new_backing
-	entries.backing = new_backing
-}
-
-hamp_zpl_remove :: proc( self : ^ HMapZPL( $ Type ), key : u64 ) {
-	find_result := hamp_zpl_find( key )
-
-	if find_result.entry_index >= 0 {
-		array_remove_at( & entries, find_result.entry_index )
-		hamp_zpl_rehash_fast( self )
-	}
-}
-
-hamp_zpl_remove_entry :: proc( using self : ^ HMapZPL( $ Type ), id : i64 ) {
-	array_remove_at( & entries, id )
-}
-
-hamp_zpl_set :: proc( using self : ^ HMapZPL( $ Type), key : u64, value : Type ) -> (^ Type, AllocatorError)
-{
-	// profile(#procedure)
-	id          : i64 = 0
-	find_result : HMapZPL_FindResult
-
-	if hamp_zpl_full( self )
-	{
-		grow_result := hamp_zpl_grow( self )
-		if grow_result != AllocatorError.None {
-				return nil, grow_result
-		}
-	}
-
-	find_result = hamp_zpl_find( self, key )
-	if find_result.entry_index >= 0 {
-		id = find_result.entry_index
-	}
-	else
-	{
-		id = hamp_zpl_add_entry( self, key )
-		if find_result.prev_index >= 0 {
-			entries.data[ find_result.prev_index ].next = id
-		}
-		else {
-			table.data[ find_result.hash_index ] = id
-		}
-	}
-
-	entries.data[id].value = value
-
-	if hamp_zpl_full( self ) {
-		alloc_error := hamp_zpl_grow( self )
-		return & entries.data[id].value, alloc_error
-	}
-
-	return & entries.data[id].value, AllocatorError.None
-}
-
-hamp_zpl_slot :: proc( using self : ^ HMapZPL( $ Type), key : u64 ) -> i64 {
-	for id : i64 = 0; id < table.num; id += 1 {
-		if table.data[id] == key                {
-			return id
-		}
-	}
-	return -1
-}
-
-hamp_zpl_add_entry :: proc( using self : ^ HMapZPL( $ Type), key : u64 ) -> i64 {
-	entry : HMapZPL_Entry(Type) = { key, -1, {} }
-	id    := cast(i64) entries.num
-	array_append( & entries, entry )
-	return id
-}
-
-hamp_zpl_find :: proc( using self : ^ HMapZPL( $ Type), key : u64 ) -> HMapZPL_FindResult
-{
-	// profile(#procedure)
-	result : HMapZPL_FindResult = { -1, -1, -1 }
-
-	if table.num > 0 {
-		result.hash_index  = cast(i64)( key % table.num )
-		result.entry_index = table.data[ result.hash_index ]
-
-		verify( result.entry_index < i64(entries.num), "Entry index is larger than the number of entries" )
-
-		for ; result.entry_index >= 0; {
-			entry := & entries.data[ result.entry_index ]
-			if entry.key == key {
-				break
-			}
-
-			result.prev_index  = result.entry_index
-			result.entry_index = entry.next
-		}
-	}
-	return result
-}
-
-hamp_zpl_full :: proc( using self : ^ HMapZPL( $ Type) ) -> b32 {
-	critical_load := u64(HMapZPL_CritialLoadScale * cast(f64) table.num)
-	result : b32 = entries.num > critical_load
-	return result
-}
--- a/code/sectr/grime/mappings.odin
+++ b/code/sectr/grime/mappings.odin
@@ -174,6 +174,13 @@ import "codebase:grime"
 	hmap_chained_set    :: grime.hmap_chained_set
 	hmap_chained_reload :: grime.hmap_chained_reload

+	HMapZPL :: grime.HMapZPL
+
+	hmap_zpl_init   :: grime.hmap_zpl_init
+	hmap_zpl_get    :: grime.hmap_zpl_get
+	hmap_zpl_reload :: grime.hmap_zpl_reload
+	hmap_zpl_set    :: grime.hmap_zpl_set
+
 	Pool :: grime.Pool

 	Slab          :: grime.Slab
@@ -234,12 +241,25 @@ import "codebase:grime"
 	memtracker_register_auto_name_slice :: grime.memtracker_register_auto_name_slice
 	memtracker_unregister               :: grime.memtracker_unregister

-
 	calc_padding_with_header :: grime.calc_padding_with_header
 	memory_after_header      :: grime.memory_after_header
 	memory_after             :: grime.memory_after
 	swap                     :: grime.swap

+	// strings
+	StrRunesPair :: grime.StrRunesPair
+	StringCache  :: grime.StringCache
+
+	str_cache_init           :: grime.str_cache_init
+	str_cache_reload         :: grime.str_cache_reload
+	str_cache_set_module_ctx :: grime.str_cache_set_module_ctx
+	// str_intern_key        :: grime.str_intern_key
+	// str_intern_lookup     :: grime.str_intern_lookup
+	str_intern               :: grime.str_intern
+	str_intern_fmt           :: grime.str_intern_fmt
+
+	to_str_runes_pair_via_string :: grime.to_str_runes_pair_via_string
+	to_str_runes_pair_via_runes  :: grime.to_str_runes_pair_via_runes
 	// profiler
 	SpallProfiler :: grime.SpallProfiler

--- a/code/sectr/grime/string_interning.odin
+++ b/code/sectr/grime/string_interning.odin
@@ -1,122 +0,0 @@
-/*
-String Intering Table using its own dedicated slab & chained hashtable
-
-If linear probing, the hash node list per table bucket is store with the strigns in the same arena.
-If open addressing, we just keep the open addressed array of node slots in the general slab (but hopefully better perf)
-
-TODO(Ed): Move the string cache to its own virtual arena?
-Its going to be used heavily and we can better utilize memory that way.
-The arena can deal with alignment just fine or we can pad in a min amount per string.
-*/
-package sectr
-
-import "base:runtime"
-import "core:mem"
-import "core:slice"
-import "core:strings"
-
-StringKey   :: distinct u64
-RunesCached :: []rune
-
-// TODO(Ed): There doesn't seem to be a need for caching the runes.
-// It seems like no one has had a bottleneck just iterating through the code points on demand when needed.
-// So we should problably scrap storing them that way.
-
-StrRunesPair :: struct {
-	str   : string,
-	runes : []rune,
-}
-to_str_runes_pair_via_string :: #force_inline proc ( content : string ) -> StrRunesPair { return { content, to_runes(content) }  }
-to_str_runes_pair_via_runes  :: #force_inline proc ( content : []rune ) -> StrRunesPair { return { to_string(content), content } }
-
-StringCache :: struct {
-	slab      : Slab,
-	table     : HMapZPL(StrRunesPair),
-}
-
-str_cache_init :: proc( /*allocator : Allocator*/ ) -> ( cache : StringCache ) {
-	alignment := uint(mem.DEFAULT_ALIGNMENT)
-
-	policy     : SlabPolicy
-	policy_ptr := & policy
-	push( policy_ptr, SlabSizeClass {  64 * Kilobyte,              8, alignment })
-	push( policy_ptr, SlabSizeClass {  64 * Kilobyte,             16, alignment })
-	push( policy_ptr, SlabSizeClass { 128 * Kilobyte,             32, alignment })
-	push( policy_ptr, SlabSizeClass { 128 * Kilobyte,             64, alignment })
-	push( policy_ptr, SlabSizeClass {  64 * Kilobyte,            128, alignment })
-	push( policy_ptr, SlabSizeClass {  64 * Kilobyte,            256, alignment })
-	push( policy_ptr, SlabSizeClass {  64 * Kilobyte,            512, alignment })
-	push( policy_ptr, SlabSizeClass {   1 * Megabyte,   1 * Kilobyte, alignment })
-	push( policy_ptr, SlabSizeClass {   4 * Megabyte,   4 * Kilobyte, alignment })
-	push( policy_ptr, SlabSizeClass {  16 * Megabyte,  16 * Kilobyte, alignment })
-	push( policy_ptr, SlabSizeClass {  32 * Megabyte,  32 * Kilobyte, alignment })
-	// push( policy_ptr, SlabSizeClass {  64 * Megabyte,  64 * Kilobyte, alignment })
-	// push( policy_ptr, SlabSizeClass {  64 * Megabyte, 128 * Kilobyte, alignment })
-	// push( policy_ptr, SlabSizeClass {  64 * Megabyte, 256 * Kilobyte, alignment })
-	// push( policy_ptr, SlabSizeClass {  64 * Megabyte, 512 * Kilobyte, alignment })
-	// push( policy_ptr, SlabSizeClass {  64 * Megabyte,   1 * Megabyte, alignment })
-
-	header_size :: size_of( Slab )
-
-	@static dbg_name := "StringCache slab"
-
-	state := get_state()
-
-	alloc_error : AllocatorError
-	cache.slab, alloc_error = slab_init( & policy, dbg_name = dbg_name, allocator = persistent_allocator() )
-	verify(alloc_error == .None, "Failed to initialize the string cache" )
-
-	cache.table, alloc_error = make( HMapZPL(StrRunesPair), 4 * Megabyte, persistent_allocator(), dbg_name )
-	return
-}
-
-str_intern_key    :: #force_inline proc( content : string ) ->  StringKey      { return cast(StringKey) crc32( transmute([]byte) content ) }
-str_intern_lookup :: #force_inline proc( key : StringKey )  -> (^StrRunesPair) { return hamp_zpl_get( & get_state().string_cache.table, transmute(u64) key ) }
-
-str_intern :: proc( content : string ) -> StrRunesPair
-{
-	// profile(#procedure)
-	cache := & get_state().string_cache
-
-	key    := str_intern_key(content)
-	result := hamp_zpl_get( & cache.table, transmute(u64) key )
-	if result != nil {
-		return (result ^)
-	}
-
-	// profile_begin("new entry")
-	{
-		length := len(content)
-		// str_mem, alloc_error := alloc( length, mem.DEFAULT_ALIGNMENT )
-		str_mem, alloc_error := slab_alloc( cache.slab, uint(length), uint(mem.DEFAULT_ALIGNMENT), zero_memory = false )
-		verify( alloc_error == .None, "String cache had a backing allocator error" )
-
-		// copy_non_overlapping( str_mem, raw_data(content), length )
-		copy_non_overlapping( raw_data(str_mem), raw_data(content), length )
-
-		runes : []rune
-		// runes, alloc_error = to_runes( content, persistent_allocator() )
-		runes, alloc_error = to_runes( content, slab_allocator(cache.slab) )
-		verify( alloc_error == .None, "String cache had a backing allocator error" )
-
-		slab_validate_pools( get_state().persistent_slab )
-
-		// result, alloc_error = hamp_zpl_set( & cache.table, key, StrRunesPair { transmute(string) byte_slice(str_mem, length), runes } )
-		result, alloc_error = hamp_zpl_set( & cache.table, transmute(u64) key, StrRunesPair { transmute(string) str_mem, runes } )
-		verify( alloc_error == .None, "String cache had a backing allocator error" )
-
-		slab_validate_pools( get_state().persistent_slab )
-	}
-	// profile_end()
-
-	return (result ^)
-}
-
-str_intern_fmt :: #force_inline proc( format : string, args : ..any, allocator := context.allocator ) -> StrRunesPair {
-	return str_intern(str_fmt(format, args, allocator = allocator))
-}
-
-// runes_intern :: proc( content : []rune ) -> StrRunesPair
-// {
-// 	cache := get_state().string_cache
-// }