hakmem/core/hakmem_tiny_ace_guard_box.inc

// ============================================================================
// ACE Learning Layer: Runtime parameter setters
// ============================================================================

void hkm_ace_set_drain_threshold(int class_idx, uint32_t threshold) {
    // Validate inputs
    if (class_idx < 0 || class_idx >= TINY_NUM_CLASSES) {
        return;
    }
    if (threshold < 16 || threshold > 2048) {
        return;
    }

    // Set per-class threshold (used by remote free drain logic)
    g_remote_drain_thresh_per_class[class_idx] = (int)threshold;
}
#include "tiny_fc_api.h"
int tiny_fc_room(int class_idx) {
    if (class_idx < 0 || class_idx >= TINY_NUM_CLASSES) return 0;
    TinyFastCache* fc = &g_fast_cache[class_idx];
    // Effective per-class cap comes from g_fast_cap (env-tunable),
    // clamped by the static storage capacity TINY_FASTCACHE_CAP.
    uint16_t eff_cap = g_fast_cap[class_idx];
    if (eff_cap > TINY_FASTCACHE_CAP) eff_cap = TINY_FASTCACHE_CAP;
    int room = (int)eff_cap - fc->top;
    return room > 0 ? room : 0;
}

int tiny_fc_push_bulk(int class_idx, void** arr, int n) {
    if (!arr || n <= 0) return 0;
    if (class_idx < 0 || class_idx >= TINY_NUM_CLASSES) return 0;
    TinyFastCache* fc = &g_fast_cache[class_idx];
    uint16_t eff_cap = g_fast_cap[class_idx];
    if (eff_cap > TINY_FASTCACHE_CAP) eff_cap = TINY_FASTCACHE_CAP;
    int room = (int)eff_cap - fc->top;
    if (room <= 0) return 0;
    int take = n < room ? n : room;
    // Forward fill with light unrolling to reduce branch overhead
    int i = 0;
    for (; i + 3 < take; i += 4) {
        fc->items[fc->top++] = arr[i];
        fc->items[fc->top++] = arr[i + 1];
        fc->items[fc->top++] = arr[i + 2];
        fc->items[fc->top++] = arr[i + 3];
    }
    for (; i < take; i++) {
        fc->items[fc->top++] = arr[i];
    }
    return take;
}

// ========= Tiny Guard (targeted debug; low overhead when disabled) =========
static int g_tiny_guard_enabled = -1;
static int g_tiny_guard_class = 2;
static int g_tiny_guard_limit = 8;
static __thread int g_tiny_guard_seen = 0;

static inline int tiny_guard_enabled_runtime(void) {
    if (__builtin_expect(g_tiny_guard_enabled == -1, 0)) {
        // Enabled via HAKMEM_DEBUG_LEVEL >= 4 (DEBUG level)
        // Legacy: HAKMEM_TINY_GUARD=1 still works for compatibility
        g_tiny_guard_enabled = hak_debug_check_level("HAKMEM_TINY_GUARD", 4);

        // Special-purpose parameters (kept for targeted debugging)
        const char* ec = getenv("HAKMEM_TINY_GUARD_CLASS");
        if (ec && *ec) g_tiny_guard_class = atoi(ec);
        const char* el = getenv("HAKMEM_TINY_GUARD_MAX");
        if (el && *el) g_tiny_guard_limit = atoi(el);
        if (g_tiny_guard_limit <= 0) g_tiny_guard_limit = 8;
    }
    return g_tiny_guard_enabled;
}

int tiny_guard_is_enabled(void) { return tiny_guard_enabled_runtime(); }

static void tiny_guard_dump_bytes(const char* tag, const uint8_t* p, size_t n) {
    fprintf(stderr, "[TGUARD] %s:", tag);
    for (size_t i = 0; i < n; i++) fprintf(stderr, " %02x", p[i]);
    fprintf(stderr, "\n");
}

void tiny_guard_on_alloc(int cls, void* base, void* user, size_t stride) {
    if (!tiny_guard_enabled_runtime() || cls != g_tiny_guard_class) return;
    if (g_tiny_guard_seen++ >= g_tiny_guard_limit) return;
    uint8_t* b = (uint8_t*)base;
    fprintf(stderr, "[TGUARD] alloc cls=%d base=%p user=%p stride=%zu hdr=%02x\n",
            cls, base, user, stride, b[0]);
    // 隣接ヘッダ可視化（前後）
    tiny_guard_dump_bytes("around_base", b, (stride >= 8 ? 8 : stride));
    tiny_guard_dump_bytes("next_header", b + stride, 4);
}

void tiny_guard_on_invalid(void* user_ptr, uint8_t hdr) {
    if (!tiny_guard_enabled_runtime()) return;
    if (g_tiny_guard_seen++ >= g_tiny_guard_limit) return;
    uint8_t* u = (uint8_t*)user_ptr;
    fprintf(stderr, "[TGUARD] invalid header at user=%p hdr=%02x prev=%02x next=%02x\n",
            user_ptr, hdr, *(u - 2), *(u));
    tiny_guard_dump_bytes("dump_before", u - 8, 8);
    tiny_guard_dump_bytes("dump_after", u, 8);
}
Refactor: Extract 5 Box modules from hakmem_tiny.c (-52% size reduction) Split hakmem_tiny.c (2081 lines) into focused modules for better maintainability. ## Changes hakmem_tiny.c: 2081 → 995 lines (-1086 lines, -52% reduction) ## Extracted Modules (5 boxes) 1. config_box (211 lines) - Size class tables, integrity counters - Debug flags, benchmark macros - HAK_RET_ALLOC/HAK_STAT_FREE instrumentation 2. publish_box (419 lines) - Publish/Adopt counters and statistics - Bench mailbox, partial ring - Live cap/Hot slot management - TLS helper functions (tiny_tls_default_) 3. globals_box* (256 lines) - Global variable declarations (~70 variables) - TinyPool instance and initialization flag - TLS variables (g_tls_lists, g_fast_head, g_fast_count) - SuperSlab configuration (partial ring, empty reserves) - Adopt gate functions 4. phase6_wrappers_box (122 lines) - Phase 6 Box Theory wrapper layer - hak_tiny_alloc_fast_wrapper() - hak_tiny_free_fast_wrapper() - Diagnostic instrumentation 5. ace_guard_box (100 lines) - ACE Learning Layer (hkm_ace_set_drain_threshold) - FastCache API (tiny_fc_room, tiny_fc_push_bulk) - Tiny Guard debugging system (5 functions) ## Benefits - Readability: Giant 2k file → focused 1k core + 5 coherent modules - Maintainability: Each box has clear responsibility and boundaries - Build: All modules compile successfully ✅ ## Technical Details - Phase 1: ChatGPT extracted config_box + publish_box (-625 lines) - Phase 2-4: Claude extracted globals_box + phase6_wrappers_box + ace_guard_box (-461 lines) - All extractions use .inc files (same translation unit, preserves static/TLS linkage) - Fixed Makefile: Added tiny_sizeclass_hist_box.o to OBJS_BASE and BENCH_HAKMEM_OBJS_BASE 🤖 Generated with [Claude Code](https://claude.com/claude-code) Co-Authored-By: Claude <noreply@anthropic.com> 2025-11-21 01:16:45 +09:00			`// ============================================================================`
			`// ACE Learning Layer: Runtime parameter setters`
			`// ============================================================================`

			`void hkm_ace_set_drain_threshold(int class_idx, uint32_t threshold) {`
			`// Validate inputs`
			`if (class_idx < 0 \|\| class_idx >= TINY_NUM_CLASSES) {`
			`return;`
			`}`
			`if (threshold < 16 \|\| threshold > 2048) {`
			`return;`
			`}`

			`// Set per-class threshold (used by remote free drain logic)`
			`g_remote_drain_thresh_per_class[class_idx] = (int)threshold;`
			`}`
			`#include "tiny_fc_api.h"`
			`int tiny_fc_room(int class_idx) {`
			`if (class_idx < 0 \|\| class_idx >= TINY_NUM_CLASSES) return 0;`
			`TinyFastCache* fc = &g_fast_cache[class_idx];`
			`// Effective per-class cap comes from g_fast_cap (env-tunable),`
			`// clamped by the static storage capacity TINY_FASTCACHE_CAP.`
			`uint16_t eff_cap = g_fast_cap[class_idx];`
			`if (eff_cap > TINY_FASTCACHE_CAP) eff_cap = TINY_FASTCACHE_CAP;`
			`int room = (int)eff_cap - fc->top;`
			`return room > 0 ? room : 0;`
			`}`

			`int tiny_fc_push_bulk(int class_idx, void** arr, int n) {`
			`if (!arr \|\| n <= 0) return 0;`
			`if (class_idx < 0 \|\| class_idx >= TINY_NUM_CLASSES) return 0;`
			`TinyFastCache* fc = &g_fast_cache[class_idx];`
			`uint16_t eff_cap = g_fast_cap[class_idx];`
			`if (eff_cap > TINY_FASTCACHE_CAP) eff_cap = TINY_FASTCACHE_CAP;`
			`int room = (int)eff_cap - fc->top;`
			`if (room <= 0) return 0;`
			`int take = n < room ? n : room;`
			`// Forward fill with light unrolling to reduce branch overhead`
			`int i = 0;`
			`for (; i + 3 < take; i += 4) {`
			`fc->items[fc->top++] = arr[i];`
			`fc->items[fc->top++] = arr[i + 1];`
			`fc->items[fc->top++] = arr[i + 2];`
			`fc->items[fc->top++] = arr[i + 3];`
			`}`
			`for (; i < take; i++) {`
			`fc->items[fc->top++] = arr[i];`
			`}`
			`return take;`
			`}`

			`// ========= Tiny Guard (targeted debug; low overhead when disabled) =========`
			`static int g_tiny_guard_enabled = -1;`
			`static int g_tiny_guard_class = 2;`
			`static int g_tiny_guard_limit = 8;`
			`static __thread int g_tiny_guard_seen = 0;`

			`static inline int tiny_guard_enabled_runtime(void) {`
			`if (__builtin_expect(g_tiny_guard_enabled == -1, 0)) {`
Cleanup: Consolidate debug ENV vars to HAKMEM_DEBUG_LEVEL Integrated 4 new debug environment variables added during bug fixes into the existing unified HAKMEM_DEBUG_LEVEL system (expanded to 0-5 levels). Changes: 1. Expanded HAKMEM_DEBUG_LEVEL from 0-3 to 0-5 levels: - 0 = OFF (production) - 1 = ERROR (critical errors) - 2 = WARN (warnings) - 3 = INFO (allocation paths, header validation, stats) - 4 = DEBUG (guard instrumentation, failfast) - 5 = TRACE (verbose tracing) 2. Integrated 4 environment variables: - HAKMEM_ALLOC_PATH_TRACE → HAKMEM_DEBUG_LEVEL >= 3 (INFO) - HAKMEM_TINY_SLL_VALIDATE_HDR → HAKMEM_DEBUG_LEVEL >= 3 (INFO) - HAKMEM_TINY_REFILL_FAILFAST → HAKMEM_DEBUG_LEVEL >= 4 (DEBUG) - HAKMEM_TINY_GUARD → HAKMEM_DEBUG_LEVEL >= 4 (DEBUG) 3. Kept 2 special-purpose variables (fine-grained control): - HAKMEM_TINY_GUARD_CLASS (target class for guard) - HAKMEM_TINY_GUARD_MAX (max guard events) 4. Backward compatibility: - Legacy ENV vars still work via hak_debug_check_level() - New code uses unified system - No behavior changes for existing users Updated files: - core/hakmem_debug_master.h (level 0-5 expansion) - core/hakmem_tiny_superslab_internal.h (alloc path trace) - core/box/tls_sll_box.h (header validation) - core/tiny_failfast.c (failfast level) - core/tiny_refill_opt.h (failfast guard) - core/hakmem_tiny_ace_guard_box.inc (guard enable) - core/hakmem_tiny.c (include hakmem_debug_master.h) Impact: - Simpler debug control: HAKMEM_DEBUG_LEVEL=3 instead of 4 separate ENVs - Easier to discover/use - Consistent debug levels across codebase - Reduces ENV variable proliferation (43+ vars surveyed) Future work: - Consolidate remaining 39+ debug variables (documented in survey) - Gradual migration over 2-3 releases 🤖 Generated with [Claude Code](https://claude.com/claude-code) Co-Authored-By: Claude <noreply@anthropic.com> 2025-11-29 06:57:03 +09:00			`// Enabled via HAKMEM_DEBUG_LEVEL >= 4 (DEBUG level)`
			`// Legacy: HAKMEM_TINY_GUARD=1 still works for compatibility`
			`g_tiny_guard_enabled = hak_debug_check_level("HAKMEM_TINY_GUARD", 4);`

			`// Special-purpose parameters (kept for targeted debugging)`
Refactor: Extract 5 Box modules from hakmem_tiny.c (-52% size reduction) Split hakmem_tiny.c (2081 lines) into focused modules for better maintainability. ## Changes hakmem_tiny.c: 2081 → 995 lines (-1086 lines, -52% reduction) ## Extracted Modules (5 boxes) 1. config_box (211 lines) - Size class tables, integrity counters - Debug flags, benchmark macros - HAK_RET_ALLOC/HAK_STAT_FREE instrumentation 2. publish_box (419 lines) - Publish/Adopt counters and statistics - Bench mailbox, partial ring - Live cap/Hot slot management - TLS helper functions (tiny_tls_default_) 3. globals_box* (256 lines) - Global variable declarations (~70 variables) - TinyPool instance and initialization flag - TLS variables (g_tls_lists, g_fast_head, g_fast_count) - SuperSlab configuration (partial ring, empty reserves) - Adopt gate functions 4. phase6_wrappers_box (122 lines) - Phase 6 Box Theory wrapper layer - hak_tiny_alloc_fast_wrapper() - hak_tiny_free_fast_wrapper() - Diagnostic instrumentation 5. ace_guard_box (100 lines) - ACE Learning Layer (hkm_ace_set_drain_threshold) - FastCache API (tiny_fc_room, tiny_fc_push_bulk) - Tiny Guard debugging system (5 functions) ## Benefits - Readability: Giant 2k file → focused 1k core + 5 coherent modules - Maintainability: Each box has clear responsibility and boundaries - Build: All modules compile successfully ✅ ## Technical Details - Phase 1: ChatGPT extracted config_box + publish_box (-625 lines) - Phase 2-4: Claude extracted globals_box + phase6_wrappers_box + ace_guard_box (-461 lines) - All extractions use .inc files (same translation unit, preserves static/TLS linkage) - Fixed Makefile: Added tiny_sizeclass_hist_box.o to OBJS_BASE and BENCH_HAKMEM_OBJS_BASE 🤖 Generated with [Claude Code](https://claude.com/claude-code) Co-Authored-By: Claude <noreply@anthropic.com> 2025-11-21 01:16:45 +09:00			`const char* ec = getenv("HAKMEM_TINY_GUARD_CLASS");`
			`if (ec && *ec) g_tiny_guard_class = atoi(ec);`
			`const char* el = getenv("HAKMEM_TINY_GUARD_MAX");`
			`if (el && *el) g_tiny_guard_limit = atoi(el);`
			`if (g_tiny_guard_limit <= 0) g_tiny_guard_limit = 8;`
			`}`
			`return g_tiny_guard_enabled;`
			`}`

			`int tiny_guard_is_enabled(void) { return tiny_guard_enabled_runtime(); }`

			`static void tiny_guard_dump_bytes(const char* tag, const uint8_t* p, size_t n) {`
			`fprintf(stderr, "[TGUARD] %s:", tag);`
			`for (size_t i = 0; i < n; i++) fprintf(stderr, " %02x", p[i]);`
			`fprintf(stderr, "\n");`
			`}`

			`void tiny_guard_on_alloc(int cls, void* base, void* user, size_t stride) {`
			`if (!tiny_guard_enabled_runtime() \|\| cls != g_tiny_guard_class) return;`
			`if (g_tiny_guard_seen++ >= g_tiny_guard_limit) return;`
			`uint8_t* b = (uint8_t*)base;`
			`fprintf(stderr, "[TGUARD] alloc cls=%d base=%p user=%p stride=%zu hdr=%02x\n",`
			`cls, base, user, stride, b[0]);`
			`// 隣接ヘッダ可視化（前後）`
			`tiny_guard_dump_bytes("around_base", b, (stride >= 8 ? 8 : stride));`
			`tiny_guard_dump_bytes("next_header", b + stride, 4);`
			`}`

			`void tiny_guard_on_invalid(void* user_ptr, uint8_t hdr) {`
			`if (!tiny_guard_enabled_runtime()) return;`
			`if (g_tiny_guard_seen++ >= g_tiny_guard_limit) return;`
			`uint8_t* u = (uint8_t*)user_ptr;`
			`fprintf(stderr, "[TGUARD] invalid header at user=%p hdr=%02x prev=%02x next=%02x\n",`
			`user_ptr, hdr, (u - 2), (u));`
			`tiny_guard_dump_bytes("dump_before", u - 8, 8);`
			`tiny_guard_dump_bytes("dump_after", u, 8);`
			`}`