hakorune/src/llvm_py/instructions/newbox.py

"""
NewBox instruction lowering
Handles box creation (new StringBox(), new IntegerBox(), etc.)
"""

import llvmlite.ir as ir
from typing import Dict, List, Optional

def lower_newbox(
    builder: ir.IRBuilder,
    module: ir.Module,
    box_type: str,
    args: List[int],
    dst_vid: int,
    vmap: Dict[int, ir.Value],
    resolver=None
) -> None:
    """
    Lower MIR NewBox instruction
    
    Creates a new box instance and returns its handle.
    
    Args:
        builder: Current LLVM IR builder
        module: LLVM module
        box_type: Box type name (e.g., "StringBox", "IntegerBox")
        args: Constructor arguments
        dst_vid: Destination value ID for box handle
        vmap: Value map
        resolver: Optional resolver for type handling
    """
    # Use NyRT shim: prefer birth_h for core boxes, otherwise env.box.new_i64x
    i64 = ir.IntType(64)
    i8p = ir.IntType(8).as_pointer()
    # Core fast paths
    if box_type in ("ArrayBox", "MapBox"):
        birth_name = "nyash.array.birth_h" if box_type == "ArrayBox" else "nyash.map.birth_h"
        birth = None
        for f in module.functions:
            if f.name == birth_name:
                birth = f
                break
        if not birth:
            birth = ir.Function(module, ir.FunctionType(i64, []), name=birth_name)
        handle = builder.call(birth, [], name=f"birth_{box_type}")
        vmap[dst_vid] = handle
        return
    # Prefer variadic shim: nyash.env.box.new_i64x(type_name, argc, a1, a2, a3, a4)
    new_i64x = None
    for f in module.functions:
        if f.name == "nyash.env.box.new_i64x":
            new_i64x = f
            break
    if not new_i64x:
        new_i64x = ir.Function(module, ir.FunctionType(i64, [i8p, i64, i64, i64, i64, i64]), name="nyash.env.box.new_i64x")

    # Build C-string for type name (unique global per function)
    sbytes = (box_type + "\0").encode('utf-8')
    arr_ty = ir.ArrayType(ir.IntType(8), len(sbytes))
    try:
        fn = builder.block.parent
        fn_name = getattr(fn, 'name', 'fn')
    except Exception:
        fn_name = 'fn'
    base = f".box_ty_{fn_name}_{dst_vid}"
    existing = {g.name for g in module.global_values}
    name = base
    n = 1
    while name in existing:
        name = f"{base}.{n}"; n += 1
    g = ir.GlobalVariable(module, arr_ty, name=name)
    g.linkage = 'private'
    g.global_constant = True
    g.initializer = ir.Constant(arr_ty, bytearray(sbytes))
    c0 = ir.Constant(ir.IntType(32), 0)
    ptr = builder.gep(g, [c0, c0], inbounds=True)
    zero = ir.Constant(i64, 0)
    handle = builder.call(new_i64x, [ptr, zero, zero, zero, zero, zero], name=f"new_{box_type}")
    vmap[dst_vid] = handle

def lower_newbox_generic(
    builder: ir.IRBuilder,
    module: ir.Module,
    dst_vid: int,
    vmap: Dict[int, ir.Value]
) -> None:
    """
    Create a generic box with runtime allocation
    
    This is used when box type is not statically known.
    """
    # Look up generic allocation function
    alloc_func = None
    for f in module.functions:
        if f.name == "ny_alloc_box":
            alloc_func = f
            break
    
    if not alloc_func:
        # Declare ny_alloc_box(size: i64) -> i64
        i64 = ir.IntType(64)
        func_type = ir.FunctionType(i64, [i64])
        alloc_func = ir.Function(module, func_type, name="ny_alloc_box")
    
    # Default box size (e.g., 64 bytes)
    size = ir.Constant(ir.IntType(64), 64)
    handle = builder.call(alloc_func, [size], name="new_box")
    
    vmap[dst_vid] = handle
✨ Python LLVM backend implementation (experimental) - Created llvmlite-based LLVM backend in src/llvm_py/ - Implemented all MIR14 instructions (const, binop, jump, branch, ret, compare, phi, call, boxcall, externcall, typeop, newbox, safepoint, barrier) - Experimental LoopForm support - ~2000 lines of clean Python code vs complex Rust/inkwell - Useful for PHI/SSA validation and rapid prototyping - Added documentation to CLAUDE.md This was created while waiting for ChatGPT's investigation of BuilderCursor issues. 2025-09-12 20:55:13 +09:00			`"""`
			`NewBox instruction lowering`
			`Handles box creation (new StringBox(), new IntegerBox(), etc.)`
			`"""`

			`import llvmlite.ir as ir`
			`from typing import Dict, List, Optional`

			`def lower_newbox(`
			`builder: ir.IRBuilder,`
			`module: ir.Module,`
			`box_type: str,`
			`args: List[int],`
			`dst_vid: int,`
			`vmap: Dict[int, ir.Value],`
			`resolver=None`
			`) -> None:`
			`"""`
			`Lower MIR NewBox instruction`

			`Creates a new box instance and returns its handle.`

			`Args:`
			`builder: Current LLVM IR builder`
			`module: LLVM module`
			`box_type: Box type name (e.g., "StringBox", "IntegerBox")`
			`args: Constructor arguments`
			`dst_vid: Destination value ID for box handle`
			`vmap: Value map`
			`resolver: Optional resolver for type handling`
			`"""`
🔍 Research: GPT-5-Codex capabilities and GitHub PR integration ## Summary Investigated OpenAI's new GPT-5-Codex model and Codex GitHub PR review integration capabilities. ## GPT-5-Codex Analysis ### Benchmark Performance (Good) - SWE-bench Verified: 74.5% (vs GPT-5's 72.8%) - Refactoring tasks: 51.3% (vs GPT-5's 33.9%) - Code review: Higher developer ratings ### Real-World Issues (Concerning) - Users report degraded coding performance - Scripts that previously worked now fail - Less consistent than GPT-4.5 - Longer response times (minutes vs instant) - "Creatively and emotionally flat" - Basic errors (e.g., counting letters incorrectly) ### Key Finding Classic case of "optimizing for benchmarks vs real usability" - scores well on tests but performs poorly in practice. ## Codex GitHub PR Integration ### Setup Process 1. Enable MFA and connect GitHub account 2. Authorize Codex GitHub app for repos 3. Enable "Code review" in repository settings ### Usage Methods - Manual: Comment '@codex review' in PR - Automatic: Triggers when PR moves from draft to ready ### Current Limitations - One-way communication (doesn't respond to review comments) - Prefers creating new PRs over updating existing ones - Better for single-pass reviews than iterative feedback ## 'codex resume' Feature New session management capability: - Resume previous codex exec sessions - Useful for continuing long tasks across days - Maintains context from interrupted work 🐱 The investigation reveals that while GPT-5-Codex shows benchmark improvements, practical developer experience has declined - a reminder that metrics don't always reflect real-world utility\! 2025-09-16 16:28:25 +09:00			`# Use NyRT shim: prefer birth_h for core boxes, otherwise env.box.new_i64x`
📚 Phase 15計画を詳細化・更新: Python/llvmlite正式採用とプラグイン全方向ビルド戦略 ✅ 主な更新内容: - Python/llvmlite実装の正式採用を明記（開発速度10倍、~2400行） - プラグイン全方向ビルド戦略（.so/.o/.a同時生成）で単一EXE生成可能に - 各実装の予想コード量を具体化（パーサー800行、MIR Builder 2500行、VM 5000行） - 循環依存問題の解決を明記（nyrtがC ABI経由で提供） - 現実的なスケジュール調整（2025年9月～2026年3月） 🎉 最新進捗: - dep_tree_min_string.nyashオブジェクト生成成功（10.4KB） - LLVM verifier green - dominance違反解決 - Resolver patternでSSA安全性確保 🚀 次のマイルストーン: - Python/llvmliteでEXE生成パイプライン完成 - nyash-llvm-compiler分離設計 - NyashパーサーMVP実装開始 Everything is Boxの究極形が、ついに実現へ！ 🤖 Generated with [Claude Code](https://claude.ai/code) Co-Authored-By: Claude <noreply@anthropic.com> 2025-09-13 15:37:58 +09:00			`i64 = ir.IntType(64)`
			`i8p = ir.IntType(8).as_pointer()`
🔍 Research: GPT-5-Codex capabilities and GitHub PR integration ## Summary Investigated OpenAI's new GPT-5-Codex model and Codex GitHub PR review integration capabilities. ## GPT-5-Codex Analysis ### Benchmark Performance (Good) - SWE-bench Verified: 74.5% (vs GPT-5's 72.8%) - Refactoring tasks: 51.3% (vs GPT-5's 33.9%) - Code review: Higher developer ratings ### Real-World Issues (Concerning) - Users report degraded coding performance - Scripts that previously worked now fail - Less consistent than GPT-4.5 - Longer response times (minutes vs instant) - "Creatively and emotionally flat" - Basic errors (e.g., counting letters incorrectly) ### Key Finding Classic case of "optimizing for benchmarks vs real usability" - scores well on tests but performs poorly in practice. ## Codex GitHub PR Integration ### Setup Process 1. Enable MFA and connect GitHub account 2. Authorize Codex GitHub app for repos 3. Enable "Code review" in repository settings ### Usage Methods - Manual: Comment '@codex review' in PR - Automatic: Triggers when PR moves from draft to ready ### Current Limitations - One-way communication (doesn't respond to review comments) - Prefers creating new PRs over updating existing ones - Better for single-pass reviews than iterative feedback ## 'codex resume' Feature New session management capability: - Resume previous codex exec sessions - Useful for continuing long tasks across days - Maintains context from interrupted work 🐱 The investigation reveals that while GPT-5-Codex shows benchmark improvements, practical developer experience has declined - a reminder that metrics don't always reflect real-world utility\! 2025-09-16 16:28:25 +09:00			`# Core fast paths`
			`if box_type in ("ArrayBox", "MapBox"):`
			`birth_name = "nyash.array.birth_h" if box_type == "ArrayBox" else "nyash.map.birth_h"`
			`birth = None`
			`for f in module.functions:`
			`if f.name == birth_name:`
			`birth = f`
			`break`
			`if not birth:`
			`birth = ir.Function(module, ir.FunctionType(i64, []), name=birth_name)`
			`handle = builder.call(birth, [], name=f"birth_{box_type}")`
			`vmap[dst_vid] = handle`
			`return`
📚 Phase 15計画を詳細化・更新: Python/llvmlite正式採用とプラグイン全方向ビルド戦略 ✅ 主な更新内容: - Python/llvmlite実装の正式採用を明記（開発速度10倍、~2400行） - プラグイン全方向ビルド戦略（.so/.o/.a同時生成）で単一EXE生成可能に - 各実装の予想コード量を具体化（パーサー800行、MIR Builder 2500行、VM 5000行） - 循環依存問題の解決を明記（nyrtがC ABI経由で提供） - 現実的なスケジュール調整（2025年9月～2026年3月） 🎉 最新進捗: - dep_tree_min_string.nyashオブジェクト生成成功（10.4KB） - LLVM verifier green - dominance違反解決 - Resolver patternでSSA安全性確保 🚀 次のマイルストーン: - Python/llvmliteでEXE生成パイプライン完成 - nyash-llvm-compiler分離設計 - NyashパーサーMVP実装開始 Everything is Boxの究極形が、ついに実現へ！ 🤖 Generated with [Claude Code](https://claude.ai/code) Co-Authored-By: Claude <noreply@anthropic.com> 2025-09-13 15:37:58 +09:00			`# Prefer variadic shim: nyash.env.box.new_i64x(type_name, argc, a1, a2, a3, a4)`
			`new_i64x = None`
✨ Python LLVM backend implementation (experimental) - Created llvmlite-based LLVM backend in src/llvm_py/ - Implemented all MIR14 instructions (const, binop, jump, branch, ret, compare, phi, call, boxcall, externcall, typeop, newbox, safepoint, barrier) - Experimental LoopForm support - ~2000 lines of clean Python code vs complex Rust/inkwell - Useful for PHI/SSA validation and rapid prototyping - Added documentation to CLAUDE.md This was created while waiting for ChatGPT's investigation of BuilderCursor issues. 2025-09-12 20:55:13 +09:00			`for f in module.functions:`
📚 Phase 15計画を詳細化・更新: Python/llvmlite正式採用とプラグイン全方向ビルド戦略 ✅ 主な更新内容: - Python/llvmlite実装の正式採用を明記（開発速度10倍、~2400行） - プラグイン全方向ビルド戦略（.so/.o/.a同時生成）で単一EXE生成可能に - 各実装の予想コード量を具体化（パーサー800行、MIR Builder 2500行、VM 5000行） - 循環依存問題の解決を明記（nyrtがC ABI経由で提供） - 現実的なスケジュール調整（2025年9月～2026年3月） 🎉 最新進捗: - dep_tree_min_string.nyashオブジェクト生成成功（10.4KB） - LLVM verifier green - dominance違反解決 - Resolver patternでSSA安全性確保 🚀 次のマイルストーン: - Python/llvmliteでEXE生成パイプライン完成 - nyash-llvm-compiler分離設計 - NyashパーサーMVP実装開始 Everything is Boxの究極形が、ついに実現へ！ 🤖 Generated with [Claude Code](https://claude.ai/code) Co-Authored-By: Claude <noreply@anthropic.com> 2025-09-13 15:37:58 +09:00			`if f.name == "nyash.env.box.new_i64x":`
			`new_i64x = f`
✨ Python LLVM backend implementation (experimental) - Created llvmlite-based LLVM backend in src/llvm_py/ - Implemented all MIR14 instructions (const, binop, jump, branch, ret, compare, phi, call, boxcall, externcall, typeop, newbox, safepoint, barrier) - Experimental LoopForm support - ~2000 lines of clean Python code vs complex Rust/inkwell - Useful for PHI/SSA validation and rapid prototyping - Added documentation to CLAUDE.md This was created while waiting for ChatGPT's investigation of BuilderCursor issues. 2025-09-12 20:55:13 +09:00			`break`
📚 Phase 15計画を詳細化・更新: Python/llvmlite正式採用とプラグイン全方向ビルド戦略 ✅ 主な更新内容: - Python/llvmlite実装の正式採用を明記（開発速度10倍、~2400行） - プラグイン全方向ビルド戦略（.so/.o/.a同時生成）で単一EXE生成可能に - 各実装の予想コード量を具体化（パーサー800行、MIR Builder 2500行、VM 5000行） - 循環依存問題の解決を明記（nyrtがC ABI経由で提供） - 現実的なスケジュール調整（2025年9月～2026年3月） 🎉 最新進捗: - dep_tree_min_string.nyashオブジェクト生成成功（10.4KB） - LLVM verifier green - dominance違反解決 - Resolver patternでSSA安全性確保 🚀 次のマイルストーン: - Python/llvmliteでEXE生成パイプライン完成 - nyash-llvm-compiler分離設計 - NyashパーサーMVP実装開始 Everything is Boxの究極形が、ついに実現へ！ 🤖 Generated with [Claude Code](https://claude.ai/code) Co-Authored-By: Claude <noreply@anthropic.com> 2025-09-13 15:37:58 +09:00			`if not new_i64x:`
			`new_i64x = ir.Function(module, ir.FunctionType(i64, [i8p, i64, i64, i64, i64, i64]), name="nyash.env.box.new_i64x")`

			`# Build C-string for type name (unique global per function)`
			`sbytes = (box_type + "\0").encode('utf-8')`
			`arr_ty = ir.ArrayType(ir.IntType(8), len(sbytes))`
			`try:`
			`fn = builder.block.parent`
			`fn_name = getattr(fn, 'name', 'fn')`
			`except Exception:`
			`fn_name = 'fn'`
			`base = f".box_ty_{fn_name}_{dst_vid}"`
			`existing = {g.name for g in module.global_values}`
			`name = base`
			`n = 1`
			`while name in existing:`
			`name = f"{base}.{n}"; n += 1`
			`g = ir.GlobalVariable(module, arr_ty, name=name)`
			`g.linkage = 'private'`
			`g.global_constant = True`
			`g.initializer = ir.Constant(arr_ty, bytearray(sbytes))`
			`c0 = ir.Constant(ir.IntType(32), 0)`
			`ptr = builder.gep(g, [c0, c0], inbounds=True)`
			`zero = ir.Constant(i64, 0)`
			`handle = builder.call(new_i64x, [ptr, zero, zero, zero, zero, zero], name=f"new_{box_type}")`
✨ Python LLVM backend implementation (experimental) - Created llvmlite-based LLVM backend in src/llvm_py/ - Implemented all MIR14 instructions (const, binop, jump, branch, ret, compare, phi, call, boxcall, externcall, typeop, newbox, safepoint, barrier) - Experimental LoopForm support - ~2000 lines of clean Python code vs complex Rust/inkwell - Useful for PHI/SSA validation and rapid prototyping - Added documentation to CLAUDE.md This was created while waiting for ChatGPT's investigation of BuilderCursor issues. 2025-09-12 20:55:13 +09:00			`vmap[dst_vid] = handle`

			`def lower_newbox_generic(`
			`builder: ir.IRBuilder,`
			`module: ir.Module,`
			`dst_vid: int,`
			`vmap: Dict[int, ir.Value]`
			`) -> None:`
			`"""`
			`Create a generic box with runtime allocation`

			`This is used when box type is not statically known.`
			`"""`
			`# Look up generic allocation function`
			`alloc_func = None`
			`for f in module.functions:`
			`if f.name == "ny_alloc_box":`
			`alloc_func = f`
			`break`

			`if not alloc_func:`
			`# Declare ny_alloc_box(size: i64) -> i64`
			`i64 = ir.IntType(64)`
			`func_type = ir.FunctionType(i64, [i64])`
			`alloc_func = ir.Function(module, func_type, name="ny_alloc_box")`

			`# Default box size (e.g., 64 bytes)`
			`size = ir.Constant(ir.IntType(64), 64)`
			`handle = builder.call(alloc_func, [size], name="new_box")`

📚 Phase 15計画を詳細化・更新: Python/llvmlite正式採用とプラグイン全方向ビルド戦略 ✅ 主な更新内容: - Python/llvmlite実装の正式採用を明記（開発速度10倍、~2400行） - プラグイン全方向ビルド戦略（.so/.o/.a同時生成）で単一EXE生成可能に - 各実装の予想コード量を具体化（パーサー800行、MIR Builder 2500行、VM 5000行） - 循環依存問題の解決を明記（nyrtがC ABI経由で提供） - 現実的なスケジュール調整（2025年9月～2026年3月） 🎉 最新進捗: - dep_tree_min_string.nyashオブジェクト生成成功（10.4KB） - LLVM verifier green - dominance違反解決 - Resolver patternでSSA安全性確保 🚀 次のマイルストーン: - Python/llvmliteでEXE生成パイプライン完成 - nyash-llvm-compiler分離設計 - NyashパーサーMVP実装開始 Everything is Boxの究極形が、ついに実現へ！ 🤖 Generated with [Claude Code](https://claude.ai/code) Co-Authored-By: Claude <noreply@anthropic.com> 2025-09-13 15:37:58 +09:00			`vmap[dst_vid] = handle`