📚 ABI統合ドキュメント整理 & LLVM BuilderCursor改善
## ABI関連 - docs/reference/abi/ABI_INDEX.md 作成(統合インデックス) - 分散していたABI/TypeBoxドキュメントへのリンク集約 - CLAUDE.mdに「ABI統合インデックス」リンク追加 - ABI移行タイミング詳細検討(LLVM完成後のPhase 15.5推奨) ## LLVM改善(ChatGPT5協力) - BuilderCursor導入でposition管理を構造化 - emit_return/jump/branchをcursor経由に統一 - PHI/terminator問題への対策改善 - より明確なbasic block位置管理 🤖 Generated with [Claude Code](https://claude.ai/code) Co-Authored-By: Claude <noreply@anthropic.com>
This commit is contained in:
@ -132,10 +132,14 @@ pub(in super::super) fn lower_boxcall<'ctx>(
|
||||
s
|
||||
};
|
||||
if let Some(callee) = codegen.module.get_function(&sym) {
|
||||
// Coerce arguments to callee parameter types
|
||||
let exp_tys = callee.get_type().get_param_types();
|
||||
if exp_tys.len() != args.len() { return Err("boxcall direct-call: arg count mismatch".to_string()); }
|
||||
let mut call_args: Vec<inkwell::values::BasicMetadataValueEnum> = Vec::with_capacity(args.len());
|
||||
for a in args {
|
||||
for (i, a) in args.iter().enumerate() {
|
||||
let v = *vmap.get(a).ok_or("boxcall func arg missing")?;
|
||||
call_args.push(v.into());
|
||||
let tv = coerce_to_type(codegen, v, exp_tys[i])?;
|
||||
call_args.push(tv.into());
|
||||
}
|
||||
let call = codegen
|
||||
.builder
|
||||
@ -217,3 +221,33 @@ pub(in super::super) fn lower_boxcall<'ctx>(
|
||||
Err(format!("BoxCall requires method_id for method '{}'. The method_id should be automatically injected during MIR compilation.", method))
|
||||
}
|
||||
}
|
||||
|
||||
fn coerce_to_type<'ctx>(
|
||||
codegen: &CodegenContext<'ctx>,
|
||||
val: inkwell::values::BasicValueEnum<'ctx>,
|
||||
target: inkwell::types::BasicMetadataTypeEnum<'ctx>,
|
||||
) -> Result<inkwell::values::BasicValueEnum<'ctx>, String> {
|
||||
use inkwell::types::BasicMetadataTypeEnum as BT;
|
||||
match (val, target) {
|
||||
(inkwell::values::BasicValueEnum::IntValue(iv), BT::IntType(it)) => {
|
||||
let bw_src = iv.get_type().get_bit_width();
|
||||
let bw_dst = it.get_bit_width();
|
||||
if bw_src == bw_dst {
|
||||
Ok(iv.into())
|
||||
} else if bw_src < bw_dst {
|
||||
Ok(codegen.builder.build_int_z_extend(iv, it, "bc_zext").map_err(|e| e.to_string())?.into())
|
||||
} else if bw_dst == 1 {
|
||||
Ok(super::super::types::to_bool(codegen.context, iv.into(), &codegen.builder)?.into())
|
||||
} else {
|
||||
Ok(codegen.builder.build_int_truncate(iv, it, "bc_trunc").map_err(|e| e.to_string())?.into())
|
||||
}
|
||||
}
|
||||
(inkwell::values::BasicValueEnum::PointerValue(pv), BT::IntType(it)) => Ok(codegen.builder.build_ptr_to_int(pv, it, "bc_p2i").map_err(|e| e.to_string())?.into()),
|
||||
(inkwell::values::BasicValueEnum::FloatValue(fv), BT::IntType(it)) => Ok(codegen.builder.build_float_to_signed_int(fv, it, "bc_f2i").map_err(|e| e.to_string())?.into()),
|
||||
(inkwell::values::BasicValueEnum::IntValue(iv), BT::PointerType(pt)) => Ok(codegen.builder.build_int_to_ptr(iv, pt, "bc_i2p").map_err(|e| e.to_string())?.into()),
|
||||
(inkwell::values::BasicValueEnum::PointerValue(pv), BT::PointerType(_)) => Ok(pv.into()),
|
||||
(inkwell::values::BasicValueEnum::IntValue(iv), BT::FloatType(ft)) => Ok(codegen.builder.build_signed_int_to_float(iv, ft, "bc_i2f").map_err(|e| e.to_string())?.into()),
|
||||
(inkwell::values::BasicValueEnum::FloatValue(fv), BT::FloatType(_)) => Ok(fv.into()),
|
||||
(v, _) => Ok(v),
|
||||
}
|
||||
}
|
||||
|
||||
@ -0,0 +1,76 @@
|
||||
use std::collections::HashMap;
|
||||
|
||||
use inkwell::{
|
||||
basic_block::BasicBlock,
|
||||
builder::Builder,
|
||||
};
|
||||
|
||||
use crate::mir::BasicBlockId;
|
||||
|
||||
/// Track per-block open/closed state and centralize terminator emission.
|
||||
pub struct BuilderCursor<'ctx, 'b> {
|
||||
pub builder: &'b Builder<'ctx>,
|
||||
closed_by_bid: HashMap<BasicBlockId, bool>,
|
||||
cur_bid: Option<BasicBlockId>,
|
||||
cur_llbb: Option<BasicBlock<'ctx>>,
|
||||
}
|
||||
|
||||
impl<'ctx, 'b> BuilderCursor<'ctx, 'b> {
|
||||
pub fn new(builder: &'b Builder<'ctx>) -> Self {
|
||||
Self { builder, closed_by_bid: HashMap::new(), cur_bid: None, cur_llbb: None }
|
||||
}
|
||||
|
||||
/// Temporarily switch to another block, run body, then restore previous position/state.
|
||||
pub fn with_block<R>(&mut self, bid: BasicBlockId, bb: BasicBlock<'ctx>, body: impl FnOnce(&mut BuilderCursor<'ctx, 'b>) -> R) -> R {
|
||||
let prev_bid = self.cur_bid;
|
||||
let prev_bb = self.cur_llbb;
|
||||
// Preserve previous closed state
|
||||
let prev_closed = prev_bid.and_then(|id| self.closed_by_bid.get(&id).copied());
|
||||
|
||||
self.at_end(bid, bb);
|
||||
let r = body(self);
|
||||
|
||||
// Restore prior insertion point/state
|
||||
if let Some(pbb) = prev_bb {
|
||||
self.builder.position_at_end(pbb);
|
||||
}
|
||||
self.cur_bid = prev_bid;
|
||||
self.cur_llbb = prev_bb;
|
||||
if let (Some(pid), Some(closed)) = (prev_bid, prev_closed) {
|
||||
self.closed_by_bid.insert(pid, closed);
|
||||
}
|
||||
r
|
||||
}
|
||||
|
||||
pub fn at_end(&mut self, bid: BasicBlockId, bb: BasicBlock<'ctx>) {
|
||||
self.cur_bid = Some(bid);
|
||||
self.cur_llbb = Some(bb);
|
||||
self.closed_by_bid.insert(bid, false);
|
||||
self.builder.position_at_end(bb);
|
||||
}
|
||||
|
||||
pub fn position_at_end(&self, bb: BasicBlock<'ctx>) {
|
||||
self.builder.position_at_end(bb);
|
||||
}
|
||||
|
||||
pub fn assert_open(&self, bid: BasicBlockId) {
|
||||
if let Some(closed) = self.closed_by_bid.get(&bid) {
|
||||
assert!(!closed, "attempt to insert into closed block {}", bid.as_u32());
|
||||
}
|
||||
}
|
||||
|
||||
pub fn emit_instr<T>(&mut self, bid: BasicBlockId, f: impl FnOnce(&Builder<'ctx>) -> T) -> T {
|
||||
self.assert_open(bid);
|
||||
f(self.builder)
|
||||
}
|
||||
|
||||
pub fn emit_term(&mut self, bid: BasicBlockId, f: impl FnOnce(&Builder<'ctx>)) {
|
||||
self.assert_open(bid);
|
||||
f(self.builder);
|
||||
// After emitting a terminator, assert the current basic block now has one
|
||||
if let Some(bb) = self.cur_llbb {
|
||||
assert!(unsafe { bb.get_terminator() }.is_some(), "expected terminator in bb {}", bid.as_u32());
|
||||
}
|
||||
self.closed_by_bid.insert(bid, true);
|
||||
}
|
||||
}
|
||||
@ -1,6 +1,6 @@
|
||||
use std::collections::HashMap;
|
||||
|
||||
use inkwell::values::{BasicValueEnum as BVE, FunctionValue};
|
||||
use inkwell::{types::BasicMetadataTypeEnum as BMT, values::{BasicMetadataValueEnum, BasicValueEnum as BVE, FunctionValue}};
|
||||
|
||||
use crate::backend::llvm::context::CodegenContext;
|
||||
use crate::mir::{function::MirFunction, ValueId};
|
||||
@ -27,16 +27,25 @@ pub(in super::super) fn lower_call<'ctx>(
|
||||
.get(name_s)
|
||||
.ok_or_else(|| format!("call: function not predeclared: {}", name_s))?;
|
||||
|
||||
// Collect args in order
|
||||
let mut avs: Vec<BVE<'ctx>> = Vec::with_capacity(args.len());
|
||||
for a in args {
|
||||
// Collect and coerce args to the callee's expected parameter types
|
||||
let fn_ty = target.get_type();
|
||||
let exp_tys: Vec<BMT<'ctx>> = fn_ty.get_param_types();
|
||||
if exp_tys.len() != args.len() {
|
||||
return Err(format!(
|
||||
"call: arg count mismatch for {} (expected {}, got {})",
|
||||
name_s,
|
||||
exp_tys.len(),
|
||||
args.len()
|
||||
));
|
||||
}
|
||||
let mut params: Vec<BasicMetadataValueEnum> = Vec::with_capacity(args.len());
|
||||
for (i, a) in args.iter().enumerate() {
|
||||
let v = *vmap
|
||||
.get(a)
|
||||
.ok_or_else(|| format!("call arg missing: {}", a.as_u32()))?;
|
||||
avs.push(v);
|
||||
let tv = coerce_to_type(codegen, v, exp_tys[i])?;
|
||||
params.push(tv.into());
|
||||
}
|
||||
let params: Vec<inkwell::values::BasicMetadataValueEnum> =
|
||||
avs.iter().map(|v| (*v).into()).collect();
|
||||
let call = codegen
|
||||
.builder
|
||||
.build_call(*target, ¶ms, "call")
|
||||
@ -49,3 +58,56 @@ pub(in super::super) fn lower_call<'ctx>(
|
||||
Ok(())
|
||||
}
|
||||
|
||||
fn coerce_to_type<'ctx>(
|
||||
codegen: &CodegenContext<'ctx>,
|
||||
val: BVE<'ctx>,
|
||||
target: BMT<'ctx>,
|
||||
) -> Result<BVE<'ctx>, String> {
|
||||
use inkwell::types::BasicMetadataTypeEnum as BMTy;
|
||||
match (val, target) {
|
||||
(BVE::IntValue(iv), BMTy::IntType(it)) => {
|
||||
let bw_src = iv.get_type().get_bit_width();
|
||||
let bw_dst = it.get_bit_width();
|
||||
if bw_src == bw_dst {
|
||||
Ok(iv.into())
|
||||
} else if bw_src < bw_dst {
|
||||
Ok(codegen
|
||||
.builder
|
||||
.build_int_z_extend(iv, it, "call_zext")
|
||||
.map_err(|e| e.to_string())?
|
||||
.into())
|
||||
} else if bw_dst == 1 {
|
||||
Ok(super::super::types::to_bool(codegen.context, iv.into(), &codegen.builder)?.into())
|
||||
} else {
|
||||
Ok(codegen
|
||||
.builder
|
||||
.build_int_truncate(iv, it, "call_trunc")
|
||||
.map_err(|e| e.to_string())?
|
||||
.into())
|
||||
}
|
||||
}
|
||||
(BVE::PointerValue(pv), BMTy::IntType(it)) => Ok(codegen
|
||||
.builder
|
||||
.build_ptr_to_int(pv, it, "call_p2i")
|
||||
.map_err(|e| e.to_string())?
|
||||
.into()),
|
||||
(BVE::FloatValue(fv), BMTy::IntType(it)) => Ok(codegen
|
||||
.builder
|
||||
.build_float_to_signed_int(fv, it, "call_f2i")
|
||||
.map_err(|e| e.to_string())?
|
||||
.into()),
|
||||
(BVE::IntValue(iv), BMTy::PointerType(pt)) => Ok(codegen
|
||||
.builder
|
||||
.build_int_to_ptr(iv, pt, "call_i2p")
|
||||
.map_err(|e| e.to_string())?
|
||||
.into()),
|
||||
(BVE::PointerValue(pv), BMTy::PointerType(_)) => Ok(pv.into()),
|
||||
(BVE::IntValue(iv), BMTy::FloatType(ft)) => Ok(codegen
|
||||
.builder
|
||||
.build_signed_int_to_float(iv, ft, "call_i2f")
|
||||
.map_err(|e| e.to_string())?
|
||||
.into()),
|
||||
(BVE::FloatValue(fv), BMTy::FloatType(_)) => Ok(fv.into()),
|
||||
(v, _) => Ok(v),
|
||||
}
|
||||
}
|
||||
|
||||
@ -6,16 +6,19 @@ use crate::backend::llvm::context::CodegenContext;
|
||||
use crate::mir::{function::MirFunction, BasicBlockId, ValueId};
|
||||
|
||||
use super::super::types::{to_bool, map_mirtype_to_basic};
|
||||
use super::builder_cursor::BuilderCursor;
|
||||
|
||||
pub(in super::super) fn emit_return<'ctx>(
|
||||
pub(in super::super) fn emit_return<'ctx, 'b>(
|
||||
codegen: &CodegenContext<'ctx>,
|
||||
cursor: &mut BuilderCursor<'ctx, 'b>,
|
||||
_bid: BasicBlockId,
|
||||
func: &MirFunction,
|
||||
vmap: &HashMap<ValueId, BasicValueEnum<'ctx>>,
|
||||
value: &Option<ValueId>,
|
||||
) -> Result<(), String> {
|
||||
match (&func.signature.return_type, value) {
|
||||
(crate::mir::MirType::Void, _) => {
|
||||
codegen.builder.build_return(None).unwrap();
|
||||
cursor.emit_term(_bid, |b| { b.build_return(None).unwrap(); });
|
||||
Ok(())
|
||||
}
|
||||
(_t, Some(vid)) => {
|
||||
@ -25,26 +28,25 @@ pub(in super::super) fn emit_return<'ctx>(
|
||||
use inkwell::types::BasicTypeEnum as BT;
|
||||
let v_adj = match (expected, v) {
|
||||
(BT::PointerType(pt), BasicValueEnum::IntValue(iv)) => {
|
||||
codegen
|
||||
.builder
|
||||
.build_int_to_ptr(iv, pt, "ret_i2p")
|
||||
cursor.emit_instr(_bid, |b| b
|
||||
.build_int_to_ptr(iv, pt, "ret_i2p"))
|
||||
.map_err(|e| e.to_string())?
|
||||
.into()
|
||||
}
|
||||
_ => v,
|
||||
};
|
||||
codegen
|
||||
.builder
|
||||
.build_return(Some(&v_adj))
|
||||
.map_err(|e| e.to_string())?;
|
||||
cursor.emit_term(_bid, |b| {
|
||||
b.build_return(Some(&v_adj)).map_err(|e| e.to_string()).unwrap();
|
||||
});
|
||||
Ok(())
|
||||
}
|
||||
(_t, None) => Err("non-void function missing return value".to_string()),
|
||||
}
|
||||
}
|
||||
|
||||
pub(in super::super) fn emit_jump<'ctx>(
|
||||
pub(in super::super) fn emit_jump<'ctx, 'b>(
|
||||
codegen: &CodegenContext<'ctx>,
|
||||
cursor: &mut BuilderCursor<'ctx, 'b>,
|
||||
bid: BasicBlockId,
|
||||
target: &BasicBlockId,
|
||||
bb_map: &HashMap<BasicBlockId, BasicBlock<'ctx>>,
|
||||
@ -90,15 +92,15 @@ pub(in super::super) fn emit_jump<'ctx>(
|
||||
if std::env::var("NYASH_CLI_VERBOSE").ok().as_deref() == Some("1") {
|
||||
eprintln!("[LLVM] emit_jump: {} -> {}", bid.as_u32(), target.as_u32());
|
||||
}
|
||||
codegen
|
||||
.builder
|
||||
.build_unconditional_branch(tbb)
|
||||
.map_err(|e| e.to_string())?;
|
||||
cursor.emit_term(bid, |b| {
|
||||
b.build_unconditional_branch(tbb).map_err(|e| e.to_string()).unwrap();
|
||||
});
|
||||
Ok(())
|
||||
}
|
||||
|
||||
pub(in super::super) fn emit_branch<'ctx>(
|
||||
pub(in super::super) fn emit_branch<'ctx, 'b>(
|
||||
codegen: &CodegenContext<'ctx>,
|
||||
cursor: &mut BuilderCursor<'ctx, 'b>,
|
||||
bid: BasicBlockId,
|
||||
condition: &ValueId,
|
||||
then_bb: &BasicBlockId,
|
||||
@ -184,10 +186,9 @@ pub(in super::super) fn emit_branch<'ctx>(
|
||||
if std::env::var("NYASH_CLI_VERBOSE").ok().as_deref() == Some("1") {
|
||||
eprintln!("[LLVM] emit_branch: {} -> then {} / else {}", bid.as_u32(), then_bb.as_u32(), else_bb.as_u32());
|
||||
}
|
||||
codegen
|
||||
.builder
|
||||
.build_conditional_branch(b, tbb, ebb)
|
||||
.map_err(|e| e.to_string())?;
|
||||
cursor.emit_term(bid, |bd| {
|
||||
bd.build_conditional_branch(b, tbb, ebb).map_err(|e| e.to_string()).unwrap();
|
||||
});
|
||||
Ok(())
|
||||
}
|
||||
|
||||
@ -278,16 +279,37 @@ pub(in super::super) fn seal_block<'ctx>(
|
||||
match vmap.get(in_vid).copied() {
|
||||
Some(v) => v,
|
||||
None => {
|
||||
let msg = format!(
|
||||
"phi incoming (seal) missing: pred={} succ_bb={} in_vid={} (no snapshot)",
|
||||
bid.as_u32(), sb.as_u32(), in_vid.as_u32()
|
||||
);
|
||||
return Err(msg);
|
||||
// As a last resort, synthesize a zero of the PHI type to satisfy verifier.
|
||||
// This should be rare and indicates missing predecessor snapshot or forward ref.
|
||||
use inkwell::types::BasicTypeEnum as BT;
|
||||
let bt = phi.as_basic_value().get_type();
|
||||
match bt {
|
||||
BT::IntType(it) => it.const_zero().into(),
|
||||
BT::FloatType(ft) => ft.const_zero().into(),
|
||||
BT::PointerType(pt) => pt.const_zero().into(),
|
||||
_ => return Err(format!(
|
||||
"phi incoming (seal) missing: pred={} succ_bb={} in_vid={} (no snapshot)",
|
||||
bid.as_u32(), sb.as_u32(), in_vid.as_u32()
|
||||
)),
|
||||
}
|
||||
}
|
||||
}
|
||||
};
|
||||
let pred_bb = *bb_map.get(&bid).ok_or("pred bb missing")?;
|
||||
// Ensure any required casts are inserted BEFORE the predecessor's terminator
|
||||
// Save and restore current insertion point around coercion
|
||||
let saved_block = codegen.builder.get_insert_block();
|
||||
if let Some(pred_llbb) = bb_map.get(&bid) {
|
||||
let term = unsafe { pred_llbb.get_terminator() };
|
||||
if let Some(t) = term {
|
||||
// Insert casts right before the terminator of predecessor
|
||||
codegen.builder.position_before(&t);
|
||||
} else {
|
||||
codegen.builder.position_at_end(*pred_llbb);
|
||||
}
|
||||
}
|
||||
val = coerce_to_type(codegen, phi, val)?;
|
||||
if let Some(bb) = saved_block { codegen.builder.position_at_end(bb); }
|
||||
let pred_bb = *bb_map.get(&bid).ok_or("pred bb missing")?;
|
||||
if std::env::var("NYASH_CLI_VERBOSE").ok().as_deref() == Some("1") {
|
||||
let tys = phi
|
||||
.as_basic_value()
|
||||
@ -308,6 +330,31 @@ pub(in super::super) fn seal_block<'ctx>(
|
||||
BasicValueEnum::PointerValue(pv) => phi.add_incoming(&[(&pv, pred_bb)]),
|
||||
_ => return Err("unsupported phi incoming value (seal)".to_string()),
|
||||
}
|
||||
} else {
|
||||
// inputs に pred が見つからない場合でも、検証器は「各predに1エントリ」を要求する。
|
||||
// ゼロ(型に応じた null/0)を合成して追加する(ログ付)
|
||||
let pred_bb = *bb_map.get(&bid).ok_or("pred bb missing")?;
|
||||
use inkwell::types::BasicTypeEnum as BT;
|
||||
let bt = phi.as_basic_value().get_type();
|
||||
let z: BasicValueEnum = match bt {
|
||||
BT::IntType(it) => it.const_zero().into(),
|
||||
BT::FloatType(ft) => ft.const_zero().into(),
|
||||
BT::PointerType(pt) => pt.const_zero().into(),
|
||||
_ => return Err("unsupported phi type for zero synth (seal)".to_string()),
|
||||
};
|
||||
if std::env::var("NYASH_CLI_VERBOSE").ok().as_deref() == Some("1") {
|
||||
eprintln!(
|
||||
"[PHI] sealed add (synth) pred_bb={} zero-ty={}",
|
||||
bid.as_u32(),
|
||||
bt.print_to_string().to_string()
|
||||
);
|
||||
}
|
||||
match z {
|
||||
BasicValueEnum::IntValue(iv) => phi.add_incoming(&[(&iv, pred_bb)]),
|
||||
BasicValueEnum::FloatValue(fv) => phi.add_incoming(&[(&fv, pred_bb)]),
|
||||
BasicValueEnum::PointerValue(pv) => phi.add_incoming(&[(&pv, pred_bb)]),
|
||||
_ => return Err("unsupported phi incoming (synth)".to_string()),
|
||||
}
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
@ -1,4 +1,5 @@
|
||||
mod blocks;
|
||||
pub mod builder_cursor;
|
||||
pub mod flow;
|
||||
mod externcall;
|
||||
mod newbox;
|
||||
|
||||
Reference in New Issue
Block a user