2025-11-08 00:46:34 +09:00
// tools/hako_parser/parser_core.hako — HakoParserCoreBox (token-based MVP)
2025-11-07 19:32:44 +09:00
using selfhost.shared.common.string_helpers as Str
2025-11-08 00:46:34 +09:00
using tools.hako_parser.tokenizer as HakoTokenizerBox
2025-11-07 19:32:44 +09:00
static box HakoParserCoreBox {
2025-11-08 00:46:34 +09:00
// Parse .hako source into minimal AST map:
// {
// uses: Array<String>,
// boxes: Array<{name,is_static,methods:Array<{name,arity,span}>}>
// }
2025-11-07 19:32:44 +09:00
parse(text) {
local ast = new MapBox()
ast.set("uses", new ArrayBox())
2025-11-08 00:46:34 +09:00
ast.set("boxes", new ArrayBox())
ast.set("includes", new ArrayBox())
if text == null { return ast }
local toks = HakoTokenizerBox.tokenize(text)
local p = 0
local N = toks.size()
// Parse stream (single pass, tolerant)
while p < N {
local t = me._peek(toks, p, N)
if me._eq(t, "USING") == 1 {
// using "mod" (as Alias)?
p = me._advance(p, N)
local t1 = me._peek(toks, p, N)
if me._eq(t1, "STRING") == 1 {
ast.get("uses").push(t1.get("lexeme")); p = me._advance(p, N)
// optional: as Alias
local t2 = me._peek(toks, p, N); if me._eq(t2, "AS") == 1 { p = me._advance(p, N); local t3=me._peek(toks, p, N); if me._eq(t3, "IDENT")==1 { p = me._advance(p, N) } }
} else {
// tolerate malformed using; skip token
}
continue
}
if me._eq(t, "INCLUDE") == 1 {
// include "path"
p = me._advance(p, N); local s=me._peek(toks, p, N); if me._eq(s, "STRING") == 1 { ast.get("includes").push(Str.int_to_str(s.get("line"))); p = me._advance(p, N) }
continue
}
if me._eq(t, "STATIC") == 1 {
// static box Name { methods }
// STATIC BOX IDENT LBRACE ... RBRACE
local save = p
2025-11-08 02:59:54 +09:00
local static_tok = t
2025-11-08 00:46:34 +09:00
p = me._advance(p, N) // STATIC
2025-11-08 01:32:02 +09:00
local tb = me._peek(toks, p, N)
if me._eq(tb, "BOX") == 0 { p = save + 1; continue }
2025-11-08 02:59:54 +09:00
local box_tok = tb
2025-11-08 01:32:02 +09:00
p = me._advance(p, N)
local tn = me._peek(toks, p, N)
if me._eq(tn, "IDENT") == 0 { continue }
2025-11-08 02:59:54 +09:00
local box_name = tn.get("lexeme");
local box_line = tn.get("line");
if box_line == null { box_line = static_tok.get("line") }
p = me._advance(p, N)
2025-11-08 00:46:34 +09:00
// expect '{'
2025-11-08 01:32:02 +09:00
local tl = me._peek(toks, p, N)
if me._eq(tl, "LBRACE") == 0 { continue }
p = me._advance(p, N)
2025-11-08 02:59:54 +09:00
// register box (bool is_static, and span_line metadata)
local b = new MapBox(); b.set("name", box_name); b.set("is_static", true); b.set("span_line", box_line); b.set("methods", new ArrayBox())
2025-11-08 01:32:02 +09:00
ast.get("boxes").push(b)
2025-11-08 00:46:34 +09:00
// scan until matching RBRACE (flat, tolerate nested braces count)
local depth = 1
while p < N && depth > 0 {
local tk = me._peek(toks, p, N)
if me._eq(tk, "LBRACE") == 1 { depth = depth + 1; p = me._advance(p, N); continue }
if me._eq(tk, "RBRACE") == 1 { depth = depth - 1; p = me._advance(p, N); if depth == 0 { break } else { continue } }
// method
if me._eq(tk, "METHOD") == 1 {
local mline = tk.get("line"); p = me._advance(p, N)
local mid = me._peek(toks, p, N); if me._eq(mid, "IDENT") == 0 { continue }
local mname = mid.get("lexeme"); p = me._advance(p, N)
// params
local lp = me._peek(toks, p, N); if me._eq(lp, "LPAREN") == 0 { continue } p = me._advance(p, N)
// count commas until RPAREN (no nesting inside params for MVP)
local arity = 0; local any = 0
while p < N {
local tt = me._peek(toks, p, N)
if me._eq(tt, "RPAREN") == 1 { p = me._advance(p, N); break }
if me._eq(tt, "COMMA") == 1 { arity = arity + 1; p = me._advance(p, N); any = 1; continue }
// consume any token inside params
p = me._advance(p, N); any = 1
}
2025-11-08 02:59:54 +09:00
// arity = comma count + 1 (if non-empty)
if any == 1 { arity = arity + 1 }
2025-11-08 00:46:34 +09:00
// record method
local m = new MapBox(); m.set("name", mname); m.set("arity", arity); m.set("span", mline)
b.get("methods").push(m)
continue
}
p = me._advance(p, N)
}
continue
}
// skip unhandled token
p = me._advance(p, N)
}
2025-11-07 19:32:44 +09:00
return ast
}
2025-11-08 00:46:34 +09:00
_peek(toks, idx, N) { if idx >= N { return null } return toks.get(idx) }
_eq(t, kind) { if t == null { return 0 } if t.get("type") == kind { return 1 } return 0 }
_advance(p, N) { if p < N { return p + 1 } return p }
2025-11-07 19:32:44 +09:00
}
static box HakoParserCoreMain { method main(args) { return 0 } }