2025-08-09 15:14:44 +09:00
|
|
|
|
/*!
|
|
|
|
|
|
* Nyash Parser - Rust Implementation
|
|
|
|
|
|
*
|
|
|
|
|
|
* Python版nyashc_v4.pyのNyashParserをRustで完全再実装
|
|
|
|
|
|
* Token列をAST (Abstract Syntax Tree) に変換
|
|
|
|
|
|
*
|
2025-08-16 12:26:17 +09:00
|
|
|
|
* モジュール構造:
|
|
|
|
|
|
* - common.rs: 共通ユーティリティとトレイト (ParserUtils)
|
2025-08-09 15:14:44 +09:00
|
|
|
|
* - expressions.rs: 式パーサー (parse_expression, parse_or, parse_and等)
|
|
|
|
|
|
* - statements.rs: 文パーサー (parse_statement, parse_if, parse_loop等)
|
2025-08-16 12:26:17 +09:00
|
|
|
|
* - declarations/: Box宣言パーサー (box_definition, static_box, dependency_helpers)
|
|
|
|
|
|
* - items/: トップレベル宣言 (global_vars, functions, static_items)
|
|
|
|
|
|
*
|
|
|
|
|
|
* 2025-08-16: 大規模リファクタリング完了
|
|
|
|
|
|
* - 1530行 → 227行 (85%削減)
|
|
|
|
|
|
* - 機能ごとにモジュール分離で保守性向上
|
2025-08-09 15:14:44 +09:00
|
|
|
|
*/
|
|
|
|
|
|
|
|
|
|
|
|
// サブモジュール宣言
|
2025-08-16 11:35:57 +09:00
|
|
|
|
mod common;
|
2025-08-09 15:14:44 +09:00
|
|
|
|
mod expressions;
|
|
|
|
|
|
mod statements;
|
2025-08-16 12:19:58 +09:00
|
|
|
|
mod declarations;
|
2025-08-16 12:24:23 +09:00
|
|
|
|
mod items;
|
2025-09-05 05:16:21 +09:00
|
|
|
|
pub mod sugar; // Phase 12.7-B: desugar pass (basic)
|
|
|
|
|
|
pub mod entry_sugar; // helper to parse with sugar level
|
|
|
|
|
|
pub mod sugar_gate; // thread-local gate for sugar parsing (tests/docs)
|
2025-08-09 15:14:44 +09:00
|
|
|
|
// mod errors;
|
|
|
|
|
|
|
2025-08-16 11:35:57 +09:00
|
|
|
|
use common::ParserUtils;
|
|
|
|
|
|
|
2025-08-09 15:14:44 +09:00
|
|
|
|
use crate::tokenizer::{Token, TokenType, TokenizeError};
|
|
|
|
|
|
use crate::ast::{ASTNode, Span};
|
|
|
|
|
|
use thiserror::Error;
|
|
|
|
|
|
|
2025-09-05 05:16:21 +09:00
|
|
|
|
#[inline]
|
|
|
|
|
|
fn is_sugar_enabled() -> bool { crate::parser::sugar_gate::is_enabled() }
|
|
|
|
|
|
|
2025-08-10 11:32:32 +09:00
|
|
|
|
// ===== 🔥 Debug Macros =====
|
|
|
|
|
|
|
|
|
|
|
|
/// Infinite loop detection macro - must be called in every loop that advances tokens
|
|
|
|
|
|
/// Prevents parser from hanging due to token consumption bugs
|
|
|
|
|
|
/// Uses parser's debug_fuel field for centralized fuel management
|
2025-08-16 11:35:57 +09:00
|
|
|
|
#[macro_export]
|
2025-08-10 11:32:32 +09:00
|
|
|
|
macro_rules! must_advance {
|
|
|
|
|
|
($parser:expr, $fuel:expr, $location:literal) => {
|
|
|
|
|
|
// デバッグ燃料がSomeの場合のみ制限チェック
|
|
|
|
|
|
if let Some(ref mut limit) = $parser.debug_fuel {
|
|
|
|
|
|
if *limit == 0 {
|
|
|
|
|
|
eprintln!("🚨 PARSER INFINITE LOOP DETECTED at {}", $location);
|
|
|
|
|
|
eprintln!("🔍 Current token: {:?} at line {}", $parser.current_token().token_type, $parser.current_token().line);
|
|
|
|
|
|
eprintln!("🔍 Parser position: {}/{}", $parser.current, $parser.tokens.len());
|
2025-08-16 11:35:57 +09:00
|
|
|
|
return Err($crate::parser::ParseError::InfiniteLoop {
|
2025-08-10 11:32:32 +09:00
|
|
|
|
location: $location.to_string(),
|
|
|
|
|
|
token: $parser.current_token().token_type.clone(),
|
|
|
|
|
|
line: $parser.current_token().line,
|
|
|
|
|
|
});
|
|
|
|
|
|
}
|
|
|
|
|
|
*limit -= 1;
|
|
|
|
|
|
}
|
|
|
|
|
|
// None の場合は無制限なのでチェックしない
|
|
|
|
|
|
};
|
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
/// Initialize debug fuel for loop monitoring
|
2025-08-16 11:35:57 +09:00
|
|
|
|
#[macro_export]
|
2025-08-10 11:32:32 +09:00
|
|
|
|
macro_rules! debug_fuel {
|
|
|
|
|
|
() => {
|
|
|
|
|
|
100_000 // Default: 100k iterations should be enough for any reasonable program
|
|
|
|
|
|
};
|
|
|
|
|
|
}
|
|
|
|
|
|
|
2025-08-09 15:14:44 +09:00
|
|
|
|
// Two-phase parser structures are no longer needed - simplified to direct parsing
|
|
|
|
|
|
|
|
|
|
|
|
/// パースエラー
|
|
|
|
|
|
#[derive(Error, Debug)]
|
|
|
|
|
|
pub enum ParseError {
|
|
|
|
|
|
#[error("Unexpected token {found:?}, expected {expected} at line {line}")]
|
|
|
|
|
|
UnexpectedToken { found: TokenType, expected: String, line: usize },
|
|
|
|
|
|
|
|
|
|
|
|
#[error("Unexpected end of file")]
|
|
|
|
|
|
UnexpectedEOF,
|
|
|
|
|
|
|
|
|
|
|
|
#[error("Invalid expression at line {line}")]
|
|
|
|
|
|
InvalidExpression { line: usize },
|
|
|
|
|
|
|
|
|
|
|
|
#[error("Invalid statement at line {line}")]
|
|
|
|
|
|
InvalidStatement { line: usize },
|
|
|
|
|
|
|
|
|
|
|
|
#[error("Circular dependency detected between static boxes: {cycle}")]
|
|
|
|
|
|
CircularDependency { cycle: String },
|
|
|
|
|
|
|
2025-08-10 11:32:32 +09:00
|
|
|
|
#[error("🚨 Infinite loop detected in parser at {location} - token: {token:?} at line {line}")]
|
|
|
|
|
|
InfiniteLoop { location: String, token: TokenType, line: usize },
|
|
|
|
|
|
|
2025-08-15 11:47:46 +00:00
|
|
|
|
#[error("🔥 Transparency system removed: {suggestion} at line {line}")]
|
|
|
|
|
|
TransparencySystemRemoved { suggestion: String, line: usize },
|
|
|
|
|
|
|
2025-08-16 01:12:10 +09:00
|
|
|
|
#[error("Unsupported namespace '{name}' at line {line}. Only 'nyashstd' is supported in Phase 0.")]
|
|
|
|
|
|
UnsupportedNamespace { name: String, line: usize },
|
|
|
|
|
|
|
|
|
|
|
|
#[error("Expected identifier at line {line}")]
|
|
|
|
|
|
ExpectedIdentifier { line: usize },
|
|
|
|
|
|
|
2025-08-09 15:14:44 +09:00
|
|
|
|
#[error("Tokenize error: {0}")]
|
|
|
|
|
|
TokenizeError(#[from] TokenizeError),
|
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
/// Nyashパーサー - トークン列をASTに変換
|
|
|
|
|
|
pub struct NyashParser {
|
2025-08-16 11:35:57 +09:00
|
|
|
|
pub(super) tokens: Vec<Token>,
|
|
|
|
|
|
pub(super) current: usize,
|
2025-08-09 15:14:44 +09:00
|
|
|
|
/// 🔥 Static box依存関係追跡(循環依存検出用)
|
2025-08-16 11:35:57 +09:00
|
|
|
|
pub(super) static_box_dependencies: std::collections::HashMap<String, std::collections::HashSet<String>>,
|
2025-08-10 11:32:32 +09:00
|
|
|
|
/// 🔥 デバッグ燃料:無限ループ検出用制限値 (None = 無制限)
|
2025-08-16 11:35:57 +09:00
|
|
|
|
pub(super) debug_fuel: Option<usize>,
|
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
// Implement ParserUtils trait
|
|
|
|
|
|
impl ParserUtils for NyashParser {
|
|
|
|
|
|
fn tokens(&self) -> &Vec<Token> {
|
|
|
|
|
|
&self.tokens
|
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
fn current(&self) -> usize {
|
|
|
|
|
|
self.current
|
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
fn current_mut(&mut self) -> &mut usize {
|
|
|
|
|
|
&mut self.current
|
|
|
|
|
|
}
|
2025-08-09 15:14:44 +09:00
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
impl NyashParser {
|
|
|
|
|
|
/// 新しいパーサーを作成
|
|
|
|
|
|
pub fn new(tokens: Vec<Token>) -> Self {
|
|
|
|
|
|
Self {
|
|
|
|
|
|
tokens,
|
|
|
|
|
|
current: 0,
|
|
|
|
|
|
static_box_dependencies: std::collections::HashMap::new(),
|
2025-08-10 11:32:32 +09:00
|
|
|
|
debug_fuel: Some(100_000), // デフォルト値
|
2025-08-09 15:14:44 +09:00
|
|
|
|
}
|
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
/// 文字列からパース (トークナイズ + パース)
|
|
|
|
|
|
pub fn parse_from_string(input: impl Into<String>) -> Result<ASTNode, ParseError> {
|
2025-08-10 11:32:32 +09:00
|
|
|
|
Self::parse_from_string_with_fuel(input, Some(100_000))
|
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
/// 文字列からパース (デバッグ燃料指定版)
|
|
|
|
|
|
/// fuel: Some(n) = n回まで、None = 無制限
|
|
|
|
|
|
pub fn parse_from_string_with_fuel(input: impl Into<String>, fuel: Option<usize>) -> Result<ASTNode, ParseError> {
|
2025-08-09 15:14:44 +09:00
|
|
|
|
let mut tokenizer = crate::tokenizer::NyashTokenizer::new(input);
|
|
|
|
|
|
let tokens = tokenizer.tokenize()?;
|
|
|
|
|
|
|
|
|
|
|
|
let mut parser = Self::new(tokens);
|
2025-08-10 11:32:32 +09:00
|
|
|
|
parser.debug_fuel = fuel;
|
2025-08-10 07:54:03 +09:00
|
|
|
|
let result = parser.parse();
|
|
|
|
|
|
result
|
2025-08-09 15:14:44 +09:00
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
/// パース実行 - Program ASTを返す
|
|
|
|
|
|
pub fn parse(&mut self) -> Result<ASTNode, ParseError> {
|
|
|
|
|
|
self.parse_program()
|
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
// ===== パース関数群 =====
|
|
|
|
|
|
|
|
|
|
|
|
/// プログラム全体をパース
|
|
|
|
|
|
fn parse_program(&mut self) -> Result<ASTNode, ParseError> {
|
|
|
|
|
|
let mut statements = Vec::new();
|
2025-08-16 17:39:04 +09:00
|
|
|
|
let mut _statement_count = 0;
|
2025-08-09 15:14:44 +09:00
|
|
|
|
|
|
|
|
|
|
while !self.is_at_end() {
|
2025-08-10 07:54:03 +09:00
|
|
|
|
|
2025-08-09 15:14:44 +09:00
|
|
|
|
// EOF tokenはスキップ
|
|
|
|
|
|
if matches!(self.current_token().token_type, TokenType::EOF) {
|
|
|
|
|
|
break;
|
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
// NEWLINE tokenはスキップ(文の区切りとして使用)
|
|
|
|
|
|
if matches!(self.current_token().token_type, TokenType::NEWLINE) {
|
|
|
|
|
|
self.advance();
|
|
|
|
|
|
continue;
|
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
let statement = self.parse_statement()?;
|
|
|
|
|
|
statements.push(statement);
|
2025-08-16 17:39:04 +09:00
|
|
|
|
_statement_count += 1;
|
2025-08-09 15:14:44 +09:00
|
|
|
|
}
|
|
|
|
|
|
|
2025-08-10 07:54:03 +09:00
|
|
|
|
|
2025-08-09 15:14:44 +09:00
|
|
|
|
// 🔥 すべてのstatic box解析後に循環依存検出
|
|
|
|
|
|
self.check_circular_dependencies()?;
|
|
|
|
|
|
|
|
|
|
|
|
Ok(ASTNode::Program { statements, span: Span::unknown() })
|
|
|
|
|
|
}
|
|
|
|
|
|
// Statement parsing methods are now in statements.rs module
|
|
|
|
|
|
|
2025-08-16 12:19:58 +09:00
|
|
|
|
/// 代入文または関数呼び出しをパース
|
|
|
|
|
|
fn parse_assignment_or_function_call(&mut self) -> Result<ASTNode, ParseError> {
|
2025-08-09 15:14:44 +09:00
|
|
|
|
|
2025-08-16 12:19:58 +09:00
|
|
|
|
// まず左辺を式としてパース
|
|
|
|
|
|
let expr = self.parse_expression()?;
|
2025-08-09 15:14:44 +09:00
|
|
|
|
|
2025-09-05 05:16:21 +09:00
|
|
|
|
// 次のトークンが = または 複合代入演算子 なら代入文
|
2025-08-16 12:19:58 +09:00
|
|
|
|
if self.match_token(&TokenType::ASSIGN) {
|
|
|
|
|
|
self.advance(); // consume '='
|
|
|
|
|
|
let value = Box::new(self.parse_expression()?);
|
2025-08-12 08:29:25 +00:00
|
|
|
|
|
2025-08-16 12:19:58 +09:00
|
|
|
|
// 左辺が代入可能な形式かチェック
|
|
|
|
|
|
match &expr {
|
|
|
|
|
|
ASTNode::Variable { .. } |
|
|
|
|
|
|
ASTNode::FieldAccess { .. } => {
|
|
|
|
|
|
Ok(ASTNode::Assignment {
|
|
|
|
|
|
target: Box::new(expr),
|
|
|
|
|
|
value,
|
|
|
|
|
|
span: Span::unknown(),
|
|
|
|
|
|
})
|
2025-08-12 08:29:25 +00:00
|
|
|
|
}
|
2025-08-16 12:19:58 +09:00
|
|
|
|
_ => {
|
2025-08-09 15:14:44 +09:00
|
|
|
|
let line = self.current_token().line;
|
2025-08-16 12:19:58 +09:00
|
|
|
|
Err(ParseError::InvalidStatement { line })
|
2025-08-09 15:14:44 +09:00
|
|
|
|
}
|
|
|
|
|
|
}
|
2025-09-05 05:16:21 +09:00
|
|
|
|
} else if self.match_token(&TokenType::PLUS_ASSIGN) ||
|
|
|
|
|
|
self.match_token(&TokenType::MINUS_ASSIGN) ||
|
|
|
|
|
|
self.match_token(&TokenType::MUL_ASSIGN) ||
|
|
|
|
|
|
self.match_token(&TokenType::DIV_ASSIGN) {
|
|
|
|
|
|
if !is_sugar_enabled() {
|
|
|
|
|
|
let line = self.current_token().line;
|
|
|
|
|
|
return Err(ParseError::UnexpectedToken {
|
|
|
|
|
|
found: self.current_token().token_type.clone(),
|
|
|
|
|
|
expected: "enable NYASH_SYNTAX_SUGAR_LEVEL=basic|full for '+=' and friends".to_string(),
|
|
|
|
|
|
line,
|
|
|
|
|
|
});
|
|
|
|
|
|
}
|
|
|
|
|
|
// determine operator
|
|
|
|
|
|
let op = match &self.current_token().token_type {
|
|
|
|
|
|
TokenType::PLUS_ASSIGN => crate::ast::BinaryOperator::Add,
|
|
|
|
|
|
TokenType::MINUS_ASSIGN => crate::ast::BinaryOperator::Subtract,
|
|
|
|
|
|
TokenType::MUL_ASSIGN => crate::ast::BinaryOperator::Multiply,
|
|
|
|
|
|
TokenType::DIV_ASSIGN => crate::ast::BinaryOperator::Divide,
|
|
|
|
|
|
_ => unreachable!(),
|
|
|
|
|
|
};
|
|
|
|
|
|
self.advance(); // consume 'op='
|
|
|
|
|
|
let rhs = self.parse_expression()?;
|
|
|
|
|
|
// 左辺が代入可能な形式かチェック
|
|
|
|
|
|
match &expr {
|
|
|
|
|
|
ASTNode::Variable { .. } | ASTNode::FieldAccess { .. } => {
|
|
|
|
|
|
let left_clone = expr.clone();
|
|
|
|
|
|
let value = ASTNode::BinaryOp { operator: op, left: Box::new(left_clone), right: Box::new(rhs), span: Span::unknown() };
|
|
|
|
|
|
Ok(ASTNode::Assignment { target: Box::new(expr), value: Box::new(value), span: Span::unknown() })
|
|
|
|
|
|
}
|
|
|
|
|
|
_ => {
|
|
|
|
|
|
let line = self.current_token().line;
|
|
|
|
|
|
Err(ParseError::InvalidStatement { line })
|
|
|
|
|
|
}
|
|
|
|
|
|
}
|
2025-08-09 15:14:44 +09:00
|
|
|
|
} else {
|
2025-08-16 12:19:58 +09:00
|
|
|
|
// 代入文でなければ式文として返す
|
|
|
|
|
|
Ok(expr)
|
2025-08-11 10:14:47 +09:00
|
|
|
|
}
|
2025-08-09 15:14:44 +09:00
|
|
|
|
}
|
|
|
|
|
|
|
2025-08-16 12:19:58 +09:00
|
|
|
|
// Expression parsing methods are now in expressions.rs module
|
|
|
|
|
|
// Utility methods are now in common.rs module via ParserUtils trait
|
2025-08-16 12:24:23 +09:00
|
|
|
|
// Item parsing methods are now in items.rs module
|
2025-08-09 15:14:44 +09:00
|
|
|
|
|
2025-08-16 12:19:58 +09:00
|
|
|
|
// ===== 🔥 Static Box循環依存検出 =====
|
2025-08-11 10:14:47 +09:00
|
|
|
|
}
|