Canon/Canon.Core/Abstractions/IGrammarParser.cs

using Canon.Core.Enums;
using Canon.Core.GrammarParser;
using Canon.Core.LexicalParser;
using Canon.Core.SyntaxNodes;

namespace Canon.Core.Abstractions;

/// <summary>
/// 语法分析器接口
/// </summary>
public interface IGrammarParser
{
    public ITransformer BeginTransformer { get; }

    public NonTerminator Begin { get; }

    /// <summary>
    /// 分析指定的词法记号流并构建对应的语法树
    /// </summary>
    /// <param name="tokens">输入的词法记号流</param>
    /// <returns>语法树的根节点</returns>
    /// <exception cref="InvalidOperationException">语法分析错误</exception>
    public ProgramStruct Analyse(IEnumerable<SemanticToken> tokens)
    {
        Stack<AnalyseState> stack = [];
        stack.Push(new AnalyseState(BeginTransformer, SyntaxNodeBase.Create(SemanticToken.End)));

        using IEnumerator<SemanticToken> enumerator = tokens.GetEnumerator();
        if (!enumerator.MoveNext())
        {
            throw new InvalidOperationException("Input token list is empty");
        }

        while (true)
        {
            AnalyseState top = stack.Peek();

            // 首先尝试进行归约
            if (top.State.ReduceTable.TryGetValue(enumerator.Current, out ReduceInformation? information))
            {
                if (information.Left == Begin)
                {
                    // 如果是归约到起始符
                    // 那么就直接返回不继续进行归约
                    return top.Node.Convert<ProgramStruct>();
                }

                List<SyntaxNodeBase> children = [];
                NonTerminatorType leftType = information.Left.Type;
                for (int i = 0; i < information.Length; i++)
                {
                    children.Add(stack.Pop().Node);
                }

                // 为了符合生成式的顺序而倒序
                children.Reverse();
                stack.Push(new AnalyseState(stack.Peek().State.ShiftTable[information.Left],
                    SyntaxNodeBase.Create(leftType, children)));
                continue;
            }

            // 如果没有成功归约就进行移进
            if (top.State.ShiftTable.TryGetValue(enumerator.Current, out ITransformer? next))
            {
                stack.Push(new AnalyseState(next, SyntaxNodeBase.Create(enumerator.Current)));
                if (enumerator.MoveNext())
                {
                    continue;
                }
                else
                {
                    throw new InvalidOperationException("Run out of token but not accept");
                }
            }

            throw new InvalidOperationException("Failed to analyse input grammar");
        }
    }

    private record AnalyseState(ITransformer State, SyntaxNodeBase Node);
}
-												refact: syntax-node (#23)

重构语法树的部分，使用单独的类来抽象不同的非终结符节点。
**同时**，将`Pascal`语法的定义从测试项目中移动到核心项目中，在项目中只维护一份对于`Pascal`语法的定义。

Reviewed-on: https://git.rrricardo.top/PostGuard/Canon/pulls/23

											
										
										
											2024-04-07 16:47:28 +08:00
+								using Canon.Core.Enums;
 								using Canon.Core.GrammarParser;
-												feat: 添加语法分析基类抽象 (#8)

增加语法分析基类和状态转换接口抽象，为直接生成语法分析器做准备，同时也提前释放一些大对象，降低内存消耗。

Reviewed-on: https://git.rrricardo.top/PostGuard/Canon/pulls/8

											
										
										
											2024-03-13 16:41:44 +08:00
+								using Canon.Core.LexicalParser;
-												refact: syntax-node (#23)

重构语法树的部分，使用单独的类来抽象不同的非终结符节点。
**同时**，将`Pascal`语法的定义从测试项目中移动到核心项目中，在项目中只维护一份对于`Pascal`语法的定义。

Reviewed-on: https://git.rrricardo.top/PostGuard/Canon/pulls/23

											
										
										
											2024-04-07 16:47:28 +08:00
+								using Canon.Core.SyntaxNodes;
-												feat: 添加语法分析基类抽象 (#8)

增加语法分析基类和状态转换接口抽象，为直接生成语法分析器做准备，同时也提前释放一些大对象，降低内存消耗。

Reviewed-on: https://git.rrricardo.top/PostGuard/Canon/pulls/8

											
										
										
											2024-03-13 16:41:44 +08:00
 								namespace Canon.Core.Abstractions;
 								/// <summary>
 								/// 语法分析器接口
 								/// </summary>
-												refact: 将编译中各个阶段接口化 (#35)

Reviewed-on: https://git.rrricardo.top/PostGuard/Canon/pulls/35

											
										
										
											2024-04-12 19:01:37 +08:00
+								public interface IGrammarParser
-												feat: 添加语法分析基类抽象 (#8)

增加语法分析基类和状态转换接口抽象，为直接生成语法分析器做准备，同时也提前释放一些大对象，降低内存消耗。

Reviewed-on: https://git.rrricardo.top/PostGuard/Canon/pulls/8

											
										
										
											2024-03-13 16:41:44 +08:00
+								{
-												refact: 将编译中各个阶段接口化 (#35)

Reviewed-on: https://git.rrricardo.top/PostGuard/Canon/pulls/35

											
										
										
											2024-04-12 19:01:37 +08:00
+								    public ITransformer BeginTransformer { get; }
-												feat: 添加语法分析基类抽象 (#8)

增加语法分析基类和状态转换接口抽象，为直接生成语法分析器做准备，同时也提前释放一些大对象，降低内存消耗。

Reviewed-on: https://git.rrricardo.top/PostGuard/Canon/pulls/8

											
										
										
											2024-03-13 16:41:44 +08:00
-												refact: 将编译中各个阶段接口化 (#35)

Reviewed-on: https://git.rrricardo.top/PostGuard/Canon/pulls/35

											
										
										
											2024-04-12 19:01:37 +08:00
+								    public NonTerminator Begin { get; }
-												feat: 添加语法分析基类抽象 (#8)

增加语法分析基类和状态转换接口抽象，为直接生成语法分析器做准备，同时也提前释放一些大对象，降低内存消耗。

Reviewed-on: https://git.rrricardo.top/PostGuard/Canon/pulls/8

											
										
										
											2024-03-13 16:41:44 +08:00
-												refact: 将编译中各个阶段接口化 (#35)

Reviewed-on: https://git.rrricardo.top/PostGuard/Canon/pulls/35

											
										
										
											2024-04-12 19:01:37 +08:00
+								    /// <summary>
 								    /// 分析指定的词法记号流并构建对应的语法树
 								    /// </summary>
 								    /// <param name="tokens">输入的词法记号流</param>
 								    /// <returns>语法树的根节点</returns>
 								    /// <exception cref="InvalidOperationException">语法分析错误</exception>
 								    public ProgramStruct Analyse(IEnumerable<SemanticToken> tokens)
-												feat: 添加语法分析基类抽象 (#8)

增加语法分析基类和状态转换接口抽象，为直接生成语法分析器做准备，同时也提前释放一些大对象，降低内存消耗。

Reviewed-on: https://git.rrricardo.top/PostGuard/Canon/pulls/8

											
										
										
											2024-03-13 16:41:44 +08:00
+								    {
 								        Stack<AnalyseState> stack = [];
-												refact: syntax-node (#23)

重构语法树的部分，使用单独的类来抽象不同的非终结符节点。
**同时**，将`Pascal`语法的定义从测试项目中移动到核心项目中，在项目中只维护一份对于`Pascal`语法的定义。

Reviewed-on: https://git.rrricardo.top/PostGuard/Canon/pulls/23

											
										
										
											2024-04-07 16:47:28 +08:00
+								        stack.Push(new AnalyseState(BeginTransformer, SyntaxNodeBase.Create(SemanticToken.End)));
-												feat: 添加语法分析基类抽象 (#8)

增加语法分析基类和状态转换接口抽象，为直接生成语法分析器做准备，同时也提前释放一些大对象，降低内存消耗。

Reviewed-on: https://git.rrricardo.top/PostGuard/Canon/pulls/8

											
										
										
											2024-03-13 16:41:44 +08:00
 								        using IEnumerator<SemanticToken> enumerator = tokens.GetEnumerator();
 								        if (!enumerator.MoveNext())
 								        {
 								            throw new InvalidOperationException("Input token list is empty");
 								        }
 								        while (true)
 								        {
 								            AnalyseState top = stack.Peek();
 								            // 首先尝试进行归约
 								            if (top.State.ReduceTable.TryGetValue(enumerator.Current, out ReduceInformation? information))
 								            {
 								                if (information.Left == Begin)
 								                {
 								                    // 如果是归约到起始符
 								                    // 那么就直接返回不继续进行归约
-												refact: 将编译中各个阶段接口化 (#35)

Reviewed-on: https://git.rrricardo.top/PostGuard/Canon/pulls/35

											
										
										
											2024-04-12 19:01:37 +08:00
+								                    return top.Node.Convert<ProgramStruct>();
-												feat: 添加语法分析基类抽象 (#8)

增加语法分析基类和状态转换接口抽象，为直接生成语法分析器做准备，同时也提前释放一些大对象，降低内存消耗。

Reviewed-on: https://git.rrricardo.top/PostGuard/Canon/pulls/8

											
										
										
											2024-03-13 16:41:44 +08:00
+								                }
-												refact: syntax-node (#23)

重构语法树的部分，使用单独的类来抽象不同的非终结符节点。
**同时**，将`Pascal`语法的定义从测试项目中移动到核心项目中，在项目中只维护一份对于`Pascal`语法的定义。

Reviewed-on: https://git.rrricardo.top/PostGuard/Canon/pulls/23

											
										
										
											2024-04-07 16:47:28 +08:00
+								                List<SyntaxNodeBase> children = [];
 								                NonTerminatorType leftType = information.Left.Type;
-												feat: 添加语法分析基类抽象 (#8)

增加语法分析基类和状态转换接口抽象，为直接生成语法分析器做准备，同时也提前释放一些大对象，降低内存消耗。

Reviewed-on: https://git.rrricardo.top/PostGuard/Canon/pulls/8

											
										
										
											2024-03-13 16:41:44 +08:00
+								                for (int i = 0; i < information.Length; i++)
 								                {
-												refact: syntax-node (#23)

重构语法树的部分，使用单独的类来抽象不同的非终结符节点。
**同时**，将`Pascal`语法的定义从测试项目中移动到核心项目中，在项目中只维护一份对于`Pascal`语法的定义。

Reviewed-on: https://git.rrricardo.top/PostGuard/Canon/pulls/23

											
										
										
											2024-04-07 16:47:28 +08:00
+								                    children.Add(stack.Pop().Node);
-												feat: 添加语法分析基类抽象 (#8)

增加语法分析基类和状态转换接口抽象，为直接生成语法分析器做准备，同时也提前释放一些大对象，降低内存消耗。

Reviewed-on: https://git.rrricardo.top/PostGuard/Canon/pulls/8

											
										
										
											2024-03-13 16:41:44 +08:00
+								                }
-												refact: syntax-node (#23)

重构语法树的部分，使用单独的类来抽象不同的非终结符节点。
**同时**，将`Pascal`语法的定义从测试项目中移动到核心项目中，在项目中只维护一份对于`Pascal`语法的定义。

Reviewed-on: https://git.rrricardo.top/PostGuard/Canon/pulls/23

											
										
										
											2024-04-07 16:47:28 +08:00
+								                // 为了符合生成式的顺序而倒序
 								                children.Reverse();
-												feat: 添加语法分析基类抽象 (#8)

增加语法分析基类和状态转换接口抽象，为直接生成语法分析器做准备，同时也提前释放一些大对象，降低内存消耗。

Reviewed-on: https://git.rrricardo.top/PostGuard/Canon/pulls/8

											
										
										
											2024-03-13 16:41:44 +08:00
+								                stack.Push(new AnalyseState(stack.Peek().State.ShiftTable[information.Left],
-												refact: syntax-node (#23)

重构语法树的部分，使用单独的类来抽象不同的非终结符节点。
**同时**，将`Pascal`语法的定义从测试项目中移动到核心项目中，在项目中只维护一份对于`Pascal`语法的定义。

Reviewed-on: https://git.rrricardo.top/PostGuard/Canon/pulls/23

											
										
										
											2024-04-07 16:47:28 +08:00
+								                    SyntaxNodeBase.Create(leftType, children)));
-												feat: 添加语法分析基类抽象 (#8)

增加语法分析基类和状态转换接口抽象，为直接生成语法分析器做准备，同时也提前释放一些大对象，降低内存消耗。

Reviewed-on: https://git.rrricardo.top/PostGuard/Canon/pulls/8

											
										
										
											2024-03-13 16:41:44 +08:00
+								                continue;
 								            }
 								            // 如果没有成功归约就进行移进
 								            if (top.State.ShiftTable.TryGetValue(enumerator.Current, out ITransformer? next))
 								            {
-												refact: syntax-node (#23)

重构语法树的部分，使用单独的类来抽象不同的非终结符节点。
**同时**，将`Pascal`语法的定义从测试项目中移动到核心项目中，在项目中只维护一份对于`Pascal`语法的定义。

Reviewed-on: https://git.rrricardo.top/PostGuard/Canon/pulls/23

											
										
										
											2024-04-07 16:47:28 +08:00
+								                stack.Push(new AnalyseState(next, SyntaxNodeBase.Create(enumerator.Current)));
-												feat: 添加语法分析基类抽象 (#8)

增加语法分析基类和状态转换接口抽象，为直接生成语法分析器做准备，同时也提前释放一些大对象，降低内存消耗。

Reviewed-on: https://git.rrricardo.top/PostGuard/Canon/pulls/8

											
										
										
											2024-03-13 16:41:44 +08:00
+								                if (enumerator.MoveNext())
 								                {
 								                    continue;
 								                }
 								                else
 								                {
 								                    throw new InvalidOperationException("Run out of token but not accept");
 								                }
 								            }
 								            throw new InvalidOperationException("Failed to analyse input grammar");
 								        }
 								    }
-												refact: syntax-node (#23)

重构语法树的部分，使用单独的类来抽象不同的非终结符节点。
**同时**，将`Pascal`语法的定义从测试项目中移动到核心项目中，在项目中只维护一份对于`Pascal`语法的定义。

Reviewed-on: https://git.rrricardo.top/PostGuard/Canon/pulls/23

											
										
										
											2024-04-07 16:47:28 +08:00
+								    private record AnalyseState(ITransformer State, SyntaxNodeBase Node);
-												feat: 添加语法分析基类抽象 (#8)

增加语法分析基类和状态转换接口抽象，为直接生成语法分析器做准备，同时也提前释放一些大对象，降低内存消耗。

Reviewed-on: https://git.rrricardo.top/PostGuard/Canon/pulls/8

											
										
										
											2024-03-13 16:41:44 +08:00
+								}