2021-10-30 01:57:19 +00:00
|
|
|
with ada.text_io;
|
|
|
|
|
|
|
|
package body H3.Compilers is
|
2021-10-31 16:03:11 +00:00
|
|
|
LB_EOF: constant S.Rune_Array := (R.V.Left_Arrow,R.V.UC_E,R.V.UC_O,R.V.UC_F,R.V.Right_Arrow); -- <EOF>
|
|
|
|
|
2021-10-30 01:57:19 +00:00
|
|
|
procedure Set_Lexer_State (C: in out Compiler; State: in Lexer_State) is
|
|
|
|
begin
|
|
|
|
C.Lx.State := State;
|
|
|
|
end Set_Lexer_State;
|
|
|
|
|
|
|
|
procedure Set_Lexer_State (C: in out Compiler; State: in Lexer_State; Ch: in R.Rune) is
|
|
|
|
begin
|
|
|
|
-- change the lexer state while storing the first character in the token buffer.
|
|
|
|
C.Lx.State := State;
|
|
|
|
S.Clear (C.Tk.Buf);
|
|
|
|
S.Append (C.Tk.Buf, Ch);
|
|
|
|
end Set_Lexer_State;
|
|
|
|
|
|
|
|
procedure Set_Lexer_State (C: in out Compiler; State: in Lexer_State; Code: in R.Code) is
|
|
|
|
begin
|
|
|
|
Set_Lexer_State (C, State, R.To_Rune(Code));
|
|
|
|
end Set_Lexer_State;
|
|
|
|
|
|
|
|
procedure Got_Token (C: in out Compiler) is
|
|
|
|
begin
|
|
|
|
--case C.P.State IS
|
|
|
|
-- when START =>
|
|
|
|
-- null;
|
|
|
|
--end case;
|
|
|
|
|
2021-10-31 16:03:11 +00:00
|
|
|
ada.text_io.put (C.Tk.Id'Img);
|
|
|
|
ada.text_io.put (" ");
|
|
|
|
for i in C.Tk.Buf.Get_First_Index .. C.Tk.Buf.Get_Last_Index loop
|
|
|
|
ada.text_io.put (standard.character'val(S.Rune'Pos(C.Tk.Buf.Get_Item(i))));
|
|
|
|
end loop;
|
|
|
|
ada.text_io.put_line("");
|
|
|
|
|
|
|
|
|
2021-10-30 01:57:19 +00:00
|
|
|
case C.Tk.Id is
|
|
|
|
when TK_BSTR =>
|
|
|
|
null;
|
|
|
|
when TK_BYTE =>
|
|
|
|
null;
|
|
|
|
when TK_CHAR =>
|
|
|
|
null;
|
|
|
|
when TK_CSTR =>
|
|
|
|
null;
|
2021-11-02 00:31:30 +00:00
|
|
|
when TK_DIRECTIVE =>
|
|
|
|
--Push_Feed_Layer (...
|
|
|
|
null;
|
2021-10-30 01:57:19 +00:00
|
|
|
when TK_EOF =>
|
|
|
|
null;
|
|
|
|
when TK_EOL =>
|
|
|
|
null;
|
|
|
|
when TK_GE =>
|
|
|
|
null;
|
|
|
|
when TK_GT =>
|
|
|
|
null;
|
|
|
|
when TK_IDENT =>
|
|
|
|
null;
|
|
|
|
when TK_LE =>
|
|
|
|
null;
|
|
|
|
when TK_LT =>
|
|
|
|
null;
|
|
|
|
when TK_SEMICOLON =>
|
|
|
|
null;
|
|
|
|
end case;
|
|
|
|
end Got_Token;
|
|
|
|
|
|
|
|
procedure Start_Token (C: in out Compiler) is
|
|
|
|
begin
|
|
|
|
C.Tk.Id := TK_EOF; -- indicate the token id is not set yet
|
|
|
|
-- TODO: store token location.
|
|
|
|
S.Clear (C.Tk.Buf);
|
|
|
|
end Start_Token;
|
|
|
|
|
|
|
|
procedure Start_Token (C: in out Compiler; Ch: in R.Rune) is
|
|
|
|
begin
|
|
|
|
Start_Token (C);
|
|
|
|
S.Append (C.Tk.Buf, Ch);
|
|
|
|
end Start_Token;
|
|
|
|
|
|
|
|
procedure Start_Token (C: in out Compiler; Code: in R.Code) is
|
|
|
|
begin
|
|
|
|
Start_Token (C, R.To_Rune(Code));
|
|
|
|
end Start_Token;
|
|
|
|
|
|
|
|
procedure Start_Token (C: in out Compiler; Str: in S.Rune_Array) is
|
|
|
|
begin
|
|
|
|
Start_Token (C);
|
|
|
|
S.Append (C.Tk.Buf, Str);
|
|
|
|
end Start_Token;
|
|
|
|
|
|
|
|
procedure Feed_Token (C: in out Compiler; Ch: in R.Rune) is
|
|
|
|
begin
|
|
|
|
S.Append (C.Tk.Buf, Ch);
|
|
|
|
end Feed_Token;
|
|
|
|
|
|
|
|
procedure Feed_Token (C: in out Compiler; Code: in R.Code) is
|
|
|
|
begin
|
|
|
|
Feed_Token(C, R.To_Rune(Code));
|
|
|
|
end Feed_Token;
|
|
|
|
|
|
|
|
procedure End_Token (C: in out Compiler; Id: in Token_Id) is
|
|
|
|
begin
|
|
|
|
C.Tk.Id := Id;
|
|
|
|
Got_Token (C);
|
|
|
|
Set_Lexer_State (C, LX_START);
|
|
|
|
end End_Token;
|
|
|
|
|
|
|
|
procedure End_Token (C: in out Compiler; Id: in Token_Id; Ch: in R.Rune) is
|
|
|
|
begin
|
|
|
|
S.Append (C.Tk.Buf, Ch);
|
|
|
|
C.Tk.Id := Id;
|
|
|
|
Got_Token (C);
|
|
|
|
Set_Lexer_State (C, LX_START);
|
|
|
|
end End_Token;
|
|
|
|
|
|
|
|
procedure End_Token (C: in out Compiler; Id: in Token_Id; Code: in R.Code) is
|
|
|
|
begin
|
|
|
|
S.Append (C.Tk.Buf, R.To_Rune(Code));
|
|
|
|
C.Tk.Id := Id;
|
|
|
|
Got_Token (C);
|
|
|
|
Set_Lexer_State (C, LX_START);
|
|
|
|
end End_Token;
|
|
|
|
|
|
|
|
procedure Feed_Char_Code (C: in out Compiler; Code: in R.Code) is
|
|
|
|
begin
|
|
|
|
<<Start_Over>>
|
2021-11-02 00:31:30 +00:00
|
|
|
if R.Is_Eof(Code) then
|
2021-10-30 01:57:19 +00:00
|
|
|
ada.text_io.put_line ("EOF");
|
2021-11-02 00:31:30 +00:00
|
|
|
else
|
2021-10-30 01:57:19 +00:00
|
|
|
ada.text_io.put_line (R.To_Rune(Code)'Img);
|
2021-11-02 00:31:30 +00:00
|
|
|
end if;
|
2021-10-30 01:57:19 +00:00
|
|
|
case C.Lx.State is
|
|
|
|
when LX_START =>
|
|
|
|
if R.Is_Eof(Code) then
|
2021-10-31 16:03:11 +00:00
|
|
|
Start_Token (C, LB_EOF);
|
2021-10-30 01:57:19 +00:00
|
|
|
End_Token (C, TK_EOF);
|
|
|
|
-- this procedure doesn't prevent you from feeding more
|
|
|
|
-- after EOF. but it's not desirable to feed more after EOF.
|
|
|
|
elsif R.Is_Space(Code) then
|
|
|
|
-- ignore. carry on
|
|
|
|
null;
|
|
|
|
elsif R.Is_Alpha(Code) then
|
|
|
|
Set_Lexer_State (C, LX_IDENT, Code);
|
|
|
|
elsif R.Is_Digit(Code) then
|
|
|
|
Set_Lexer_State (C, LX_NUMBER, Code);
|
2021-10-31 05:41:19 +00:00
|
|
|
elsif R.Is_Rune(Code, R.V.Semicolon) then
|
2021-10-30 01:57:19 +00:00
|
|
|
Start_Token (C, Code);
|
|
|
|
End_Token (C, TK_SEMICOLON);
|
2021-10-31 05:41:19 +00:00
|
|
|
elsif R.Is_Rune(Code, R.V.Left_Arrow) then
|
2021-10-30 01:57:19 +00:00
|
|
|
Set_Lexer_State (C, LX_OP_LESS, Code);
|
2021-10-31 05:41:19 +00:00
|
|
|
elsif R.Is_Rune(Code, R.V.Right_Arrow) then
|
2021-10-30 01:57:19 +00:00
|
|
|
Set_Lexer_State (C, LX_OP_GREATER, Code);
|
2021-11-02 00:31:30 +00:00
|
|
|
elsif R.Is_Rune(Code, R.V.Number_Sign) then
|
|
|
|
Set_Lexer_State (C, LX_DIRECTIVE);
|
2021-10-30 01:57:19 +00:00
|
|
|
else
|
|
|
|
raise Syntax_Error;
|
|
|
|
end if;
|
|
|
|
|
2021-11-02 00:31:30 +00:00
|
|
|
when LX_DIRECTIVE =>
|
|
|
|
if R.Is_Alnum(Code) or else R.Is_Rune(Code, R.V.Underline) then
|
|
|
|
Feed_Token (C, Code);
|
|
|
|
else
|
|
|
|
End_Token (C, TK_DIRECTIVE);
|
|
|
|
goto Start_Over;
|
|
|
|
end if;
|
|
|
|
|
2021-10-30 01:57:19 +00:00
|
|
|
when LX_OP_GREATER =>
|
2021-10-31 05:41:19 +00:00
|
|
|
if R.Is_Rune(Code, R.V.Equal_Sign) then
|
2021-10-30 01:57:19 +00:00
|
|
|
End_Token (C, TK_GE, Code);
|
|
|
|
else
|
|
|
|
End_Token (C, TK_GT);
|
|
|
|
goto Start_Over;
|
|
|
|
end if;
|
|
|
|
|
|
|
|
when LX_OP_LESS =>
|
2021-10-31 05:41:19 +00:00
|
|
|
if R.Is_Rune(Code, R.V.Equal_sign) then
|
2021-10-30 01:57:19 +00:00
|
|
|
End_Token (C, TK_LE, Code);
|
|
|
|
else
|
|
|
|
End_Token (C, TK_LT);
|
|
|
|
goto Start_Over;
|
|
|
|
end if;
|
|
|
|
|
|
|
|
when LX_COMMENT =>
|
|
|
|
null;
|
|
|
|
|
|
|
|
when LX_IDENT =>
|
2021-10-31 05:41:19 +00:00
|
|
|
if R.Is_Alnum(Code) or else R.Is_Rune(Code, R.V.Underline) then
|
2021-10-30 01:57:19 +00:00
|
|
|
Feed_Token (C, Code);
|
|
|
|
else
|
|
|
|
End_Token (C, TK_IDENT);
|
|
|
|
goto Start_Over;
|
|
|
|
end if;
|
|
|
|
|
|
|
|
when LX_NUMBER =>
|
|
|
|
if R.Is_Digit(Code) then
|
|
|
|
Feed_Token (C, Code);
|
|
|
|
else
|
|
|
|
End_Token (C, TK_IDENT); -- TODO: change this
|
|
|
|
goto Start_Over;
|
|
|
|
end if;
|
|
|
|
end case;
|
|
|
|
end Feed_Char_Code;
|
|
|
|
|
|
|
|
procedure Feed (C: in out Compiler; Data: in S.Rune_Array) is
|
|
|
|
begin
|
|
|
|
for i in Data'Range loop
|
|
|
|
Feed_Char_Code (C, R.To_Code(Data(i)));
|
|
|
|
end loop;
|
|
|
|
end Feed;
|
|
|
|
|
|
|
|
procedure End_Feed (C: in out Compiler) is
|
|
|
|
begin
|
2021-10-31 16:03:11 +00:00
|
|
|
Feed_Char_Code (C, R.P.EOF);
|
2021-10-30 01:57:19 +00:00
|
|
|
end End_Feed;
|
|
|
|
|
|
|
|
end H3.Compilers;
|