start local static declarations

This commit is contained in:
pommicket 2022-02-05 15:50:49 -05:00
parent 267b52814e
commit c5e2556d31
2 changed files with 234 additions and 196 deletions

View file

@ -38,6 +38,24 @@ function structure_is_union
; parse a translation unit
function parse_tokens
argument tokens
local token
token = tokens
:parse_tokens_loop
if *1token == TOKEN_EOF goto parse_tokens_eof
parse_toplevel_declaration(&token, global_variables)
goto parse_tokens_loop
:parse_tokens_eof
return
; also handles static declarations inside functions
; advances *p_token past semicolon
; static_vars = where to put static variables
function parse_toplevel_declaration
argument p_token
argument static_vars
local token
local ident
local type
@ -55,206 +73,221 @@ function parse_tokens
local is_extern
local out
token = tokens
:parse_tokens_loop
is_extern = 0
if *1token == TOKEN_EOF goto parse_tokens_eof
if *1token == KEYWORD_STATIC goto parse_static_toplevel_decl
if *1token == KEYWORD_EXTERN goto parse_extern_toplevel_decl
if *1token == KEYWORD_TYPEDEF goto parse_typedef
b = token_is_type(token)
if b != 0 goto parse_toplevel_decl
token_error(token, .str_bad_statement)
:str_bad_statement
string Bad statement.
byte 0
:parse_static_toplevel_decl
token += 16 ; we don't care that this is static
goto parse_toplevel_decl
:parse_extern_toplevel_decl
token = *8p_token
is_extern = 0
if *1token == KEYWORD_STATIC goto parse_static_toplevel_decl
if *1token == KEYWORD_EXTERN goto parse_extern_toplevel_decl
if *1token == KEYWORD_TYPEDEF goto parse_typedef
b = token_is_type(token)
if b != 0 goto parse_toplevel_decl
token_error(token, .str_bad_decl)
:str_bad_decl
string Bad declaration.
byte 0
:parse_tld_ret
*8p_token = token
return
:parse_static_toplevel_decl
token += 16 ; we don't care that this is static
goto parse_toplevel_decl
:parse_extern_toplevel_decl
token += 16
is_extern = 1
goto parse_toplevel_decl
:parse_toplevel_decl
base_type = token
base_type_end = type_get_base_end(token)
token = base_type_end
:tl_decl_loop
prefix = token
prefix_end = type_get_prefix_end(prefix)
if *1prefix_end != TOKEN_IDENTIFIER goto tl_decl_no_ident
name = prefix_end + 8
name = *8name
suffix = prefix_end + 16
suffix_end = type_get_suffix_end(prefix)
type = types_bytes_used
parse_type_declarators(prefix, prefix_end, suffix, suffix_end)
parse_base_type(base_type, base_type_end)
; ensure rwdata_end_addr is aligned to 8 bytes
; otherwise addresses could be screwed up
rwdata_end_addr += 7
rwdata_end_addr >= 3
rwdata_end_addr <= 3
token = suffix_end
if *1token == SYMBOL_LBRACE goto parse_function_definition
if is_extern != 0 goto parse_tl_decl_cont ; ignore external variable declarations
; deal with the initializer if there is one
if *1token == SYMBOL_SEMICOLON goto parse_tld_no_initializer
if *1token == SYMBOL_COMMA goto parse_tld_no_initializer
if *1token == SYMBOL_EQ goto parse_tld_initializer
token_error(token, .str_unrecognized_stuff_after_declaration)
:str_unrecognized_stuff_after_declaration
string Declaration should be followed by one of: { , =
byte 32
byte 59 ; semicolon
byte 0
:parse_tl_decl_cont
if *1token == SYMBOL_SEMICOLON goto tl_decl_loop_done
if *1token != SYMBOL_COMMA goto tld_bad_stuff_after_decl
token += 16
is_extern = 1
goto parse_toplevel_decl
:parse_toplevel_decl
base_type = token
base_type_end = type_get_base_end(token)
token = base_type_end
:tl_decl_loop
prefix = token
prefix_end = type_get_prefix_end(prefix)
if *1prefix_end != TOKEN_IDENTIFIER goto tl_decl_no_ident
name = prefix_end + 8
name = *8name
suffix = prefix_end + 16
suffix_end = type_get_suffix_end(prefix)
type = types_bytes_used
parse_type_declarators(prefix, prefix_end, suffix, suffix_end)
parse_base_type(base_type, base_type_end)
; ensure rwdata_end_addr is aligned to 8 bytes
; otherwise addresses could be screwed up
rwdata_end_addr += 7
rwdata_end_addr >= 3
rwdata_end_addr <= 3
token = suffix_end
if *1token == SYMBOL_LBRACE goto parse_function_definition
if is_extern != 0 goto parse_tl_decl_cont ; ignore external variable declarations
; deal with the initializer if there is one
if *1token == SYMBOL_SEMICOLON goto parse_tld_no_initializer
if *1token == SYMBOL_COMMA goto parse_tld_no_initializer
if *1token == SYMBOL_EQ goto parse_tld_initializer
token_error(token, .str_unrecognized_stuff_after_declaration)
:str_unrecognized_stuff_after_declaration
string Declaration should be followed by one of: { , =
byte 32
byte 59 ; semicolon
byte 0
:parse_tl_decl_cont
if *1token == SYMBOL_SEMICOLON goto tl_decl_loop_done
if *1token != SYMBOL_COMMA goto tld_bad_stuff_after_decl
token += 16
goto tl_decl_loop
:tl_decl_loop_done
token += 16 ; skip semicolon
goto parse_tokens_loop
:tl_decl_no_ident
token_error(prefix_end, .str_tl_decl_no_ident)
:str_tl_decl_no_ident
string No identifier in top-level declaration.
byte 0
:tld_bad_stuff_after_decl
token_error(token, .str_tld_bad_stuff_after_decl)
:str_tld_bad_stuff_after_decl
string Declarations should be immediately followed by a comma or semicolon.
byte 0
:parse_tld_no_initializer
p = types + type
if *1p == TYPE_FUNCTION goto parse_tl_decl_cont ; ignore function declarations -- we do two passes anyways
b = ident_list_lookup(global_variables, name)
if b != 0 goto global_redefinition
c = type < 32
c |= rwdata_end_addr
ident_list_add(global_variables, name, c)
; just skip forward by the size of this variable -- it'll automatically be filled with 0s.
rwdata_end_addr += type_sizeof(type)
goto parse_tl_decl_cont
:parse_tld_initializer
if *1p == TYPE_FUNCTION goto function_initializer
b = ident_list_lookup(global_variables, name)
if b != 0 goto global_redefinition
token += 16 ; skip =
c = type < 32
c |= rwdata_end_addr
ident_list_add(global_variables, name, c)
parse_constant_initializer(&token, type)
goto parse_tl_decl_cont
:global_redefinition
token_error(token, .str_global_redefinition)
:str_global_redefinition
string Redefinition of global variable.
goto tl_decl_loop
:tl_decl_loop_done
token += 16 ; skip semicolon
goto parse_tld_ret
:tl_decl_no_ident
token_error(prefix_end, .str_tl_decl_no_ident)
:str_tl_decl_no_ident
string No identifier in top-level declaration.
byte 0
:function_initializer
token_error(token, .str_function_initializer)
:str_function_initializer
string Functions should not have initializers.
:tld_bad_stuff_after_decl
token_error(token, .str_tld_bad_stuff_after_decl)
:str_tld_bad_stuff_after_decl
string Declarations should be immediately followed by a comma or semicolon.
byte 0
:parse_function_definition
p = types + type
; @TODO: parameters
; @NOTE: remember to turn array members into pointers
if *1p != TYPE_FUNCTION goto lbrace_after_declaration
global function_stmt_data ; initialized in main
global function_stmt_data_bytes_used
p = function_stmt_data + function_stmt_data_bytes_used
out = p
parse_statement(&token, &out)
if block_depth != 0 goto stmtdepth_internal_err
function_stmt_data_bytes_used = out - function_stmt_data
ident_list_add(function_statements, name, p)
print_statement(p)
goto parse_tokens_loop
:stmtdepth_internal_err
token_error(token, .str_stmtdepth_internal_err)
:str_stmtdepth_internal_err
string Internal compiler error: parse_stmt_depth is not 0 after parsing function body.
byte 0
:lbrace_after_declaration
token_error(token, .str_lbrace_after_declaration)
:str_lbrace_after_declaration
string Opening { after declaration of non-function.
byte 0
:parse_typedef
base_type = token + 16
base_type_end = type_get_base_end(base_type)
token = base_type_end
:typedef_loop
prefix = token
prefix_end = type_get_prefix_end(prefix)
if *1prefix_end != TOKEN_IDENTIFIER goto typedef_no_ident
ident = prefix_end + 8
ident = *8ident
suffix = prefix_end + 16
suffix_end = type_get_suffix_end(prefix)
;putc('B)
;putc(':)
;print_tokens(base_type, base_type_end)
;putc('P)
;putc(':)
;print_tokens(prefix, prefix_end)
;putc('S)
;putc(':)
;print_tokens(suffix, suffix_end)
type = types_bytes_used
parse_type_declarators(prefix, prefix_end, suffix, suffix_end)
parse_base_type(base_type)
puts(.str_typedef)
putc(32)
print_type(type)
putc(10)
b = ident_list_lookup(typedefs, ident)
if b != 0 goto typedef_redefinition
ident_list_add(typedefs, ident, type)
token = suffix_end
if *1token == SYMBOL_SEMICOLON goto typedef_loop_end
if *1token != SYMBOL_COMMA goto bad_typedef
token += 16 ; skip comma
goto typedef_loop
:typedef_loop_end
token += 16 ; skip semicolon
goto parse_tokens_loop
:typedef_no_ident
token_error(token, .str_typedef_no_ident)
:str_typedef_no_ident
string No identifier in typedef declaration.
:parse_tld_no_initializer
p = types + type
if *1p == TYPE_FUNCTION goto parse_tl_decl_cont ; ignore function declarations -- we do two passes anyways
b = ident_list_lookup(static_vars, name)
if b != 0 goto global_redefinition
c = type < 32
c |= rwdata_end_addr
ident_list_add(static_vars, name, c)
; just skip forward by the size of this variable -- it'll automatically be filled with 0s.
rwdata_end_addr += type_sizeof(type)
goto parse_tl_decl_cont
:parse_tld_initializer
p = types + type
if *1p == TYPE_FUNCTION goto function_initializer
b = ident_list_lookup(static_vars, name)
if b != 0 goto global_redefinition
token += 16 ; skip =
c = type < 32
c |= rwdata_end_addr
ident_list_add(static_vars, name, c)
parse_constant_initializer(&token, type)
goto parse_tl_decl_cont
:global_redefinition
token_error(token, .str_global_redefinition)
:str_global_redefinition
string Redefinition of global variable.
byte 0
:function_initializer
token_error(token, .str_function_initializer)
:str_function_initializer
string Functions should not have initializers.
byte 0
:parse_function_definition
if block_depth != 0 goto nested_function
p = types + type
; @TODO: parameters
; @NOTE: remember to turn array members into pointers
if *1p != TYPE_FUNCTION goto lbrace_after_declaration
global function_stmt_data ; initialized in main
global function_stmt_data_bytes_used
p = function_stmt_data + function_stmt_data_bytes_used
out = p
parse_statement(&token, &out)
if block_depth != 0 goto stmtdepth_internal_err
function_stmt_data_bytes_used = out - function_stmt_data
ident_list_add(function_statements, name, p)
print_statement(p)
goto parse_tld_ret
:stmtdepth_internal_err
token_error(token, .str_stmtdepth_internal_err)
:str_stmtdepth_internal_err
string Internal compiler error: parse_stmt_depth is not 0 after parsing function body.
byte 0
:bad_typedef
token_error(token, .str_bad_typedef)
:str_bad_typedef
string Bad typedef.
:lbrace_after_declaration
token_error(token, .str_lbrace_after_declaration)
:str_lbrace_after_declaration
string Opening { after declaration of non-function.
byte 0
:typedef_redefinition
token_error(token, .str_typedef_redefinition)
:str_typedef_redefinition
string typedef redefinition.
:nested_function
token_error(token, .str_nested_function)
:str_nested_function
string Nested function.
byte 0
:parse_tokens_eof
return
:parse_typedef
if block_depth > 0 goto local_typedef
base_type = token + 16
base_type_end = type_get_base_end(base_type)
token = base_type_end
:typedef_loop
prefix = token
prefix_end = type_get_prefix_end(prefix)
if *1prefix_end != TOKEN_IDENTIFIER goto typedef_no_ident
ident = prefix_end + 8
ident = *8ident
suffix = prefix_end + 16
suffix_end = type_get_suffix_end(prefix)
;putc('B)
;putc(':)
;print_tokens(base_type, base_type_end)
;putc('P)
;putc(':)
;print_tokens(prefix, prefix_end)
;putc('S)
;putc(':)
;print_tokens(suffix, suffix_end)
type = types_bytes_used
parse_type_declarators(prefix, prefix_end, suffix, suffix_end)
parse_base_type(base_type)
puts(.str_typedef)
putc(32)
print_type(type)
putc(10)
b = ident_list_lookup(typedefs, ident)
if b != 0 goto typedef_redefinition
ident_list_add(typedefs, ident, type)
token = suffix_end
if *1token == SYMBOL_SEMICOLON goto typedef_loop_end
if *1token != SYMBOL_COMMA goto bad_typedef
token += 16 ; skip comma
goto typedef_loop
:typedef_loop_end
token += 16 ; skip semicolon
goto parse_tld_ret
:local_typedef
; @NONSTANDARD
; we could add an extra "typedefs" argument to this function to fix this.
token_error(token, .str_local_typedef)
:str_local_typedef
string typedefs inside functions are not supported.
byte 0
:typedef_no_ident
token_error(token, .str_typedef_no_ident)
:str_typedef_no_ident
string No identifier in typedef declaration.
byte 0
:bad_typedef
token_error(token, .str_bad_typedef)
:str_bad_typedef
string Bad typedef.
byte 0
:typedef_redefinition
token_error(token, .str_typedef_redefinition)
:str_typedef_redefinition
string typedef redefinition.
byte 0
; write type, file, and line info for statement
function write_statement_header
@ -281,7 +314,6 @@ function parse_statement
local c
local n
out = *8p_out
token = *8p_token
@ -321,7 +353,10 @@ function parse_statement
*8p_out = out
return
:stmt_static_declaration
byte 0xcc ; @TODO
p = block_static_variables
p += block_depth < 3
parse_toplevel_declaration(&token, *8p)
goto parse_statement_ret
:stmt_break
write_statement_header(out, STATEMENT_BREAK, token)
token += 16