2024-04-25 00:10:36 -06:00

2418 lines
89 KiB
Zig

const std = @import("std");
const Allocator = std.mem.Allocator;
const assert = std.debug.assert;
const library = @import("../library.zig");
const Arena = library.Arena;
const byte_equal = library.byte_equal;
const BlockList = library.BlockList;
const BoundedArray = library.BoundedArray;
const enumFromString = library.enumFromString;
const PinnedArray = library.PinnedArray;
const MyAllocator = library.MyAllocator;
const lexer = @import("lexer.zig");
const Compilation = @import("../Compilation.zig");
const write = Compilation.write;
const logln = Compilation.logln;
const Token = Compilation.Token;
pub const Result = struct {
main_node_index: Node.Index,
time: u64,
};
pub const Logger = enum {
file,
token_errors,
symbol_declaration,
node_creation,
node_creation_detailed,
main_node,
container_members,
block,
assign,
suffix,
precedence,
@"switch",
pointer_like_type_expression,
switch_case,
consume_token,
pub var bitset = std.EnumSet(Logger).initMany(&.{
.file,
.token_errors,
.symbol_declaration,
.node_creation,
// .node_creation_detailed,
.main_node,
.container_members,
.block,
.assign,
.suffix,
.precedence,
.@"switch",
.pointer_like_type_expression,
.switch_case,
.consume_token,
});
};
// TODO: pack it to be more efficient
pub const Node = struct {
left: Node.Index,
right: Node.Index,
token: Token.Index,
id: Id,
// TODO: this is dangerous
pub const StackList = BoundedArray(Node.Index, 512);
pub const Index = PinnedArray(Node).Index;
pub const Range = struct {
start: u32,
end: u32,
};
pub const Id = enum {
main,
identifier,
number,
@"return",
function_declaration_no_arguments,
container_declaration,
string_literal,
constant_symbol_declaration,
variable_symbol_declaration,
assign,
@"comptime",
node_list,
@"while",
function_prototype,
function_definition,
keyword_noreturn,
keyword_true,
number_literal,
@"unreachable",
field_access,
comptime_block,
block,
unsigned_integer_type,
signed_integer_type,
slice_type,
array_type,
argument_declaration,
comptime_argument_declaration,
intrinsic,
ssize_type,
usize_type,
void_type,
call,
pointer_type,
dot_literal,
address_of,
pointer_dereference,
keyword_false,
compare_equal,
compare_not_equal,
compare_less,
compare_greater,
compare_less_equal,
compare_greater_equal,
@"if",
if_else,
@"switch",
switch_case,
enum_type,
enum_field,
extern_qualifier,
export_qualifier,
add,
sub,
mul,
div,
mod,
bit_and,
bit_xor,
expression_group,
bit_or,
shift_left,
shift_right,
add_assign,
sub_assign,
mul_assign,
div_assign,
mod_assign,
discarded_assign,
bool_type,
named_argument,
optional_type,
container_field,
struct_type,
container_literal,
container_field_initialization,
array_index_initialization,
boolean_not,
null_literal,
if_else_payload,
if_payload,
discard,
slice,
range,
negation,
one_complement,
anonymous_container_literal,
anonymous_array_literal,
array_literal,
indexed_access,
calling_convention,
assembly_register,
assembly_statement,
// assembly_block,
for_condition,
for_loop,
undefined,
zero_terminated,
null_terminated,
const_expression,
many_pointer_expression,
optional_unwrap,
anonymous_empty_literal,
empty_container_literal_guess,
break_expression,
continue_expression,
character_literal,
function_attribute_naked,
function_attribute_cc,
symbol_attribute_extern,
symbol_attribute_export,
symbol_attributes,
metadata,
test_declaration,
all_errors,
error_union,
catch_expression,
try_expression,
error_type,
error_field,
assembly_code_expression,
assembly_instruction,
assembly_code_block,
bool_and,
bool_or,
payload,
catch_payload,
bitfield_type,
comptime_expression,
self,
any,
for_expressions,
slice_metadata,
orelse_expression,
type,
or_assign,
wrapping_add,
saturated_add,
wrapping_sub,
saturated_sub,
wrapping_mul,
saturated_mul,
};
};
const Error = error{
unexpected_token,
not_implemented,
OutOfMemory,
};
const Analyzer = struct {
lexer: lexer.Result,
token_i: Token.Index,
token_buffer: *Token.Buffer,
nodes: *PinnedArray(Node),
node_lists: *PinnedArray([]const Node.Index),
source_file: []const u8,
allocator: Allocator,
my_allocator: *MyAllocator,
arena: *Arena,
suffix_depth: usize = 0,
fn expectToken(analyzer: *Analyzer, expected_token_id: Token.Id) !Token.Index {
const token_i = analyzer.token_i;
const token_id = analyzer.peekToken();
const is_expected_token = token_id == expected_token_id;
if (is_expected_token) {
analyzer.consumeToken();
const result = token_i;
return result;
} else {
const file_offset = analyzer.getTokenOffset(token_i);
const file_chunk = analyzer.source_file[file_offset..];
try write(.panic, "Unexpected token ");
try write(.panic, @tagName(token_id));
try write(.panic, " when expected ");
try write(.panic, @tagName(expected_token_id));
try write(.panic, "\n");
try write(.panic, "File chunk:\n\n```\n");
try write(.panic, file_chunk);
try write(.panic, "\n```\n");
// std.debug.print("Unexpected token {s} when expected {s}\n| |\n v \n```\n{s}\n```", .{ @tagName(token_id), @tagName(expected_token_id), file_chunk });
@breakpoint();
return error.unexpected_token;
}
}
fn getTokenOffset(analyzer: *Analyzer, token_index: Token.Index) u32 {
const token = analyzer.token_buffer.tokens.get(token_index);
return token.offset;
}
fn peekTokenAhead(analyzer: *Analyzer, ahead_offset: u32) Token.Id {
const index = @intFromEnum(analyzer.token_i) + ahead_offset;
const token = analyzer.token_buffer.tokens.get_unchecked(index);
return token.id;
}
fn peekToken(analyzer: *Analyzer) Token.Id {
const token = analyzer.peekTokenAhead(0);
return token;
}
fn hasTokens(analyzer: *Analyzer) bool {
const token_end = analyzer.getTokenEnd();
return @intFromEnum(analyzer.token_i) < token_end;
}
fn getTokenEnd(analyzer: *const Analyzer) u32 {
return @intFromEnum(analyzer.lexer.offset) + analyzer.lexer.count;
}
fn consumeToken(analyzer: *Analyzer) void {
analyzer.consumeTokens(1);
}
fn consumeTokens(analyzer: *Analyzer, token_count: u32) void {
assert((@intFromEnum(analyzer.token_i) + token_count) <= analyzer.getTokenEnd());
// log(.parser, .consume_token, "Consuming {} {s}: ", .{ token_count, if (token_count == 1) "token" else "tokens" });
// for (0..token_count) |i_usize| {
// const i: u32 = @intCast(i_usize);
// const token_id = analyzer.peekTokenAhead(i);
// _ = token_id; // autofix
// const token_index = @intFromEnum(analyzer.token_i) + i;
// const token_bytes = analyzer.bytes(token_index);
// _ = token_bytes; // autofix
// // log(.parser, .consume_token, "{s}, '{s}'", .{ @tagName(token_id), token_bytes });
// }
// log(.parser, .consume_token, "\n", .{});
analyzer.token_i = @enumFromInt(@intFromEnum(analyzer.token_i) + token_count);
}
fn bytes(analyzer: *const Analyzer, token_index: Token.Index) []const u8 {
const token = analyzer.token_buffer.tokens.get(token_index);
const slice = analyzer.source_file[token.offset..][0..token.length];
return slice;
}
fn symbolDeclaration(analyzer: *Analyzer) anyerror!Node.Index {
const first = analyzer.token_i;
const mutability_node_id: Node.Id = switch (analyzer.peekToken()) {
.fixed_keyword_var => .variable_symbol_declaration,
.fixed_keyword_const => .constant_symbol_declaration,
else => |t| @panic(@tagName(t)),
};
analyzer.consumeToken();
const declaration_name_token = try analyzer.expectToken(.identifier);
const declaration_name = analyzer.bytes(declaration_name_token);
_ = declaration_name; // autofix
// logln(.parser, .symbol_declaration, "Starting parsing declaration \"{s}\"", .{declaration_name});
// logln(.parser, .symbol_declaration, "Current token: {}", .{analyzer.peekToken()});
const metadata_node_index = switch (analyzer.peekToken()) {
.operator_colon => blk: {
const colon = try analyzer.expectToken(.operator_colon);
const type_node_index = if (analyzer.peekToken() != .operator_colon) try analyzer.typeExpression() else .null;
const attribute_node_index: Node.Index = if (analyzer.peekToken() == .operator_colon) b: {
analyzer.consumeToken();
var stack_list = Node.StackList{};
while (analyzer.peekToken() != .operator_assign) {
const identifier = try analyzer.expectToken(.identifier);
const identifier_name = analyzer.bytes(identifier);
const attribute_node = inline for (@typeInfo(Compilation.Debug.Declaration.Global.Attribute).Enum.fields) |enum_field| {
if (byte_equal(identifier_name, enum_field.name)) {
const attribute = @field(Compilation.Debug.Declaration.Global.Attribute, enum_field.name);
const attribute_node = switch (attribute) {
.@"export",
.@"extern",
=> try analyzer.addNode(.{
.id = @field(Node.Id, "symbol_attribute_" ++ @tagName(attribute)),
.token = identifier,
.left = .null,
.right = .null,
}),
};
break attribute_node;
}
} else @panic(identifier_name);
stack_list.appendAssumeCapacity(attribute_node);
switch (analyzer.peekToken()) {
.operator_assign => {},
.operator_comma => analyzer.consumeToken(),
else => |t| @panic(@tagName(t)),
}
}
break :b try analyzer.nodeList(&stack_list);
} else .null;
break :blk try analyzer.addNode(.{
.id = .metadata,
.token = colon,
.left = type_node_index,
.right = attribute_node_index,
});
},
else => Node.Index.null,
};
_ = try analyzer.expectToken(.operator_assign);
const init_node_index = try analyzer.expression();
const init_node = analyzer.nodes.get(init_node_index);
switch (init_node.id) {
.function_definition => {},
else => _ = try analyzer.expectToken(.operator_semicolon),
}
// TODO:
const declaration = Node{
.id = mutability_node_id,
.token = first,
.left = metadata_node_index,
.right = init_node_index,
};
// logln(.parser, .symbol_declaration, "Adding declaration \"{s}\" with init node of type: {s}", .{ declaration_name, @tagName(init_node.id) });
return try analyzer.addNode(declaration);
}
fn function(analyzer: *Analyzer) !Node.Index {
const token = analyzer.token_i;
assert(analyzer.peekToken() == .fixed_keyword_fn);
analyzer.consumeToken();
const function_prototype = try analyzer.functionPrototype();
const is_comptime = false;
_ = is_comptime;
return switch (analyzer.peekToken()) {
.operator_left_brace => try analyzer.addNode(.{
.id = .function_definition,
.token = token,
.left = function_prototype,
.right = try analyzer.block(),
}),
.operator_semicolon => function_prototype,
else => |t| @panic(@tagName(t)),
};
}
fn functionPrototype(analyzer: *Analyzer) !Node.Index {
const token = analyzer.token_i;
var attribute_and_return_type_node_list = Node.StackList{};
while (analyzer.peekToken() != .operator_left_parenthesis) {
const identifier = try analyzer.expectToken(.identifier);
const identifier_name = analyzer.bytes(identifier);
const attribute_node = inline for (@typeInfo(Compilation.Function.Attribute).Enum.fields) |enum_field| {
if (byte_equal(identifier_name, enum_field.name)) {
const attribute = @field(Compilation.Function.Attribute, enum_field.name);
const attribute_node = switch (attribute) {
.naked => try analyzer.addNode(.{
.id = @field(Node.Id, "function_attribute_" ++ @tagName(attribute)),
.token = identifier,
.left = .null,
.right = .null,
}),
.cc => try analyzer.addNode(.{
.id = .function_attribute_cc,
.token = identifier,
.left = b: {
_ = try analyzer.expectToken(.operator_left_parenthesis);
const cc = try analyzer.expression();
_ = try analyzer.expectToken(.operator_right_parenthesis);
break :b cc;
},
.right = .null,
}),
else => |t| @panic(@tagName(t)),
};
break attribute_node;
}
} else @panic(identifier_name);
attribute_and_return_type_node_list.appendAssumeCapacity(attribute_node);
if (analyzer.peekToken() == .operator_comma) analyzer.consumeToken();
}
assert(analyzer.peekToken() == .operator_left_parenthesis);
const arguments = try analyzer.argumentList(.operator_left_parenthesis, .operator_right_parenthesis);
const return_type = try analyzer.typeExpression();
attribute_and_return_type_node_list.appendAssumeCapacity(return_type);
const function_prototype = try analyzer.addNode(.{
.id = .function_prototype,
.token = token,
.left = arguments,
.right = try analyzer.nodeList(&attribute_and_return_type_node_list),
});
return function_prototype;
}
fn argumentList(analyzer: *Analyzer, maybe_start_token: ?Token.Id, end_token: Token.Id) !Node.Index {
if (maybe_start_token) |start_token| {
_ = try analyzer.expectToken(start_token);
}
var list = Node.StackList{};
while (analyzer.peekToken() != end_token) {
const identifier_token = analyzer.token_i;
const id: Node.Id = switch (analyzer.peekToken()) {
.operator_dollar => b: {
analyzer.consumeToken();
break :b .comptime_argument_declaration;
},
else => .argument_declaration,
};
switch (analyzer.peekToken()) {
.identifier, .discard => analyzer.consumeToken(),
else => |t| @panic(@tagName(t)),
}
_ = try analyzer.expectToken(.operator_colon);
const type_expression = try analyzer.typeExpression();
if (analyzer.peekToken() == .operator_comma) {
analyzer.consumeToken();
}
list.appendAssumeCapacity(try analyzer.addNode(.{
.id = id,
.token = identifier_token,
.left = type_expression,
.right = Node.Index.null,
}));
}
_ = try analyzer.expectToken(end_token);
if (list.len != 0) {
return try analyzer.nodeList(&list);
} else {
return Node.Index.null;
}
}
fn assignExpressionStatement(analyzer: *Analyzer) !Node.Index {
const result = try analyzer.assignExpression();
_ = try analyzer.expectToken(.operator_semicolon);
return result;
}
fn block(analyzer: *Analyzer) anyerror!Node.Index {
const left_brace = try analyzer.expectToken(.operator_left_brace);
var list = Node.StackList{};
while (analyzer.peekToken() != .operator_right_brace) {
const first_statement_token = analyzer.peekToken();
// logln(.parser, .block, "First statement token: {s}", .{@tagName(first_statement_token)});
const statement_index = switch (first_statement_token) {
else => try analyzer.assignExpressionStatement(),
.fixed_keyword_while => try analyzer.whileExpression(),
.fixed_keyword_switch => try analyzer.switchExpression(),
.fixed_keyword_if => try analyzer.ifExpression(),
.fixed_keyword_for => try analyzer.forExpression(),
.fixed_keyword_const,
.fixed_keyword_var,
=> try analyzer.symbolDeclaration(),
};
list.appendAssumeCapacity(statement_index);
}
_ = try analyzer.expectToken(.operator_right_brace);
return try analyzer.addNode(.{
.id = .block,
.token = left_brace,
.left = try analyzer.nodeList(&list),
.right = Node.Index.null,
});
}
fn whileExpression(analyzer: *Analyzer) anyerror!Node.Index {
const while_identifier_index = try analyzer.expectToken(.fixed_keyword_while);
_ = try analyzer.expectToken(.operator_left_parenthesis);
// TODO:
const while_condition = try analyzer.expression();
_ = try analyzer.expectToken(.operator_right_parenthesis);
const while_block = try analyzer.block();
if (analyzer.peekToken() == .fixed_keyword_else) {
analyzer.consumeToken();
unreachable;
}
return analyzer.addNode(.{
.id = .@"while",
.token = while_identifier_index,
.left = while_condition,
.right = while_block,
});
}
fn switchExpression(analyzer: *Analyzer) anyerror!Node.Index {
// logln(.parser, .@"switch", "Parsing switch...", .{});
const switch_token = analyzer.token_i;
analyzer.consumeToken();
_ = try analyzer.expectToken(.operator_left_parenthesis);
const switch_expression = try analyzer.expression();
_ = try analyzer.expectToken(.operator_right_parenthesis);
// logln(.parser, .@"switch", "Parsed switch expression...", .{});
_ = try analyzer.expectToken(.operator_left_brace);
var list = Node.StackList{};
while (analyzer.peekToken() != .operator_right_brace) {
const case_token = analyzer.token_i;
// logln(.parser, .@"switch", "Parsing switch case...", .{});
const case_node = switch (analyzer.peekToken()) {
.fixed_keyword_else => blk: {
analyzer.consumeToken();
break :blk Node.Index.null;
},
else => blk: {
var array_list = Node.StackList{};
while (true) {
const token = analyzer.token_i;
const left = try analyzer.expression();
const switch_case_node = switch (analyzer.peekToken()) {
.operator_triple_dot => try analyzer.addNode(.{
.id = .range,
.token = b: {
analyzer.consumeToken();
break :b token;
},
.left = left,
.right = try analyzer.expression(),
}),
else => left,
};
array_list.appendAssumeCapacity(switch_case_node);
switch (analyzer.peekToken()) {
.operator_comma => analyzer.consumeToken(),
.operator_switch_case => break,
else => {},
}
}
break :blk switch (array_list.len) {
0 => unreachable,
1 => array_list.buffer[0],
else => try analyzer.nodeList(&array_list),
};
},
};
_ = try analyzer.expectToken(.operator_switch_case);
const is_left_brace = analyzer.peekToken() == .operator_left_brace;
const expr = switch (is_left_brace) {
true => try analyzer.block(),
false => try analyzer.assignExpression(),
};
// logln(.parser, .switch_case, "Comma token: \n```\n{s}\n```\n", .{analyzer.source_file[analyzer.tokens[analyzer.token_i].start..]});
_ = try analyzer.expectToken(.operator_comma);
const node = try analyzer.addNode(.{
.id = .switch_case,
.token = case_token,
.left = case_node,
.right = expr,
});
list.appendAssumeCapacity(node);
}
_ = try analyzer.expectToken(.operator_right_brace);
return try analyzer.addNode(.{
.id = .@"switch",
.token = switch_token,
.left = switch_expression,
.right = try analyzer.nodeList(&list),
});
}
fn parsePayload(analyzer: *Analyzer) !Node.Index {
_ = try analyzer.expectToken(.operator_bar);
const main_token = analyzer.token_i;
switch (analyzer.peekToken()) {
.identifier,
.discard,
=> analyzer.consumeToken(),
else => |t| @panic(@tagName(t)),
}
_ = try analyzer.expectToken(.operator_bar);
return try analyzer.addNode(.{
.id = .payload,
.token = main_token,
.left = .null,
.right = .null,
});
}
fn ifExpression(analyzer: *Analyzer) anyerror!Node.Index {
const if_token = analyzer.token_i;
analyzer.consumeToken();
_ = try analyzer.expectToken(.operator_left_parenthesis);
const if_condition = try analyzer.expression();
_ = try analyzer.expectToken(.operator_right_parenthesis);
const payload = if (analyzer.peekToken() == .operator_bar) try analyzer.parsePayload() else Node.Index.null;
const if_taken_expression = try analyzer.expression();
const if_node = try analyzer.addNode(.{
.id = .@"if",
.token = if_token,
.left = if_condition,
.right = if_taken_expression,
});
const result = switch (analyzer.peekToken()) {
.fixed_keyword_else => blk: {
analyzer.consumeToken();
break :blk try analyzer.addNode(.{
.id = .if_else,
.token = if_token,
.left = if_node,
.right = try analyzer.expression(),
});
},
else => if_node,
};
if (payload == .null) {
return result;
} else {
return try analyzer.addNode(.{
.id = switch (result == if_node) {
true => .if_payload,
false => .if_else_payload,
},
.token = if_token,
.left = result,
.right = payload,
});
}
}
fn forExpression(analyzer: *Analyzer) !Node.Index {
const token = try analyzer.expectToken(.fixed_keyword_for);
_ = try analyzer.expectToken(.operator_left_parenthesis);
var for_expression_list = Node.StackList{};
while (analyzer.peekToken() != .operator_right_parenthesis) {
const expression_token = analyzer.token_i;
const first = try analyzer.expression();
const node_index = switch (analyzer.peekToken()) {
.operator_double_dot => blk: {
analyzer.consumeToken();
break :blk try analyzer.addNode(.{
.id = .range,
.token = expression_token,
.left = first,
.right = switch (analyzer.peekToken()) {
.operator_right_parenthesis, .operator_comma => Node.Index.null,
else => try analyzer.expression(),
},
});
},
.operator_right_parenthesis,
.operator_comma,
=> first,
else => |t| @panic(@tagName(t)),
};
for_expression_list.appendAssumeCapacity(node_index);
switch (analyzer.peekToken()) {
.operator_comma => analyzer.consumeToken(),
.operator_right_parenthesis => {},
else => |t| @panic(@tagName(t)),
}
}
_ = try analyzer.expectToken(.operator_right_parenthesis);
_ = try analyzer.expectToken(.operator_bar);
var payload_nodes = Node.StackList{};
while (analyzer.peekToken() != .operator_bar) {
const payload_token = analyzer.token_i;
const id: Node.Id = switch (analyzer.peekToken()) {
.identifier => .identifier,
.discard => .discard,
else => |t| @panic(@tagName(t)),
};
analyzer.consumeToken();
switch (analyzer.peekToken()) {
.operator_bar => {},
.operator_comma => analyzer.consumeToken(),
else => |t| @panic(@tagName(t)),
}
payload_nodes.appendAssumeCapacity(try analyzer.addNode(.{
.id = id,
.token = payload_token,
.left = Node.Index.null,
.right = Node.Index.null,
}));
}
_ = try analyzer.expectToken(.operator_bar);
if (payload_nodes.len != for_expression_list.len) {
unreachable;
}
const for_condition_node = try analyzer.addNode(.{
.id = .for_condition,
.token = token,
.left = try analyzer.nodeList(&for_expression_list),
.right = try analyzer.nodeList(&payload_nodes),
});
const true_expression = switch (analyzer.peekToken()) {
.operator_left_brace => try analyzer.block(),
else => blk: {
const for_content_expression = try analyzer.expression();
_ = try analyzer.expectToken(.operator_semicolon);
break :blk for_content_expression;
},
};
const else_expression: Node.Index = if (analyzer.peekToken() == .fixed_keyword_else) b: {
analyzer.consumeToken();
const else_expression = if (analyzer.peekToken() == .operator_left_brace) try analyzer.block() else try analyzer.expression();
break :b else_expression;
} else .null;
const for_node = try analyzer.addNode(.{ .id = .for_loop, .token = token, .left = for_condition_node, .right = try analyzer.addNode(.{
.id = .for_expressions,
.token = .null,
.left = true_expression,
.right = else_expression,
}) });
return for_node;
}
fn continueExpression(analyzer: *Analyzer) !Node.Index {
const t = try analyzer.expectToken(.fixed_keyword_continue);
const node_index = try analyzer.addNode(.{
.id = .continue_expression,
.token = t,
.left = Node.Index.null,
.right = Node.Index.null,
});
return node_index;
}
fn breakExpression(analyzer: *Analyzer) !Node.Index {
const t = try analyzer.expectToken(.fixed_keyword_break);
const node_index = try analyzer.addNode(.{
.id = .break_expression,
.token = t,
.left = Node.Index.null,
.right = Node.Index.null,
});
return node_index;
}
fn assignExpression(analyzer: *Analyzer) !Node.Index {
const left = try analyzer.expression();
const expression_token = analyzer.token_i;
const expression_id: Node.Id = switch (analyzer.peekToken()) {
.operator_semicolon, .operator_comma, .operator_right_brace, .identifier => return left,
.operator_assign => .assign,
.operator_add_assign => .add_assign,
.operator_sub_assign => .sub_assign,
.operator_mul_assign => .mul_assign,
.operator_div_assign => .div_assign,
.operator_mod_assign => .mod_assign,
.operator_or_assign => .or_assign,
else => |t| @panic(@tagName(t)),
};
analyzer.consumeToken();
const right = try analyzer.expression();
const node = Node{
.id = expression_id,
.token = expression_token,
.left = left,
.right = right,
};
// logln(.parser, .assign, "assign:\nleft: {}.\nright: {}", .{ node.left, node.right });
return try analyzer.addNode(node);
}
fn parseAsmOperand(analyzer: *Analyzer) !Node.Index {
const token = analyzer.token_i;
const result = switch (analyzer.peekToken()) {
.identifier => try analyzer.addNode(.{
.id = .assembly_register,
.token = blk: {
analyzer.consumeToken();
break :blk token;
},
.left = Node.Index.null,
.right = Node.Index.null,
}),
.number_literal => blk: {
analyzer.consumeToken();
break :blk analyzer.addNode(.{
.id = .number_literal,
.token = token,
.left = Node.Index.null,
.right = Node.Index.null,
});
},
.operator_left_brace => blk: {
analyzer.consumeToken();
const result = try analyzer.expression();
_ = try analyzer.expectToken(.operator_right_brace);
break :blk result;
},
else => |t| @panic(@tagName(t)),
};
return result;
}
fn compilerIntrinsic(analyzer: *Analyzer) !Node.Index {
const intrinsic_token = try analyzer.expectToken(.intrinsic);
_ = try analyzer.expectToken(.operator_left_parenthesis);
const intrinsic_name = analyzer.bytes(intrinsic_token)[1..];
const intrinsic_id = inline for (@typeInfo(Compilation.IntrinsicId).Enum.fields) |enum_field| {
if (byte_equal(enum_field.name, intrinsic_name)) {
break @field(Compilation.IntrinsicId, enum_field.name);
}
} else @panic(intrinsic_name);
var list = Node.StackList{};
if (intrinsic_id == .@"asm") {
const backtick = try analyzer.expectToken(.operator_backtick);
var instruction_list = Node.StackList{};
while (analyzer.peekToken() != .operator_backtick) {
const instruction_token = analyzer.token_i;
const instruction_name = try analyzer.identifierNode();
var operand_list = Node.StackList{};
while (analyzer.peekToken() != .operator_semicolon) {
const node = switch (analyzer.peekToken()) {
.identifier => try analyzer.addNode(.{
.id = .assembly_register,
.token = b: {
const t = analyzer.token_i;
analyzer.consumeToken();
break :b t;
},
.left = .null,
.right = .null,
}),
.number_literal => try analyzer.addNode(.{
.id = .number_literal,
.token = b: {
const t = analyzer.token_i;
analyzer.consumeToken();
break :b t;
},
.left = Node.Index.null,
.right = Node.Index.null,
}),
.operator_left_brace => b: {
const left_brace = try analyzer.expectToken(.operator_left_brace);
const code_expression = try analyzer.expression();
_ = try analyzer.expectToken(.operator_right_brace);
break :b try analyzer.addNode(.{
.id = .assembly_code_expression,
.token = left_brace,
.left = code_expression,
.right = .null,
});
},
else => |t| @panic(@tagName(t)),
};
switch (analyzer.peekToken()) {
.operator_comma => analyzer.consumeToken(),
.operator_semicolon => {},
else => |t| @panic(@tagName(t)),
}
operand_list.appendAssumeCapacity(node);
}
analyzer.consumeToken();
const instruction = try analyzer.addNode(.{
.id = .assembly_instruction,
.token = instruction_token,
.left = instruction_name,
.right = try analyzer.nodeList(&operand_list),
});
instruction_list.appendAssumeCapacity(instruction);
}
_ = try analyzer.expectToken(.operator_backtick);
_ = try analyzer.expectToken(.operator_right_parenthesis);
const assembly_block = try analyzer.addNode(.{
.id = .assembly_code_block,
.token = backtick,
.left = try analyzer.nodeList(&instruction_list),
.right = .null,
});
list.appendAssumeCapacity(assembly_block);
const intrinsic = try analyzer.addNode(.{
.id = .intrinsic,
.token = intrinsic_token,
.left = try analyzer.nodeList(&list),
.right = @enumFromInt(@intFromEnum(intrinsic_id)),
});
return intrinsic;
} else {
while (analyzer.peekToken() != .operator_right_parenthesis) {
const parameter = try analyzer.expression();
list.appendAssumeCapacity(parameter);
switch (analyzer.peekToken()) {
.operator_comma => analyzer.consumeToken(),
.operator_right_parenthesis => continue,
else => |t| @panic(@tagName(t)),
}
}
// Consume the right parenthesis
analyzer.consumeToken();
}
return try analyzer.addNode(.{
.id = .intrinsic,
.token = intrinsic_token,
.left = try analyzer.nodeList(&list),
.right = @enumFromInt(@intFromEnum(intrinsic_id)),
});
}
fn expression(analyzer: *Analyzer) anyerror!Node.Index {
return try analyzer.expressionPrecedence(0);
}
const PrecedenceOperator = enum {
compare_equal,
compare_not_equal,
compare_less,
compare_greater,
compare_less_equal,
compare_greater_equal,
add,
wrapping_add,
saturated_add,
sub,
wrapping_sub,
saturated_sub,
mul,
wrapping_mul,
saturated_mul,
div,
mod,
bit_and,
bit_xor,
bit_or,
bool_and,
bool_or,
shift_left,
shift_right,
@"catch",
@"orelse",
};
const operator_precedence = std.EnumArray(PrecedenceOperator, i32).init(.{
.compare_equal = 30,
.compare_not_equal = 30,
.compare_less = 30,
.compare_greater = 30,
.compare_less_equal = 30,
.compare_greater_equal = 30,
.add = 60,
.wrapping_add = 60,
.saturated_add = 60,
.sub = 60,
.wrapping_sub = 60,
.saturated_sub = 60,
.mul = 70,
.wrapping_mul = 70,
.saturated_mul = 70,
.div = 70,
.mod = 70,
.bit_and = 40,
.bit_xor = 40,
.bit_or = 40,
.bool_or = 10,
.bool_and = 20,
.shift_left = 50,
.shift_right = 50,
.@"catch" = 40,
.@"orelse" = 40,
});
const operator_associativity = std.EnumArray(PrecedenceOperator, Associativity).init(.{
.compare_equal = .none,
.compare_not_equal = .none,
.compare_less = .none,
.compare_greater = .none,
.compare_less_equal = .none,
.compare_greater_equal = .none,
.add = .left,
.wrapping_add = .left,
.saturated_add = .left,
.sub = .left,
.wrapping_sub = .left,
.saturated_sub = .left,
.bit_and = .left,
.bit_xor = .left,
.bit_or = .left,
.bool_and = .left,
.bool_or = .left,
.mul = .left,
.wrapping_mul = .left,
.saturated_mul = .left,
.div = .left,
.mod = .left,
.shift_left = .left,
.shift_right = .left,
.@"catch" = .left,
.@"orelse" = .left,
});
const operator_node_id = std.EnumArray(PrecedenceOperator, Node.Id).init(.{
.compare_equal = .compare_equal,
.compare_not_equal = .compare_not_equal,
.compare_greater = .compare_greater,
.compare_less = .compare_less,
.compare_greater_equal = .compare_greater_equal,
.compare_less_equal = .compare_less_equal,
.add = .add,
.wrapping_add = .wrapping_add,
.saturated_add = .saturated_add,
.sub = .sub,
.wrapping_sub = .wrapping_sub,
.saturated_sub = .saturated_sub,
.bit_and = .bit_and,
.bit_xor = .bit_xor,
.bit_or = .bit_or,
.bool_and = .bool_and,
.bool_or = .bool_or,
.mul = .mul,
.wrapping_mul = .wrapping_mul,
.saturated_mul = .saturated_mul,
.div = .div,
.mod = .mod,
.shift_left = .shift_left,
.shift_right = .shift_right,
.@"catch" = .catch_expression,
.@"orelse" = .orelse_expression,
});
fn expressionPrecedence(analyzer: *Analyzer, minimum_precedence: i32) !Node.Index {
assert(minimum_precedence >= 0);
var result = try analyzer.prefixExpression();
// if (result != .null) {
// const prefix_node = analyzer.nodes.get(result);
// logln(.parser, .precedence, "Prefix: {s}", .{@tagName(prefix_node.id)});
// }
var banned_precedence: i32 = -1;
while (analyzer.hasTokens()) {
const token = analyzer.peekToken();
// logln("Looping in expression precedence with token {}", .{token});
const operator: PrecedenceOperator = switch (token) {
.operator_semicolon,
.operator_right_parenthesis,
.operator_right_brace,
.operator_right_bracket,
.operator_comma,
.operator_colon,
.operator_assign,
.operator_add_assign,
.operator_sub_assign,
.operator_mul_assign,
.operator_div_assign,
.operator_mod_assign,
.operator_or_assign,
.operator_dot,
.operator_double_dot,
.operator_triple_dot,
.operator_switch_case,
.fixed_keyword_const,
.fixed_keyword_var,
.fixed_keyword_return,
.fixed_keyword_if,
.fixed_keyword_else,
.identifier,
.discard,
.fixed_keyword_test,
.fixed_keyword_break,
.fixed_keyword_while,
=> break,
.operator_compare_equal => .compare_equal,
.operator_compare_not_equal => .compare_not_equal,
.operator_compare_less => .compare_less,
.operator_compare_greater => .compare_greater,
.operator_compare_less_equal => .compare_less_equal,
.operator_compare_greater_equal => .compare_greater_equal,
.operator_add => .add,
.operator_wrapping_add => .wrapping_add,
.operator_saturated_add => .saturated_add,
.operator_minus => .sub,
.operator_wrapping_sub => .wrapping_sub,
.operator_saturated_sub => .saturated_sub,
.operator_asterisk => .mul,
.operator_wrapping_mul => .wrapping_mul,
.operator_saturated_mul => .saturated_mul,
.operator_div => .div,
.operator_mod => .mod,
.operator_ampersand => .bit_and,
.operator_bar => .bit_or,
.operator_xor => .bit_xor,
.fixed_keyword_and => .bool_and,
.fixed_keyword_or => .bool_or,
.operator_shift_left => .shift_left,
.operator_shift_right => .shift_right,
.fixed_keyword_catch => .@"catch",
.fixed_keyword_orelse => .@"orelse",
else => |t| @panic(@tagName(t)),
};
// logln(.parser, .precedence, "Precedence operator: {s}", .{@tagName(operator)});
const precedence = operator_precedence.get(operator);
if (precedence < minimum_precedence) {
// logln(.parser, .precedence, "Breaking for minimum_precedence", .{});
break;
}
if (precedence == banned_precedence) {
unreachable;
}
const operator_token = analyzer.token_i;
analyzer.consumeToken();
const right = if (token == .fixed_keyword_catch and analyzer.peekToken() == .operator_bar) b: {
const payload = try analyzer.parsePayload();
const r_node = try analyzer.expressionPrecedence(precedence + 1);
break :b try analyzer.addNode(.{
.id = .catch_payload,
.token = operator_token,
.left = payload,
.right = r_node,
});
} else try analyzer.expressionPrecedence(precedence + 1);
const node_id = operator_node_id.get(operator);
result = try analyzer.addNode(.{
.id = node_id,
.token = operator_token,
.left = result,
.right = right,
});
const associativity = operator_associativity.get(operator);
if (associativity == .none) {
banned_precedence = precedence;
}
}
return result;
}
fn prefixExpression(analyzer: *Analyzer) !Node.Index {
const token = analyzer.token_i;
// logln("Prefix...", .{});
const node_id: Node.Id = switch (analyzer.peekToken()) {
else => |pref| {
_ = pref;
return try analyzer.primaryExpression();
},
.operator_bang => .boolean_not,
.operator_minus => .negation,
.operator_tilde => .one_complement,
.fixed_keyword_try => .try_expression,
// .tilde => |t| @panic(@tagName(t)),
};
return try analyzer.addNode(.{
.id = node_id,
.token = blk: {
analyzer.consumeToken();
break :blk token;
},
.left = try analyzer.prefixExpression(),
.right = Node.Index.null,
});
}
fn primaryExpression(analyzer: *Analyzer) !Node.Index {
const token = analyzer.token_i;
const result = switch (analyzer.peekToken()) {
.identifier => switch (analyzer.peekTokenAhead(1)) {
// TODO: tags
// .operator_colon => unreachable,
else => try analyzer.curlySuffixExpression(),
},
.string_literal,
.character_literal,
.number_literal,
.intrinsic,
.fixed_keyword_true,
.fixed_keyword_false,
.fixed_keyword_unreachable,
.fixed_keyword_null,
.fixed_keyword_switch,
.operator_dot,
.operator_left_parenthesis,
.keyword_signed_integer,
.keyword_unsigned_integer,
.fixed_keyword_ssize,
.fixed_keyword_usize,
.fixed_keyword_enum,
.fixed_keyword_struct,
.discard,
.fixed_keyword_undefined,
.operator_left_bracket,
.fixed_keyword_const,
.fixed_keyword_var,
.fixed_keyword_error,
=> try analyzer.curlySuffixExpression(),
.fixed_keyword_fn => try analyzer.function(),
.fixed_keyword_return => try analyzer.addNode(.{
.id = .@"return",
.token = blk: {
analyzer.consumeToken();
break :blk token;
},
.left = switch (analyzer.peekToken()) {
.operator_comma,
.operator_semicolon,
.operator_compare_equal,
=> Node.Index.null,
else => try analyzer.expression(),
},
.right = Node.Index.null,
}),
.fixed_keyword_break => try analyzer.breakExpression(),
.fixed_keyword_continue => try analyzer.continueExpression(),
// todo:?
.operator_left_brace => try analyzer.block(),
.fixed_keyword_if => try analyzer.ifExpression(),
.fixed_keyword_bitfield => try analyzer.processContainerType(.fixed_keyword_bitfield),
.operator_dollar => blk: {
analyzer.consumeToken();
const t = try analyzer.typeExpression();
break :blk try analyzer.addNode(.{
.id = .comptime_expression,
.token = token,
.left = t,
.right = .null,
});
},
else => |id| @panic(@tagName(id)),
};
return result;
}
fn curlySuffixExpression(analyzer: *Analyzer) !Node.Index {
const left = try analyzer.typeExpression();
return switch (analyzer.peekToken()) {
.operator_left_brace => try analyzer.containerLiteral(left),
else => left,
};
}
fn noReturn(analyzer: *Analyzer) !Node.Index {
const token_i = analyzer.token_i;
assert(analyzer.peekToken() == .fixed_keyword_noreturn);
analyzer.consumeToken();
return try analyzer.addNode(.{
.id = .keyword_noreturn,
.token = token_i,
.left = Node.Index.null,
.right = Node.Index.null,
});
}
fn boolLiteral(analyzer: *Analyzer) !Node.Index {
return try analyzer.addNode(.{
.id = switch (analyzer.peekToken()) {
.fixed_keyword_true => .keyword_true,
.fixed_keyword_false => .keyword_false,
else => unreachable,
},
.token = blk: {
const token_i = analyzer.token_i;
analyzer.consumeToken();
break :blk token_i;
},
.left = Node.Index.null,
.right = Node.Index.null,
});
}
const PointerOrArrayTypeExpectedExpression = enum {
single_pointer_type,
many_pointer_type,
array_or_slice_type,
};
fn parseTermination(analyzer: *Analyzer) !Node.Index {
_ = try analyzer.expectToken(.operator_colon);
const token_i = analyzer.token_i;
const token = analyzer.peekToken();
const termination_id: Node.Id = switch (token) {
.fixed_keyword_null => .null_terminated,
.number_literal => switch (std.zig.parseNumberLiteral(analyzer.bytes(token_i))) {
.int => |integer| switch (integer) {
0 => .zero_terminated,
else => @panic("Invalid number literal terminator"),
},
else => @panic("Invalid number literal terminator"),
},
else => |t| @panic(@tagName(t)),
};
const termination_node_index = try analyzer.addNode(.{
.id = termination_id,
.token = token_i,
.left = Node.Index.null,
.right = Node.Index.null,
});
analyzer.consumeToken();
return termination_node_index;
}
fn pointerOrArrayTypeExpression(analyzer: *Analyzer, expected: PointerOrArrayTypeExpectedExpression) !Node.Index {
const first = analyzer.token_i;
var list = Node.StackList{};
const expression_type: Node.Id = switch (expected) {
.single_pointer_type => blk: {
analyzer.consumeToken();
break :blk .pointer_type;
},
.many_pointer_type => blk: {
list.appendAssumeCapacity(try analyzer.addNode(.{
.id = .many_pointer_expression,
.token = analyzer.token_i,
.left = Node.Index.null,
.right = Node.Index.null,
}));
_ = try analyzer.expectToken(.operator_left_bracket);
_ = try analyzer.expectToken(.operator_ampersand);
switch (analyzer.peekToken()) {
.operator_right_bracket => {},
.operator_colon => list.appendAssumeCapacity(try analyzer.parseTermination()),
else => |t| @panic(@tagName(t)),
}
_ = try analyzer.expectToken(.operator_right_bracket);
break :blk .pointer_type;
},
.array_or_slice_type => blk: {
_ = try analyzer.expectToken(.operator_left_bracket);
switch (analyzer.peekToken()) {
.operator_right_bracket => {
analyzer.consumeToken();
break :blk .slice_type;
},
.operator_colon => {
list.appendAssumeCapacity(try analyzer.parseTermination());
_ = try analyzer.expectToken(.operator_right_bracket);
break :blk .slice_type;
},
else => {
const length_expression = try analyzer.expression();
list.appendAssumeCapacity(length_expression);
switch (analyzer.peekToken()) {
.operator_right_bracket => {},
.operator_colon => list.appendAssumeCapacity(try analyzer.parseTermination()),
else => |t| @panic(@tagName(t)),
}
_ = try analyzer.expectToken(.operator_right_bracket);
break :blk .array_type;
},
}
},
};
if (expression_type != .array_type) {
const const_node = switch (analyzer.peekToken()) {
.fixed_keyword_const => try analyzer.addNode(.{
.id = .const_expression,
.token = analyzer.token_i,
.left = Node.Index.null,
.right = Node.Index.null,
}),
else => Node.Index.null,
};
analyzer.consumeTokens(@intFromBool(analyzer.peekToken() == .fixed_keyword_const));
if (const_node != .null) {
list.appendAssumeCapacity(const_node);
}
} else {
assert(list.len > 0);
}
const type_expression = try analyzer.typeExpression();
assert(type_expression != .null);
list.appendAssumeCapacity(type_expression);
const node_list = try analyzer.nodeList(&list);
const node = Node{
.id = expression_type,
.token = first,
.left = node_list,
.right = Node.Index.null,
};
const node_index = try analyzer.addNode(node);
switch (analyzer.peekToken()) {
.operator_comma,
.operator_right_parenthesis,
.operator_left_brace,
.operator_assign,
.operator_semicolon,
=> return node_index,
else => |t| @panic(@tagName(t)),
}
return node_index;
}
fn typeExpression(analyzer: *Analyzer) anyerror!Node.Index {
const first = analyzer.token_i;
return switch (analyzer.peekToken()) {
else => try analyzer.errorUnionExpression(),
.operator_optional => blk: {
analyzer.consumeToken();
break :blk try analyzer.addNode(.{
.id = .optional_type,
.token = first,
.left = try analyzer.typeExpression(),
.right = Node.Index.null,
});
},
.operator_ampersand => try analyzer.pointerOrArrayTypeExpression(.single_pointer_type),
.operator_left_bracket => switch (analyzer.peekTokenAhead(1)) {
.operator_ampersand => try analyzer.pointerOrArrayTypeExpression(.many_pointer_type),
.operator_asterisk => @panic("Meant to use ampersand?"),
else => try analyzer.pointerOrArrayTypeExpression(.array_or_slice_type),
},
};
}
fn errorUnionExpression(analyzer: *Analyzer) !Node.Index {
const initial = analyzer.token_i;
if (analyzer.peekToken() == .operator_asterisk and analyzer.peekTokenAhead(1) == .operator_bang) {
const asterisk = try analyzer.expectToken(.operator_asterisk);
analyzer.consumeToken();
// if (analyzer.peekToken() == .operator_left_bracket) @breakpoint();
const type_node = try analyzer.typeExpression();
const all_errors_node = try analyzer.addNode(.{
.id = .all_errors,
.token = asterisk,
.left = .null,
.right = .null,
});
const error_union = try analyzer.addNode(.{
.id = .error_union,
.token = asterisk,
// All errors
.left = all_errors_node,
.right = type_node,
});
return error_union;
} else {
const suffix_expression = try analyzer.suffixExpression();
return switch (analyzer.peekToken()) {
.operator_bang => try analyzer.addNode(.{
.id = .error_union,
.token = blk: {
analyzer.consumeToken();
break :blk initial;
},
.left = suffix_expression,
.right = try analyzer.typeExpression(),
}),
else => suffix_expression,
};
}
}
fn suffixExpression(analyzer: *Analyzer) !Node.Index {
analyzer.suffix_depth += 1;
defer analyzer.suffix_depth -= 1;
var result = try analyzer.primaryTypeExpression();
while (true) {
const suffix_operator = try analyzer.suffixOperator(result);
if (suffix_operator != .null) {
result = suffix_operator;
} else {
if (analyzer.peekToken() == .operator_left_parenthesis) {
const left_parenthesis = analyzer.token_i;
analyzer.consumeToken();
var expression_list = Node.StackList{};
// logln(.parser, .suffix, "[DEPTH={}] Initializating suffix call-like expression", .{analyzer.suffix_depth});
while (analyzer.peekToken() != .operator_right_parenthesis) {
const current_token = analyzer.token_i;
// logln(.parser, .suffix, "[DEPTH={}] First token: {s}", .{ analyzer.suffix_depth, @tagName(analyzer.tokens[current_token].id) });
var parameter = try analyzer.expression();
// const parameter_node = analyzer.nodes.items[parameter.unwrap()];
// logln(.parser, .suffix, "[DEPTH={}] Parameter node: {s}", .{ analyzer.suffix_depth, @tagName(parameter_node.id) });
if (analyzer.peekToken() == .operator_assign) {
analyzer.consumeToken();
parameter = try analyzer.addNode(.{
.id = .named_argument,
.token = current_token,
.left = parameter,
.right = try analyzer.expression(),
});
}
expression_list.appendAssumeCapacity(parameter);
switch (analyzer.peekToken()) {
.operator_right_parenthesis => {},
.operator_comma => analyzer.consumeToken(),
.operator_colon, .operator_right_brace, .operator_right_bracket => unreachable,
.operator_dot => @panic("Unexpected period"), //panic("[DEPTH={}] Unexpected period", .{analyzer.suffix_depth}),
else => |t| @panic(@tagName(t)),
}
}
// logln(.parser, .suffix, "[DEPTH={}] Ending suffix call-like expression", .{analyzer.suffix_depth});
// logln(.parser, .suffix, "Callee node: {s}", .{@tagName(analyzer.nodes.get(result).id)});
_ = try analyzer.expectToken(.operator_right_parenthesis);
// const is_comma = analyzer.tokens[analyzer.token_i].id == .comma;
result = try analyzer.addNode(.{
.id = .call,
.token = left_parenthesis,
.left = result,
.right = try analyzer.nodeList(&expression_list),
});
} else {
return result;
}
}
}
unreachable;
}
fn containerLiteral(analyzer: *Analyzer, type_node: Node.Index) anyerror!Node.Index {
const token = try analyzer.expectToken(.operator_left_brace);
var list = Node.StackList{};
const InitializationType = enum {
anonymous,
array_indices,
container_field_names,
empty_literal,
empty_container_literal_guess,
empty_array_literal,
};
var current_initialization: ?InitializationType = null;
while (analyzer.peekToken() != .operator_right_brace) {
const start_token = analyzer.token_i;
const iteration_initialization_type: InitializationType = switch (analyzer.peekToken()) {
.operator_dot => switch (analyzer.peekTokenAhead(1)) {
.identifier => switch (analyzer.peekTokenAhead(2)) {
.operator_assign => blk: {
analyzer.consumeTokens(3);
const field_expression_initializer = try analyzer.expression();
const field_initialization = try analyzer.addNode(.{
.id = .container_field_initialization,
.token = start_token,
.left = field_expression_initializer,
.right = Node.Index.null,
});
list.appendAssumeCapacity(field_initialization);
switch (analyzer.peekToken()) {
.operator_comma => analyzer.consumeToken(),
else => {},
}
break :blk .container_field_names;
},
else => |t| @panic(@tagName(t)),
},
else => blk: {
list.appendAssumeCapacity(try analyzer.anonymousExpression());
_ = try analyzer.expectToken(.operator_comma);
break :blk .anonymous;
},
},
.string_literal,
.identifier,
.number_literal,
.intrinsic,
.fixed_keyword_if,
=> blk: {
const field_expression_initializer = try analyzer.expression();
switch (analyzer.peekToken()) {
.operator_comma => analyzer.consumeToken(),
else => {},
}
list.appendAssumeCapacity(field_expression_initializer);
break :blk .anonymous;
},
else => |t| @panic(@tagName(t)),
};
if (current_initialization) |ci| {
if (ci != iteration_initialization_type) {
unreachable;
}
}
current_initialization = iteration_initialization_type;
}
_ = try analyzer.expectToken(.operator_right_brace);
const initialization: InitializationType = current_initialization orelse switch (type_node) {
.null => .empty_literal,
else => switch (analyzer.nodes.get(type_node).id) {
.identifier, .call => .empty_container_literal_guess,
.array_type => .empty_array_literal,
else => |t| @panic(@tagName(t)),
},
};
return try analyzer.addNode(.{
.id = switch (type_node) {
.null => switch (initialization) {
.container_field_names => .anonymous_container_literal,
.empty_literal => .anonymous_empty_literal,
.anonymous => .anonymous_array_literal,
else => |t| @panic(@tagName(t)),
},
else => switch (initialization) {
.container_field_names => .container_literal,
.empty_container_literal_guess => .empty_container_literal_guess,
.anonymous => .array_literal,
.empty_array_literal => .array_literal,
else => |t| @panic(@tagName(t)),
},
},
.token = token,
.left = type_node,
.right = try analyzer.nodeList(&list),
});
}
fn discardNode(analyzer: *Analyzer) !Node.Index {
const token = analyzer.token_i;
assert(analyzer.peekToken() == .discard);
analyzer.consumeToken();
return try analyzer.addNode(.{
.id = .discard,
.token = token,
.left = Node.Index.null,
.right = Node.Index.null,
});
}
fn processContainerType(analyzer: *Analyzer, maybe_token_id: ?Token.Id) !Node.Index {
const token_i = if (maybe_token_id) |tid| try analyzer.expectToken(tid) else analyzer.token_i;
assert(@intFromEnum(analyzer.token_i) < analyzer.token_buffer.tokens.length);
const token_id = maybe_token_id orelse .fixed_keyword_struct;
const container_type: Compilation.ContainerType = switch (token_id) {
.fixed_keyword_struct => .@"struct",
.fixed_keyword_enum => .@"enum",
.fixed_keyword_bitfield => .bitfield,
else => unreachable,
};
const node_id: Node.Id = switch (token_id) {
.fixed_keyword_struct => .struct_type,
.fixed_keyword_enum => .enum_type,
.fixed_keyword_bitfield => .bitfield_type,
else => unreachable,
};
const parameters_node = if (analyzer.hasTokens() and analyzer.peekToken() == .operator_left_parenthesis) b: {
analyzer.consumeToken();
var list = Node.StackList{};
while (analyzer.peekToken() != .operator_right_parenthesis) {
const parameter_node = try analyzer.expression();
list.appendAssumeCapacity(parameter_node);
switch (analyzer.peekToken()) {
.operator_comma => analyzer.consumeToken(),
else => {},
}
}
analyzer.consumeToken();
break :b try analyzer.nodeList(&list);
} else Node.Index.null;
if (maybe_token_id) |_| _ = try analyzer.expectToken(.operator_left_brace);
var list = Node.StackList{};
while (analyzer.hasTokens() and analyzer.peekToken() != .operator_right_brace) {
const first = analyzer.token_i;
// logln(.parser, .container_members, "First token for container member: {s}", .{@tagName(analyzer.peekToken())});
const member_node_index: Node.Index = switch (analyzer.peekToken()) {
.fixed_keyword_comptime => switch (analyzer.peekTokenAhead(1)) {
.operator_left_brace => b: {
analyzer.consumeToken();
const comptime_block = try analyzer.block();
break :b try analyzer.addNode(.{
.id = .@"comptime",
.token = first,
.left = comptime_block,
.right = Node.Index.null,
});
},
else => |t| @panic(@tagName(t)),
},
.identifier,
.discard,
.string_literal,
=> b: {
analyzer.consumeToken();
switch (container_type) {
.@"struct",
.bitfield,
=> {
_ = try analyzer.expectToken(.operator_colon);
const field_type = try analyzer.typeExpression();
const field_default_node = if (analyzer.peekToken() == .operator_assign) f: {
analyzer.consumeToken();
const default_index = try analyzer.expression();
const default_node = analyzer.nodes.get(default_index);
assert(default_node.id != .node_list);
break :f default_index;
} else Node.Index.null;
_ = try analyzer.expectToken(.operator_comma);
const field_node = try analyzer.addNode(.{
.id = .container_field,
.token = first,
.left = field_type,
.right = field_default_node,
});
break :b field_node;
},
.@"enum" => {
const value_associated = switch (analyzer.peekToken()) {
.operator_comma => Node.Index.null,
else => value: {
analyzer.consumeToken();
break :value try analyzer.expression();
},
};
_ = try analyzer.expectToken(.operator_comma);
const enum_field_node = try analyzer.addNode(.{
.id = .enum_field,
.token = first,
.left = value_associated,
.right = Node.Index.null,
});
break :b enum_field_node;
},
}
},
.fixed_keyword_const, .fixed_keyword_var => try analyzer.symbolDeclaration(),
.fixed_keyword_test => try analyzer.testDeclaration(),
else => |t| @panic(@tagName(t)),
};
const member_node = analyzer.nodes.get(member_node_index);
// logln(.parser, .container_members, "Container member {s}", .{@tagName(member_node.id)});
assert(member_node.id != .identifier);
list.appendAssumeCapacity(member_node_index);
}
if (maybe_token_id) |_| _ = try analyzer.expectToken(.operator_right_brace);
// for (node_list.slice(), 0..) |member_node_index, index| {
// _ = index; // autofix
// const member_node = analyzer.nodes.get(member_node_index);
// if (member_node.id == .identifier) {
// const token_offset = analyzer.getTokenOffset(member_node.token);
// _ = token_offset; // autofix
// // std.debug.print("Node index #{} (list index {}):\n```\n{s}\n```\n", .{ Node.unwrap(member_node_index), index, analyzer.source_file[token_offset..] });
// // std.debug.print("ID: {s}\n", .{analyzer.bytes(member_node.token)});
// unreachable;
// }
// }
return try analyzer.addNode(.{
.id = node_id,
.token = token_i,
.left = try analyzer.nodeList(&list),
.right = parameters_node,
});
}
fn testDeclaration(analyzer: *Analyzer) !Node.Index {
const test_token = try analyzer.expectToken(.fixed_keyword_test);
const name_node: Node.Index = if (analyzer.peekToken() == .string_literal) try analyzer.addNode(.{
.id = .string_literal,
.token = b: {
const index = analyzer.token_i;
analyzer.consumeToken();
break :b index;
},
.left = .null,
.right = .null,
}) else .null;
const test_block = try analyzer.block();
return try analyzer.addNode(.{
.token = test_token,
.id = .test_declaration,
.left = test_block,
.right = name_node,
});
}
fn primaryTypeExpression(analyzer: *Analyzer) anyerror!Node.Index {
const token_i = analyzer.token_i;
const token = analyzer.peekToken();
return try switch (token) {
.fixed_keyword_type => try analyzer.addNode(.{
.id = .type,
.token = b: {
analyzer.consumeToken();
break :b token_i;
},
.left = .null,
.right = .null,
}),
.fixed_keyword_any => try analyzer.addNode(.{
.id = .any,
.token = b: {
analyzer.consumeToken();
break :b token_i;
},
.left = .null,
.right = .null,
}),
.fixed_keyword_Self => try analyzer.addNode(.{
.id = .self,
.token = b: {
analyzer.consumeToken();
break :b token_i;
},
.left = .null,
.right = .null,
}),
.fixed_keyword_fn => blk: {
analyzer.consumeToken();
break :blk analyzer.functionPrototype();
},
.string_literal => blk: {
analyzer.consumeToken();
break :blk analyzer.addNode(.{
.id = .string_literal,
.token = token_i,
.left = Node.Index.null,
.right = Node.Index.null,
});
},
.character_literal => blk: {
analyzer.consumeToken();
break :blk analyzer.addNode(.{
.id = .character_literal,
.token = token_i,
.left = Node.Index.null,
.right = Node.Index.null,
});
},
.number_literal => blk: {
analyzer.consumeToken();
break :blk analyzer.addNode(.{
.id = .number_literal,
.token = token_i,
.left = Node.Index.null,
.right = Node.Index.null,
});
},
.identifier => analyzer.identifierNode(),
.discard => try analyzer.discardNode(),
.fixed_keyword_noreturn => analyzer.noReturn(),
.fixed_keyword_true, .fixed_keyword_false => analyzer.boolLiteral(),
.fixed_keyword_undefined => analyzer.addNode(.{
.id = .undefined,
.token = blk: {
analyzer.consumeToken();
break :blk token_i;
},
.left = Node.Index.null,
.right = Node.Index.null,
}),
.fixed_keyword_null => analyzer.addNode(.{
.id = .null_literal,
.token = blk: {
analyzer.consumeToken();
break :blk token_i;
},
.left = Node.Index.null,
.right = Node.Index.null,
}),
.fixed_keyword_unreachable => analyzer.addNode(.{
.id = .@"unreachable",
.token = blk: {
analyzer.consumeToken();
break :blk token_i;
},
.left = Node.Index.null,
.right = Node.Index.null,
}),
.intrinsic => analyzer.compilerIntrinsic(),
.fixed_keyword_bool => analyzer.addNode(.{
.id = .bool_type,
.token = blk: {
analyzer.consumeToken();
break :blk token_i;
},
.left = Node.Index.null,
.right = Node.Index.null,
}),
.keyword_unsigned_integer, .keyword_signed_integer => |signedness| analyzer.addNode(.{
.id = switch (signedness) {
.keyword_unsigned_integer => .unsigned_integer_type,
.keyword_signed_integer => .signed_integer_type,
else => unreachable,
},
.token = blk: {
analyzer.consumeToken();
break :blk token_i;
},
.left = @enumFromInt(@as(u32, try std.fmt.parseInt(u16, b: {
const slice = analyzer.bytes(token_i)[1..];
if (slice.len == 0) unreachable;
break :b slice;
}, 10))),
.right = Node.Index.null,
}),
.fixed_keyword_usize, .fixed_keyword_ssize => |size_type| analyzer.addNode(.{
.id = switch (size_type) {
.fixed_keyword_usize => .usize_type,
.fixed_keyword_ssize => .ssize_type,
else => unreachable,
},
.token = blk: {
analyzer.consumeToken();
break :blk token_i;
},
.left = Node.Index.null,
.right = Node.Index.null,
}),
.fixed_keyword_void => analyzer.addNode(.{
.id = .void_type,
.token = blk: {
analyzer.consumeToken();
break :blk token_i;
},
.left = Node.Index.null,
.right = Node.Index.null,
}),
.fixed_keyword_switch => try analyzer.switchExpression(),
.operator_dot => try analyzer.anonymousExpression(),
.fixed_keyword_enum, .fixed_keyword_struct => try analyzer.processContainerType(token),
.operator_left_parenthesis => blk: {
analyzer.consumeToken();
const expr = try analyzer.expression();
_ = try analyzer.expectToken(.operator_right_parenthesis);
break :blk expr;
},
.fixed_keyword_error => blk: {
analyzer.consumeToken();
const backing_type: Node.Index = if (analyzer.peekToken() == .operator_left_parenthesis) b: {
analyzer.consumeToken();
const type_node = try analyzer.typeExpression();
_ = try analyzer.expectToken(.operator_right_parenthesis);
break :b type_node;
} else Node.Index.null;
_ = try analyzer.expectToken(.operator_left_brace);
var list = Node.StackList{};
while (analyzer.peekToken() != .operator_right_brace) {
const tok_i = analyzer.token_i;
const t_id = analyzer.peekToken();
const identifier = switch (t_id) {
.identifier => try analyzer.identifierNode(),
else => |t| @panic(@tagName(t)),
};
const value_associated = switch (analyzer.peekToken()) {
.operator_comma => Node.Index.null,
else => value: {
analyzer.consumeToken();
break :value try analyzer.expression();
},
};
_ = try analyzer.expectToken(.operator_comma);
const error_field_node = try analyzer.addNode(.{
.id = .error_field,
.token = tok_i,
.left = identifier,
.right = value_associated,
});
list.appendAssumeCapacity(error_field_node);
}
analyzer.consumeToken();
break :blk try analyzer.addNode(.{
.id = .error_type,
.token = token_i,
.left = try analyzer.nodeList(&list),
.right = backing_type,
});
},
.operator_ampersand => try analyzer.pointerOrArrayTypeExpression(.single_pointer_type),
else => |t| switch (t) {
.identifier => @panic(analyzer.bytes(token_i)),
else => @panic(@tagName(t)),
},
};
}
fn anonymousExpression(analyzer: *Analyzer) !Node.Index {
const token_i = analyzer.token_i;
_ = try analyzer.expectToken(.operator_dot);
return switch (analyzer.peekToken()) {
.identifier => try analyzer.addNode(.{
.id = .dot_literal,
.token = blk: {
analyzer.consumeToken();
break :blk token_i;
},
.left = Node.Index.null,
.right = Node.Index.null,
}),
.operator_left_brace => try analyzer.containerLiteral(Node.Index.null),
else => |t| @panic(@tagName(t)),
};
}
// TODO:
fn suffixOperator(analyzer: *Analyzer, left: Node.Index) !Node.Index {
const token = analyzer.token_i;
const result: Node.Index = switch (analyzer.peekToken()) {
.operator_left_bracket => blk: {
analyzer.consumeToken();
const index_expression = try analyzer.expression();
if (analyzer.peekToken() == .operator_double_dot) {
analyzer.consumeToken();
const range_end_expression = switch (analyzer.peekToken()) {
.operator_right_bracket => Node.Index.null,
else => try analyzer.expression(),
};
const slice_termination: Node.Index = if (analyzer.peekToken() == .operator_colon) b: {
analyzer.consumeToken();
const result = try analyzer.expression();
break :b result;
} else .null;
const slice_metadata = try analyzer.addNode(.{
.id = .slice_metadata,
.token = token,
.left = try analyzer.addNode(.{
.id = .range,
.token = token,
.left = index_expression,
.right = range_end_expression,
}),
.right = slice_termination,
});
_ = try analyzer.expectToken(.operator_right_bracket);
const slice = try analyzer.addNode(.{
.id = .slice,
.token = token,
.left = left,
.right = slice_metadata,
});
break :blk slice;
} else {
_ = try analyzer.expectToken(.operator_right_bracket);
break :blk try analyzer.addNode(.{
.id = .indexed_access,
.token = token,
.left = left,
.right = index_expression,
});
}
},
.operator_dot => switch (analyzer.peekTokenAhead(1)) {
.identifier => try analyzer.addNode(.{
.id = .field_access,
.token = blk: {
analyzer.consumeToken();
break :blk token;
},
.left = left,
.right = try analyzer.addNode(.{
.id = .identifier,
.token = blk: {
const t = analyzer.token_i;
analyzer.consumeToken();
break :blk t;
},
.left = Node.Index.null,
.right = Node.Index.null,
}),
}),
.string_literal => try analyzer.addNode(.{
.id = .field_access,
.token = blk: {
analyzer.consumeToken();
break :blk token;
},
.left = left,
.right = try analyzer.addNode(.{
.id = .string_literal,
.token = blk: {
const t = analyzer.token_i;
analyzer.consumeToken();
break :blk t;
},
.left = Node.Index.null,
.right = Node.Index.null,
}),
}),
.operator_ampersand => try analyzer.addNode(.{
.id = .address_of,
.token = blk: {
analyzer.consumeTokens(2);
break :blk token;
},
.left = left,
.right = Node.Index.null,
}),
.operator_at => try analyzer.addNode(.{
.id = .pointer_dereference,
.token = blk: {
analyzer.consumeTokens(2);
break :blk token;
},
.left = left,
.right = Node.Index.null,
}),
.operator_optional => try analyzer.addNode(.{
.id = .optional_unwrap,
.token = blk: {
analyzer.consumeToken();
break :blk token;
},
.left = left,
.right = blk: {
const t = analyzer.token_i;
analyzer.consumeToken();
break :blk @enumFromInt(@intFromEnum(t));
},
}),
else => |t| @panic(@tagName(t)),
},
else => Node.Index.null,
};
return result;
}
fn addNode(analyzer: *Analyzer, node: Node) !Node.Index {
const node_pointer = analyzer.nodes.append(node);
const node_index = analyzer.nodes.get_index(node_pointer);
// logln(.parser, .node_creation, "Adding node #{} {s} to file #{} (left: {}, right: {})", .{ Node.unwrap(node_index), @tagName(node.id), File.unwrap(analyzer.file_index), switch (node.left) {
// .null => 0xffff_ffff,
// else => Node.unwrap(node.left),
// }, switch (node.right) {
// .null => 0xffff_ffff,
// else => Node.unwrap(node.right),
// }});
// if (Logger.bitset.contains(.node_creation_detailed)) {
// const chunk_start = analyzer.lexer.offsets.items[node.token];
// const chunk_end = analyzer.lexer.offsets.items[node.token + 1];
// const chunk_from_start = analyzer.source_file[chunk_start..];
// const end = @min(200, chunk_end - chunk_start);
// const chunk = chunk_from_start[0..end];
// logln(.parser, .node_creation, "[SOURCE]: ```\n{s}\n```\n", .{chunk});
// }
// if (node.id == .identifier) {
// logln("Node identifier: {s}", .{analyzer.bytes(node.token)});
// }
return node_index;
}
fn nodeList(analyzer: *Analyzer, stack_list: *Node.StackList) !Node.Index {
const heap_list = try analyzer.arena.new_array(Node.Index, stack_list.len);
@memcpy(heap_list, stack_list.slice());
const index = analyzer.node_lists.length;
_ = analyzer.node_lists.append(heap_list);
return try analyzer.addNode(.{
.id = .node_list,
.token = @enumFromInt(0),
.left = @enumFromInt(index),
.right = Node.Index.null,
});
}
fn identifierNode(analyzer: *Analyzer) !Node.Index {
const identifier_token = analyzer.token_i;
const t = analyzer.peekToken();
assert(t == .identifier);
analyzer.consumeToken();
return try analyzer.addNode(.{
.id = .identifier,
.token = identifier_token,
.left = Node.Index.null,
.right = Node.Index.null,
});
}
};
// Here it is assumed that left brace is consumed
pub fn analyze(allocator: Allocator, my_allocator: *MyAllocator, arena: *Arena, lexer_result: lexer.Result, source_file: []const u8, token_buffer: *Token.Buffer, node_list: *PinnedArray(Node), node_lists: *PinnedArray([]const Node.Index)) !Result {
const start = std.time.Instant.now() catch unreachable;
var analyzer = Analyzer{
.lexer = lexer_result,
.token_buffer = token_buffer,
.source_file = source_file,
// .file_index = file_index,
.token_i = lexer_result.offset,
.allocator = allocator,
.my_allocator = my_allocator,
.nodes = node_list,
.node_lists = node_lists,
.arena = arena,
};
const main_node_index = try analyzer.processContainerType(null);
const end = std.time.Instant.now() catch unreachable;
return .{
.main_node_index = main_node_index,
.time = end.since(start),
};
}
pub const SymbolDeclaration = struct {
type_node: Node.Index,
initialization_node: Node.Index,
mutability_token: Token.Index,
};
const Associativity = enum {
none,
left,
};