323 lines
12 KiB
C++
323 lines
12 KiB
C++
|
/*
|
||
|
* Mr. 4th Dimention - Allen Webster
|
||
|
*
|
||
|
* 03.10.2019
|
||
|
*
|
||
|
* Parser that extracts an API from C++ source code.
|
||
|
*
|
||
|
*/
|
||
|
|
||
|
// TOP
|
||
|
|
||
|
/*
|
||
|
function:
|
||
|
api ( <identifier> ) function <identifier> {*} <identifier> ( <param_list> )
|
||
|
|
||
|
param_list:
|
||
|
void |
|
||
|
<identifier> {*} <identifier> [, <identifier> {*} <identifier>]
|
||
|
|
||
|
anything_else:
|
||
|
***
|
||
|
|
||
|
api_source:
|
||
|
{function|anything_else} EOF
|
||
|
*/
|
||
|
|
||
|
function Token*
|
||
|
api_parse__token_pos(Token_Iterator *it){
|
||
|
return(token_it_read(it));
|
||
|
}
|
||
|
|
||
|
function b32
|
||
|
api_parse__match(Token_Iterator *it, Token_Cpp_Kind sub_kind){
|
||
|
b32 match = false;
|
||
|
Token *token = token_it_read(it);
|
||
|
if (token != 0 && token->sub_kind == sub_kind){
|
||
|
if (token_it_inc(it)){
|
||
|
match = true;
|
||
|
}
|
||
|
}
|
||
|
return(match);
|
||
|
}
|
||
|
|
||
|
function b32
|
||
|
api_parse__match_identifier(Token_Iterator *it, String_Const_u8 source, String_Const_u8 *lexeme){
|
||
|
b32 match = false;
|
||
|
Token *token = token_it_read(it);
|
||
|
if (token->kind == TokenBaseKind_Identifier ||
|
||
|
token->kind == TokenBaseKind_Keyword){
|
||
|
if (token_it_inc(it)){
|
||
|
*lexeme = string_substring(source, Ii64(token));
|
||
|
match = true;
|
||
|
}
|
||
|
}
|
||
|
return(match);
|
||
|
}
|
||
|
|
||
|
function b32
|
||
|
api_parse__match_identifier(Token_Iterator *it, String_Const_u8 source, char *lexeme){
|
||
|
b32 match = false;
|
||
|
Token *token = token_it_read(it);
|
||
|
if ((token->kind == TokenBaseKind_Identifier ||
|
||
|
token->kind == TokenBaseKind_Keyword) &&
|
||
|
string_match(SCu8(lexeme), string_substring(source, Ii64(token)))){
|
||
|
if (token_it_inc(it)){
|
||
|
match = true;
|
||
|
}
|
||
|
}
|
||
|
return(match);
|
||
|
}
|
||
|
|
||
|
function String_Const_u8
|
||
|
api_parse__type_name_with_stars(Arena *arena, String_Const_u8 type, i32 star_counter){
|
||
|
if (star_counter > 0){
|
||
|
i32 type_full_size = (i32)(type.size) + star_counter;
|
||
|
u8 *type_buffer = push_array(arena, u8, type_full_size + 1);
|
||
|
block_copy(type_buffer, type.str, type.size);
|
||
|
block_fill_u8(type_buffer + type.size, star_counter, (u8)'*');
|
||
|
type_buffer[type_full_size] = 0;
|
||
|
type = SCu8(type_buffer, type_full_size);
|
||
|
}
|
||
|
return(type);
|
||
|
}
|
||
|
|
||
|
function void
|
||
|
api_parse_add_param(Arena *arena, API_Param_List *list, String_Const_u8 type, i32 star_counter, String_Const_u8 name){
|
||
|
type = api_parse__type_name_with_stars(arena, type, star_counter);
|
||
|
API_Param *param = push_array(arena, API_Param, 1);
|
||
|
sll_queue_push(list->first, list->last, param);
|
||
|
list->count += 1;
|
||
|
param->type_name = type;
|
||
|
param->name = name;
|
||
|
}
|
||
|
|
||
|
function void
|
||
|
api_parse_add_function(Arena *arena, API_Definition_List *list,
|
||
|
String_Const_u8 api_name, String_Const_u8 func_name,
|
||
|
String_Const_u8 type, i32 star_counter, API_Param_List param_list,
|
||
|
String_Const_u8 location){
|
||
|
API_Definition *api = api_get_api(arena, list, api_name);
|
||
|
type = api_parse__type_name_with_stars(arena, type, star_counter);
|
||
|
API_Call *call = api_call_with_location(arena, api, func_name, type, location);
|
||
|
api_set_param_list(call, param_list);
|
||
|
}
|
||
|
|
||
|
function void
|
||
|
api_parse_add_structure(Arena *arena, API_Definition_List *list,
|
||
|
String_Const_u8 api_name, API_Type_Structure_Kind kind,
|
||
|
String_Const_u8 name, List_String_Const_u8 member_list,
|
||
|
String_Const_u8 definition, String_Const_u8 location){
|
||
|
API_Definition *api = api_get_api(arena, list, api_name);
|
||
|
api_type_structure_with_location(arena, api, kind, name, member_list, definition, location);
|
||
|
}
|
||
|
|
||
|
function String_Const_u8
|
||
|
api_parse_location(Arena *arena, String_Const_u8 source_name, String_Const_u8 source, u8 *pos){
|
||
|
i32 line_number = 1;
|
||
|
i32 col_number = 1;
|
||
|
if (source.str <= pos && pos < source.str + source.size){
|
||
|
for (u8 *ptr = source.str;;){
|
||
|
if (ptr == pos){
|
||
|
break;
|
||
|
}
|
||
|
if (*ptr == '\n'){
|
||
|
line_number += 1;
|
||
|
col_number = 1;
|
||
|
}
|
||
|
else{
|
||
|
col_number += 1;
|
||
|
}
|
||
|
ptr += 1;
|
||
|
}
|
||
|
}
|
||
|
return(push_u8_stringf(arena, "%.*s:%d:%d:", string_expand(source_name), line_number, col_number));
|
||
|
}
|
||
|
|
||
|
function b32
|
||
|
api_parse_source__function(Arena *arena, String_Const_u8 source_name, String_Const_u8 source, Token_Iterator *token_it, String_Const_u8 api_name, API_Definition_List *list){
|
||
|
b32 result = false;
|
||
|
String_Const_u8 ret_type = {};
|
||
|
i32 ret_type_star_counter = 0;
|
||
|
String_Const_u8 func_name = {};
|
||
|
API_Param_List param_list = {};
|
||
|
if (api_parse__match_identifier(token_it, source, &ret_type)){
|
||
|
for (;api_parse__match(token_it, TokenCppKind_Star);){
|
||
|
ret_type_star_counter += 1;
|
||
|
}
|
||
|
if (api_parse__match_identifier(token_it, source, &func_name)){
|
||
|
if (api_parse__match(token_it, TokenCppKind_ParenOp)){
|
||
|
b32 param_list_success = false;
|
||
|
if (api_parse__match_identifier(token_it, source, "void")){
|
||
|
param_list_success = true;
|
||
|
}
|
||
|
else{
|
||
|
for (;;){
|
||
|
String_Const_u8 type = {};
|
||
|
i32 star_counter = 0;
|
||
|
String_Const_u8 name = {};
|
||
|
if (api_parse__match_identifier(token_it, source, &type)){
|
||
|
for (;api_parse__match(token_it, TokenCppKind_Star);){
|
||
|
star_counter += 1;
|
||
|
}
|
||
|
if (api_parse__match_identifier(token_it, source, &name)){
|
||
|
param_list_success = true;
|
||
|
}
|
||
|
else{
|
||
|
break;
|
||
|
}
|
||
|
}
|
||
|
else{
|
||
|
break;
|
||
|
}
|
||
|
if (param_list_success){
|
||
|
api_parse_add_param(arena, ¶m_list, type, star_counter, name);
|
||
|
}
|
||
|
if (api_parse__match(token_it, TokenCppKind_Comma)){
|
||
|
param_list_success = false;
|
||
|
}
|
||
|
else{
|
||
|
break;
|
||
|
}
|
||
|
}
|
||
|
}
|
||
|
if (param_list_success){
|
||
|
if (api_parse__match(token_it, TokenCppKind_ParenCl)){
|
||
|
result = true;
|
||
|
}
|
||
|
}
|
||
|
}
|
||
|
}
|
||
|
}
|
||
|
if (result){
|
||
|
String_Const_u8 location = api_parse_location(arena, source_name, source, func_name.str);
|
||
|
api_parse_add_function(arena, list, api_name, func_name, ret_type, ret_type_star_counter, param_list, location);
|
||
|
}
|
||
|
return(result);
|
||
|
}
|
||
|
|
||
|
function String_Const_u8
|
||
|
api_parse__restringize_token_range(Arena *arena, String_Const_u8 source, Token *token, Token *token_end){
|
||
|
List_String_Const_u8 list = {};
|
||
|
for (Token *t = token; t < token_end; t += 1){
|
||
|
if (t->kind == TokenBaseKind_Comment){
|
||
|
continue;
|
||
|
}
|
||
|
if (t->kind == TokenBaseKind_Whitespace){
|
||
|
// TODO(allen): if there is a newline, emit it, all other whitespace is managed automatically.
|
||
|
continue;
|
||
|
}
|
||
|
|
||
|
String_Const_u8 str = string_substring(source, Ii64(t));
|
||
|
string_list_push(arena, &list, str);
|
||
|
}
|
||
|
return(string_list_flatten(arena, list));
|
||
|
}
|
||
|
|
||
|
function b32
|
||
|
api_parse_source__structure(Arena *arena, String_Const_u8 source_name, String_Const_u8 source, API_Type_Structure_Kind kind, Token_Iterator *token_it, String_Const_u8 api_name, API_Definition_List *list){
|
||
|
b32 result = false;
|
||
|
String_Const_u8 name = {};
|
||
|
List_String_Const_u8 member_list = {};
|
||
|
Token *token = api_parse__token_pos(token_it);
|
||
|
(void)token;
|
||
|
if (api_parse__match_identifier(token_it, source, &name)){
|
||
|
if (api_parse__match(token_it, TokenCppKind_Semicolon)){
|
||
|
result = true;
|
||
|
}
|
||
|
else if (api_parse__match(token_it, TokenCppKind_BraceOp)){
|
||
|
b32 member_list_success = false;
|
||
|
for (;;){
|
||
|
String_Const_u8 member_name = {};
|
||
|
if (api_parse__match(token_it, TokenCppKind_BraceCl)){
|
||
|
member_list_success = true;
|
||
|
break;
|
||
|
}
|
||
|
else if (api_parse__match_identifier(token_it, source, &member_name)){
|
||
|
if (api_parse__match(token_it, TokenCppKind_Semicolon)){
|
||
|
string_list_push(arena, &member_list, member_name);
|
||
|
}
|
||
|
}
|
||
|
else{
|
||
|
if (!token_it_inc(token_it)){
|
||
|
break;
|
||
|
}
|
||
|
}
|
||
|
}
|
||
|
if (member_list_success){
|
||
|
if (api_parse__match(token_it, TokenCppKind_BraceCl)){
|
||
|
if (api_parse__match(token_it, TokenCppKind_Semicolon)){
|
||
|
result = true;
|
||
|
}
|
||
|
}
|
||
|
}
|
||
|
}
|
||
|
}
|
||
|
if (result){
|
||
|
Token *token_end = api_parse__token_pos(token_it);
|
||
|
(void)token_end;
|
||
|
// TODO(allen):
|
||
|
String_Const_u8 definition = {};
|
||
|
String_Const_u8 location = api_parse_location(arena, source_name, source, name.str);
|
||
|
api_parse_add_structure(arena, list, api_name, kind, name, member_list, definition, location);
|
||
|
}
|
||
|
return(result);
|
||
|
}
|
||
|
|
||
|
function b32
|
||
|
api_parse_source__struct(Arena *arena, String_Const_u8 source_name, String_Const_u8 source, Token_Iterator *token_it, String_Const_u8 api_name, API_Definition_List *list){
|
||
|
return(api_parse_source__structure(arena, source_name, source, APITypeStructureKind_Struct, token_it, api_name, list));
|
||
|
}
|
||
|
|
||
|
function b32
|
||
|
api_parse_source__union(Arena *arena, String_Const_u8 source_name, String_Const_u8 source, Token_Iterator *token_it, String_Const_u8 api_name, API_Definition_List *list){
|
||
|
return(api_parse_source__structure(arena, source_name, source, APITypeStructureKind_Union, token_it, api_name, list));
|
||
|
}
|
||
|
|
||
|
function void
|
||
|
api_parse_source_add_to_list(Arena *arena, String_Const_u8 source_name, String_Const_u8 source, API_Definition_List *list){
|
||
|
Token_List token_list = lex_full_input_cpp(arena, source);
|
||
|
Token_Iterator token_it = token_iterator(token_iterator(0, &token_list));
|
||
|
|
||
|
for (;;){
|
||
|
Token *token = token_it_read(&token_it);
|
||
|
if (token->sub_kind == TokenCppKind_EOF){
|
||
|
break;
|
||
|
}
|
||
|
|
||
|
if (api_parse__match_identifier(&token_it, source, "api")){
|
||
|
String_Const_u8 api_name = {};
|
||
|
if (api_parse__match(&token_it, TokenCppKind_ParenOp)){
|
||
|
if (api_parse__match_identifier(&token_it, source, &api_name)){
|
||
|
if (api_parse__match(&token_it, TokenCppKind_ParenCl)){
|
||
|
if (api_parse__match_identifier(&token_it, source, "function")){
|
||
|
api_parse_source__function(arena, source_name, source, &token_it, api_name, list);
|
||
|
}
|
||
|
else if (api_parse__match_identifier(&token_it, source, "struct")){
|
||
|
api_parse_source__struct(arena, source_name, source, &token_it, api_name, list);
|
||
|
}
|
||
|
else if (api_parse__match_identifier(&token_it, source, "union")){
|
||
|
api_parse_source__union(arena, source_name, source, &token_it, api_name, list);
|
||
|
}
|
||
|
}
|
||
|
}
|
||
|
}
|
||
|
}
|
||
|
else{
|
||
|
if (!token_it_inc(&token_it)){
|
||
|
break;
|
||
|
}
|
||
|
}
|
||
|
}
|
||
|
}
|
||
|
|
||
|
function API_Definition_List
|
||
|
api_parse_source(Arena *arena, String_Const_u8 source_name, String_Const_u8 source){
|
||
|
API_Definition_List list = {};
|
||
|
api_parse_source_add_to_list(arena, source_name, source, &list);
|
||
|
return(list);
|
||
|
}
|
||
|
|
||
|
// BOTTOM
|
||
|
|