2016-11-02 03:27:51 +00:00
/*
* Mr . 4 th Dimention - Allen Webster
*
* 01.11 .2016
*
* meta - compilation core system
*
*/
// TOP
2017-01-23 06:19:43 +00:00
# if !defined(META_PARSER_CPP)
# define META_PARSER_CPP
2016-11-02 03:27:51 +00:00
typedef struct Parse_Context {
Cpp_Token * token_s ;
Cpp_Token * token_e ;
Cpp_Token * token ;
char * data ;
} Parse_Context ;
typedef struct Argument {
String param_string ;
String param_name ;
} Argument ;
typedef struct Argument_Breakdown {
int32_t count ;
Argument * args ;
} Argument_Breakdown ;
typedef struct Documentation {
int32_t param_count ;
String * param_name ;
String * param_docs ;
String return_doc ;
String main_doc ;
int32_t see_also_count ;
String * see_also ;
} Documentation ;
typedef enum Item_Type {
Item_Null ,
Item_Function ,
Item_CppName ,
Item_Macro ,
Item_Typedef ,
Item_Struct ,
Item_Union ,
Item_Enum ,
Item_Type_Count ,
# define Item_Type_User0 Item_Type_Count
} Item_Type ;
typedef struct Item_Node {
int32_t t ;
String cpp_name ;
String name ;
String ret ;
String args ;
String body ;
String marker ;
String value ;
String type ;
String type_postfix ;
String doc_string ;
Argument_Breakdown breakdown ;
Documentation doc ;
Item_Node * first_child ;
Item_Node * next_sibling ;
} Item_Node ;
typedef struct Item_Set {
Item_Node * items ;
int32_t count ;
} Item_Set ;
typedef struct Parse {
String code ;
Cpp_Token_Array tokens ;
int32_t item_count ;
} Parse ;
typedef struct Meta_Unit {
Item_Set set ;
Parse * parse ;
int32_t count ;
} Meta_Unit ;
typedef struct Meta_Keywords {
String key ;
Item_Type type ;
} Meta_Keywords ;
typedef struct Used_Links {
String * strs ;
int32_t count , max ;
} Used_Links ;
static Item_Node null_item_node = { 0 } ;
static String
str_start_end ( char * data , int32_t start , int32_t end ) {
return ( make_string ( data + start , end - start ) ) ;
}
static String
get_lexeme ( Cpp_Token token , char * code ) {
String str = make_string ( code + token . start , token . size ) ;
return ( str ) ;
}
static Parse_Context
setup_parse_context ( char * data , Cpp_Token_Array array ) {
Parse_Context context ;
context . token_s = array . tokens ;
context . token_e = array . tokens + array . count ;
context . token = context . token_s ;
context . data = data ;
return ( context ) ;
}
static Parse_Context
setup_parse_context ( Parse parse ) {
Parse_Context context ;
context . token_s = parse . tokens . tokens ;
context . token_e = parse . tokens . tokens + parse . tokens . count ;
context . token = context . token_s ;
context . data = parse . code . str ;
return ( context ) ;
}
static Cpp_Token *
get_token ( Parse_Context * context ) {
Cpp_Token * result = context - > token ;
if ( result > = context - > token_e ) {
result = 0 ;
}
return ( result ) ;
}
static Cpp_Token *
get_next_token ( Parse_Context * context ) {
Cpp_Token * result = context - > token + 1 ;
context - > token = result ;
if ( result > = context - > token_e ) {
result = 0 ;
context - > token = context - > token_e ;
}
return ( result ) ;
}
static Cpp_Token *
get_prev_token ( Parse_Context * context ) {
Cpp_Token * result = context - > token - 1 ;
if ( result < context - > token_s ) {
result = 0 ;
}
else {
context - > token = result ;
}
return ( result ) ;
}
static Cpp_Token *
can_back_step ( Parse_Context * context ) {
Cpp_Token * result = context - > token - 1 ;
if ( result < context - > token_s ) {
result = 0 ;
}
return ( result ) ;
}
static Cpp_Token *
set_token ( Parse_Context * context , Cpp_Token * token ) {
Cpp_Token * result = 0 ;
if ( token > = context - > token_s & & token < context - > token_e ) {
context - > token = token ;
result = token ;
}
return ( result ) ;
}
static String
str_alloc ( Partition * part , int32_t cap ) {
return ( make_string_cap ( push_array ( part , char , cap ) , 0 , cap ) ) ;
}
static Item_Set
allocate_item_set ( Partition * part , int32_t count ) {
Item_Set item_set = { 0 } ;
if ( count > 0 ) {
item_set . items = push_array ( part , Item_Node , count ) ;
item_set . count = count ;
memset ( item_set . items , 0 , sizeof ( Item_Node ) * count ) ;
}
return ( item_set ) ;
}
static String
file_dump ( char * filename ) {
String result = { 0 } ;
FILE * file = fopen ( filename , " rb " ) ;
if ( file ) {
fseek ( file , 0 , SEEK_END ) ;
result . size = ftell ( file ) ;
fseek ( file , 0 , SEEK_SET ) ;
result . memory_size = result . size + 1 ;
result . str = ( char * ) malloc ( result . memory_size ) ;
fread ( result . str , 1 , result . size , file ) ;
result . str [ result . size ] = 0 ;
fclose ( file ) ;
}
return ( result ) ;
}
static Parse
meta_lex ( char * filename ) {
Parse result = { 0 } ;
result . code = file_dump ( filename ) ;
2017-01-23 06:19:43 +00:00
if ( result . code . str ! = 0 ) {
result . tokens = cpp_make_token_array ( 1024 ) ;
cpp_lex_file ( result . code . str , result . code . size , & result . tokens ) ;
}
2016-11-02 03:27:51 +00:00
return ( result ) ;
}
static String
get_first_line ( String source ) {
String line = { 0 } ;
int32_t pos = find_s_char ( source , 0 , ' \n ' ) ;
line = substr ( source , 0 , pos ) ;
return ( line ) ;
}
static String
get_next_line ( String source , String line ) {
String next = { 0 } ;
int32_t pos = ( int32_t ) ( line . str - source . str ) + line . size ;
int32_t start = 0 ;
if ( pos < source . size ) {
2017-01-23 06:19:43 +00:00
Assert ( source . str [ pos ] = = ' \n ' ) ;
2016-11-02 03:27:51 +00:00
start = pos + 1 ;
if ( start < source . size ) {
pos = find_s_char ( source , start , ' \n ' ) ;
next = substr ( source , start , pos - start ) ;
}
}
return ( next ) ;
}
static int32_t
is_comment ( String str ) {
int32_t result = 0 ;
if ( str . size > = 2 ) {
if ( str . str [ 0 ] = = ' / ' & &
str . str [ 1 ] = = ' / ' ) {
result = 1 ;
}
}
return ( result ) ;
}
typedef enum Doc_Note_Type {
DOC_PARAM ,
DOC_RETURN ,
DOC ,
DOC_SEE ,
DOC_HIDE ,
HIDE_MEMBERS ,
} Doc_Note_Type ;
static String
2017-03-17 04:48:27 +00:00
defined_doc_notes [ ] = {
2016-11-02 03:27:51 +00:00
make_lit_string ( " DOC_PARAM " ) ,
make_lit_string ( " DOC_RETURN " ) ,
make_lit_string ( " DOC " ) ,
make_lit_string ( " DOC_SEE " ) ,
make_lit_string ( " DOC_HIDE " ) ,
make_lit_string ( " HIDE_MEMBERS " ) ,
} ;
static int32_t
check_and_fix_docs ( String * doc_string ) {
int32_t result = false ;
if ( doc_string - > size > 4 ) {
if ( doc_string - > str [ 0 ] = = ' / ' ) {
if ( doc_string - > str [ 1 ] = = ' * ' ) {
if ( doc_string - > str [ doc_string - > size - 2 ] = = ' * ' ) {
if ( doc_string - > str [ doc_string - > size - 1 ] = = ' / ' ) {
result = true ;
doc_string - > str + = 2 ;
doc_string - > size - = 4 ;
}
}
}
}
}
return ( result ) ;
}
static int32_t
get_doc_string_from_prev ( Parse_Context * context , String * doc_string ) {
int32_t result = false ;
if ( can_back_step ( context ) ) {
Cpp_Token * prev_token = get_token ( context ) - 1 ;
if ( prev_token - > type = = CPP_TOKEN_COMMENT ) {
* doc_string = get_lexeme ( * prev_token , context - > data ) ;
if ( check_and_fix_docs ( doc_string ) ) {
result = true ;
}
else {
* doc_string = null_string ;
}
}
}
return ( result ) ;
}
static String
doc_parse_note ( String source , int32_t * pos ) {
String result = { 0 } ;
int32_t p = * pos ;
int32_t start = p ;
for ( ; p < source . size ; + + p ) {
if ( source . str [ p ] = = ' ( ' ) {
break ;
}
}
if ( p ! = source . size ) {
result = make_string ( source . str + start , p - start ) ;
result = skip_chop_whitespace ( result ) ;
}
* pos = p ;
return ( result ) ;
}
static String
doc_parse_note_string ( String source , int32_t * pos ) {
String result = { 0 } ;
2017-01-23 06:19:43 +00:00
Assert ( source . str [ * pos ] = = ' ( ' ) ;
2016-11-02 03:27:51 +00:00
int32_t p = * pos + 1 ;
int32_t start = p ;
int32_t nest_level = 0 ;
for ( ; p < source . size ; + + p ) {
if ( source . str [ p ] = = ' ) ' ) {
if ( nest_level = = 0 ) {
break ;
}
else {
- - nest_level ;
}
}
else if ( source . str [ p ] = = ' ( ' ) {
+ + nest_level ;
}
}
if ( p ! = source . size ) {
result = make_string ( source . str + start , p - start ) ;
result = skip_chop_whitespace ( result ) ;
+ + p ;
}
* pos = p ;
return ( result ) ;
}
static String
doc_parse_parameter ( String source , int32_t * pos ) {
String result = { 0 } ;
int32_t p = * pos ;
int32_t start = p ;
for ( ; p < source . size ; + + p ) {
if ( source . str [ p ] = = ' , ' ) {
break ;
}
}
if ( p ! = source . size ) {
result = make_string ( source . str + start , p - start ) ;
result = skip_chop_whitespace ( result ) ;
+ + p ;
}
* pos = p ;
return ( result ) ;
}
static String
doc_parse_last_parameter ( String source , int32_t * pos ) {
String result = { 0 } ;
int32_t p = * pos ;
int32_t start = p ;
for ( ; p < source . size ; + + p ) {
if ( source . str [ p ] = = ' ) ' ) {
break ;
}
}
if ( p = = source . size ) {
result = make_string ( source . str + start , p - start ) ;
result = skip_chop_whitespace ( result ) ;
}
* pos = p ;
return ( result ) ;
}
static void
perform_doc_parse ( Partition * part , String doc_string , Documentation * doc ) {
int32_t keep_parsing = true ;
int32_t pos = 0 ;
int32_t param_count = 0 ;
int32_t see_count = 0 ;
do {
String doc_note = doc_parse_note ( doc_string , & pos ) ;
if ( doc_note . size = = 0 ) {
keep_parsing = false ;
}
else {
int32_t doc_note_type ;
2017-03-17 04:48:27 +00:00
if ( string_set_match ( defined_doc_notes , ArrayCount ( defined_doc_notes ) , doc_note , & doc_note_type ) ) {
2016-11-02 03:27:51 +00:00
doc_parse_note_string ( doc_string , & pos ) ;
switch ( doc_note_type ) {
case DOC_PARAM : + + param_count ; break ;
case DOC_SEE : + + see_count ; break ;
}
}
}
} while ( keep_parsing ) ;
if ( param_count + see_count > 0 ) {
int32_t memory_size = sizeof ( String ) * ( 2 * param_count + see_count ) ;
doc - > param_name = push_array ( part , String , memory_size ) ;
doc - > param_docs = doc - > param_name + param_count ;
doc - > see_also = doc - > param_docs + param_count ;
doc - > param_count = param_count ;
doc - > see_also_count = see_count ;
}
int32_t param_index = 0 ;
int32_t see_index = 0 ;
keep_parsing = true ;
pos = 0 ;
do {
String doc_note = doc_parse_note ( doc_string , & pos ) ;
if ( doc_note . size = = 0 ) {
keep_parsing = false ;
}
else {
int32_t doc_note_type ;
2017-03-17 04:48:27 +00:00
if ( string_set_match ( defined_doc_notes , ArrayCount ( defined_doc_notes ) , doc_note , & doc_note_type ) ) {
2016-11-02 03:27:51 +00:00
String doc_note_string = doc_parse_note_string ( doc_string , & pos ) ;
switch ( doc_note_type ) {
case DOC_PARAM :
{
2017-01-23 06:19:43 +00:00
Assert ( param_index < param_count ) ;
2016-11-02 03:27:51 +00:00
int32_t param_pos = 0 ;
String param_name = doc_parse_parameter ( doc_note_string , & param_pos ) ;
String param_docs = doc_parse_last_parameter ( doc_note_string , & param_pos ) ;
doc - > param_name [ param_index ] = param_name ;
doc - > param_docs [ param_index ] = param_docs ;
+ + param_index ;
} break ;
case DOC_RETURN :
{
doc - > return_doc = doc_note_string ;
} break ;
case DOC :
{
doc - > main_doc = doc_note_string ;
} break ;
case DOC_SEE :
{
2017-01-23 06:19:43 +00:00
Assert ( see_index < see_count ) ;
2016-11-02 03:27:51 +00:00
doc - > see_also [ see_index + + ] = doc_note_string ;
} break ;
}
}
else {
fprintf ( stderr , " warning: invalid doc note %.*s \n " , doc_note . size , doc_note . str ) ;
}
}
} while ( keep_parsing ) ;
}
static int32_t
struct_parse ( Partition * part , int32_t is_struct ,
Parse_Context * context , Item_Node * top_member ) ;
static int32_t
struct_parse_member ( Partition * part , Parse_Context * context , Item_Node * member ) {
int32_t result = false ;
Cpp_Token * token = get_token ( context ) ;
String doc_string = { 0 } ;
get_doc_string_from_prev ( context , & doc_string ) ;
Cpp_Token * start_token = token ;
for ( ; ( token = get_token ( context ) ) ! = 0 ; get_next_token ( context ) ) {
if ( token - > type = = CPP_TOKEN_SEMICOLON ) {
break ;
}
}
if ( token ) {
String name = { 0 } ;
Cpp_Token * token_j = 0 ;
int32_t nest_level = 0 ;
for ( ; ( token_j = get_token ( context ) ) > start_token ; get_prev_token ( context ) ) {
if ( token_j - > type = = CPP_TOKEN_BRACKET_CLOSE ) {
+ + nest_level ;
}
else if ( token_j - > type = = CPP_TOKEN_BRACKET_OPEN ) {
- - nest_level ;
if ( nest_level < 0 ) {
break ;
}
}
if ( nest_level = = 0 ) {
if ( token_j - > type = = CPP_TOKEN_IDENTIFIER ) {
break ;
}
}
}
name = skip_chop_whitespace ( get_lexeme ( * token_j , context - > data ) ) ;
String type = skip_chop_whitespace ( str_start_end ( context - > data , start_token - > start , token_j - > start ) ) ;
String type_postfix = skip_chop_whitespace ( str_start_end ( context - > data , token_j - > start + token_j - > size , token - > start ) ) ;
set_token ( context , token + 1 ) ;
result = true ;
member - > name = name ;
member - > type = type ;
member - > type_postfix = type_postfix ;
member - > doc_string = doc_string ;
member - > first_child = 0 ;
member - > next_sibling = 0 ;
}
return ( result ) ;
}
static Item_Node *
struct_parse_next_member ( Partition * part , Parse_Context * context ) {
Item_Node * result = 0 ;
Cpp_Token * token = 0 ;
for ( ; ( token = get_token ( context ) ) ! = 0 ; get_next_token ( context ) ) {
if ( token - > type = = CPP_TOKEN_IDENTIFIER | |
( token - > flags & CPP_TFLAG_IS_KEYWORD ) ) {
String lexeme = get_lexeme ( * token , context - > data ) ;
if ( match_ss ( lexeme , make_lit_string ( " STRUCT " ) ) ) {
Item_Node * member = push_struct ( part , Item_Node ) ;
if ( struct_parse ( part , true , context , member ) ) {
result = member ;
break ;
}
else {
2017-01-23 06:19:43 +00:00
Assert ( ! " unhandled error " ) ;
2016-11-02 03:27:51 +00:00
}
}
else if ( match_ss ( lexeme , make_lit_string ( " UNION " ) ) ) {
Item_Node * member = push_struct ( part , Item_Node ) ;
if ( struct_parse ( part , false , context , member ) ) {
result = member ;
break ;
}
else {
2017-01-23 06:19:43 +00:00
Assert ( ! " unhandled error " ) ;
2016-11-02 03:27:51 +00:00
}
}
else {
Item_Node * member = push_struct ( part , Item_Node ) ;
if ( struct_parse_member ( part , context , member ) ) {
result = member ;
break ;
}
else {
2017-01-23 06:19:43 +00:00
Assert ( ! " unhandled error " ) ;
2016-11-02 03:27:51 +00:00
}
}
}
else if ( token - > type = = CPP_TOKEN_BRACE_CLOSE ) {
break ;
}
}
return ( result ) ;
}
static int32_t
struct_parse ( Partition * part , int32_t is_struct , Parse_Context * context , Item_Node * top_member ) {
int32_t result = false ;
Cpp_Token * start_token = get_token ( context ) ;
Cpp_Token * token = 0 ;
String doc_string = { 0 } ;
get_doc_string_from_prev ( context , & doc_string ) ;
for ( ; ( token = get_token ( context ) ) ! = 0 ; get_next_token ( context ) ) {
if ( token - > type = = CPP_TOKEN_BRACE_OPEN ) {
break ;
}
}
if ( token ) {
Cpp_Token * token_j = token ;
for ( ; ( token_j = get_token ( context ) ) > start_token ; get_prev_token ( context ) ) {
if ( token_j - > type = = CPP_TOKEN_IDENTIFIER ) {
break ;
}
}
String name = { 0 } ;
if ( token_j ! = start_token ) {
name = skip_chop_whitespace ( get_lexeme ( * token_j , context - > data ) ) ;
}
String type = { 0 } ;
if ( is_struct ) {
type = make_lit_string ( " struct " ) ;
}
else {
type = make_lit_string ( " union " ) ;
}
set_token ( context , token + 1 ) ;
Item_Node * new_member = struct_parse_next_member ( part , context ) ;
if ( new_member ) {
top_member - > first_child = new_member ;
Item_Node * head_member = new_member ;
for ( ; ; ) {
new_member = struct_parse_next_member ( part , context ) ;
if ( new_member ) {
head_member - > next_sibling = new_member ;
head_member = new_member ;
}
else {
break ;
}
}
}
for ( ; ( token = get_token ( context ) ) ! = 0 ; get_next_token ( context ) ) {
if ( token - > type = = CPP_TOKEN_SEMICOLON ) {
break ;
}
}
+ + token ;
if ( is_struct ) {
top_member - > t = Item_Struct ;
}
else {
top_member - > t = Item_Union ;
}
top_member - > name = name ;
top_member - > type = type ;
top_member - > doc_string = doc_string ;
top_member - > next_sibling = 0 ;
result = true ;
}
return ( result ) ;
}
static int32_t
typedef_parse ( Parse_Context * context , Item_Node * item ) {
int32_t result = false ;
Cpp_Token * token = get_token ( context ) ;
String doc_string = { 0 } ;
get_doc_string_from_prev ( context , & doc_string ) ;
Cpp_Token * start_token = token ;
for ( ; ( token = get_token ( context ) ) ! = 0 ; get_next_token ( context ) ) {
if ( token - > type = = CPP_TOKEN_SEMICOLON ) {
break ;
}
}
if ( token ) {
Cpp_Token * token_j = token ;
for ( ; ( token_j = get_token ( context ) ) > start_token ; get_prev_token ( context ) ) {
if ( token_j - > type = = CPP_TOKEN_IDENTIFIER ) {
break ;
}
}
String name = get_lexeme ( * token_j , context - > data ) ;
String type = skip_chop_whitespace ( str_start_end ( context - > data , start_token - > start + start_token - > size , token_j - > start ) ) ;
item - > t = Item_Typedef ;
item - > type = type ;
item - > name = name ;
item - > doc_string = doc_string ;
result = true ;
}
set_token ( context , token ) ;
return ( result ) ;
}
static int32_t
enum_parse ( Partition * part , Parse_Context * context , Item_Node * item ) {
int32_t result = false ;
2017-03-17 04:48:27 +00:00
String parent_doc_string = { 0 } ;
get_doc_string_from_prev ( context , & parent_doc_string ) ;
2016-11-02 03:27:51 +00:00
2017-03-17 04:48:27 +00:00
Cpp_Token * parent_start_token = get_token ( context ) ;
2016-11-02 03:27:51 +00:00
Cpp_Token * token = 0 ;
for ( ; ( token = get_token ( context ) ) ! = 0 ; get_next_token ( context ) ) {
if ( token - > type = = CPP_TOKEN_BRACE_OPEN ) {
break ;
}
}
if ( token ) {
2017-03-17 04:48:27 +00:00
String parent_name = { 0 } ;
2016-11-02 03:27:51 +00:00
Cpp_Token * token_j = 0 ;
for ( ; ( token_j = get_token ( context ) ) ! = 0 ; get_prev_token ( context ) ) {
if ( token_j - > type = = CPP_TOKEN_IDENTIFIER ) {
break ;
}
}
2017-03-17 04:48:27 +00:00
parent_name = get_lexeme ( * token_j , context - > data ) ;
2016-11-02 03:27:51 +00:00
set_token ( context , token ) ;
2017-03-17 04:48:27 +00:00
for ( ; ( token = get_token ( context ) ) > parent_start_token ; get_next_token ( context ) ) {
2016-11-02 03:27:51 +00:00
if ( token - > type = = CPP_TOKEN_BRACE_OPEN ) {
break ;
}
}
if ( token ) {
Item_Node * first_member = 0 ;
Item_Node * head_member = 0 ;
for ( ; ( token = get_token ( context ) ) ! = 0 ; get_next_token ( context ) ) {
if ( token - > type = = CPP_TOKEN_BRACE_CLOSE ) {
break ;
}
else if ( token - > type = = CPP_TOKEN_IDENTIFIER ) {
String doc_string = { 0 } ;
String name = { 0 } ;
String value = { 0 } ;
get_doc_string_from_prev ( context , & doc_string ) ;
name = get_lexeme ( * token , context - > data ) ;
token = get_next_token ( context ) ;
if ( token ) {
if ( token - > type = = CPP_TOKEN_EQ ) {
Cpp_Token * start_token = token ;
for ( ; ( token = get_token ( context ) ) ! = 0 ; get_next_token ( context ) ) {
if ( token - > type = = CPP_TOKEN_COMMA | |
token - > type = = CPP_TOKEN_BRACE_CLOSE ) {
break ;
}
}
value = skip_chop_whitespace ( str_start_end ( context - > data , start_token - > start + start_token - > size , token - > start ) ) ;
get_prev_token ( context ) ;
}
else {
get_prev_token ( context ) ;
}
}
Item_Node * new_member = push_struct ( part , Item_Node ) ;
if ( first_member = = 0 ) {
first_member = new_member ;
}
if ( head_member ) {
head_member - > next_sibling = new_member ;
}
head_member = new_member ;
new_member - > name = name ;
new_member - > value = value ;
new_member - > doc_string = doc_string ;
new_member - > next_sibling = 0 ;
}
}
if ( ( token = get_token ( context ) ) ! = 0 ) {
for ( ; ( token = get_token ( context ) ) ! = 0 ; get_next_token ( context ) ) {
if ( token - > type = = CPP_TOKEN_BRACE_CLOSE ) {
break ;
}
}
get_next_token ( context ) ;
item - > t = Item_Enum ;
2017-03-17 04:48:27 +00:00
item - > name = parent_name ;
item - > doc_string = parent_doc_string ;
2016-11-02 03:27:51 +00:00
item - > first_child = first_member ;
result = true ;
}
}
}
return ( result ) ;
}
static Argument_Breakdown
allocate_argument_breakdown ( Partition * part , int32_t count ) {
Argument_Breakdown breakdown = { 0 } ;
if ( count > 0 ) {
breakdown . count = count ;
breakdown . args = push_array ( part , Argument , count ) ;
memset ( breakdown . args , 0 , sizeof ( Argument ) * count ) ;
}
return ( breakdown ) ;
}
/*
Parse arguments by giving pointers to the tokens :
foo ( a , . . . , z )
^ ^
*/
static Argument_Breakdown
parameter_parse ( Partition * part , char * data , Cpp_Token * args_start_token , Cpp_Token * args_end_token ) {
int32_t arg_index = 0 ;
Cpp_Token * arg_token = args_start_token + 1 ;
2017-03-19 23:05:05 +00:00
uint32_t param_string_start = arg_token - > start ;
2016-11-02 03:27:51 +00:00
int32_t arg_count = 1 ;
arg_token = args_start_token ;
for ( ; arg_token < args_end_token ; + + arg_token ) {
if ( arg_token - > type = = CPP_TOKEN_COMMA ) {
+ + arg_count ;
}
}
Argument_Breakdown breakdown = allocate_argument_breakdown ( part , arg_count ) ;
arg_token = args_start_token + 1 ;
for ( ; arg_token < = args_end_token ; + + arg_token ) {
if ( arg_token - > type = = CPP_TOKEN_COMMA | |
arg_token - > type = = CPP_TOKEN_PARENTHESE_CLOSE ) {
int32_t size = arg_token - > start - param_string_start ;
String param_string = make_string ( data + param_string_start , size ) ;
param_string = chop_whitespace ( param_string ) ;
breakdown . args [ arg_index ] . param_string = param_string ;
for ( Cpp_Token * param_name_token = arg_token - 1 ;
param_name_token - > start > param_string_start ;
- - param_name_token ) {
if ( param_name_token - > type = = CPP_TOKEN_IDENTIFIER ) {
2017-03-17 17:45:41 +00:00
int32_t name_start = param_name_token - > start ;
int32_t name_size = param_name_token - > size ;
breakdown . args [ arg_index ] . param_name = make_string ( data + name_start , name_size ) ;
2016-11-02 03:27:51 +00:00
break ;
}
}
+ + arg_index ;
if ( arg_token + 1 < = args_end_token ) {
param_string_start = arg_token [ 1 ] . start ;
}
}
}
return ( breakdown ) ;
}
/*
Moves the context in the following way :
~ ~ ~ ~ ~ ~ ~ name ( ~ ~ ~ ~ ~ ~ ~
^ - > ^
*/
static int32_t
function_parse_goto_name ( Parse_Context * context ) {
int32_t result = false ;
Cpp_Token * token = 0 ;
{
for ( ; ( token = get_token ( context ) ) ! = 0 ; get_next_token ( context ) ) {
if ( token - > type = = CPP_TOKEN_PARENTHESE_OPEN ) {
break ;
}
}
if ( get_token ( context ) ) {
do {
token = get_prev_token ( context ) ;
} while ( token - > type = = CPP_TOKEN_COMMENT ) ;
if ( token - > type = = CPP_TOKEN_IDENTIFIER ) {
result = true ;
}
}
}
return ( result ) ;
}
/*
Moves the context in the following way :
~ ~ ~ ~ ~ ~ ~ name ( ~ ~ ~ ~ ~ ~ ~ /* XXX //
^ - - - - - - - - - - - - - - - > ^
*/
static int32_t
function_get_doc ( Parse_Context * context , char * data , String * doc_string ) {
int32_t result = false ;
Cpp_Token * token = get_token ( context ) ;
String lexeme = { 0 } ;
if ( function_parse_goto_name ( context ) ) {
if ( token - > type = = CPP_TOKEN_IDENTIFIER ) {
for ( ; ( token = get_token ( context ) ) ! = 0 ; get_next_token ( context ) ) {
if ( token - > type = = CPP_TOKEN_COMMENT ) {
lexeme = get_lexeme ( * token , data ) ;
if ( check_and_fix_docs ( & lexeme ) ) {
* doc_string = lexeme ;
result = true ;
break ;
}
}
else if ( token - > type = = CPP_TOKEN_BRACE_OPEN ) {
break ;
}
}
}
}
return ( result ) ;
}
static int32_t
cpp_name_parse ( Parse_Context * context , String * name ) {
int32_t result = false ;
Cpp_Token * token = 0 ;
Cpp_Token * token_start = get_token ( context ) ;
token = get_next_token ( context ) ;
if ( token & & token - > type = = CPP_TOKEN_PARENTHESE_OPEN ) {
token = get_next_token ( context ) ;
if ( token & & token - > type = = CPP_TOKEN_IDENTIFIER ) {
token = get_next_token ( context ) ;
if ( token & & token - > type = = CPP_TOKEN_PARENTHESE_CLOSE ) {
* name = get_lexeme ( * ( token - 1 ) , context - > data ) ;
result = true ;
}
}
}
if ( ! result ) {
set_token ( context , token_start ) ;
}
return ( result ) ;
}
/*
Moves the context in the following way :
RETTY ~ name ( ~ ~ ~ ~ ~ ~ ~ )
^ - - - - - - - - - - - - - - - > ^
*/
static int32_t
function_sig_parse ( Partition * part , Parse_Context * context , Item_Node * item , String cpp_name ) {
int32_t result = false ;
Cpp_Token * token = 0 ;
Cpp_Token * args_start_token = 0 ;
Cpp_Token * ret_token = get_token ( context ) ;
if ( function_parse_goto_name ( context ) ) {
token = get_token ( context ) ;
args_start_token = token + 1 ;
item - > name = get_lexeme ( * token , context - > data ) ;
item - > ret = chop_whitespace ( str_start_end ( context - > data , ret_token - > start , token - > start ) ) ;
for ( ; ( token = get_token ( context ) ) ! = 0 ; get_next_token ( context ) ) {
if ( token - > type = = CPP_TOKEN_PARENTHESE_CLOSE ) {
break ;
}
}
if ( token ) {
item - > args = str_start_end ( context - > data , args_start_token - > start , token - > start + token - > size ) ;
item - > t = Item_Function ;
item - > cpp_name = cpp_name ;
item - > breakdown = parameter_parse ( part , context - > data , args_start_token , token ) ;
Assert ( get_token ( context ) - > type = = CPP_TOKEN_PARENTHESE_CLOSE ) ;
result = true ;
}
}
return ( result ) ;
}
/*
Moves the context in the following way :
MARKER ~ ~ ~ name ( ~ ~ ~ ~ ~ ~ ~ )
^ - - - - - - - - - - - - - - - - - - - > ^
*/
static int32_t
function_parse ( Partition * part , Parse_Context * context , Item_Node * item , String cpp_name ) {
int32_t result = false ;
String doc_string = { 0 } ;
Cpp_Token * token = get_token ( context ) ;
item - > marker = get_lexeme ( * token , context - > data ) ;
if ( function_get_doc ( context , context - > data , & doc_string ) ) {
item - > doc_string = doc_string ;
}
set_token ( context , token ) ;
if ( get_next_token ( context ) ) {
if ( function_sig_parse ( part , context , item , cpp_name ) ) {
Assert ( get_token ( context ) - > type = = CPP_TOKEN_PARENTHESE_CLOSE ) ;
result = true ;
}
}
return ( result ) ;
}
/*
Moves the context in the following way :
/* ~~~ // #define
^ - - - - > ^
*/
static int32_t
macro_parse_check ( Parse_Context * context ) {
int32_t result = false ;
Cpp_Token * token = 0 ;
if ( ( token = get_next_token ( context ) ) ! = 0 ) {
if ( token - > type = = CPP_TOKEN_COMMENT ) {
if ( ( token = get_next_token ( context ) ) ! = 0 ) {
if ( token - > type = = CPP_PP_DEFINE ) {
result = true ;
}
}
}
}
return ( result ) ;
}
/*
Moves the context in the following way :
/* ~~~ // #define ~~~~~~~~~~~~~~~~~ NOT_IN_MACRO_BODY
^ - - - - - - - - - - - - - - - - - - - - - - - - - - - - > ^
*/
static int32_t
macro_parse ( Partition * part , Parse_Context * context , Item_Node * item ) {
int32_t result = false ;
Cpp_Token * token = 0 ;
Cpp_Token * doc_token = 0 ;
Cpp_Token * args_start_token = 0 ;
String doc_string = { 0 } ;
if ( macro_parse_check ( context ) ) {
token = get_token ( context ) ;
if ( can_back_step ( context ) ) {
doc_token = token - 1 ;
doc_string = get_lexeme ( * doc_token , context - > data ) ;
if ( check_and_fix_docs ( & doc_string ) ) {
item - > doc_string = doc_string ;
for ( ; ( token = get_token ( context ) ) ! = 0 ; get_next_token ( context ) ) {
if ( token - > type = = CPP_TOKEN_IDENTIFIER ) {
break ;
}
}
if ( get_token ( context ) & & ( token - > flags & CPP_TFLAG_PP_BODY ) ) {
item - > name = get_lexeme ( * token , context - > data ) ;
if ( ( token = get_next_token ( context ) ) ! = 0 ) {
args_start_token = token ;
for ( ; ( token = get_token ( context ) ) ! = 0 ; get_next_token ( context ) ) {
if ( token - > type = = CPP_TOKEN_PARENTHESE_CLOSE ) {
break ;
}
}
if ( token ) {
item - > args = str_start_end ( context - > data , args_start_token - > start , token - > start + token - > size ) ;
item - > breakdown = parameter_parse ( part , context - > data , args_start_token , token ) ;
if ( ( token = get_next_token ( context ) ) ! = 0 ) {
Cpp_Token * body_start = token ;
if ( body_start - > flags & CPP_TFLAG_PP_BODY ) {
for ( ; ( token = get_token ( context ) ) ! = 0 ; get_next_token ( context ) ) {
if ( ! ( token - > flags & CPP_TFLAG_PP_BODY ) ) {
break ;
}
}
token = get_prev_token ( context ) ;
item - > body = str_start_end ( context - > data , body_start - > start , token - > start + token - > size ) ;
}
}
item - > t = Item_Macro ;
result = true ;
}
}
}
}
}
}
return ( result ) ;
}
static Meta_Unit
2017-03-17 17:45:41 +00:00
compile_meta_unit ( Partition * part , char * code_directory , char * * files , Meta_Keywords * meta_keywords , int32_t key_count ) {
2016-11-02 03:27:51 +00:00
Meta_Unit unit = { 0 } ;
int32_t file_count = 0 ;
for ( char * * file_ptr = files ; * file_ptr ; + + file_ptr , + + file_count ) ;
unit . count = file_count ;
unit . parse = push_array ( part , Parse , file_count ) ;
2017-01-23 06:19:43 +00:00
b32 all_files_lexed = true ;
2016-11-02 03:27:51 +00:00
int32_t i = 0 ;
for ( char * * file_ptr = files ; * file_ptr ; + + file_ptr , + + i ) {
char str_space [ 512 ] ;
String name = make_fixed_width_string ( str_space ) ;
append_sc ( & name , code_directory ) ;
2016-11-06 02:31:45 +00:00
# ifdef _WIN32
2016-11-02 03:27:51 +00:00
append_sc ( & name , " \\ " ) ;
2016-11-06 02:31:45 +00:00
# else
append_sc ( & name , " / " ) ;
# endif
2016-11-02 03:27:51 +00:00
append_sc ( & name , * file_ptr ) ;
terminate_with_null ( & name ) ;
unit . parse [ i ] = meta_lex ( name . str ) ;
2017-01-23 06:19:43 +00:00
if ( unit . parse [ i ] . code . str = = 0 ) {
all_files_lexed = false ;
break ;
}
2016-11-02 03:27:51 +00:00
}
2017-01-23 06:19:43 +00:00
if ( all_files_lexed ) {
// TODO(allen): This stage counts nested structs and unions which is not correct. Luckily it only means we over allocate by a few items, but fixing it to be exactly correct would be nice.
for ( int32_t J = 0 ; J < unit . count ; + + J ) {
Cpp_Token * token = 0 ;
Parse_Context context_ = setup_parse_context ( unit . parse [ J ] ) ;
Parse_Context * context = & context_ ;
for ( ; ( token = get_token ( context ) ) ! = 0 ; get_next_token ( context ) ) {
if ( ! ( token - > flags & CPP_TFLAG_PP_BODY ) ) {
2016-11-02 03:27:51 +00:00
2017-01-23 06:19:43 +00:00
String lexeme = get_lexeme ( * token , context - > data ) ;
int32_t match_index = 0 ;
2017-03-17 17:45:41 +00:00
if ( string_set_match_table ( meta_keywords , sizeof ( * meta_keywords ) , key_count , lexeme , & match_index ) ) {
Item_Type type = meta_keywords [ match_index ] . type ;
2017-01-23 06:19:43 +00:00
if ( type > Item_Null & & type < Item_Type_Count ) {
+ + unit . set . count ;
}
else {
// TODO(allen): Warning
}
2016-11-02 03:27:51 +00:00
}
}
}
}
2017-01-23 06:19:43 +00:00
if ( unit . set . count > 0 ) {
unit . set = allocate_item_set ( part , unit . set . count ) ;
}
int32_t index = 0 ;
2016-11-02 03:27:51 +00:00
2017-01-23 06:19:43 +00:00
for ( int32_t J = 0 ; J < unit . count ; + + J ) {
Cpp_Token * token = 0 ;
Parse_Context context_ = setup_parse_context ( unit . parse [ J ] ) ;
Parse_Context * context = & context_ ;
String cpp_name = { 0 } ;
int32_t has_cpp_name = 0 ;
for ( ; ( token = get_token ( context ) ) ! = 0 ; get_next_token ( context ) ) {
if ( ! ( token - > flags & CPP_TFLAG_PP_BODY ) ) {
2016-11-02 03:27:51 +00:00
2017-01-23 06:19:43 +00:00
String lexeme = get_lexeme ( * token , context - > data ) ;
int32_t match_index = 0 ;
2017-03-17 17:45:41 +00:00
if ( string_set_match_table ( meta_keywords , sizeof ( * meta_keywords ) , key_count , lexeme , & match_index ) ) {
Item_Type type = meta_keywords [ match_index ] . type ;
2016-11-02 03:27:51 +00:00
2017-01-23 06:19:43 +00:00
switch ( type ) {
case Item_Function :
{
if ( function_parse ( part , context , unit . set . items + index , cpp_name ) ) {
Assert ( unit . set . items [ index ] . t = = Item_Function ) ;
+ + index ;
}
else {
fprintf ( stderr , " warning: invalid function signature \n " ) ;
}
} break ;
case Item_CppName :
{
if ( cpp_name_parse ( context , & cpp_name ) ) {
has_cpp_name = 1 ;
}
else {
// TODO(allen): warning message
}
} break ;
case Item_Macro :
{
if ( macro_parse ( part , context , unit . set . items + index ) ) {
Assert ( unit . set . items [ index ] . t = = Item_Macro ) ;
+ + index ;
}
else {
// TODO(allen): warning message
}
} break ;
case Item_Typedef : //typedef
{
if ( typedef_parse ( context , unit . set . items + index ) ) {
Assert ( unit . set . items [ index ] . t = = Item_Typedef ) ;
+ + index ;
}
else {
// TODO(allen): warning message
}
} break ;
case Item_Struct : case Item_Union : //struct/union
{
if ( struct_parse ( part , ( type = = Item_Struct ) , context , unit . set . items + index ) ) {
Assert ( unit . set . items [ index ] . t = = Item_Struct | |
unit . set . items [ index ] . t = = Item_Union ) ;
+ + index ;
}
else {
// TODO(allen): warning message
}
} break ;
case Item_Enum : //ENUM
{
if ( enum_parse ( part , context , unit . set . items + index ) ) {
Assert ( unit . set . items [ index ] . t = = Item_Enum ) ;
+ + index ;
}
else {
// TODO(allen): warning message
}
} break ;
}
2016-11-02 03:27:51 +00:00
}
}
2017-01-23 06:19:43 +00:00
if ( has_cpp_name ) {
has_cpp_name = 0 ;
}
else {
cpp_name = null_string ;
}
unit . parse [ J ] . item_count = index ;
2016-11-02 03:27:51 +00:00
}
2017-01-23 06:19:43 +00:00
// NOTE(allen): This is necessary for now because
// the original count is slightly overestimated thanks
// to nested structs and unions.
unit . set . count = index ;
2016-11-02 03:27:51 +00:00
}
2017-01-23 06:19:43 +00:00
}
else {
unit . parse = 0 ;
unit . count = 0 ;
2016-11-02 03:27:51 +00:00
}
return ( unit ) ;
}
2016-11-03 04:57:26 +00:00
static Meta_Unit
2017-03-17 17:45:41 +00:00
compile_meta_unit ( Partition * part , char * code_directory , char * file , Meta_Keywords * meta_keywords , int32_t key_count ) {
2016-11-03 04:57:26 +00:00
char * file_array [ 2 ] = { file , 0 } ;
2017-03-17 17:45:41 +00:00
Meta_Unit unit = compile_meta_unit ( part , code_directory , file_array , meta_keywords , key_count ) ;
2016-11-03 04:57:26 +00:00
return ( unit ) ;
}
2016-11-02 03:27:51 +00:00
# endif
// BOTTOM