tree-sitter-lang/grammar.g4
ProgramSnail d218e02a78 init
2023-07-16 20:54:43 +03:00

167 lines
5.2 KiB
ANTLR

grammar lang ;
// not always most recent grammar ??
// not checked
source_file: (statement)+ EOF ;
statement: import
| type_definition
| function_definition
| typeclass_definition
;
import: ('::' | 'import') (SIMPLE_NAME_IDENTIFIER | '_') ('=' SIMPLE_NAME_IDENTIFIER)?
(':' (SIMPLE_TYPE_IDENTIFIER | SIMPLE_NAME_IDENTIFIER | TYPECLASS_IDENTIFIER | ('(' OPERATOR ')'))*)? ';'
;
constraint: '?' expression ;
type_definition: (DEFINITION_INFO)? (ANNOTATION_INFO)* ('^')?
SIMPLE_TYPE_IDENTIFIER ((ARGUMENT_TYPE_IDENTIFIER)* '=' (variant_type | typle_type))?
(('{' function_definietion '}')|';')
;
function_definition: (definietion_info)? (ANNOTATION_INFO)* (constraint ';')*
(('%' | 'let') | ('$' | 'var'))? SIMPLE_NAME_IDENTIFIER
((ANNOTATION_IDENTIFIER)? ARGUMENT_NAME_IDENTIFIER)*
(':' ((ANNOTATION_IDENTIFIER)? ('->' | 'in') | ('<-' | 'out') | ('<>' | 'ref'))? type)+)?
(('=' ((super_expression ';') | block)) | ';')
;
typeclass_definition: (DEFINITION_INFO)? (ANNOTATION_INFO)*
TYPECLASS_IDENTIFIER (seq(':', (TYPECLASS_IDENTIFIER)*))?
(('{' (function_definition)* '}') | ';')
;
case: (':=' | '=:') expression (('??' | 'if') expression)? (('->' | 'do') expression)? ;
match: expression (case)+ ;
condition: choice('??' | 'if') expression choice('->' |'do') expression
(('!!' | 'elif') expression ('->' | 'do') expression)*
(('!!->' | 'else') _expression)?
;
loop: ('@' | 'for') (expression | (expression ':' expression))?,
('->' | 'do') expression
;
comma_expression: /* prec left ?? */ super_expression ',' super_expression ;
operator_expression: /* prec left ?? */
| /* prec 4 */ expression OPERATOR expression
| /* prec 3 */ expression OPERATOR_TAIL1 expression
| /* prec 2 */ expression OPERATOR_TAIL2 expression
| /* prec 1 */ expression OPERATOR_TAIL3 expression
;
block: '{' (super_expression ';')* '}' ;
array: '[[' (scoped_expression)+ ']]' ;
name_definition: (('%' | 'let') | ('$' | 'var')) (SIMPLE_NAME_IDENTIFIER | PLACEHOLDER) ;
access: scoped_expression '[' super_expression ']' ;
reference: /* prec -1 ?? */ (('<>' | 'ref') | ('<-' | 'in')) scoped_expression ;
return: ('return' | 'bring') expression ;
loop_control: 'break'
| 'continue'
;
name_expression:
((type '.' SIMPLE_NAME_IDENTIFIER)
| (scoped_expression '.' SIMPLE_NAME_IDENTIFIER)
| name_identifier
| ('(' OPERATOR ')'))
((ANNOTATION_IDENTIFIER)? scoped_expression)*
;
constructor: type (ANNOTATION_IDENTIFIER)? scoped_expression)+ ;
lambda: '\\' ((ANNOTATION_IDENTIFIER)? ARGUMENT_NAME_IDENTIFIER)+ '->' expression ;
super_expression: match
| condition
| loop
| comma_expression
| expression
;
expression: name_expression
| operator_expression
| return
| lambda
| constructor
| block
| not_name_scoped_expression
;
scoped_expression: name_identifier
| not_name_scoped_expression
;
not_name_scoped_expression: PLACEHOLDER
| name_definition
| access
| loop_control
| array
| literal
| '(' super_expression ')'
| reference
;
variant_type: ('|')? tuple_type ('|' tuple_type)+ ;
tuple_type: ('&')? annotated_type ('&' _annotated_type)* ;
annotated_type: (ANNOTATION_IDENTIFIER)? type ;
type: ('^')? type_identifier ('?')? ('[' (type)+ ']')? ;
name_identifier: (ARGUMENT_NAME_IDENTIFIER | SIMPLE_NAME_IDENTIFIER) ;
type_identifier: (ARGUMENT_TYPE_IDENTIFIER | SIMPLE_TYPE_IDENTIFIER) ;
literal: FLOAT_NUMBER_LITERAL
| NUMBER_LITERAL
| STRING_LITERAL
| CHAR_LITERAL
| BOOL_LITERAL
| UNIT_LITERAL
| NULL_LITERAL
DEFINITION_INFO : : ': ' ([^\n]*)+ ;
ANNOTATION_INFO : ANNOTATION_IDENTIFIER [^\n]* ;
LINE_COMMENT : '//' [^\n]* -> skip ;
BLOCK_COMMENT : '\*' ([^*] |('\*' [^/]))* '*/' -> skip ;
PLACEHOLDER : '_' ;
SIMPLE_NAME_IDENTIFIER : ([a-z_][a-z0-9_]* '.')* [a-z_][a-z0-9_]* ;
SIMPLE_TYPE_IDENTIFIER : ([a-z_][a-z0-9_]* '.')* [A-Z][a-zA-Z0-9]* ;
TYPECLASS_IDENTIFIER : ([a-z_][a-z0-9_]* '.' )* '#' [A-Z][a-zA-Z0-9]* ;
ARGUMENT_NAME_IDENTIFIER : '\'' [a-z_][a-z0-9_]* ;
ARGUMENT_TYPE_IDENTIFIER : '\'' [A-Z][a-zA-Z0-9]* ;
ANNOTATION_IDENTIFIER : '@' [a-z_][a-z0-9_]* ;
OPERATOR : ([+\-*/%^!?|&,<>=]+)|\.+ ;
OPERATOR_TAIL1 : [+\-*/%^!?|&,<>=]+\. ;
OPERATOR_TAIL2 : [+\-*/%^!?|&,<>=]+\.\. ;
OPERATOR_TAIL3 : [+\-*/%^!?|&,<>=]+\.\.\. ;
FLOAT_NUMBER_LITERAL : [0-9]+ '.' [0-9]+ ;
NUMBER_LITERAL : [0-9]+ ;
STRING_LITERAL : \"([^\\\"]|(\\.))*\" ;
CHAR_LITERAL : '\'' '\'' ([^\\\'] | ( '\\' [\u0000-\u00FF])) '\'' '\'' ;
BOOL_LITERAL : 'true' | 'false' ;
UNIT_LITERAL : '()' ;
NULL_LITERAL : 'null' ;
// IDENTIFIER: ([@'#]?[a-zA-Z0-9_]+)|([+\-*/%^!?|&,<>=]+\.?\.?\.?)|\.+