VirtoolsTranslation/NlpParser/Nlp.g4

grammar Nlp;

// ===== Parser =====

document: LANG_HEADER (section)* ;

section: SECTION_HEAD (subSection | entry)* ;

subSection: SUB_SECTION_HEAD (entry)* ;

entry: ENTRY_STRING                             # entryString
| ENTRY_STRING (LINE_CONCATOR ENTRY_STRING)+    # entryConcatedString
| ENTRY_INTEGER                                 # entryInteger
;

// ===== Lexer =====

LANG_HEADER: 'Language:' [a-zA-Z]+ ;

SECTION_HEAD: '[' NAME_SECTION ']' ;
SUB_SECTION_HEAD: '<' NAME_SECTION '>' ;
fragment NAME_SECTION: [ a-zA-Z0-9]+ ;   // section name are consisted of space, char and number

ENTRY_STRING: '"' (ENTRY_STRING_ESC| ~'"' )* '"' ;
fragment ENTRY_STRING_ESC: '""' | '\\\\' | '\\t' | '\\n' ; 

ENTRY_INTEGER: [1-9][0-9]+ ;

LINE_CONCATOR: '\\';
SPLITTOR: [ ,;\r\n]+ -> skip;               // ignore all splittor and space
LINE_COMMENT: '//' ~[\r\n]* -> skip ;       // consume all non-line-breaker. because we need line breaker.
BLOCK_COMMENT: '/*' .*? '*/' -> skip ;
add parser 2023-06-28 22:56:18 +08:00			`grammar Nlp;`

fix parser error 2023-06-30 17:19:08 +08:00			`// ===== Parser =====`

add antlr4 listener 2023-06-29 21:46:58 +08:00			`document: LANG_HEADER (section)* ;`
add parser 2023-06-28 22:56:18 +08:00
add antlr4 listener 2023-06-29 21:46:58 +08:00			`section: SECTION_HEAD (subSection \| entry)* ;`
add parser 2023-06-28 22:56:18 +08:00
add antlr4 listener 2023-06-29 21:46:58 +08:00			`subSection: SUB_SECTION_HEAD (entry)* ;`
add parser 2023-06-28 22:56:18 +08:00
add antlr4 listener 2023-06-29 21:46:58 +08:00			`entry: ENTRY_STRING # entryString`
fix parser error 2023-06-30 17:19:08 +08:00			`\| ENTRY_STRING (LINE_CONCATOR ENTRY_STRING)+ # entryConcatedString`
add antlr4 listener 2023-06-29 21:46:58 +08:00			`\| ENTRY_INTEGER # entryInteger`
add parser 2023-06-28 22:56:18 +08:00			`;`

fix parser error 2023-06-30 17:19:08 +08:00			`// ===== Lexer =====`

add parser 2023-06-28 22:56:18 +08:00			`LANG_HEADER: 'Language:' [a-zA-Z]+ ;`

			`SECTION_HEAD: '[' NAME_SECTION ']' ;`
			`SUB_SECTION_HEAD: '<' NAME_SECTION '>' ;`
			`fragment NAME_SECTION: [ a-zA-Z0-9]+ ; // section name are consisted of space, char and number`

fix parser error 2023-06-30 17:19:08 +08:00			`ENTRY_STRING: '"' (ENTRY_STRING_ESC\| ~'"' )* '"' ;`
			`fragment ENTRY_STRING_ESC: '""' \| '\\\\' \| '\\t' \| '\\n' ;`
add parser 2023-06-28 22:56:18 +08:00
			`ENTRY_INTEGER: [1-9][0-9]+ ;`

fix parser error 2023-06-30 17:19:08 +08:00			`LINE_CONCATOR: '\\';`
add parser 2023-06-28 22:56:18 +08:00			`SPLITTOR: [ ,;\r\n]+ -> skip; // ignore all splittor and space`
			`LINE_COMMENT: '//' ~[\r\n]* -> skip ; // consume all non-line-breaker. because we need line breaker.`
			`BLOCK_COMMENT: '/' .? '*/' -> skip ;`