fix parser error

This commit is contained in:
yyc12345 2023-06-30 17:19:08 +08:00
parent 2525cf402d
commit b6558a718d
4 changed files with 125 additions and 145 deletions

View File

@ -1,5 +1,7 @@
grammar Nlp; grammar Nlp;
// ===== Parser =====
document: LANG_HEADER (section)* ; document: LANG_HEADER (section)* ;
section: SECTION_HEAD (subSection | entry)* ; section: SECTION_HEAD (subSection | entry)* ;
@ -7,22 +9,24 @@ section: SECTION_HEAD (subSection | entry)* ;
subSection: SUB_SECTION_HEAD (entry)* ; subSection: SUB_SECTION_HEAD (entry)* ;
entry: ENTRY_STRING # entryString entry: ENTRY_STRING # entryString
| ENTRY_STRING (LINE_CONCAT ENTRY_STRING)+ # entryConcatedString | ENTRY_STRING (LINE_CONCATOR ENTRY_STRING)+ # entryConcatedString
| ENTRY_INTEGER # entryInteger | ENTRY_INTEGER # entryInteger
; ;
// ===== Lexer =====
LANG_HEADER: 'Language:' [a-zA-Z]+ ; LANG_HEADER: 'Language:' [a-zA-Z]+ ;
SECTION_HEAD: '[' NAME_SECTION ']' ; SECTION_HEAD: '[' NAME_SECTION ']' ;
SUB_SECTION_HEAD: '<' NAME_SECTION '>' ; SUB_SECTION_HEAD: '<' NAME_SECTION '>' ;
fragment NAME_SECTION: [ a-zA-Z0-9]+ ; // section name are consisted of space, char and number fragment NAME_SECTION: [ a-zA-Z0-9]+ ; // section name are consisted of space, char and number
ENTRY_STRING: '"' (STRING_ESC|.)*? '"' ; ENTRY_STRING: '"' (ENTRY_STRING_ESC| ~'"' )* '"' ;
fragment STRING_ESC: '\\"' | '\\\\' ; fragment ENTRY_STRING_ESC: '""' | '\\\\' | '\\t' | '\\n' ;
ENTRY_INTEGER: [1-9][0-9]+ ; ENTRY_INTEGER: [1-9][0-9]+ ;
LINE_CONCATOR: '\\';
SPLITTOR: [ ,;\r\n]+ -> skip; // ignore all splittor and space SPLITTOR: [ ,;\r\n]+ -> skip; // ignore all splittor and space
LINE_CONCAT: '\\' ;
LINE_COMMENT: '//' ~[\r\n]* -> skip ; // consume all non-line-breaker. because we need line breaker. LINE_COMMENT: '//' ~[\r\n]* -> skip ; // consume all non-line-breaker. because we need line breaker.
BLOCK_COMMENT: '/*' .*? '*/' -> skip ; BLOCK_COMMENT: '/*' .*? '*/' -> skip ;

View File

@ -1,20 +1,41 @@
// import antlr stuff
import org.antlr.v4.runtime.*; import org.antlr.v4.runtime.*;
import org.antlr.v4.runtime.tree.*; import org.antlr.v4.runtime.tree.*;
// import container
import java.util.Stack; import java.util.Stack;
import java.util.stream.Collectors;
import java.util.List; import java.util.List;
import java.lang.StringBuilder; import java.lang.StringBuilder;
// import json
import com.google.gson.JsonArray;
import com.google.gson.JsonObject;
import com.google.gson.Gson;
import com.google.gson.GsonBuilder;
// import regex
import java.util.regex.Pattern;
import java.util.regex.Matcher;
public class NlpRunner { public class NlpRunner {
public static class ConvertToJson extends NlpBaseListener { public static class NlpJsonConverter extends NlpBaseListener {
public ConvertToJson() { public NlpJsonConverter() {
mIndent = 0; mGsonInstance = new GsonBuilder().setPrettyPrinting().create();
mRoot = new JsonObject();
mEntryIndex = 0; mSection = new JsonArray();
mEntryIndexStack = new Stack<Integer>(); mSectionStack = new Stack<JsonArray>();
mIsFirst = true; }
mIsFirstStack = new Stack<Boolean>(); /* JSON related stuff */
Gson mGsonInstance;
public void printJson() {
System.out.print(mGsonInstance.toJson(mRoot));;
} }
/* String related stuff */
private static final Pattern mRegStrCctor = Pattern.compile("\\\\[^\\r\\n]*[\\r\\n]+");
private static final Pattern mRegDoubleQuote = Pattern.compile("\\\"\\\"");
private static final Pattern mRegEscTab = Pattern.compile("\\t");
private static final Pattern mRegEscEol = Pattern.compile("\\r?\\n");
private String cutLangHead(String strl) { private String cutLangHead(String strl) {
return strl.substring("Language:".length()); return strl.substring("Language:".length());
} }
@ -24,129 +45,95 @@ public class NlpRunner {
private String cutString(String strl) { private String cutString(String strl) {
return strl.substring(1, strl.length() - 1); return strl.substring(1, strl.length() - 1);
} }
private String joinConcatedString(List<TerminalNode> ls) { private String regulateString(String strl) {
strl = mRegStrCctor.matcher(strl).replaceAll(Matcher.quoteReplacement("")); // remove string concator \\[^\r\n]*[\r\n]+
strl = mRegDoubleQuote.matcher(strl).replaceAll(Matcher.quoteReplacement("\""));// replace "" with "
strl = mRegEscTab.matcher(strl).replaceAll(Matcher.quoteReplacement("\\t")); // replace real \t to escape char
strl = mRegEscEol.matcher(strl).replaceAll(Matcher.quoteReplacement("\\n")); // replace all real \n to escape char
return strl;
}
private String processString(String strl) {
return regulateString(cutString(strl));
}
private String processConcatedString(List<String> ls) {
StringBuilder sb = new StringBuilder(); StringBuilder sb = new StringBuilder();
for (TerminalNode node : ls) { for (String node : ls) {
sb.append(cutString(node.getText())); sb.append(regulateString(cutString(node)));
} }
return sb.toString(); return sb.toString();
} }
int mEntryIndex; /* Section layout related stuff */
boolean mIsFirst;
Stack<Integer> mEntryIndexStack; JsonObject mRoot;
Stack<Boolean> mIsFirstStack; JsonArray mSection;
Stack<JsonArray> mSectionStack;
private void pushSection() { private void pushSection() {
mEntryIndexStack.push(mEntryIndex); mSectionStack.push(mSection);
mEntryIndex = 0; mSection = new JsonArray();
mIsFirstStack.push(mIsFirst);
mIsFirst = true;
} }
private void popSection() { private void popSection() {
mEntryIndex = mEntryIndexStack.pop(); mSection = mSectionStack.pop();
mIsFirst = mIsFirstStack.pop();
}
private void printComma() {
// only the first entry do not need comma
if (mIsFirst) {
mIsFirst = false;
} else {
System.out.print(',');
}
} }
int mIndent; /* Listener */
private void printIndent() {
for(int i = 0; i < mIndent; ++i) {
System.out.print('\t');
}
}
private void printEOL() {
System.out.print('\n');
}
private void printIndentLn(String strl) {
// call this when writting tail bracket
printEOL();
printIndent();
System.out.print(strl);
}
private void printIndentCommaLn(String strl) {
// call this when writting anything else.
printComma();
printEOL();
printIndent();
System.out.print(strl);
}
private void printStrEntry(String val) {
printIndentCommaLn(String.format("\"%s\": \"%s\"", mEntryIndex++, val));
}
private void printIntEntry(int val) {
printIndentCommaLn(String.format("\"%s\": %d", mEntryIndex++, val));
}
@Override @Override
public void enterDocument(NlpParser.DocumentContext ctx) { public void enterDocument(NlpParser.DocumentContext ctx) {
printIndentCommaLn("{"); // insert language prop
pushSection(); mRoot.addProperty("language", cutLangHead(ctx.LANG_HEADER().getText()));
++mIndent;
printIndentCommaLn(String.format("\"Language\": \"%s\"", cutLangHead(ctx.LANG_HEADER().getText())));
printIndentCommaLn("\"document\": {");
pushSection();
++mIndent;
} }
@Override @Override
public void exitDocument(NlpParser.DocumentContext ctx) { public void exitDocument(NlpParser.DocumentContext ctx) {
--mIndent; // insert document prop
popSection(); mRoot.add("entries", mSection);
printIndentLn("}");
--mIndent;
popSection();
printIndentLn("}");
} }
@Override @Override
public void enterSection(NlpParser.SectionContext ctx) { public void enterSection(NlpParser.SectionContext ctx) {
printIndentCommaLn(String.format("\"%s\": {", cutSectionHead(ctx.SECTION_HEAD().getText())));
pushSection(); pushSection();
++mIndent;
} }
@Override @Override
public void exitSection(NlpParser.SectionContext ctx) { public void exitSection(NlpParser.SectionContext ctx) {
--mIndent; // create new object
JsonObject objSection = new JsonObject();
objSection.addProperty("section", cutSectionHead(ctx.SECTION_HEAD().getText()));
objSection.add("entries", mSection);
// pop and insert
popSection(); popSection();
printIndentLn("}"); mSection.add(objSection);
} }
@Override @Override
public void enterSubSection(NlpParser.SubSectionContext ctx) { public void enterSubSection(NlpParser.SubSectionContext ctx) {
printIndentCommaLn(String.format("\"%s\": {", cutSectionHead(ctx.SUB_SECTION_HEAD().getText())));
pushSection(); pushSection();
++mIndent;
} }
@Override @Override
public void exitSubSection(NlpParser.SubSectionContext ctx) { public void exitSubSection(NlpParser.SubSectionContext ctx) {
--mIndent; // create new object
JsonObject objSubSection = new JsonObject();
objSubSection.addProperty("section", cutSectionHead(ctx.SUB_SECTION_HEAD().getText()));
objSubSection.add("entries", mSection);
// pop and insert
popSection(); popSection();
printIndentLn("}"); mSection.add(objSubSection);
} }
@Override @Override
public void enterEntryString(NlpParser.EntryStringContext ctx) { public void enterEntryString(NlpParser.EntryStringContext ctx) {
printStrEntry(cutString(ctx.ENTRY_STRING().getText())); mSection.add(processString(ctx.ENTRY_STRING().getText()));
} }
@Override @Override
public void enterEntryConcatedString(NlpParser.EntryConcatedStringContext ctx) { public void enterEntryConcatedString(NlpParser.EntryConcatedStringContext ctx) {
printStrEntry(joinConcatedString(ctx.ENTRY_STRING())); mSection.add(processConcatedString(
ctx.ENTRY_STRING().stream().map(value -> value.getText()).collect(Collectors.toList())
));
} }
@Override @Override
public void enterEntryInteger(NlpParser.EntryIntegerContext ctx) { public void enterEntryInteger(NlpParser.EntryIntegerContext ctx) {
printIntEntry(Integer.parseInt(ctx.ENTRY_INTEGER().getText())); mSection.add(Integer.parseInt(ctx.ENTRY_INTEGER().getText()));
} }
} }
@ -158,7 +145,9 @@ public class NlpRunner {
ParseTree tree = parser.document(); ParseTree tree = parser.document();
ParseTreeWalker walker = new ParseTreeWalker(); ParseTreeWalker walker = new ParseTreeWalker();
walker.walk(new ConvertToJson(), tree); NlpJsonConverter converter = new NlpJsonConverter();
walker.walk(converter, tree);
converter.printJson();
System.out.println(); System.out.println();
} }
} }

View File

@ -1,4 +1,4 @@
antlr4 Nlp.g4 antlr4 Nlp.g4
javac Nlp*.java javac Nlp*.java
;grun Nlp document -tree < testbench.txt ;grun Nlp document -tree < testbench.txt
java NlpRunner < ../NlpSrc/VT50.txt > result.txt java NlpRunner < ../NlpSrc/VT50.txt > result.json

View File

@ -1,71 +1,58 @@
Language:English Language:English
/* /*
----===[[[[ Virtools Language Pack File ]]]]===---- long comments
Rules:
First line must contain the string 'Language:' followed by the language name.
The file may be seen as sections, each section name is enclosed in brackets ([,])
Sections can have sub-sections, with names enclosed in brackets (<,>)
For every section or sub-section, you can have as many entries as you want,
which can be: - strings (optionaly enclosed in quotes)
- numbers
Separators for entries are ',',';' or LF (line feed)
Entries belong to the last section or sub-section specified, until
a new section is reached. The first entry of the section has an index of 0,
the next one, an index of 1, and so on.
Comments can be added using the standard ANSI C++ scheme.
Also, dont remove %s,%d and %f tags, those will be replaced at runtime by strings or numbers.
A string can take multiple lines, adding \ at the end of the line means that the entry
continues on the next line.
NOTE FOR TRANSLATORS: DO NOT CHANGE ENTRIES ORDER IN THIS FILE!!!
*/ */
[Version] // short comments
"Virtools Dev","Virtools Crea"
"Virtools Dev Evaluation","Virtools Crea Evaluation"
"Virtools Dev Education","Virtools Crea Education"
[Layout 0]
[Profiler] "entry 0"
"Profiler"
"Database","Framerate","Objects Drawn","Faces Drawn","Lines Drawn" <layout 0 0>
"Behavior Code Execution Details...","Collisions Management","Parametric Operations", "Virtools Dev1","Virtools Dev2"
"IK","Floors Management","Other Code" "Virtools Dev3"
"Virtools Dev1","Virtools Dev2",
"Virtools Dev3"
[Common] <layout 0 1>
"Virtools Dev"
"MultiSelection" [Layout 1]
// -- DONT CHANGE THIS <layout 1 0>
<layout 1 1>
<Registry> [String Escape]
"Software\\Virtools\\Global","Usage Count"
<Timebomb> <String Escape 0>
"Key1","Key2","Key3","SYSINFO.SysInfo32\\CLSID","\\csrsrv32.dll"
// -- ENDOF DONT CHANGE "foo bar"
"\\foo\tbar\n"
"foo barr "
"\\""foo""\t""bar"""
<Timebomb Messages> <String Escape 1>
"Your license has expired.\n\nYou must either stop evaluating Virtools or\nextend it by clicking the 'Extend' button and following the instructions.\n\nAlso, check out our web resources for more information:"
"- Main Web Site","- Virtools mailing list, additional resources, discussions and more."
"Customer Key:","Check Key:"
"HOWTO:\n\t- A new customer key will be generated.\n\t- Send it by e-mail to our support service at: support@Virtools.com\n"\
"\t You will receive back a valid check key according to your customer key.\n\t- Copy/Paste the key into corresponding field above.\n"\
"\t- Your license will be extended to as many days as specified in your agreement.\n\n"\
"WARNING: Once generated, the customer key is valid for 5 days only."
"foo"\ // short comments
"bar"
[3D Layout] "foo\ // short comments
"3D Layout" bar"
<Names> "foo"\ // short comments
"New 3D Frame","New 2D Frame","New Camera","New Light","New Curve","New Grid","New Material","New Texture","New Portal" "bar"\ // short comments
"bar"
<Actions>
"--- Out of range ---" "foo\ // short comments
"%s '%s' created." // on creation (ie. TargetLight 'light0000' created.) bar\ // short comments
bar"
<String Escape 2>
"foo""\\"\
"""bar"
"foo""\\\
""bar"