Transform a JSON grammar into a CodeMirror syntax-highlight parser
A simple and light-weight (~ 37kB minified, ~ 13kB zipped) CodeMirror add-on
to generate syntax-highlight parsers (codemirror modes) from a grammar specification in JSON format.
See also: ace-grammar, prism-grammar, syntaxhighlighter-grammar
Note: The invariant codebase for all the *-grammar
add-ons resides at editor-grammar repository (used as a git submodule
)
###Contents
###Todo
Code Indentation is Codemirror default, see Modularity and Future Directions
- handle arbitrary, user-defined, code
(de-)indentation
in thegrammar
specification (e.g viaindent action
tokens) - handle arbitrary, user-defined, code
matching
(e.gbrackets
,tags
, etc..) in thegrammar
specification (e.g viamatch action
tokens) - handle arbitrary, user-defined,
(operator) precedence
relations in thegrammar
specification (e.g viaprecedence action
tokens) - handle arbitrary, user-defined,
local/global/scoped
relations in thegrammar
specification (e.g viascope action
tokens) - and so on..
- enable grammar add-on to pre-compile a grammar specification directly into mode source code, so it can be used without the add-on as standalone mode [TODO, maybe]
###Features
- A
Grammar
can extend otherGrammars
(so arbitraryvariations
anddialects
can be handled more easily) Grammar
includes:Style Model
,Lex Model
andSyntax Model
(optional), plus a couple of settings (see examples)Grammar
specification can be minimal, defaults will be used (see example grammars)Grammar.Syntax Model
can enable highlight in a more context-specific way, plus detect possible syntax errors and display appropriate error messages (see below)Grammar.Syntax Model
can contain recursive references (see/test/grammar-js-recursion.html
)Grammar.Syntax Model
can be (fully) specificed usingPEG
-like notation orBNF
-like notation (NEW feature)Grammar
can define action tokens to perform complex context-specific parsing functionality, including associated tag matching and duplicate identifiers (see for examplexml.grammar
example) (NEW feature)- Generated highlight modes can support toggle comments and keyword autocompletion functionality if defined in the grammar
- Generated highlight modes can support lint-like syntax-annotation functionality generated from the grammar
- Generated highlight modes can support custom, user-defined, code folding functionality from the grammar
fold
model (NEW feature) - Generated parsers are optimized for speed and size
- Can generate a syntax-highlight parser from a grammar interactively and on-the-fly ( see example, http://foo123.github.io/examples/codemirror-grammar )
- see also Modularity and Future Directions
###How to use:
See working examples under /test folder.
An example for XML:
// 1. a partial xml grammar in simple JSON format
var xml_grammar = {
// prefix ID for regular expressions, represented as strings, used in the grammar
"RegExpID" : "RE::",
"Extra" : {
"fold" : "xml"
//"electricChars" : "<"
},
// Style model
"Style" : {
"comment" : "comment"
,"declaration" : "tag"
,"doctype" : "meta"
,"meta" : "meta"
,"cdata" : "atom"
,"tag" : "tag"
,"attribute" : "attribute"
,"string" : "string"
,"atom" : "atom"
,"number" : "number"
,"error" : "error"
},
// Lexical model
"Lex" : {
"comment:comment" : ["<!--", "-->"]
,"declaration:block" : ["<?xml", "?>"]
,"doctype:block" : ["RE::/<!doctype\\b/i", ">"]
,"meta:block" : ["RE::/<\\?[_a-zA-Z][\\w\\._\\-]*/", "?>"]
,"cdata:block" : ["<![CDATA[", "]]>"]
,"open_tag" : "RE::/<([_a-zA-Z][_a-zA-Z0-9\\-]*)/"
,"close_tag" : "RE::/<\\/([_a-zA-Z][_a-zA-Z0-9\\-]*)>/"
,"attribute" : "RE::/[_a-zA-Z][_a-zA-Z0-9\\-]*/"
,"string:line-block" : [["\""], ["'"]]
,"number" : ["RE::/[0-9]\\d*/", "RE::/#[0-9a-fA-F]+/"]
,"atom" : ["RE::/&#x[a-fA-F\\d]+;/", "RE::/&#[\\d]+;/", "RE::/&[a-zA-Z][a-zA-Z0-9]*;/"]
,"text" : "RE::/[^<&]+/"
// actions
,"tag_ctx:action" : {"context":true}
,"\\tag_ctx:action" : {"context":false}
,"unique_id:action" : {"unique":["xml", "$1"],"msg":"Duplicate id value \"$0\""}
,"unique_att:action" : {"unique":["tag", "$0"],"msg":"Duplicate attribute \"$0\"","in-context":true}
,"tag_opened:action" : {"push":"<$1>","ci":true}
,"tag_closed:action" : {"pop":"<$1>","ci":true,"msg":"Tags \"$0\" and \"$1\" do not match"}
,"tag_autoclosed:action" : {"pop":null}
,"out_of_place:error" : "\"$2$3\" can only be at the beginning of XML document"
},
// Syntax model (optional)
"Syntax" : {
"tag_att" : "'id'.attribute unique_att '=' string unique_id | attribute unique_att '=' (string | number)"
,"start_tag" : "open_tag.tag tag_ctx tag_opened tag_att* ('>'.tag | '/>'.tag tag_autoclosed) \\tag_ctx"
,"end_tag" : "close_tag.tag tag_closed"
,"xml" : "(^^1 declaration? doctype?) (declaration.error out_of_place | doctype.error out_of_place | comment | meta | cdata | start_tag | end_tag | atom | text)*"
},
// what to parse and in what order
"Parser" : [ ["xml"] ]
};
// 2. parse the grammar into a Codemirror syntax-highlight mode
var xml_mode = CodeMirrorGrammar.getMode( xml_grammar );
// 3. use it with Codemirror
CodeMirror.defineMode("xml", xml_mode);
// enable user-defined code folding in the specification (new feature)
xml_mode.supportCodeFolding = true;
CodeMirror.registerHelper("fold", xml_mode.foldType, xml_mode.folder);
// enable syntax lint-like validation in the grammar
xml_mode.supportGrammarAnnotations = true;
CodeMirror.registerHelper("lint", "xml", xml_mode.validator);
// enable user-defined autocompletion (if defined)
xml_mode.supportAutoCompletion = true;
CodeMirror.commands['my_autocompletion'] = function( cm ) {
CodeMirror.showHint(cm, xml_mode.autocompleter, {prefixMatch:true, caseInsensitiveMatch:false});
};
// this also works (takes priority if set)
xml_mode.autocompleter.options = {prefixMatch:true, caseInsensitiveMatch:false};
var editor = CodeMirror.fromTextArea(document.getElementById("code"), {
mode: "xml",
lineNumbers: true,
indentUnit: 4,
indentWithTabs: false,
lint: true, // enable lint validation
extraKeys: {"Ctrl-Space": 'my_autocompletion', "Ctrl-L": "toggleComment"},
foldGutter: true,
gutters: ["CodeMirror-lint-markers", "CodeMirror-linenumbers", "CodeMirror-foldgutter"]
});
Result:
###Other Examples: