diff --git a/doc/site/style.css b/doc/site/style.css index 16034342..79640676 100644 --- a/doc/site/style.css +++ b/doc/site/style.css @@ -387,8 +387,8 @@ UL.menu-footer LI A:hover { } .nav-tabs > li > a, .nav-pills > li > a { - padding-right: 30px; - padding-left: 30px; + padding-right: 17px; + padding-left: 17px; border-right: 1px solid #bbb; border-radius: 0; margin: 0; @@ -403,8 +403,8 @@ UL.menu-footer LI A:hover { } .nav.nav-pills li:first-child > a { - padding-left: 29px; - padding-right: 29px; + padding-left: 28px; + padding-right: 28px; } .nav.nav-pills li:first-child > a > img { diff --git a/index.html b/index.html index 3a4fdd78..fcfc0077 100644 --- a/index.html +++ b/index.html @@ -47,6 +47,9 @@
  • How-To Guide
  • +
  • + Syntax Highlighters +
  • API Reference
  • @@ -342,64 +345,408 @@ editor.replace('bar'); //... } }); -

    Importing Themes and Languages

    -

    ACE supports the importing of .tmtheme and .tmlanguage files for use -in the editor. The task is accomplished by two simple node scripts.

    - -

    Importing Textmate/Sublime Themes

    -

    To import a .tmtheme file into ACE:

    -
      -
    1. Go to the tool folder, and run npm install to install required -dependencies.
    2. -
    3. Drop your .tmtheme file into the tmthemes folder.
    4. -
    5. Update the tmtheme.js file to include your new theme.
    6. -
    7. Run node tmtheme.js -
    8. -

    Your .tmtheme will be converted and placed into lib/ace/theme -alongside other themes. Note that there’s one more class we’ve added -that isn’t available in regular Textmate themes, and that’s for -.ace_indent-guide. This class adds indentation guides for your theme, -using a base64-encoded png. In general, the dark themes and light themes -each have their own strings, so you can just copy the class from an -equivalent theme.

    - -

    Importing Textmate/Sublime Languages

    - -

    If you’re interested in porting over an existing .tmlanguage file into -Ace’s mode syntax highlighting, there’s a tool to accomplish that, too.

    - -
      -
    1. Go to the tool folder. Run npm install to install required -dependencies.
    2. -
    3. Drop your .tmlanguage file into the tools folder.
    4. -
    5. Run node tmlanguage.js <path_to_tmlanguage_file>, such as -node tmlanguage.js MyGreatLanguage.tmlanguage.
    6. -

    Your .tmlanguage file will be converted to the best of the converter’s -ability. It is an understatement to say that the tool is imperfect. -Probably, this will never be able to be fully autogenerated. In -.tmlanguage files, for instance, one sees the use of -lookbehinds/negative lookbehinds, which JavaScript regexps simply do not -have. There’s a list of other non-determinable items, too:

    - -

    Two files are created and placed in lib/ace/mode: one for the language -mode, and one for the set of highlight rules. You will still need to add -the code into kitchen_sink.html and demo.js, as well as write any -tests for the highlighting.

    + +
    +

    Creating a Syntax Highlighter for Ace

    Creating a new syntax highlighter for Ace is extremly simple. You'll need to define two pieces of code: a new mode, and a new set of highlighting rules.

    +

    Where to Start

    +

    We recommend using the the Ace Mode Creator when defining your highlighter. This allows you to inspect your code's tokens, as well as providing a live preview of the syntax highlighter in action.

    +

    Defining a Mode

    +

    Every language needs a mode. A mode contains the paths to a language's syntax highlighting rules, indentation rules, and code folding rules. Without defining a mode, Ace won't know anything about the finer aspects of your language.

    +

    Here is the starter template we'll use to create a new mode:

    +
    define(function(require, exports, module) {
    +"use strict";
    +
    +var oop = require("../lib/oop");
    +// defines the parent mode
    +var TextMode = require("./text").Mode;
    +var Tokenizer = require("../tokenizer").Tokenizer;
    +var MatchingBraceOutdent = require("./matching_brace_outdent").MatchingBraceOutdent;
    +
    +// defines the language specific highlighters and folding rules
    +var MyNewHighlightRules = require("./mynew_highlight_rules").MyNewHighlightRules;
    +var MyNewFoldMode = require("./folding/mynew").MyNewFoldMode;
    +
    +var Mode = function() {
    +    // set everything up
    +    var highlighter = new MyNewHighlightRules();
    +    this.$outdent = new MatchingBraceOutdent();
    +    this.foldingRules = new MyNewFoldMode();
    +
    +    this.$tokenizer = new Tokenizer(highlighter.getRules());
    +};
    +oop.inherits(Mode, TextMode);
    +
    +(function() {
    +    // Extra logic goes here--we won't be covering all of this
    +
    +    /* These are all optional pieces of code!
    +    this.getNextLineIndent = function(state, line, tab) {
    +        var indent = this.$getIndent(line);
    +        return indent;
    +    };
    +
    +    this.checkOutdent = function(state, line, input) {
    +        return this.$outdent.checkOutdent(line, input);
    +    };
    +
    +    this.autoOutdent = function(state, doc, row) {
    +        this.$outdent.autoOutdent(doc, row);
    +    };
    +
    +    this.createWorker = function(session) {
    +        var worker = new WorkerClient(["ace"], "ace/mode/mynew_worker", "NewWorker");
    +        worker.attachToDocument(session.getDocument());
    +
    +        return worker;
    +    };
    +    */
    +}).call(Mode.prototype);
    +
    +exports.Mode = Mode;
    +});
    +

    What's going on here? First, you're defining the path to TextMode (more on this later). Then you're pointing the mode to your definitions for the highlighting rules, as well as your rules for code folding. Finally, you're setting everything up to find those rules, and exporting the Mode so that it can be consumed. That's it!

    +

    Regarding TextMode, you'll notice that it's only being used once: oop.inherits(Mode, TextMode);. If your new language depends on the rules of another language, you can choose to inherit the same rules, while expanding on it with your language's own requirements. For example, PHP inherits from HTML, since it can be embedded directly inside .html pages. You can either inherit from TextMode, or any other existing mode, if it already relates to your language.

    +

    All Ace modes can be found in the lib/ace/mode folder.

    +

    Defining Syntax Highlighting Rules

    +

    The Ace highlighter can be considered to be a state machine. Regular expressions define the tokens for the current state, as well as the transitions into another state. Let's define mynew_highlight_rules.js, which our mode above uses.

    +

    All syntax highlighters start off looking something like this:

    +
    define(function(require, exports, module) {
    +"use strict";
    +
    +var oop = require("../lib/oop");
    +var TextHighlightRules = require("./text_highlight_rules").TextHighlightRules;
    +
    +var MyNewHighlightRules = function() {
    +
    +    // regexp must not have capturing parentheses. Use (?:) instead.
    +    // regexps are ordered -> the first match is used
    +   this.$rules = {
    +        "start" : [
    +            {
    +                token: <token>, // String, Array, or Function: the CSS token to apply
    +                regex: <regex>, // String or RegExp: the regexp to match
    +                next:  <next>   // [Optional] String: next state to enter
    +            }
    +        ]
    +    };
    +};
    +
    +oop.inherits(MyNewHighlightRules, TextHighlightRules);
    +
    +exports.MyNewHighlightRules = MyNewHighlightRules;
    +
    +});
    +

    The token state machine operates on whatever is defined in this.$rules. The highlighter always begins at the start state, and progresses down the list, looking for a matching regex. When one is found, the resulting text is wrapped within a <span class="ace_<token>"> tag, where <token> is defined as the token property. Note that all tokens are preceded by the ace_ prefix when they're rendered on the page.

    +

    Once again, we're inheriting from TextHighlightRules here. We could choose to make this any other language set we want, if our new language requires previously defined syntaxes. For more information on extending languages, see "extending Highlighters" below.

    +

    Defining Tokens

    +

    The Ace highlighting system is heavily inspired by the TextMate language grammar. Most tokens will follow the conventions of TextMate when naming grammars. A thorough (albeit incomplete) list of tokens can be found on the Ace Wiki.

    +

    For the complete list of tokens, see tool/tmtheme.js. It is possible to add new token names, but the scope of that knowledge is outside of this document.

    +

    Multiple tokens can be applied to the same text by adding dots in the token, e.g. token: support.function wraps the text in a <span class="ace_support ace_function"> tag.

    +

    Defining Regular Expressions

    +

    Regular expressions can either be a RegExp or String definition

    +

    If you're using a regular expression, remember to start and end the line with the / character, like this:

    +
    {
    +    token : "constant.language.escape",
    +    regex : /\$[\w\d]+/
    +}
    +

    A caveat of using stringed regular expressions is that any \ character must be escaped. That means that even an innocuous regular expression like this:

    +
    regex: "function\s*\(\w+\)"
    +

    Must actually be written like this:

    +
    regex: "function\\s*\(\\w+\)"
    +

    Groupings

    +

    You can also include flat regexps--(var)--or have matching groups--((a+)(b+)). There is a strict requirement whereby matching groups must cover the entire matched string; thus, (hel)lo is invalid. If you want to create a non-matching group, simply start the group with the ?: predicate; thus, (hel)(?:lo) is okay. You can, of course, create longer non-matching groups. For example:

    +
    {
    +    token : "constant.language.boolean",
    +    regex : /(?:true|false)\b/
    +},
    +

    For flat regular expression matches, token can be a String, or a Function that takes a single argument (the match) and returns a string token. For example, using a function might look like this:

    +
    var colors = lang.arrayToMap(
    +    ("aqua|black|blue|fuchsia|gray|green|lime|maroon|navy|olive|orange|" +
    +    "purple|red|silver|teal|white|yellow").split("|")
    +);
    +
    +var fonts = lang.arrayToMap(
    +    ("arial|century|comic|courier|garamond|georgia|helvetica|impact|lucida|" +
    +    "symbol|system|tahoma|times|trebuchet|utopia|verdana|webdings|sans-serif|" +
    +    "serif|monospace").split("|")
    +);
    +
    +...
    +
    +{
    +    token: function(value) {
    +        if (colors.hasOwnProperty(value.toLowerCase())) {
    +            return "support.constant.color";
    +        }
    +        else if (fonts.hasOwnProperty(value.toLowerCase())) {
    +            return "support.constant.fonts";
    +        }
    +        else {
    +            return "text";
    +        }
    +    },
    +    regex: "\\-?[a-zA-Z_][a-zA-Z0-9_\\-]*"
    +}
    +

    If token is a function,it should take the same number of arguments as there are groups, and return an array of tokens.

    +

    For grouped regular expressions, token can be a String, in which case all matched groups are given that same token, like this:

    +
    {
    +    token: "identifier",
    +    regex: "(\\w+\\s*:)(\\w*)"
    +}
    +

    More commonly, though, token is an Array (of the same length as the number of groups), whereby matches are given the token of the same alignment as in the match. For a complicated regular expression, like defining a function, that might look something like this:

    +
    {
    +    token : ["storage.type", "text", "entity.name.function"],
    +    regex : "(function)(\\s+)([a-zA-Z_][a-zA-Z0-9_]*\\b)"
    +}
    +

    Defining States

    +

    The syntax highlighting state machine stays in the start state, until you define a next state for it to advance to. At that point, the tokenizer stays in that new state, until it advances to another state. Afterwards, you should return to the original start state.

    +

    Here's an example:

    +
    this.$rules = {
    +    "start" : [ {
    +        token : "text",
    +        merge : true,
    +        regex : "<\\!\\[CDATA\\[",
    +        next : "cdata"
    +    },
    +
    +    "cdata" : [ {
    +        token : "text",
    +        regex : "\\]\\]>",
    +        next : "start"
    +    }, {
    +        token : "text",
    +        merge : true,
    +        regex : "\\s+"
    +    }, {
    +        token : "text",
    +        merge : true,
    +        regex : ".+"
    +    } ]
    +};
    +

    In this extremly short sample, we're defining some highlighting rules for when Ace detectes a <![CDATA tag. When one is encountered, the tokenizer moves from start into the cdata state. It remains there, applying the text token to any string it encounters. Finally, when it hits a closing ]> symbol, it returns to the start state and continues to tokenize anything else.

    + +

    Using the TMLanguage Tool

    +

    There is a tool that +will take an existing tmlanguage file and do its best to convert it into Javascript for Ace to consume. Here's what you need to get started:

    +
      +
    1. In the Ace repository, navigate to the tools folder.
    2. +
    3. Run npm install to install required dependencies.
    4. +
    5. Run node tmlanguage.js <path_to_tmlanguage_file>; for example, node <path_to_tmlanguage_file> /Users/Elrond/elven.tmLanguage
    6. +
    +

    Two files are created and placed in lib/ace/mode: one for the language mode, and one for the set of highlight rules. You will still need to add the code into kitchen_sink.html and demo.js, as well as write any tests for the highlighting.

    +

    A Note on Accuracy

    +

    Your .tmlanguage file will then be converted to the best of the converter’s ability. It is an understatement to say that the tool is imperfect. Probably, language mode creation will never be able to be fully autogenerated. There's a list of non-determinable items; for example:

    + +

    However, the tool is an excellent way to get a quick start, if you already possess a tmlanguage file for you language.

    + +

    Extending Highlighters

    + +

    Suppose you're working on a LuaPage, PHP embedded in HTML, or a Django template. You'll need to create a syntax highlighter that takes all the rules from the original language (Lua, PHP, or Python) and extends it with some additional identifiers (<?lua, <?php, {%, for example). Ace allows you to easily extend a highlighter using a few helper functions.

    +

    Getting Existing Rules

    +

    To get the existing syntax highlighting rules for a particular language, use the getRules() function. For example:

    +
    var HtmlHighlightRules = require("./html_highlight_rules").HtmlHighlightRules;
    +
    +this.$rules = new HtmlHighlightRules().getRules();
    +
    +/*
    +    this.$rules == Same this.$rules as HTML highlighting
    +*/
    +

    Extending a Highlighter

    +

    The addRules method does one thing, and it does one thing well: it adds new rules to an existing rule set, and prefixes any state with a given tag. For example, let's say you've got two sets of rules, defined like this:

    +
    this.$rules = {
    +    "start": [ /* ... */ ]
    +};
    +
    +var newRules = {
    +    "start": [ /* ... */ ]
    +}
    +

    If you want to incorporate newRules into this.$rules, you'd do something like this:

    +
    this.addRules(newRules, "new-");
    +
    +/*
    +    this.$rules = {
    +        "start": [ ... ],
    +        "new-start": [ ... ]
    +    };
    +*/
    +

    Extending Two Highlighters

    +

    The last function available to you combines both of these concepts, and it's called embedRules. It takes three parameters:

    +
      +
    1. An existing rule set to embed with
    2. +
    3. A prefix to apply for each state in the existing rule set
    4. +
    5. A set of new states to add
    6. +
    +

    Like addRules, embedRules adds on to the existing this.$rules object.

    +

    To explain this visually, let's take a look at the syntax highlighter for Lua pages, which combines all of these concepts:

    +
    var HtmlHighlightRules = require("./html_highlight_rules").HtmlHighlightRules;
    +var LuaHighlightRules = require("./lua_highlight_rules").LuaHighlightRules;
    +
    +var LuaPageHighlightRules = function() {
    +    this.$rules = new HtmlHighlightRules().getRules();
    +
    +    for (var i in this.$rules) {
    +        this.$rules[i].unshift({
    +            token: "keyword",
    +            regex: "<\\%\\=?",
    +            next: "lua-start"
    +        }, {
    +            token: "keyword",
    +            regex: "<\\?lua\\=?",
    +            next: "lua-start"
    +        });
    +    }
    +    this.embedRules(LuaHighlightRules, "lua-", [
    +        {
    +            token: "keyword",
    +            regex: "\\%>",
    +            next: "start"
    +        },
    +        {
    +            token: "keyword",
    +            regex: "\\?>",
    +            next: "start"
    +        }
    +    ]);
    +};
    +

    Here, this.$rules starts off as a set of HTML highlighting rules. To this set, we add two new checks for <%= and <?lua=. We also delegate that if one of these rules are matched, we should move onto the lua-start state. Next, embedRules takes the already existing set of LuaHighlightRules and applies the lua- prefix to each state there. Finally, it adds two new checks for %> and ?>, allowing the state machine to return to start.

    + +

    Code Folding

    + +

    Adding new folding rules to your mode can be a little tricky. First, insert the following lines of code into your mode definition:

    +
    var MyFoldMode = require("./folding/newrules").FoldMode;
    +
    +...
    +var MyMode = function() {
    +
    +    ...
    +
    +    this.foldingRules = new MyFoldMode();
    +};
    +

    You'll be defining your code folding rules into the lib/ace/mode/folding folder. Here's a template that you can use to get started:

    +
    define(function(require, exports, module) {
    +"use strict";
    +
    +var oop = require("../../lib/oop");
    +var Range = require("../../range").Range;
    +var BaseFoldMode = require("./fold_mode").FoldMode;
    +
    +var FoldMode = exports.FoldMode = function() {};
    +oop.inherits(FoldMode, BaseFoldMode);
    +
    +(function() {
    +
    +    // regular expressions that identify starting and stopping points
    +    this.foldingStartMarker; 
    +    this.foldingStopMarker;
    +
    +    this.getFoldWidgetRange = function(session, foldStyle, row) {
    +        var line = session.getLine(row);
    +
    +        // test each line, and return a range of segments to collapse
    +    };
    +
    +}).call(FoldMode.prototype);
    +
    +});
    +

    Just like with TextMode for syntax highlighting, BaseFoldMode contains the starting point for code folding logic. foldingStartMarker defines your opening folding point, while foldingStopMarker defines the stopping point. For example, for a C-style folding system, these values might look like this:

    +
    this.foldingStartMarker = /(\{|\[)[^\}\]]*$|^\s*(\/\*)/;
    +this.foldingStopMarker = /^[^\[\{]*(\}|\])|^[\s\*]*(\*\/)/;
    +

    These regular expressions identify various symbols--{, [, //--to pay attention to. getFoldWidgetRange matches on these regular expressions, and when found, returns the range of relevant folding points. For more information on the Range object, see the Ace API documentation.

    +

    Again, for a C-style folding mechanism, a range to return for the starting fold might look like this:

    +
    var line = session.getLine(row);
    +var match = line.match(this.foldingStartMarker);
    +if (match) {
    +    var i = match.index;
    +
    +    if (match[1])
    +        return this.openingBracketBlock(session, match[1], row, i);
    +
    +    var range = session.getCommentFoldRange(row, i + match[0].length);
    +    range.end.column -= 2;
    +    return range;
    +}
    +

    Let's say we stumble across the code block hello_world() {. Our range object here becomes:

    +
    {
    +  startRow: 0,
    +  endRow: 0,
    +  startColumn: 0,
    +  endColumn: 13
    +}
    + +

    Testing Your Highlighter

    + +

    The best way to test your tokenizer is to see it live, right? To do that, you'll want to modify the live Ace demo to preview your changes. You can find this file in the root Ace directory with the name kitchen-sink.html.

    +

    The file that defines the behavior for this live demo is defined in demo/kitchen-sink/demo.js. You'll want to add lines to two separate objects:

    +
      +
    1. modesByName needs a new entry that defines all the rules regarding your new mode. Entries looks like propertyName: [dropdownName, arrayOfExtensions], where:

      +
        +
      • propertyName is the name of the new language you're highlighting
      • +
      • dropdownName is an arbitrary string that lists your language in the live demo's Mode dropdown menu
      • +
      • arrayOfExtensions is an array of strings (seperated by |) that defines valid extensions to use for the new language.
      • +
      +
    2. +
    3. docs also needs a new entry, which defines the location of your sample document showing all the power of your new language. Entries look like filenamePath: modeToUse, where:

      +
        +
      • filenamePath is the path to your example document. This should just be in docs/.
      • +
      • modeToUse is the same arbitrary string as dropdownName
      • +
      +
    4. +
    +

    Once you set this up, you should see be able to witness a live demonstration of your new highlighter.

    +

    Adding Automated Tests

    +

    It's also suggested that you go one step further and define some automated tests to test your syntax highlighter. A basic test looks something like this:

    +
    if (typeof process !== "undefined") {
    +    require("amd-loader");
    +}
    +
    +define(function(require, exports, module) {
    +"use strict";
    +
    +var MyNewLanguage = require("./mynewlanguage").Mode;
    +var assert = require("../test/assertions");
    +
    +module.exports = {
    +
    +    name: "MyNewLanguage Tokenizer",
    +
    +    setUp : function() {
    +        this.tokenizer = new MyNewLanguage().getTokenizer();
    +    },
    +
    +    "test: my random description" : function() {
    +        var line = "-12px";
    +        var tokens = this.tokenizer.getLineTokens(line, "ruleset").tokens;
    +
    +        assert.equal(2, tokens.length);
    +        assert.equal("constant.numeric", tokens[0].type);
    +    },
    +
    +    "test: tokenize more than one thing" : function() {
    +        var tokens = this.tokenizer.getLineTokens("{()}", "start").tokens;
    +
    +        assert.equal(3, tokens.length);
    +        assert.equal("paren.lparen", tokens[0].type);
    +        assert.equal("text", tokens[1].type);
    +        assert.equal("paren.rparen", tokens[2].type);
    +    },
    +};
    +
    +});
    +
    +if (typeof module !== "undefined" && module === require.main) {
    +    require("asyncjs").test.testcase(module.exports).exec()
    +}
    +

    All tests contain a string describing what the test is doing. Then, you define an arbitrary line that you want your tokenizer to check. It's recommended that you test both the number of tokens found, as well as the values of those tokens.

    +

    Any file ending with the _test.js suffix are automatically run by Ace's Travis CI server.

    + +