TiddlyWiki5/js/WikiTextParser.js

/*\
title: js/WikiTextParser.js

Parses a block of tiddlywiki-format wiki text into a parse tree object.

\*/
(function(){

/*jslint node: true */
"use strict";

var WikiTextRules = require("./WikiTextRules.js"),
	WikiTextParseTree = require("./WikiTextParseTree.js").WikiTextParseTree,
	utils = require("./Utils.js"),
	util = require("util");

/*
Creates a new instance of the wiki text parser with the specified options. The
options are a hashmap of mandatory members as follows:

	store: The store object to use to parse any cascaded content (eg transclusion)

Planned:

	enableRules: An array of names of wiki text rules to enable. If not specified, all rules are available
	extraRules: An array of additional rule handlers to add
	enableMacros: An array of names of macros to enable. If not specified, all macros are available
	extraMacros: An array of additional macro handlers to add
*/

var WikiTextParser = function(options) {
	this.store = options.store;
	this.autoLinkWikiWords = true;
	this.rules = WikiTextRules.rules;
	var pattern = [];
	for(var n=0; n<this.rules.length; n++) {
		pattern.push("(" + this.rules[n].match + ")");
	}
	this.rulesRegExp = new RegExp(pattern.join("|"),"mg");

};

WikiTextParser.prototype.parse = function(text) {
	this.source = text;
	this.nextMatch = 0;
	this.children = [];
	this.dependencies = [];
	this.output = null;
	this.subWikify(this.children);
	var tree = new WikiTextParseTree(this.children,this.dependencies,this.store);
	this.source = null;
	this.children = null;
	return tree;
};

WikiTextParser.prototype.addDependency = function(dependency) {
	if(dependency === null) {
		this.dependencies = null;
	} else if(this.dependencies && this.dependencies.indexOf(dependency) === -1) {
		this.dependencies.push(dependency);
	}	
};

WikiTextParser.prototype.outputText = function(place,startPos,endPos) {
	if(startPos < endPos) {
		place.push({type: "text", value: this.source.substring(startPos,endPos)});
	}
};

WikiTextParser.prototype.subWikify = function(output,terminator) {
	// Handle the terminated and unterminated cases separately, this speeds up wikifikation by about 30%
	if(terminator)
		this.subWikifyTerm(output,new RegExp("(" + terminator + ")","mg"));
	else
		this.subWikifyUnterm(output);
};

WikiTextParser.prototype.subWikifyUnterm = function(output) {
	// subWikify can be indirectly recursive, so we need to save the old output pointer
	var oldOutput = this.output;
	this.output = output;
	// Get the first match
	this.rulesRegExp.lastIndex = this.nextMatch;
	var ruleMatch = this.rulesRegExp.exec(this.source);
	while(ruleMatch) {
		// Output any text before the match
		if(ruleMatch.index > this.nextMatch)
			this.outputText(this.output,this.nextMatch,ruleMatch.index);
		// Set the match parameters for the handler
		this.matchStart = ruleMatch.index;
		this.matchLength = ruleMatch[0].length;
		this.matchText = ruleMatch[0];
		this.nextMatch = this.rulesRegExp.lastIndex;
		// Figure out which rule matched and call its handler
		var t;
		for(t=1; t<ruleMatch.length; t++) {
			if(ruleMatch[t]) {
				this.rules[t-1].handler(this);
				this.rulesRegExp.lastIndex = this.nextMatch;
				break;
			}
		}
		// Get the next match
		ruleMatch = this.rulesRegExp.exec(this.source);
	}
	// Output any text after the last match
	if(this.nextMatch < this.source.length) {
		this.outputText(this.output,this.nextMatch,this.source.length);
		this.nextMatch = this.source.length;
	}
	// Restore the output pointer
	this.output = oldOutput;
};

WikiTextParser.prototype.subWikifyTerm = function(output,terminatorRegExp) {
	// subWikify can be indirectly recursive, so we need to save the old output pointer
	var oldOutput = this.output;
	this.output = output;
	// Get the first matches for the rule and terminator RegExps
	terminatorRegExp.lastIndex = this.nextMatch;
	var terminatorMatch = terminatorRegExp.exec(this.source);
	this.rulesRegExp.lastIndex = this.nextMatch;
	var ruleMatch = this.rulesRegExp.exec(terminatorMatch ? this.source.substr(0,terminatorMatch.index) : this.source);
	while(terminatorMatch || ruleMatch) {
		// Check for a terminator match before the next rule match
		if(terminatorMatch && (!ruleMatch || terminatorMatch.index <= ruleMatch.index)) {
			// Output any text before the match
			if(terminatorMatch.index > this.nextMatch)
				this.outputText(this.output,this.nextMatch,terminatorMatch.index);
			// Set the match parameters
			this.matchText = terminatorMatch[1];
			this.matchLength = terminatorMatch[1].length;
			this.matchStart = terminatorMatch.index;
			this.nextMatch = this.matchStart + this.matchLength;
			// Restore the output pointer
			this.output = oldOutput;
			return;
		}
		// It must be a rule match; output any text before the match
		if(ruleMatch.index > this.nextMatch)
			this.outputText(this.output,this.nextMatch,ruleMatch.index);
		// Set the match parameters
		this.matchStart = ruleMatch.index;
		this.matchLength = ruleMatch[0].length;
		this.matchText = ruleMatch[0];
		this.nextMatch = this.rulesRegExp.lastIndex;
		// Figure out which rule matched and call its handler
		var t;
		for(t=1; t<ruleMatch.length; t++) {
			if(ruleMatch[t]) {
				this.rules[t-1].handler(this);
				this.rulesRegExp.lastIndex = this.nextMatch;
				break;
			}
		}
		// Get the next match
		terminatorRegExp.lastIndex = this.nextMatch;
		terminatorMatch = terminatorRegExp.exec(this.source);
		ruleMatch = this.rulesRegExp.exec(terminatorMatch ? this.source.substr(0,terminatorMatch.index) : this.source);
	}
	// Output any text after the last match
	if(this.nextMatch < this.source.length) {
		this.outputText(this.output,this.nextMatch,this.source.length);
		this.nextMatch = this.source.length;
	}
	// Restore the output pointer
	this.output = oldOutput;
};

exports.WikiTextParser = WikiTextParser;

})();
Experimental support for client-side builds These changes allow tiddlywiki.js to cook it's own components into a skeletal new-school client-side TiddlyWiki. 2011-12-13 12:30:09 +00:00			`/*\`
			`title: js/WikiTextParser.js`
Integrated the TiddlyWiki wikifier A large refactoring to tidy up the interface of the TiddlyWiki wikifier code, and package it as a wiki text parser. 2011-12-05 16:50:25 +00:00
			`Parses a block of tiddlywiki-format wiki text into a parse tree object.`

Experimental support for client-side builds These changes allow tiddlywiki.js to cook it's own components into a skeletal new-school client-side TiddlyWiki. 2011-12-13 12:30:09 +00:00			`\*/`
			`(function(){`
Integrated the TiddlyWiki wikifier A large refactoring to tidy up the interface of the TiddlyWiki wikifier code, and package it as a wiki text parser. 2011-12-05 16:50:25 +00:00
Lots of JSHint induced tweaks Still not spotless 2011-12-09 16:34:02 +00:00			`/jslint node: true /`
Integrated the TiddlyWiki wikifier A large refactoring to tidy up the interface of the TiddlyWiki wikifier code, and package it as a wiki text parser. 2011-12-05 16:50:25 +00:00			`"use strict";`

Refactoring the wikitext parser To match the structure of the JavaScript parser, and make it less complicated 2012-01-05 11:08:05 +00:00			`var WikiTextRules = require("./WikiTextRules.js"),`
			`WikiTextParseTree = require("./WikiTextParseTree.js").WikiTextParseTree,`
Integrated the TiddlyWiki wikifier A large refactoring to tidy up the interface of the TiddlyWiki wikifier code, and package it as a wiki text parser. 2011-12-05 16:50:25 +00:00			`utils = require("./Utils.js"),`
			`util = require("util");`

Refactoring the wikitext parser To match the structure of the JavaScript parser, and make it less complicated 2012-01-05 11:08:05 +00:00			`/*`
			`Creates a new instance of the wiki text parser with the specified options. The`
			`options are a hashmap of mandatory members as follows:`

			`store: The store object to use to parse any cascaded content (eg transclusion)`

			`Planned:`

			`enableRules: An array of names of wiki text rules to enable. If not specified, all rules are available`
			`extraRules: An array of additional rule handlers to add`
			`enableMacros: An array of names of macros to enable. If not specified, all macros are available`
			`extraMacros: An array of additional macro handlers to add`
			`*/`

			`var WikiTextParser = function(options) {`
			`this.store = options.store;`
Integrated the TiddlyWiki wikifier A large refactoring to tidy up the interface of the TiddlyWiki wikifier code, and package it as a wiki text parser. 2011-12-05 16:50:25 +00:00			`this.autoLinkWikiWords = true;`
Refactoring the wikitext parser To match the structure of the JavaScript parser, and make it less complicated 2012-01-05 11:08:05 +00:00			`this.rules = WikiTextRules.rules;`
			`var pattern = [];`
			`for(var n=0; n<this.rules.length; n++) {`
			`pattern.push("(" + this.rules[n].match + ")");`
			`}`
			`this.rulesRegExp = new RegExp(pattern.join("\|"),"mg");`

			`};`

			`WikiTextParser.prototype.parse = function(text) {`
Integrated the TiddlyWiki wikifier A large refactoring to tidy up the interface of the TiddlyWiki wikifier code, and package it as a wiki text parser. 2011-12-05 16:50:25 +00:00			`this.source = text;`
			`this.nextMatch = 0;`
Major refactoring of how wiki text parsing and rendering is packaged 2011-12-11 18:28:09 +00:00			`this.children = [];`
Added tracking of dependencies between tiddlers 2012-01-06 19:41:42 +00:00			`this.dependencies = [];`
Integrated the TiddlyWiki wikifier A large refactoring to tidy up the interface of the TiddlyWiki wikifier code, and package it as a wiki text parser. 2011-12-05 16:50:25 +00:00			`this.output = null;`
Major refactoring of how wiki text parsing and rendering is packaged 2011-12-11 18:28:09 +00:00			`this.subWikify(this.children);`
Cleared some temporary variables after use To reduce memory consumption 2012-01-08 10:24:09 +00:00			`var tree = new WikiTextParseTree(this.children,this.dependencies,this.store);`
			`this.source = null;`
			`this.children = null;`
			`return tree;`
Integrated the TiddlyWiki wikifier A large refactoring to tidy up the interface of the TiddlyWiki wikifier code, and package it as a wiki text parser. 2011-12-05 16:50:25 +00:00			`};`

Take links into account when accumulating dependencies 2012-01-07 10:30:50 +00:00			`WikiTextParser.prototype.addDependency = function(dependency) {`
			`if(dependency === null) {`
			`this.dependencies = null;`
			`} else if(this.dependencies && this.dependencies.indexOf(dependency) === -1) {`
			`this.dependencies.push(dependency);`
			`}`
			`};`

Added basic support for HTML rendering 2011-12-05 18:21:52 +00:00			`WikiTextParser.prototype.outputText = function(place,startPos,endPos) {`
Integrated the TiddlyWiki wikifier A large refactoring to tidy up the interface of the TiddlyWiki wikifier code, and package it as a wiki text parser. 2011-12-05 16:50:25 +00:00			`if(startPos < endPos) {`
			`place.push({type: "text", value: this.source.substring(startPos,endPos)});`
			`}`
			`};`

Added basic support for HTML rendering 2011-12-05 18:21:52 +00:00			`WikiTextParser.prototype.subWikify = function(output,terminator) {`
Integrated the TiddlyWiki wikifier A large refactoring to tidy up the interface of the TiddlyWiki wikifier code, and package it as a wiki text parser. 2011-12-05 16:50:25 +00:00			`// Handle the terminated and unterminated cases separately, this speeds up wikifikation by about 30%`
			`if(terminator)`
			`this.subWikifyTerm(output,new RegExp("(" + terminator + ")","mg"));`
			`else`
			`this.subWikifyUnterm(output);`
			`};`

Added basic support for HTML rendering 2011-12-05 18:21:52 +00:00			`WikiTextParser.prototype.subWikifyUnterm = function(output) {`
Integrated the TiddlyWiki wikifier A large refactoring to tidy up the interface of the TiddlyWiki wikifier code, and package it as a wiki text parser. 2011-12-05 16:50:25 +00:00			`// subWikify can be indirectly recursive, so we need to save the old output pointer`
			`var oldOutput = this.output;`
			`this.output = output;`
			`// Get the first match`
Refactoring the wikitext parser To match the structure of the JavaScript parser, and make it less complicated 2012-01-05 11:08:05 +00:00			`this.rulesRegExp.lastIndex = this.nextMatch;`
			`var ruleMatch = this.rulesRegExp.exec(this.source);`
Integrated the TiddlyWiki wikifier A large refactoring to tidy up the interface of the TiddlyWiki wikifier code, and package it as a wiki text parser. 2011-12-05 16:50:25 +00:00			`while(ruleMatch) {`
			`// Output any text before the match`
			`if(ruleMatch.index > this.nextMatch)`
			`this.outputText(this.output,this.nextMatch,ruleMatch.index);`
			`// Set the match parameters for the handler`
			`this.matchStart = ruleMatch.index;`
			`this.matchLength = ruleMatch[0].length;`
			`this.matchText = ruleMatch[0];`
Refactoring the wikitext parser To match the structure of the JavaScript parser, and make it less complicated 2012-01-05 11:08:05 +00:00			`this.nextMatch = this.rulesRegExp.lastIndex;`
Integrated the TiddlyWiki wikifier A large refactoring to tidy up the interface of the TiddlyWiki wikifier code, and package it as a wiki text parser. 2011-12-05 16:50:25 +00:00			`// Figure out which rule matched and call its handler`
			`var t;`
			`for(t=1; t<ruleMatch.length; t++) {`
			`if(ruleMatch[t]) {`
Refactoring the wikitext parser To match the structure of the JavaScript parser, and make it less complicated 2012-01-05 11:08:05 +00:00			`this.rules[t-1].handler(this);`
			`this.rulesRegExp.lastIndex = this.nextMatch;`
Integrated the TiddlyWiki wikifier A large refactoring to tidy up the interface of the TiddlyWiki wikifier code, and package it as a wiki text parser. 2011-12-05 16:50:25 +00:00			`break;`
			`}`
			`}`
			`// Get the next match`
Refactoring the wikitext parser To match the structure of the JavaScript parser, and make it less complicated 2012-01-05 11:08:05 +00:00			`ruleMatch = this.rulesRegExp.exec(this.source);`
Integrated the TiddlyWiki wikifier A large refactoring to tidy up the interface of the TiddlyWiki wikifier code, and package it as a wiki text parser. 2011-12-05 16:50:25 +00:00			`}`
			`// Output any text after the last match`
			`if(this.nextMatch < this.source.length) {`
			`this.outputText(this.output,this.nextMatch,this.source.length);`
			`this.nextMatch = this.source.length;`
			`}`
			`// Restore the output pointer`
			`this.output = oldOutput;`
			`};`

Added basic support for HTML rendering 2011-12-05 18:21:52 +00:00			`WikiTextParser.prototype.subWikifyTerm = function(output,terminatorRegExp) {`
Integrated the TiddlyWiki wikifier A large refactoring to tidy up the interface of the TiddlyWiki wikifier code, and package it as a wiki text parser. 2011-12-05 16:50:25 +00:00			`// subWikify can be indirectly recursive, so we need to save the old output pointer`
			`var oldOutput = this.output;`
			`this.output = output;`
			`// Get the first matches for the rule and terminator RegExps`
			`terminatorRegExp.lastIndex = this.nextMatch;`
			`var terminatorMatch = terminatorRegExp.exec(this.source);`
Refactoring the wikitext parser To match the structure of the JavaScript parser, and make it less complicated 2012-01-05 11:08:05 +00:00			`this.rulesRegExp.lastIndex = this.nextMatch;`
			`var ruleMatch = this.rulesRegExp.exec(terminatorMatch ? this.source.substr(0,terminatorMatch.index) : this.source);`
Integrated the TiddlyWiki wikifier A large refactoring to tidy up the interface of the TiddlyWiki wikifier code, and package it as a wiki text parser. 2011-12-05 16:50:25 +00:00			`while(terminatorMatch \|\| ruleMatch) {`
			`// Check for a terminator match before the next rule match`
			`if(terminatorMatch && (!ruleMatch \|\| terminatorMatch.index <= ruleMatch.index)) {`
			`// Output any text before the match`
			`if(terminatorMatch.index > this.nextMatch)`
			`this.outputText(this.output,this.nextMatch,terminatorMatch.index);`
			`// Set the match parameters`
			`this.matchText = terminatorMatch[1];`
			`this.matchLength = terminatorMatch[1].length;`
			`this.matchStart = terminatorMatch.index;`
			`this.nextMatch = this.matchStart + this.matchLength;`
			`// Restore the output pointer`
			`this.output = oldOutput;`
			`return;`
			`}`
			`// It must be a rule match; output any text before the match`
			`if(ruleMatch.index > this.nextMatch)`
			`this.outputText(this.output,this.nextMatch,ruleMatch.index);`
			`// Set the match parameters`
			`this.matchStart = ruleMatch.index;`
			`this.matchLength = ruleMatch[0].length;`
			`this.matchText = ruleMatch[0];`
Refactoring the wikitext parser To match the structure of the JavaScript parser, and make it less complicated 2012-01-05 11:08:05 +00:00			`this.nextMatch = this.rulesRegExp.lastIndex;`
Integrated the TiddlyWiki wikifier A large refactoring to tidy up the interface of the TiddlyWiki wikifier code, and package it as a wiki text parser. 2011-12-05 16:50:25 +00:00			`// Figure out which rule matched and call its handler`
			`var t;`
			`for(t=1; t<ruleMatch.length; t++) {`
			`if(ruleMatch[t]) {`
Refactoring the wikitext parser To match the structure of the JavaScript parser, and make it less complicated 2012-01-05 11:08:05 +00:00			`this.rules[t-1].handler(this);`
			`this.rulesRegExp.lastIndex = this.nextMatch;`
Integrated the TiddlyWiki wikifier A large refactoring to tidy up the interface of the TiddlyWiki wikifier code, and package it as a wiki text parser. 2011-12-05 16:50:25 +00:00			`break;`
			`}`
			`}`
			`// Get the next match`
			`terminatorRegExp.lastIndex = this.nextMatch;`
			`terminatorMatch = terminatorRegExp.exec(this.source);`
Refactoring the wikitext parser To match the structure of the JavaScript parser, and make it less complicated 2012-01-05 11:08:05 +00:00			`ruleMatch = this.rulesRegExp.exec(terminatorMatch ? this.source.substr(0,terminatorMatch.index) : this.source);`
Integrated the TiddlyWiki wikifier A large refactoring to tidy up the interface of the TiddlyWiki wikifier code, and package it as a wiki text parser. 2011-12-05 16:50:25 +00:00			`}`
			`// Output any text after the last match`
			`if(this.nextMatch < this.source.length) {`
			`this.outputText(this.output,this.nextMatch,this.source.length);`
			`this.nextMatch = this.source.length;`
			`}`
			`// Restore the output pointer`
			`this.output = oldOutput;`
			`};`

			`exports.WikiTextParser = WikiTextParser;`
Added a function wrapper around all source files to keep JSHint happy 2011-12-12 10:52:04 +00:00
			`})();`