TiddlyWiki5/js/FileRetriever.js

/*
FileRetriever can asynchronously retrieve files from HTTP URLs or the local file system. It incorporates
throttling so that we don't get error EMFILE "Too many open files".
*/

/*jslint node: true */
"use strict";

var fs = require("fs"),
	path = require("path"),
	url = require("url"),
	util = require("util"),
	http = require("http"),
	https = require("https");

var FileRetriever = exports;

var fileRequest = function fileRequest(filepath,callback) {
	fs.readFile(filepath,"utf8", callback);
};

var httpRequest = function(fileurl,callback) {
	var opts = url.parse(fileurl);
	var httpLib = opts.protocol === "http:" ? http : https;
	var request = httpLib.get(opts,function(res) {
		if(res.statusCode != 200) {
			var err = new Error("HTTP error");
			err.code = res.statusCode.toString();
			callback(err);
		} else {
			var data = [];
			res.on("data", function(chunk) {
				data.push(chunk);
			});
			res.on("end", function() {
				callback(null,data.join(""));
			});
		}
	});
	request.addListener("error", function(err) {
		callback(err);
	});
	request.end();
};

// Retrieve a file given a filepath specifier and a context path. If the filepath isn't an absolute
// filepath or an absolute URL, then it is interpreted relative to the context path, which can also be
// a filepath or a URL. On completion, the callback function is called as callback(err,data). The
// data hashmap is as follows:
//		text: full text of file
//		path: full path used to reach the file
//		basename: the basename of the file
//		extname: the extension of the file
FileRetriever.retrieveFile = function(filepath,contextPath,callback) {
	var httpRegExp = /^(https?:\/\/)/gi,
		result = {},
		filepathIsHttp = httpRegExp.test(filepath),
		contextPathIsHttp = httpRegExp.test(contextPath),
		requester;
	if(contextPathIsHttp || filepathIsHttp) {
		// If we've got a full HTTP URI then we're good to go
		result.path = url.resolve(contextPath,filepath);
		var parsedPath = url.parse(result.path);
		result.extname = path.extname(parsedPath.pathname);
		result.basename = path.basename(parsedPath.extname);
		requester = httpRequest;
	} else {
		// It's a file requested in a file context
		result.path = path.resolve(path.dirname(contextPath),filepath);
		result.extname = path.extname(result.path);
		result.basename = path.basename(result.path,result.extname);
		requester = fileRequest;
	}
	requester(result.path,function(err,data) {
		if(!err) {
			result.text = data;
		}
		callback(err,result);
	});
};
Converted recipe handling to use async IO Part of the preparation for supporting reading recipes and ingredients over HTTP 2011-11-28 13:47:38 +00:00			`/*`
			`FileRetriever can asynchronously retrieve files from HTTP URLs or the local file system. It incorporates`
			`throttling so that we don't get error EMFILE "Too many open files".`
			`*/`

Lots of JSHint induced tweaks Still not spotless 2011-12-09 16:34:02 +00:00			`/jslint node: true /`
Minor refactoring, including switching to strict mode 2011-11-30 17:27:00 +00:00			`"use strict";`

Converted recipe handling to use async IO Part of the preparation for supporting reading recipes and ingredients over HTTP 2011-11-28 13:47:38 +00:00			`var fs = require("fs"),`
Further refactoring of the new async design 2011-11-28 15:15:35 +00:00			`path = require("path"),`
Added support for retrieving ingredients over HTTP This makes it possible to directly reference recipes and tiddlers stored on GitHub, for example. 2011-11-29 18:27:03 +00:00			`url = require("url"),`
			`util = require("util"),`
			`http = require("http"),`
Major refactoring of async code The result is correct handling of tiddlers being overwritten within recipes. 2011-12-02 14:40:18 +00:00			`https = require("https");`
Converted recipe handling to use async IO Part of the preparation for supporting reading recipes and ingredients over HTTP 2011-11-28 13:47:38 +00:00
			`var FileRetriever = exports;`

Major refactoring of async code The result is correct handling of tiddlers being overwritten within recipes. 2011-12-02 14:40:18 +00:00			`var fileRequest = function fileRequest(filepath,callback) {`
			`fs.readFile(filepath,"utf8", callback);`
			`};`
Converted recipe handling to use async IO Part of the preparation for supporting reading recipes and ingredients over HTTP 2011-11-28 13:47:38 +00:00
Major refactoring of async code The result is correct handling of tiddlers being overwritten within recipes. 2011-12-02 14:40:18 +00:00			`var httpRequest = function(fileurl,callback) {`
			`var opts = url.parse(fileurl);`
Added support for retrieving ingredients over HTTP This makes it possible to directly reference recipes and tiddlers stored on GitHub, for example. 2011-11-29 18:27:03 +00:00			`var httpLib = opts.protocol === "http:" ? http : https;`
			`var request = httpLib.get(opts,function(res) {`
			`if(res.statusCode != 200) {`
			`var err = new Error("HTTP error");`
			`err.code = res.statusCode.toString();`
			`callback(err);`
			`} else {`
			`var data = [];`
			`res.on("data", function(chunk) {`
Preparing to add support for JSON files loaded from TiddlySpace/TiddlyWeb 2011-11-30 16:06:34 +00:00			`data.push(chunk);`
Added support for retrieving ingredients over HTTP This makes it possible to directly reference recipes and tiddlers stored on GitHub, for example. 2011-11-29 18:27:03 +00:00			`});`
			`res.on("end", function() {`
			`callback(null,data.join(""));`
			`});`
			`}`
			`});`
			`request.addListener("error", function(err) {`
Refactorings to keep JSHint happy 2011-12-01 10:19:21 +00:00			`callback(err);`
Added support for retrieving ingredients over HTTP This makes it possible to directly reference recipes and tiddlers stored on GitHub, for example. 2011-11-29 18:27:03 +00:00			`});`
			`request.end();`
Major refactoring of async code The result is correct handling of tiddlers being overwritten within recipes. 2011-12-02 14:40:18 +00:00			`};`
Added support for retrieving ingredients over HTTP This makes it possible to directly reference recipes and tiddlers stored on GitHub, for example. 2011-11-29 18:27:03 +00:00
Converted recipe handling to use async IO Part of the preparation for supporting reading recipes and ingredients over HTTP 2011-11-28 13:47:38 +00:00			`// Retrieve a file given a filepath specifier and a context path. If the filepath isn't an absolute`
			`// filepath or an absolute URL, then it is interpreted relative to the context path, which can also be`
Major refactoring of async code The result is correct handling of tiddlers being overwritten within recipes. 2011-12-02 14:40:18 +00:00			`// a filepath or a URL. On completion, the callback function is called as callback(err,data). The`
			`// data hashmap is as follows:`
			`// text: full text of file`
Refactored return value of retrieveFile() 2011-11-30 11:41:26 +00:00			`// path: full path used to reach the file`
Major refactoring of async code The result is correct handling of tiddlers being overwritten within recipes. 2011-12-02 14:40:18 +00:00			`// basename: the basename of the file`
Refactored return value of retrieveFile() 2011-11-30 11:41:26 +00:00			`// extname: the extension of the file`
Converted recipe handling to use async IO Part of the preparation for supporting reading recipes and ingredients over HTTP 2011-11-28 13:47:38 +00:00			`FileRetriever.retrieveFile = function(filepath,contextPath,callback) {`
Added support for retrieving ingredients over HTTP This makes it possible to directly reference recipes and tiddlers stored on GitHub, for example. 2011-11-29 18:27:03 +00:00			`var httpRegExp = /^(https?:\/\/)/gi,`
Refactored return value of retrieveFile() 2011-11-30 11:41:26 +00:00			`result = {},`
Added support for retrieving ingredients over HTTP This makes it possible to directly reference recipes and tiddlers stored on GitHub, for example. 2011-11-29 18:27:03 +00:00			`filepathIsHttp = httpRegExp.test(filepath),`
Major refactoring of async code The result is correct handling of tiddlers being overwritten within recipes. 2011-12-02 14:40:18 +00:00			`contextPathIsHttp = httpRegExp.test(contextPath),`
			`requester;`
Added support for retrieving ingredients over HTTP This makes it possible to directly reference recipes and tiddlers stored on GitHub, for example. 2011-11-29 18:27:03 +00:00			`if(contextPathIsHttp \|\| filepathIsHttp) {`
			`// If we've got a full HTTP URI then we're good to go`
Refactored return value of retrieveFile() 2011-11-30 11:41:26 +00:00			`result.path = url.resolve(contextPath,filepath);`
			`var parsedPath = url.parse(result.path);`
			`result.extname = path.extname(parsedPath.pathname);`
			`result.basename = path.basename(parsedPath.extname);`
Major refactoring of async code The result is correct handling of tiddlers being overwritten within recipes. 2011-12-02 14:40:18 +00:00			`requester = httpRequest;`
Added support for retrieving ingredients over HTTP This makes it possible to directly reference recipes and tiddlers stored on GitHub, for example. 2011-11-29 18:27:03 +00:00			`} else {`
			`// It's a file requested in a file context`
Refactored return value of retrieveFile() 2011-11-30 11:41:26 +00:00			`result.path = path.resolve(path.dirname(contextPath),filepath);`
			`result.extname = path.extname(result.path);`
			`result.basename = path.basename(result.path,result.extname);`
Major refactoring of async code The result is correct handling of tiddlers being overwritten within recipes. 2011-12-02 14:40:18 +00:00			`requester = fileRequest;`
Added support for retrieving ingredients over HTTP This makes it possible to directly reference recipes and tiddlers stored on GitHub, for example. 2011-11-29 18:27:03 +00:00			`}`
Major refactoring of async code The result is correct handling of tiddlers being overwritten within recipes. 2011-12-02 14:40:18 +00:00			`requester(result.path,function(err,data) {`
			`if(!err) {`
			`result.text = data;`
			`}`
			`callback(err,result);`
			`});`
Preparing to add support for JSON files loaded from TiddlySpace/TiddlyWeb 2011-11-30 16:06:34 +00:00			`};`