--- markup/html/scripting-parser/parser.html 2008/04/20 12:19:13 1.4
+++ markup/html/scripting-parser/parser.html 2008/04/27 10:34:18 1.10
@@ -1,14 +1,19 @@
-Demo of HTML5 Parsing Algorithm with Scripting Enabled
+Live Scripting HTML Parser
]+)>/, function (s, e) {
- if (p.insertionPoint < s.length) {
+ i.s = i.s.replace (/^<\/([^>]+)(?:>|$)/, function (s, e) {
+ if (p.insertionPoint < s.length ||
+ (p.insertionPoint <= s.length &&
+ s.substring (s.length - 1, 1) != '>')) {
token = {type: 'abort'};
return s;
}
@@ -98,8 +143,10 @@
return '';
});
if (token) return token;
- i.s = i.s.replace (/^<([^>]+)>/, function (s, e) {
- if (p.insertionPoint < s.length) {
+ i.s = i.s.replace (/^<([^>]+)(?:>|$)/, function (s, e) {
+ if (p.insertionPoint < s.length ||
+ (p.insertionPoint <= s.length &&
+ s.substring (s.length - 1, 1) != '>')) {
token = {type: 'abort'};
return s;
}
@@ -109,11 +156,22 @@
tagName = v.toLowerCase ();
return '';
});
- e = e.replace (/^\s*(\S+)\s*(?:=\s*"([^"]*)"|'([^']*)'|([^"']+))?/,
- function (x, attrName, attrValue1, attrValue2, attrValue3) {
- attrs[attrName] = attrValue1 || attrValue2 || attrValue3;
- return '';
- });
+ while (true) {
+ var m = false;
+ e = e.replace (/^\s*([^\s=]+)\s*(?:=\s*(?:"([^"]*)"|'([^']*)'|([^"'\s]*)))?/,
+ function (x, attrName, attrValue1, attrValue2, attrValue3) {
+ v = attrValue1 || attrValue2 || attrValue3;
+ v = v.replace (/"/g, '"').replace (/'/g, "'")
+ .replace (/&/g, '&');
+ attrs[attrName.toLowerCase ()] = v;
+ m = true;
+ return '';
+ });
+ if (!m) break;
+ }
+ if (e.length) {
+ log ('Broken start tag: "' + e + '"');
+ }
token = {type: 'start-tag', value: tagName, attrs: attrs};
p.insertionPoint -= s.length;
return '';
@@ -144,7 +202,8 @@
} // getNextToken
Parser.prototype.parse = function () {
- log ('start parsing');
+ logIndentLevel++;
+ log ('parse: start');
while (true) {
var token = this.getNextToken ();
@@ -212,11 +271,40 @@
this.openElements[this.openElements.length - 1].appendChild (el);
// 11. Let the insertion point have the value of the old ...
+
+ oldInsertionPoint += this.insertionPoint;
this.setInsertionPoint (oldInsertionPoint);
// 12. If there is a script that will execute as soon as ...
-
+ while (this.scriptExecutedWhenParserResumes) {
+ // 12.1. If the tree construction stage is being called reentrantly
+ if (this.reentrant) {
+ log ('parse: abort (reentrance)');
+ logIndentLevel--;
+ return;
+
+ // 12.2. Otherwise
+ } else {
+ // 1.
+ var script = this.scriptExecutedWhenParserResumes;
+ this.scriptExecutedWhenParserResumes = null;
+
+ // 2. Pause until the script has completed loading.
+ //
+
+ // 3. Let the insertion point to just before the next input char.
+ this.setInsertionPoint (0);
+
+ // 4. Execute the script.
+ executeScript (this.doc, script);
+
+ // 5. Let the insertion point be undefined again.
+ this.setInsertionPoint (undefined);
+ // 6. If there is once again a script that will execute ...
+ //
+ }
+ }
} else {
var el = new JSElement (this.doc, token.value);
this.openElements[this.openElements.length - 1].appendChild (el);
@@ -236,6 +324,7 @@
break;
} else if (token.type == 'abort') {
log ('parse: abort');
+ logIndentLevel--;
return;
}
}
@@ -246,8 +335,21 @@
// "When a script completes loading" rules start applying.
- // TODO: Handles "list of scripts that will execute as soon as possible"
- // and "list of scripts that will execute asynchronously"
+ // List of scripts that will execute as soon as possible
+ for (var i = 0; i < this.scriptsExecutedSoon.length; i++) {
+ var e = this.scriptsExecutedSoon[i];
+
+ // If it has completed loading
+ log ('Execute an external script not inserted by parser...');
+ executeScript (this.doc, e);
+
+ // NOTE: It MAY be executed before the end of the parsing, according
+ // to the spec.
+ this.hasAsyncScript = true;
+ }
+
+ // TODO: Handles
+ // "list of scripts that will execute asynchronously"
// Handle "list of scripts that will execute when the document has finished
// parsing".
@@ -270,18 +372,20 @@
// "delays tha load event" things has completed:
// readyState = 'complete'
log ('load event fired');
+
+ logIndentLevel--;
} // parse
Parser.prototype.setInsertionPoint = function (ip) {
if (ip == undefined || ip == null || isNaN (ip)) {
log ('insertion point: set to undefined');
this.insertionPoint = undefined;
- } else if (ip == this.in.s.length) {
+ } else if (ip == this.input.s.length) {
log ('insertion point: end of file');
this.insertionPoint = ip;
} else {
log ('insertion point: set to ' + ip +
- ' (before "' + this.in.s.substring (0, 10) + '")');
+ ' (before "' + this.input.s.substring (0, 10) + '")');
this.insertionPoint = ip;
}
}; // setInsertionPoint
@@ -303,6 +407,7 @@
e.parentNode = this;
if (e.localName == 'script') {
+ logIndentLevel++;
log ('Running a script: start');
var doc = this.ownerDocument || this;
@@ -321,6 +426,7 @@
if (e.manakaiAlreadyExecuted) {
// 2.5. Abort these steps at this point.
log ('Running a script: aborted');
+ logIndentLevel--;
return e;
}
@@ -343,14 +449,20 @@
/* && list of scripts that will execute asynchronously is not empty */) {
// TODO
} else if (e.src != null && e.manakaiParserInserted) {
- // TODO
+ if (p.scriptExecutedWhenParserResumes) {
+ log ('Error: There is a script that will execute as soon as the parser resumes.');
+ }
+ p.scriptExecutedWhenParserResumes = e;
+ log ('Running a script: aborted (src parser-inserted)');
} else if (e.src != null) {
- // TODO
+ p.scriptsExecutedSoon.push (e);
+ log ('Running a script: aborted (src)');
} else {
executeScript (doc, e); // even if other scripts are already executing.
}
log ('Running a script: end');
+ logIndentLevel--;
}
return e;
@@ -359,7 +471,20 @@
function executeScript (doc, e) {
log ('executing a script block: start');
- // If the load resulted in an error, then ... firing an error event ...
+ var s;
+ if (e.src != null) {
+ s = getExternalScript (e.src);
+
+ // If the load resulted in an error, then ... firing an error event ...
+ if (s == null) {
+ log ('error event fired at the script element');
+ return;
+ }
+
+ log ('External script loaded: "' + s + '"');
+ } else {
+ s = e.text;
+ }
// If the load was successful
log ('load event fired at the script element');
@@ -368,19 +493,37 @@
// Scripting is enabled, Document.designMode is disabled,
// Document is the active document in its browsing context
- var s;
- if (e.src != null) {
- // TODO: from external file
- } else {
- s = e.text;
- }
-
parseAndRunScript (doc, s);
}
log ('executing a script block: end');
} // executeScript
+ function getExternalScript (uri) {
+ if (uri.match (/^javascript:/i)) {
+ var m;
+ if (m = uri.match (/^javascript:\s*(?:'([^']*)'|"([^"]+)")\s*$/i)) {
+ if (m[1]) {
+ return m[1].replace (/\\u([0-9A-F]{4})/g, function (s, v) {
+ return String.fromCharCode (parseInt ('0x' + v));
+ });
+ } else if (m[2]) {
+ return m[2].replace (/\\u([0-9A-F]{4})/g, function (s, v) {
+ return String.fromCharCode (parseInt ('0x' + v));
+ });
+ } else {
+ return null;
+ }
+ } else {
+ log ('Complex javascript: URI is not supported: <' + uri + '>');
+ return null;
+ }
+ } else {
+ log ('URI scheme not supported: <' + uri + '>');
+ return null;
+ }
+ } // getExternalScript
+
function parseAndRunScript (doc, s) {
while (true) {
var matched = false;
@@ -394,6 +537,13 @@
doc.write.apply (doc, args);
return '';
});
+ s = s.replace (/^\s*var\s+s\s*=\s*document\.createElement\s*\(\s*['"]script['"]\s*\)\s*;\s*s\.src\s*=\s*(?:'(javascript:[^']*)'|"(javascript:[^"]*)")\s*;\s*document\.documentElement\.appendChild\s*\(\s*s\s*\)\s*;\s*/,
+ function (s, t, u) {
+ matched = true;
+ var args = [t ? t : u];
+ doc._insertExternalScript.apply (doc, args);
+ return '';
+ });
if (s == '') break;
if (!matched) {
log ('Script parse error: "' + s + '"');
@@ -429,7 +579,7 @@
// Step 3.
if (this._parser &&
!this._parser.scriptCreated &&
- this._parser.in.insertionPoint != undefined) {
+ this._parser.input.insertionPoint != undefined) {
log ('document.open () in parsing mode is ignored');
return this;
}
@@ -463,13 +613,15 @@
}
// Step 11.
- this._parser.setInsertionPoint (this._parser.in.s.length);
+ this._parser.setInsertionPoint (this._parser.input.s.length);
// Step 12.
return this;
}; // document.open
JSDocument.prototype.write = function () {
+ logIndentLevel++;
+
var p = this._parser;
// 1. If the insertion point is undefined, the open() method must be ...
@@ -481,22 +633,51 @@
// 2. ... inserted into the input stream just before the insertion point.
var s = Array.join (arguments, '');
log ('document.write: insert "' + s + '"' +
- ' before "' + p.in.s.substring (p.insertionPoint, p.insertionPoint + 10) + '"');
- p.in.s = p.in.s.substring (0, p.insertionPoint) + s
- + p.in.s.substring (p.insertionPoint, p.in.s.length);
+ ' before "' +
+ p.input.s.substring (p.insertionPoint, p.insertionPoint + 10) + '"');
+ p.input.s = p.input.s.substring (0, p.insertionPoint) + s
+ + p.input.s.substring (p.insertionPoint, p.input.s.length);
p.insertionPoint += s.length;
// 3. If there is a script that will execute as soon as the parser resumes
- // TODO
+ if (p.scriptExecutedAfterParserResumes) {
+ log ('document.write: processed later (there is an unprocessed