Index: lib/child/frameScript.js |
=================================================================== |
new file mode 100644 |
--- /dev/null |
+++ b/lib/child/frameScript.js |
@@ -0,0 +1,129 @@ |
+/* |
+ * This Source Code is subject to the terms of the Mozilla Public License |
+ * version 2.0 (the "License"). You can obtain a copy of the License at |
+ * http://mozilla.org/MPL/2.0/. |
+ */ |
+ |
+"use strict"; |
+ |
+const {classes: Cc, interfaces: Ci, utils: Cu, results: Cr} = Components; |
+ |
+/** |
+ * @param e exception |
+ */ |
+function reportException(e) |
+{ |
+ let stack = ""; |
+ if (e && typeof e == "object" && "stack" in e) |
+ stack = e.stack + "\n"; |
+ |
+ Cu.reportError(e); |
+ dump(e + "\n" + stack + "\n"); |
+} |
+ |
+const {XPCOMUtils} = Cu.import("resource://gre/modules/XPCOMUtils.jsm", {}); |
+ |
+/** |
+ * Progress listener capturing the data of the current page and calling |
+ * onPageLoaded(data) when loading is finished, where data contains |
+ * HTTP status and headers. |
+ * |
+ * @type nsIWebProgressListener |
+ */ |
+let webProgressListener = |
+{ |
+ onStateChange: function(webProgress, request, flags, status) |
+ { |
+ if (webProgress.DOMWindow == content && |
+ (flags & Ci.nsIWebProgressListener.STATE_STOP)) |
+ { |
+ // First time we receive STATE_STOP for about:blank and the second time |
+ // for our interested URL which is distinct from about:blank. |
+ // However we should not process about:blank because it can happen that |
+ // the message with information about about:blank is delivered when the |
+ // code in crawler.js is already waiting for a message from this tab. |
+ // Another case we are not interested in is about:newtab. |
+ if (content.location.protocol == "about:") |
+ return; |
+ let pageInfo = {channelStatus: status}; |
+ if (request instanceof Ci.nsIHttpChannel) |
+ { |
+ try |
+ { |
+ pageInfo.headers = []; |
+ pageInfo.headers.push("HTTP/x.x " + request.responseStatus + " " + request.responseStatusText); |
+ request.visitResponseHeaders((header, value) => pageInfo.headers.push(header + ": " + value)); |
+ } |
+ catch (e) |
+ { |
+ reportException(e); |
+ } |
+ } |
+ onPageLoaded(pageInfo); |
+ } |
+ }, |
+ |
+ onLocationChange: function() {}, |
+ onProgressChange: function() {}, |
+ onStatusChange: function() {}, |
+ onSecurityChange: function() {}, |
+ |
+ QueryInterface: XPCOMUtils.generateQI([Ci.nsIWebProgressListener, Ci.nsISupportsWeakReference]) |
+}; |
+ |
+function onPageLoaded(pageInfo) |
+{ |
+ Object.assign(pageInfo, gatherPageInfo(content)); |
+ sendAsyncMessage("abpcrawler:pageInfoGathered", pageInfo); |
+}; |
+ |
+let webProgress = docShell.QueryInterface(Ci.nsIInterfaceRequestor).getInterface(Ci.nsIWebProgress); |
+webProgress.addProgressListener(webProgressListener, Ci.nsIWebProgress.NOTIFY_STATE_WINDOW); |
+ |
+/** |
+ * Gathers information about a DOM window. |
+ * Currently |
+ * - creates a screenshot of the page |
+ * - serializes the page source code |
+ * @param {nsIDOMWindow} wnd window to process |
+ * @return {Object} the object containing "screenshot" and "source" properties. |
+ */ |
+function gatherPageInfo(wnd) |
+{ |
+ let document = wnd.document; |
+ let result = {errors:[]}; |
+ if (!document.documentElement) |
+ { |
+ result.errors.push("No document.documentElement"); |
+ return result; |
+ } |
+ |
+ try |
+ { |
+ let canvas = document.createElementNS("http://www.w3.org/1999/xhtml", "canvas"); |
+ canvas.width = document.documentElement.scrollWidth; |
+ canvas.height = document.documentElement.scrollHeight; |
+ let context = canvas.getContext("2d"); |
+ context.drawWindow(wnd, 0, 0, canvas.width, canvas.height, "rgb(255, 255, 255)"); |
+ result.screenshot = canvas.toDataURL("image/jpeg", 0.8); |
+ } |
+ catch (e) |
+ { |
+ reportException(e); |
+ result.errors.push("Cannot make page screenshot"); |
+ } |
+ |
+ try |
+ { |
+ // TODO: Capture frames as well? |
+ let serializer = new wnd.XMLSerializer(); |
+ result.source = serializer.serializeToString(document.documentElement); |
+ } |
+ catch(e) |
+ { |
+ reportException(e); |
+ result.errors.push("Cannot obtain page source code"); |
+ } |
+ |
+ return result; |
+} |