2 GLib = imports.gi.GLib;
3 WebKit = imports.gi.WebKit;
4 Soup = imports.gi.Soup;
6 TabbedBrowser = imports.TabbedBrowser;
7 BrowserSettings = imports.BrowserSettings;
8 BrowserTab = imports.BrowserTab;
10 File = imports.File.File;
12 base64 = imports.base64.base64;
14 BrowserView = new GType({
15 parent: WebKit.WebView.type,
21 var sess = WebKit.get_default_session();
22 sess.proxy_uri = new Soup.URI.c_new('http://localhost:3128');
26 var browsePage = false;
32 var update_title = function (web_view, web_frame, title)
35 print("calling update title");
37 title = title.slice(0,25) + "...";
39 tab.get_tab_label().label = title;
46 var traversedom = function(doc, fn, sub ) {
47 print("TRAVERSE DOM?");
52 var cb = function(s) {
62 //Roo.select('body > div',true).each(function(el) {
63 traverseDOMTree(cb, doc.head, 1);
64 traverseDOMTree(cb, doc.body, 1);
66 File.write(cb.fn.replace(/\.html$/, '')+ (sub ? ('.' + sub ) : '') + '.html' , ret +'</HTML>');
72 var traverseDOMTree = function(cb, currentElement, depth) {
75 //if (currentElement.class_name.match(/roo-dynamic/)) {
78 //print(currentElement.node_name);
80 var nodeName = currentElement.node_name;
81 var tagName = currentElement.tag_name;
83 if (nodeName == '#text') {
84 cb(currentElement.node_value);
93 if (nodeName == 'SCRIPT') {
97 //if (nodeName == 'STYLE') { return; }
99 // Prints the node tagName, such as <A>, <IMG>, etc
100 var outNodeName = nodeName;
101 if (nodeName == 'IFRAME') {
102 //outNodeName = 'DIV';
111 for(i = 0; i < currentElement.attributes.length;i++) {
112 var aname = currentElement.attributes.item(i).name;
113 //if (aname =='class' || aname == 'style') {
116 if (aname =='src' && tagName == 'IFRAME') {
120 attr.push(aname + '="' + currentElement.attributes.item(i).value + '"' );
122 if (tagName == 'IFRAME') {
123 attr.push('src="' + File.basename(cb.fn).replace(/\.html$/, '')+ '.' + cb.sub + '.html"' );
126 //if (nodeName == 'IFRAME') {
127 // attr.push('src="' + currentElement.attributes.item(i).value + embeded_file '"' );
130 //var style = elClassToStyle(currentElement);
131 //if (style.length) {
132 // attr.push('style="' + style + '"' );
136 //if (depth > 1000 && (tagName == 'BODY' || tagName == 'HEAD' )) {
137 // cb("<DIV"+ ( attr.length ? (' ' + attr.join(' ') ) : '') + ">");
139 cb("<"+outNodeName + ( attr.length ? (' ' + attr.join(' ') ) : '') + ">");
147 if (nodeName == 'IFRAME') {
150 traversedom(currentElement.content_document, cb.fn, cb.sub )
159 var currentElementChild = currentElement.child_nodes.item(i);
161 while (currentElementChild) {
162 // Formatting code (indent the tree so it looks nice on the screen)
164 if (currentElementChild.node_name == '#text') {
165 // if (currentElementChild.node_value.length) {
166 cb(currentElementChild.node_value);
170 currentElementChild=currentElement.child_nodes.item(i);
175 //for (j = 0; j < depth; j++) {
176 // ¦ is just a vertical line
181 // Recursively traverse the tree structure of the child node
182 traverseDOMTree(cb, currentElementChild, depth+1);
184 currentElementChild=currentElement.child_nodes.item(i);
187 // The remaining code is mostly for formatting the tree
189 //for (j = 0; j < depth - 1; j++) {
194 // if (depth > 1000 && (tagName == 'BODY' || tagName == 'HEAD' )) {
197 cb("</"+outNodeName+">");
205 var update_url = function (web_view, web_frame)
207 var toolbar = tab.get_toolbar();
209 toolbar.set_url(web_frame.get_uri());
210 toolbar.set_can_go_back(web_view.can_go_back());
211 toolbar.set_can_go_forward(web_view.can_go_forward());
221 var create_new_tab = function (web_view, web_frame, new_web_view)
223 new_web_view = new BrowserView();
224 new_web_view.signal.web_view_ready.connect(show_new_tab);
228 var show_new_tab = function (new_web_view)
230 TabbedBrowser.browser.new_tab("", new_web_view);
235 var hover_link = function (web_view, link, url)
237 tab.get_statusbar().set_status(url);
242 this.add_inject = function(force)
245 if (force || (typeof(injected[this.uri]) == 'undefined' )) {
246 injected[this.uri] = 0;
248 if (injected[this.uri] > 2) {
251 injected[this.uri]++;
252 var fn = __script_path__ + "/inject.js";
253 if (File.exists(fn)) {
254 // print("Adding inject");
255 var newjs = File.read(__script_path__ + "/inject.js");
256 TabbedBrowser.browser.current_tab().get_web_view().execute_script(
264 var after_login = false;
267 var load_finished_called = false;
269 var done_print = false;
272 var do_print = function(web_frame) {
276 var realprint = function() {
278 if (_this.queue_print > 0) {
279 print("ignore print - queue is " + _this.queue_print);
285 if (current_url.match(/theindependent\.sg\//) ) {
286 TabbedBrowser.browser.current_tab().get_web_view().execute_script(
287 File.read( __script_path__ + "/domains/theindependent.sg.js")
293 if (web_frame && BrowserSettings.export_filename_html ) {
294 var html = traversedom(web_frame.get_dom_document(), BrowserSettings.export_filename_html);
295 //File.write(BrowserSettings.export_filename_html, html);
299 if (!BrowserSettings.export_filename) {
300 if (!BrowserSettings.export_filename_html) {
301 print("no export filename / and html filename");
307 var mf = _t.get_main_frame();
309 print("Creating paper");
310 var ar = Gtk.PaperSize.get_paper_sizes();
311 var psetup = new Gtk.PageSetup();
312 for(var i = 0; i < ar.length; i++) {
313 if (ar[i].get_name() =='iso_a2') {
314 psetup.set_paper_size(ar[i]);
317 print("doing print operation");
318 var p = new Gtk.PrintOperation({ export_filename : BrowserSettings.export_filename });
319 print("doing print operation - set page");
321 p.set_default_page_setup(psetup);
323 print("doing print operation - print_full");
324 mf.print_full(p, Gtk.PrintOperationAction.EXPORT);
325 print("made image - exiting");
330 print("error occured");
331 print(JSON.stringify(e));
339 GLib.timeout_add(GLib.PRIORITY_DEFAULT, BrowserSettings.delay *1, realprint);
340 print("do_print called -- while already doing this...");
344 print("do_print called");
347 TabbedBrowser.browser.current_tab().get_web_view().execute_script(
348 File.read( __script_path__ + "/domains/remove_print_css.js")
351 var url_p = current_url.split('/');
353 var dom_p = url_p[2].split('.');
354 var chk = dom_p.pop();
355 chk = dom_p.pop() + '.' + chk;
359 print("CHECK: " + chk +"\n");
360 if (File.exists( __script_path__ + "/domains/" + chk + '.js')) {
361 print("INCLUDING: " + __script_path__ + "/domains/"+ chk + ".js\n");
362 TabbedBrowser.browser.current_tab().get_web_view().execute_script(
363 File.read( __script_path__ + "/domains/"+ chk + ".js")
368 // motorme - requires a scroll to make content appear..
369 if (current_url.match(/\.motorme\.my\//) ) {
370 TabbedBrowser.browser.current_tab().get_web_view().execute_script("window.scrollTo(0,500);");
374 if (current_url.match('/forbes.com')) {
379 print("Delay:" + BrowserSettings.delay);
383 GLib.timeout_add(GLib.PRIORITY_DEFAULT, BrowserSettings.delay *1, realprint);
387 var weibo_added = false;
389 var is_weibo = false;
392 var load_finished = function (webkit, web_frame, wb)
403 print("load finished");
406 if (after_login === true) {
412 if (after_login === false) {
415 print("adding timeout?");
417 GLib.timeout_add(GLib.PRIORITY_LOW, 2000, function() {
418 print("Redirecting after login?" + after_login);
420 _t.browse(after_login);
427 TabbedBrowser.browser.current_tab().get_web_view().execute_script(
428 File.read( __script_path__ + "/weibo.js")
430 print("run_weibo(" + JSON.stringify( BrowserSettings.username ) + ", " + JSON.stringify(BrowserSettings.passwd) + ");");
432 TabbedBrowser.browser.current_tab().get_web_view().execute_script(
433 "run_weibo(" + JSON.stringify( BrowserSettings.username ) + ", " + JSON.stringify(BrowserSettings.passwd) + ");"
439 if (after_login !== false) {
442 // wait a bit then load the real page..
443 GLib.timeout_add(GLib.PRIORITY_LOW, 500, function() {
444 print("Redirecting after login?");
445 _t.browse(after_login);
451 if (load_finished_called) {
455 load_finished_called = true;
459 // if(document.location.host=='weibo.com') {
460 // // clear login dialog from weibo.
461 // //check and hidden the login dialog and overlay .....
462 // var els = document.querySelectorAll('div[node-type]');
464 // for (i = 0; i < els.length; i++) {
465 // if (els[i].hasAttribute('node-type')) {
466 // if(els[i].getAttribute('node-type') == 'outer'){
471 // for (i = 0; i < bbc.length; i++) {// hide all the outer.....
472 // bbc[i].style.display = 'none';
476 // if(document.location.pathname == '/login.php'){
478 // // fills in the user name and password
479 // var els = document.querySelectorAll('input[node-type]');
481 // for (i = 0; i < els.length; i++) {
482 // if (els[i].hasAttribute('node-type')) {
483 // if(els[i].getAttribute('node-type') == 'username'){
484 // els[i].value = BrowserSettings.username;
486 // if(els[i].getAttribute('node-type') == 'password'){
487 // els[i].value = BrowserSettings.passwd;
493 // // simulating click event to login ....
494 // var elss = document.querySelectorAll('a[node-type]');
496 // for (i = 0; i < elss.length; i++) {
497 // if (elss[i].hasAttribute('node-type')) {
498 // if(elss[i].getAttribute('node-type') == 'submitBtn'){
510 // clear login dialog from weibo.
511 // TabbedBrowser.browser.current_tab().get_web_view().execute_script(
512 // " if (document.location.host=='weibo.com') { " +
514 // " var a = document.getElementsByClassName('W_layer')[0]; " +
515 // " a.parentNode.removeChild(a.previousSibling); " +
516 // " a.parentNode.removeChild(a); " +
517 // " } catch(e) { } } " );
521 GLib.timeout_add(GLib.PRIORITY_LOW, BrowserSettings.delay, function() {
523 var mf = _t.get_main_frame();
525 var ar = Gtk.PaperSize.get_paper_sizes();
526 var psetup = new Gtk.PageSetup();
527 for(var i = 0; i < ar.length; i++) {
528 if (ar[i].get_name() =='iso_a2') {
529 psetup.set_paper_size(ar[i]);
533 var p = new Gtk.PrintOperation({ export_filename : BrowserSettings.export_filename });
534 p.set_default_page_setup(psetup);
535 mf.print_full(p, Gtk.PrintOperationAction.EXPORT);
536 print("made image - exiting");
548 var load_committed = function (web_view, web_frame)
550 print("load commited");
552 update_url(web_view, web_frame);
554 // call load finished after 20seconds??
555 // so even if it never complets we try and print the thing.
556 GLib.timeout_add(GLib.PRIORITY_LOW, 40000, function() {
557 print("load commited - 3000 ms?");
563 var clicked_link = function (web_view, web_frame, request,
564 action, decision, window)
566 if(action.get_reason() == WebKit.WebNavigationReason.LINK_CLICKED &&
567 action.get_button() == 2)
569 browser.new_tab(request.get_uri(), null);
579 this.browse = function (url)
581 if(url.search("://") < 0)
582 url = "http://" + url;
586 print("BROWSE: " + url);
587 if (url.match(/\/weibo\.com\//) && after_login === false) {
590 url = "http://weibo.com/login.php";
592 else if (url.match(/\/weibo\.com\//) && after_login !== false) {
595 print("BROWSE -really: " + url);
599 this.set_tab = function (new_tab)
604 this.get_tab = function ()
611 //this.set_scroll_adjustments(null, null);
613 //this.signal.title_changed.connect(update_title);
614 //this.signal.load_committed.connect(load_committed);
615 this.signal.load_finished.connect(load_finished);
618 // For some reason, this segfaults seed in the instance init closure handler
619 // Once that's fixed, uncommenting the next line will give middle-click-open-in-new tab
620 //this.signal.navigation_policy_decision_requested.connect(clicked_link);
622 //this.signal.hovering_over_link.connect(hover_link);
624 this.signal.create_web_view.connect(create_new_tab);
628 // print("ADDing console message sig handler");
633 this.toFilename = function(url)
635 url = url.replace(/^http[s]*:\/\//, '');
636 var p = url.split('/');
637 p.unshift(storedir+'/output');
638 for (var i =1 ;i < p.length; i++) {
639 p[i] = encodeURIComponent(p[i]);
642 p[p.length-1] = decodeURIComponent(p[p.length-1]);
644 var dir = File.dirname(ret);
649 this.checkdomain = function(comp)
651 var b = parseUri(this.uri);
652 var d = parseUri(comp);
653 return (d.host == b.host && d.protocol == b.protocol);
658 this.dupeCheck = function(url)
661 // order - return highest up the queue first..
662 if (File.exists(downloaddir +'/' + encodeURIComponent(url))) {
663 return downloaddir +'/' + encodeURIComponent(url);
665 if (File.exists(parsedir +'/' + encodeURIComponent(url))) {
666 return parsedir +'/' + encodeURIComponent(url);
668 if (File.exists(donedir +'/' + encodeURIComponent(url))) {
669 return donedir +'/' + encodeURIComponent(url);
675 this.moveToParse = function(url)
677 var old = this.dupeCheck(url);
678 var target =parsedir +'/' + encodeURIComponent(url);
682 File.write(target, old ? File.read(old) : '');
689 this.moveToDownload= function(url)
691 var old = this.dupeCheck(url);
692 var target =downloaddir +'/' + encodeURIComponent(url);
696 File.write(target, old ? File.read(old) : '');
702 this.moveToDone= function(url)
704 var old = this.dupeCheck(url);
705 var target = donedir +'/' + encodeURIComponent(url);
709 File.write(target, old ? File.read(old) : '');
719 function parseUri (str) {
720 var o = parseUri.options,
721 m = o.parser[o.strictMode ? "strict" : "loose"].exec(str),
725 while (i--) uri[o.key[i]] = m[i] || "";
728 uri[o.key[12]].replace(o.q.parser, function ($0, $1, $2) {
729 if ($1) uri[o.q.name][$1] = $2;
737 key: ["source","protocol","authority","userInfo","user","password","host","port","relative","path","directory","file","query","anchor"],
740 parser: /(?:^|&)([^&=]*)=?([^&]*)/g
743 strict: /^(?:([^:\/?#]+):)?(?:\/\/((?:(([^:@]*)(?::([^:@]*))?)?@)?([^:\/?#]*)(?::(\d*))?))?((((?:[^?#\/]*\/)*)([^?#]*))(?:\?([^#]*))?(?:#(.*))?)/,
744 loose: /^(?:(?![^:@]+:[^:@\/]*@)([^:\/?#.]+):)?(?:\/\/)?((?:(([^:@]*)(?::([^:@]*))?)?@)?([^:\/?#]*)(?::(\d*))?)(((\/(?:[^?#](?![^?#\/]*\.[^?#\/.]+(?:[?#]|$)))*\/?)?([^?#\/]*))(?:\?([^#]*))?(?:#(.*))?)/