2 GLib = imports.gi.GLib;
3 WebKit = imports.gi.WebKit;
4 Soup = imports.gi.Soup;
6 TabbedBrowser = imports.TabbedBrowser;
7 BrowserSettings = imports.BrowserSettings;
8 BrowserTab = imports.BrowserTab;
10 File = imports.File.File;
12 base64 = imports.base64.base64;
14 BrowserView = new GType({
15 parent: WebKit.WebView.type,
21 var sess = WebKit.get_default_session();
22 sess.proxy_uri = new Soup.URI.c_new('http://localhost:3128');
26 var browsePage = false;
32 var update_title = function (web_view, web_frame, title)
35 print("calling update title");
37 title = title.slice(0,25) + "...";
39 tab.get_tab_label().label = title;
46 var traversedom = function(doc, fn, sub ) {
47 print("TRAVERSE DOM?");
52 var cb = function(s) {
62 //Roo.select('body > div',true).each(function(el) {
63 traverseDOMTree(cb, doc.head, 1);
64 traverseDOMTree(cb, doc.body, 1);
66 File.write(cb.fn.replace(/\.html$/, '')+ (sub ? ('.' + sub ) : '') + '.html' , ret +'</HTML>');
72 var traverseDOMTree = function(cb, currentElement, depth) {
75 //if (currentElement.class_name.match(/roo-dynamic/)) {
78 //print(currentElement.node_name);
80 var nodeName = currentElement.node_name;
81 var tagName = currentElement.tag_name;
83 if (nodeName == '#text') {
84 cb(currentElement.node_value);
93 if (nodeName == 'SCRIPT') {
97 //if (nodeName == 'STYLE') { return; }
99 // Prints the node tagName, such as <A>, <IMG>, etc
100 var outNodeName = nodeName;
101 if (nodeName == 'IFRAME') {
102 //outNodeName = 'DIV';
111 for(i = 0; i < currentElement.attributes.length;i++) {
112 var aname = currentElement.attributes.item(i).name;
113 //if (aname =='class' || aname == 'style') {
116 if (aname =='src' && tagName == 'IFRAME') {
120 attr.push(aname + '="' + currentElement.attributes.item(i).value + '"' );
122 if (tagName == 'IFRAME') {
123 attr.push('src="' + File.basename(cb.fn).replace(/\.html$/, '')+ '.' + cb.sub + '.html"' );
126 //if (nodeName == 'IFRAME') {
127 // attr.push('src="' + currentElement.attributes.item(i).value + embeded_file '"' );
130 //var style = elClassToStyle(currentElement);
131 //if (style.length) {
132 // attr.push('style="' + style + '"' );
136 //if (depth > 1000 && (tagName == 'BODY' || tagName == 'HEAD' )) {
137 // cb("<DIV"+ ( attr.length ? (' ' + attr.join(' ') ) : '') + ">");
139 cb("<"+outNodeName + ( attr.length ? (' ' + attr.join(' ') ) : '') + ">");
147 if (nodeName == 'IFRAME') {
150 traversedom(currentElement.content_document, cb.fn, cb.sub )
159 var currentElementChild = currentElement.child_nodes.item(i);
161 while (currentElementChild) {
162 // Formatting code (indent the tree so it looks nice on the screen)
164 if (currentElementChild.node_name == '#text') {
165 // if (currentElementChild.node_value.length) {
166 cb(currentElementChild.node_value);
170 currentElementChild=currentElement.child_nodes.item(i);
175 //for (j = 0; j < depth; j++) {
176 // ¦ is just a vertical line
181 // Recursively traverse the tree structure of the child node
182 traverseDOMTree(cb, currentElementChild, depth+1);
184 currentElementChild=currentElement.child_nodes.item(i);
187 // The remaining code is mostly for formatting the tree
189 //for (j = 0; j < depth - 1; j++) {
194 // if (depth > 1000 && (tagName == 'BODY' || tagName == 'HEAD' )) {
197 cb("</"+outNodeName+">");
205 var update_url = function (web_view, web_frame)
207 var toolbar = tab.get_toolbar();
209 toolbar.set_url(web_frame.get_uri());
210 toolbar.set_can_go_back(web_view.can_go_back());
211 toolbar.set_can_go_forward(web_view.can_go_forward());
221 var create_new_tab = function (web_view, web_frame, new_web_view)
223 new_web_view = new BrowserView();
224 new_web_view.signal.web_view_ready.connect(show_new_tab);
228 var show_new_tab = function (new_web_view)
230 TabbedBrowser.browser.new_tab("", new_web_view);
235 var hover_link = function (web_view, link, url)
237 tab.get_statusbar().set_status(url);
242 this.add_inject = function(force)
245 if (force || (typeof(injected[this.uri]) == 'undefined' )) {
246 injected[this.uri] = 0;
248 if (injected[this.uri] > 2) {
251 injected[this.uri]++;
252 var fn = __script_path__ + "/inject.js";
253 if (File.exists(fn)) {
254 // print("Adding inject");
255 var newjs = File.read(__script_path__ + "/inject.js");
256 TabbedBrowser.browser.current_tab().get_web_view().execute_script(
264 var after_login = false;
267 var load_finished_called = false;
269 var done_print = false;
272 var do_print = function(web_frame) {
276 var realprint = function() {
280 if (current_url.match(/theindependent\.sg\//) ) {
281 TabbedBrowser.browser.current_tab().get_web_view().execute_script(
282 File.read( __script_path__ + "/domains/theindependent.sg.js")
288 if (web_frame && BrowserSettings.export_filename_html ) {
289 var html = traversedom(web_frame.get_dom_document(), BrowserSettings.export_filename_html);
290 //File.write(BrowserSettings.export_filename_html, html);
294 if (!BrowserSettings.export_filename) {
295 if (!BrowserSettings.export_filename_html) {
296 print("no export filename / and html filename");
302 var mf = _t.get_main_frame();
304 print("Creating paper");
305 var ar = Gtk.PaperSize.get_paper_sizes();
306 var psetup = new Gtk.PageSetup();
307 for(var i = 0; i < ar.length; i++) {
308 if (ar[i].get_name() =='iso_a2') {
309 psetup.set_paper_size(ar[i]);
312 print("doing print operation");
313 var p = new Gtk.PrintOperation({ export_filename : BrowserSettings.export_filename });
314 print("doing print operation - set page");
316 p.set_default_page_setup(psetup);
318 print("doing print operation - print_full");
319 mf.print_full(p, Gtk.PrintOperationAction.EXPORT);
320 print("made image - exiting");
325 print("error occured");
326 print(JSON.stringify(e));
333 print("do_print called -- while already doing this...");
337 print("do_print called");
340 TabbedBrowser.browser.current_tab().get_web_view().execute_script(
341 File.read( __script_path__ + "/domains/remove_print_css.js")
344 var url_p = current_url.split('/');
346 var dom_p = url_p[2].split('.');
347 var chk = dom_p.pop();
348 chk = dom_p.pop() + '.' + chk;
352 print("CHECK: " + chk +"\n");
353 if (File.exists( __script_path__ + "/domains/" + chk + '.js')) {
354 print("INCLUDING: " + __script_path__ + "/domains/"+ chk + ".js\n");
355 TabbedBrowser.browser.current_tab().get_web_view().execute_script(
356 File.read( __script_path__ + "/domains/"+ chk + ".js")
361 // motorme - requires a scroll to make content appear..
362 if (current_url.match(/\.motorme\.my\//) ) {
363 TabbedBrowser.browser.current_tab().get_web_view().execute_script("window.scrollTo(0,500);");
367 if (current_url.match('/forbes.com')) {
372 print("Delay:" + BrowserSettings.delay);
376 GLib.timeout_add(GLib.PRIORITY_DEFAULT, BrowserSettings.delay *1, realprint);
380 var weibo_added = false;
382 var is_weibo = false;
385 var load_finished = function (webkit, web_frame, wb)
396 print("load finished");
399 if (after_login === true) {
405 if (after_login === false) {
408 print("adding timeout?");
410 GLib.timeout_add(GLib.PRIORITY_LOW, 2000, function() {
411 print("Redirecting after login?" + after_login);
413 _t.browse(after_login);
420 TabbedBrowser.browser.current_tab().get_web_view().execute_script(
421 File.read( __script_path__ + "/weibo.js")
423 print("run_weibo(" + JSON.stringify( BrowserSettings.username ) + ", " + JSON.stringify(BrowserSettings.passwd) + ");");
425 TabbedBrowser.browser.current_tab().get_web_view().execute_script(
426 "run_weibo(" + JSON.stringify( BrowserSettings.username ) + ", " + JSON.stringify(BrowserSettings.passwd) + ");"
432 if (after_login !== false) {
435 // wait a bit then load the real page..
436 GLib.timeout_add(GLib.PRIORITY_LOW, 500, function() {
437 print("Redirecting after login?");
438 _t.browse(after_login);
444 if (load_finished_called) {
448 load_finished_called = true;
452 // if(document.location.host=='weibo.com') {
453 // // clear login dialog from weibo.
454 // //check and hidden the login dialog and overlay .....
455 // var els = document.querySelectorAll('div[node-type]');
457 // for (i = 0; i < els.length; i++) {
458 // if (els[i].hasAttribute('node-type')) {
459 // if(els[i].getAttribute('node-type') == 'outer'){
464 // for (i = 0; i < bbc.length; i++) {// hide all the outer.....
465 // bbc[i].style.display = 'none';
469 // if(document.location.pathname == '/login.php'){
471 // // fills in the user name and password
472 // var els = document.querySelectorAll('input[node-type]');
474 // for (i = 0; i < els.length; i++) {
475 // if (els[i].hasAttribute('node-type')) {
476 // if(els[i].getAttribute('node-type') == 'username'){
477 // els[i].value = BrowserSettings.username;
479 // if(els[i].getAttribute('node-type') == 'password'){
480 // els[i].value = BrowserSettings.passwd;
486 // // simulating click event to login ....
487 // var elss = document.querySelectorAll('a[node-type]');
489 // for (i = 0; i < elss.length; i++) {
490 // if (elss[i].hasAttribute('node-type')) {
491 // if(elss[i].getAttribute('node-type') == 'submitBtn'){
503 // clear login dialog from weibo.
504 // TabbedBrowser.browser.current_tab().get_web_view().execute_script(
505 // " if (document.location.host=='weibo.com') { " +
507 // " var a = document.getElementsByClassName('W_layer')[0]; " +
508 // " a.parentNode.removeChild(a.previousSibling); " +
509 // " a.parentNode.removeChild(a); " +
510 // " } catch(e) { } } " );
514 GLib.timeout_add(GLib.PRIORITY_LOW, BrowserSettings.delay, function() {
516 var mf = _t.get_main_frame();
518 var ar = Gtk.PaperSize.get_paper_sizes();
519 var psetup = new Gtk.PageSetup();
520 for(var i = 0; i < ar.length; i++) {
521 if (ar[i].get_name() =='iso_a2') {
522 psetup.set_paper_size(ar[i]);
526 var p = new Gtk.PrintOperation({ export_filename : BrowserSettings.export_filename });
527 p.set_default_page_setup(psetup);
528 mf.print_full(p, Gtk.PrintOperationAction.EXPORT);
529 print("made image - exiting");
541 var load_committed = function (web_view, web_frame)
543 print("load commited");
545 update_url(web_view, web_frame);
547 // call load finished after 20seconds??
548 // so even if it never complets we try and print the thing.
549 GLib.timeout_add(GLib.PRIORITY_LOW, 40000, function() {
550 print("load commited - 3000 ms?");
556 var clicked_link = function (web_view, web_frame, request,
557 action, decision, window)
559 if(action.get_reason() == WebKit.WebNavigationReason.LINK_CLICKED &&
560 action.get_button() == 2)
562 browser.new_tab(request.get_uri(), null);
572 this.browse = function (url)
574 if(url.search("://") < 0)
575 url = "http://" + url;
579 print("BROWSE: " + url);
580 if (url.match(/\/weibo\.com\//) && after_login === false) {
583 url = "http://weibo.com/login.php";
585 else if (url.match(/\/weibo\.com\//) && after_login !== false) {
588 print("BROWSE -really: " + url);
592 this.set_tab = function (new_tab)
597 this.get_tab = function ()
604 //this.set_scroll_adjustments(null, null);
606 //this.signal.title_changed.connect(update_title);
607 //this.signal.load_committed.connect(load_committed);
608 this.signal.load_finished.connect(load_finished);
611 // For some reason, this segfaults seed in the instance init closure handler
612 // Once that's fixed, uncommenting the next line will give middle-click-open-in-new tab
613 //this.signal.navigation_policy_decision_requested.connect(clicked_link);
615 //this.signal.hovering_over_link.connect(hover_link);
617 this.signal.create_web_view.connect(create_new_tab);
621 // print("ADDing console message sig handler");
626 this.toFilename = function(url)
628 url = url.replace(/^http[s]*:\/\//, '');
629 var p = url.split('/');
630 p.unshift(storedir+'/output');
631 for (var i =1 ;i < p.length; i++) {
632 p[i] = encodeURIComponent(p[i]);
635 p[p.length-1] = decodeURIComponent(p[p.length-1]);
637 var dir = File.dirname(ret);
642 this.checkdomain = function(comp)
644 var b = parseUri(this.uri);
645 var d = parseUri(comp);
646 return (d.host == b.host && d.protocol == b.protocol);
651 this.dupeCheck = function(url)
654 // order - return highest up the queue first..
655 if (File.exists(downloaddir +'/' + encodeURIComponent(url))) {
656 return downloaddir +'/' + encodeURIComponent(url);
658 if (File.exists(parsedir +'/' + encodeURIComponent(url))) {
659 return parsedir +'/' + encodeURIComponent(url);
661 if (File.exists(donedir +'/' + encodeURIComponent(url))) {
662 return donedir +'/' + encodeURIComponent(url);
668 this.moveToParse = function(url)
670 var old = this.dupeCheck(url);
671 var target =parsedir +'/' + encodeURIComponent(url);
675 File.write(target, old ? File.read(old) : '');
682 this.moveToDownload= function(url)
684 var old = this.dupeCheck(url);
685 var target =downloaddir +'/' + encodeURIComponent(url);
689 File.write(target, old ? File.read(old) : '');
695 this.moveToDone= function(url)
697 var old = this.dupeCheck(url);
698 var target = donedir +'/' + encodeURIComponent(url);
702 File.write(target, old ? File.read(old) : '');
712 function parseUri (str) {
713 var o = parseUri.options,
714 m = o.parser[o.strictMode ? "strict" : "loose"].exec(str),
718 while (i--) uri[o.key[i]] = m[i] || "";
721 uri[o.key[12]].replace(o.q.parser, function ($0, $1, $2) {
722 if ($1) uri[o.q.name][$1] = $2;
730 key: ["source","protocol","authority","userInfo","user","password","host","port","relative","path","directory","file","query","anchor"],
733 parser: /(?:^|&)([^&=]*)=?([^&]*)/g
736 strict: /^(?:([^:\/?#]+):)?(?:\/\/((?:(([^:@]*)(?::([^:@]*))?)?@)?([^:\/?#]*)(?::(\d*))?))?((((?:[^?#\/]*\/)*)([^?#]*))(?:\?([^#]*))?(?:#(.*))?)/,
737 loose: /^(?:(?![^:@]+:[^:@\/]*@)([^:\/?#.]+):)?(?:\/\/)?((?:(([^:@]*)(?::([^:@]*))?)?@)?([^:\/?#]*)(?::(\d*))?)(((\/(?:[^?#](?![^?#\/]*\.[^?#\/.]+(?:[?#]|$)))*\/?)?([^?#\/]*))(?:\?([^#]*))?(?:#(.*))?)/