2 GLib = imports.gi.GLib;
3 WebKit = imports.gi.WebKit;
4 Soup = imports.gi.Soup;
6 TabbedBrowser = imports.TabbedBrowser;
7 BrowserSettings = imports.BrowserSettings;
8 BrowserTab = imports.BrowserTab;
10 File = imports.File.File;
12 base64 = imports.base64.base64;
14 BrowserView = new GType({
15 parent: WebKit.WebView.type,
21 var sess = WebKit.get_default_session();
22 sess.proxy_uri = new Soup.URI.c_new('http://localhost:3128');
26 var browsePage = false;
32 var update_title = function (web_view, web_frame, title)
35 print("calling update title");
37 title = title.slice(0,25) + "...";
39 tab.get_tab_label().label = title;
46 var traversedom = function(doc, fn, sub ) {
47 print("TRAVERSE DOM?");
52 var cb = function(s) {
62 //Roo.select('body > div',true).each(function(el) {
63 traverseDOMTree(cb, doc.head, 1);
64 traverseDOMTree(cb, doc.body, 1);
66 File.write(cb.fn.replace(/\.html$/, '')+ (sub ? ('.' + sub ) : '') + '.html' , ret +'</HTML>');
72 var traverseDOMTree = function(cb, currentElement, depth) {
75 //if (currentElement.class_name.match(/roo-dynamic/)) {
78 //print(currentElement.node_name);
80 var nodeName = currentElement.node_name;
81 var tagName = currentElement.tag_name;
83 if (nodeName == '#text') {
84 cb(currentElement.node_value);
93 if (nodeName == 'SCRIPT') {
97 //if (nodeName == 'STYLE') { return; }
99 // Prints the node tagName, such as <A>, <IMG>, etc
100 var outNodeName = nodeName;
101 if (nodeName == 'IFRAME') {
102 //outNodeName = 'DIV';
111 for(i = 0; i < currentElement.attributes.length;i++) {
112 var aname = currentElement.attributes.item(i).name;
113 //if (aname =='class' || aname == 'style') {
116 if (aname =='src' && tagName == 'IFRAME') {
120 attr.push(aname + '="' + currentElement.attributes.item(i).value + '"' );
122 if (tagName == 'IFRAME') {
123 attr.push('src="' + File.basename(cb.fn).replace(/\.html$/, '')+ '.' + cb.sub + '.html"' );
126 //if (nodeName == 'IFRAME') {
127 // attr.push('src="' + currentElement.attributes.item(i).value + embeded_file '"' );
130 //var style = elClassToStyle(currentElement);
131 //if (style.length) {
132 // attr.push('style="' + style + '"' );
136 //if (depth > 1000 && (tagName == 'BODY' || tagName == 'HEAD' )) {
137 // cb("<DIV"+ ( attr.length ? (' ' + attr.join(' ') ) : '') + ">");
139 cb("<"+outNodeName + ( attr.length ? (' ' + attr.join(' ') ) : '') + ">");
147 if (nodeName == 'IFRAME') {
150 traversedom(currentElement.content_document, cb.fn, cb.sub )
159 var currentElementChild = currentElement.child_nodes.item(i);
161 while (currentElementChild) {
162 // Formatting code (indent the tree so it looks nice on the screen)
164 if (currentElementChild.node_name == '#text') {
165 // if (currentElementChild.node_value.length) {
166 cb(currentElementChild.node_value);
170 currentElementChild=currentElement.child_nodes.item(i);
175 //for (j = 0; j < depth; j++) {
176 // ¦ is just a vertical line
181 // Recursively traverse the tree structure of the child node
182 traverseDOMTree(cb, currentElementChild, depth+1);
184 currentElementChild=currentElement.child_nodes.item(i);
187 // The remaining code is mostly for formatting the tree
189 //for (j = 0; j < depth - 1; j++) {
194 // if (depth > 1000 && (tagName == 'BODY' || tagName == 'HEAD' )) {
197 cb("</"+outNodeName+">");
205 var update_url = function (web_view, web_frame)
207 var toolbar = tab.get_toolbar();
209 toolbar.set_url(web_frame.get_uri());
210 toolbar.set_can_go_back(web_view.can_go_back());
211 toolbar.set_can_go_forward(web_view.can_go_forward());
221 var create_new_tab = function (web_view, web_frame, new_web_view)
223 new_web_view = new BrowserView();
224 new_web_view.signal.web_view_ready.connect(show_new_tab);
228 var show_new_tab = function (new_web_view)
230 TabbedBrowser.browser.new_tab("", new_web_view);
235 var hover_link = function (web_view, link, url)
237 tab.get_statusbar().set_status(url);
242 this.add_inject = function(force)
245 if (force || (typeof(injected[this.uri]) == 'undefined' )) {
246 injected[this.uri] = 0;
248 if (injected[this.uri] > 2) {
251 injected[this.uri]++;
252 var fn = __script_path__ + "/inject.js";
253 if (File.exists(fn)) {
254 // print("Adding inject");
255 var newjs = File.read(__script_path__ + "/inject.js");
256 TabbedBrowser.browser.current_tab().get_web_view().execute_script(
264 var after_login = false;
267 var load_finished_called = false;
269 var done_print = false;
270 var do_print = function(web_frame) {
274 print("do_print called -- while already doing this...");
278 print("do_print called");
281 TabbedBrowser.browser.current_tab().get_web_view().execute_script(
282 File.read( __script_path__ + "/domains/remove_print_css.js")
285 var url_p = current_url.split('/');
287 var dom_p = url_p[2].split('.');
288 var chk = dom_p.pop();
289 chk = dom_p.pop() + '.' + chk;
293 print("CHECK: " + chk +"\n");
294 if (File.exists( __script_path__ + "/domains/" + chk + '.js')) {
295 print("INCLUDING: " + __script_path__ + "/domains/"+ chk + ".js\n");
296 TabbedBrowser.browser.current_tab().get_web_view().execute_script(
297 File.read( __script_path__ + "/domains/"+ chk + ".js")
302 // motorme - requires a scroll to make content appear..
303 if (current_url.match(/\.motorme\.my\//) ) {
304 TabbedBrowser.browser.current_tab().get_web_view().execute_script("window.scrollTo(0,500);");
308 if (current_url.match('/forbes.com')) {
313 print("Delay:" + BrowserSettings.delay);
316 var realprint = function() {
320 if (current_url.match(/theindependent\.sg\//) ) {
321 TabbedBrowser.browser.current_tab().get_web_view().execute_script(
322 File.read( __script_path__ + "/domains/theindependent.sg.js")
328 if (web_frame && BrowserSettings.export_filename_html ) {
329 var html = traversedom(web_frame.get_dom_document(), BrowserSettings.export_filename_html);
330 //File.write(BrowserSettings.export_filename_html, html);
334 if (!BrowserSettings.export_filename) {
335 if (!BrowserSettings.export_filename_html) {
336 print("no export filename / and html filename");
342 var mf = _t.get_main_frame();
344 print("Creating paper");
345 var ar = Gtk.PaperSize.get_paper_sizes();
346 var psetup = new Gtk.PageSetup();
347 for(var i = 0; i < ar.length; i++) {
348 if (ar[i].get_name() =='iso_a2') {
349 psetup.set_paper_size(ar[i]);
352 print("doing print operation");
353 var p = new Gtk.PrintOperation({ export_filename : BrowserSettings.export_filename });
354 print("doing print operation - set page");
356 p.set_default_page_setup(psetup);
358 print("doing print operation - print_full");
359 mf.print_full(p, Gtk.PrintOperationAction.EXPORT);
360 print("made image - exiting");
365 print("error occured");
366 print(JSON.stringify(e));
371 GLib.timeout_add(GLib.PRIORITY_DEFAULT, BrowserSettings.delay *1, realprint);
375 var weibo_added = false;
377 var is_weibo = false;
380 var load_finished = function (webkit, web_frame, wb)
391 print("load finished");
394 if (after_login === true) {
400 if (after_login === false) {
403 print("adding timeout?");
405 GLib.timeout_add(GLib.PRIORITY_LOW, 2000, function() {
406 print("Redirecting after login?" + after_login);
408 _t.browse(after_login);
415 TabbedBrowser.browser.current_tab().get_web_view().execute_script(
416 File.read( __script_path__ + "/weibo.js")
418 print("run_weibo(" + JSON.stringify( BrowserSettings.username ) + ", " + JSON.stringify(BrowserSettings.passwd) + ");");
420 TabbedBrowser.browser.current_tab().get_web_view().execute_script(
421 "run_weibo(" + JSON.stringify( BrowserSettings.username ) + ", " + JSON.stringify(BrowserSettings.passwd) + ");"
427 if (after_login !== false) {
430 // wait a bit then load the real page..
431 GLib.timeout_add(GLib.PRIORITY_LOW, 500, function() {
432 print("Redirecting after login?");
433 _t.browse(after_login);
439 if (load_finished_called) {
443 load_finished_called = true;
447 // if(document.location.host=='weibo.com') {
448 // // clear login dialog from weibo.
449 // //check and hidden the login dialog and overlay .....
450 // var els = document.querySelectorAll('div[node-type]');
452 // for (i = 0; i < els.length; i++) {
453 // if (els[i].hasAttribute('node-type')) {
454 // if(els[i].getAttribute('node-type') == 'outer'){
459 // for (i = 0; i < bbc.length; i++) {// hide all the outer.....
460 // bbc[i].style.display = 'none';
464 // if(document.location.pathname == '/login.php'){
466 // // fills in the user name and password
467 // var els = document.querySelectorAll('input[node-type]');
469 // for (i = 0; i < els.length; i++) {
470 // if (els[i].hasAttribute('node-type')) {
471 // if(els[i].getAttribute('node-type') == 'username'){
472 // els[i].value = BrowserSettings.username;
474 // if(els[i].getAttribute('node-type') == 'password'){
475 // els[i].value = BrowserSettings.passwd;
481 // // simulating click event to login ....
482 // var elss = document.querySelectorAll('a[node-type]');
484 // for (i = 0; i < elss.length; i++) {
485 // if (elss[i].hasAttribute('node-type')) {
486 // if(elss[i].getAttribute('node-type') == 'submitBtn'){
498 // clear login dialog from weibo.
499 // TabbedBrowser.browser.current_tab().get_web_view().execute_script(
500 // " if (document.location.host=='weibo.com') { " +
502 // " var a = document.getElementsByClassName('W_layer')[0]; " +
503 // " a.parentNode.removeChild(a.previousSibling); " +
504 // " a.parentNode.removeChild(a); " +
505 // " } catch(e) { } } " );
509 GLib.timeout_add(GLib.PRIORITY_LOW, BrowserSettings.delay, function() {
511 var mf = _t.get_main_frame();
513 var ar = Gtk.PaperSize.get_paper_sizes();
514 var psetup = new Gtk.PageSetup();
515 for(var i = 0; i < ar.length; i++) {
516 if (ar[i].get_name() =='iso_a2') {
517 psetup.set_paper_size(ar[i]);
521 var p = new Gtk.PrintOperation({ export_filename : BrowserSettings.export_filename });
522 p.set_default_page_setup(psetup);
523 mf.print_full(p, Gtk.PrintOperationAction.EXPORT);
524 print("made image - exiting");
536 var load_committed = function (web_view, web_frame)
538 print("load commited");
540 update_url(web_view, web_frame);
542 // call load finished after 20seconds??
543 // so even if it never complets we try and print the thing.
544 GLib.timeout_add(GLib.PRIORITY_LOW, 40000, function() {
545 print("load commited - 3000 ms?");
551 var clicked_link = function (web_view, web_frame, request,
552 action, decision, window)
554 if(action.get_reason() == WebKit.WebNavigationReason.LINK_CLICKED &&
555 action.get_button() == 2)
557 browser.new_tab(request.get_uri(), null);
567 this.browse = function (url)
569 if(url.search("://") < 0)
570 url = "http://" + url;
574 print("BROWSE: " + url);
575 if (url.match(/\/weibo\.com\//) && after_login === false) {
578 url = "http://weibo.com/login.php";
580 else if (url.match(/\/weibo\.com\//) && after_login !== false) {
583 print("BROWSE -really: " + url);
587 this.set_tab = function (new_tab)
592 this.get_tab = function ()
599 //this.set_scroll_adjustments(null, null);
601 //this.signal.title_changed.connect(update_title);
602 //this.signal.load_committed.connect(load_committed);
603 this.signal.load_finished.connect(load_finished);
606 // For some reason, this segfaults seed in the instance init closure handler
607 // Once that's fixed, uncommenting the next line will give middle-click-open-in-new tab
608 //this.signal.navigation_policy_decision_requested.connect(clicked_link);
610 //this.signal.hovering_over_link.connect(hover_link);
612 this.signal.create_web_view.connect(create_new_tab);
616 // print("ADDing console message sig handler");
621 this.toFilename = function(url)
623 url = url.replace(/^http[s]*:\/\//, '');
624 var p = url.split('/');
625 p.unshift(storedir+'/output');
626 for (var i =1 ;i < p.length; i++) {
627 p[i] = encodeURIComponent(p[i]);
630 p[p.length-1] = decodeURIComponent(p[p.length-1]);
632 var dir = File.dirname(ret);
637 this.checkdomain = function(comp)
639 var b = parseUri(this.uri);
640 var d = parseUri(comp);
641 return (d.host == b.host && d.protocol == b.protocol);
646 this.dupeCheck = function(url)
649 // order - return highest up the queue first..
650 if (File.exists(downloaddir +'/' + encodeURIComponent(url))) {
651 return downloaddir +'/' + encodeURIComponent(url);
653 if (File.exists(parsedir +'/' + encodeURIComponent(url))) {
654 return parsedir +'/' + encodeURIComponent(url);
656 if (File.exists(donedir +'/' + encodeURIComponent(url))) {
657 return donedir +'/' + encodeURIComponent(url);
663 this.moveToParse = function(url)
665 var old = this.dupeCheck(url);
666 var target =parsedir +'/' + encodeURIComponent(url);
670 File.write(target, old ? File.read(old) : '');
677 this.moveToDownload= function(url)
679 var old = this.dupeCheck(url);
680 var target =downloaddir +'/' + encodeURIComponent(url);
684 File.write(target, old ? File.read(old) : '');
690 this.moveToDone= function(url)
692 var old = this.dupeCheck(url);
693 var target = donedir +'/' + encodeURIComponent(url);
697 File.write(target, old ? File.read(old) : '');
707 function parseUri (str) {
708 var o = parseUri.options,
709 m = o.parser[o.strictMode ? "strict" : "loose"].exec(str),
713 while (i--) uri[o.key[i]] = m[i] || "";
716 uri[o.key[12]].replace(o.q.parser, function ($0, $1, $2) {
717 if ($1) uri[o.q.name][$1] = $2;
725 key: ["source","protocol","authority","userInfo","user","password","host","port","relative","path","directory","file","query","anchor"],
728 parser: /(?:^|&)([^&=]*)=?([^&]*)/g
731 strict: /^(?:([^:\/?#]+):)?(?:\/\/((?:(([^:@]*)(?::([^:@]*))?)?@)?([^:\/?#]*)(?::(\d*))?))?((((?:[^?#\/]*\/)*)([^?#]*))(?:\?([^#]*))?(?:#(.*))?)/,
732 loose: /^(?:(?![^:@]+:[^:@\/]*@)([^:\/?#.]+):)?(?:\/\/)?((?:(([^:@]*)(?::([^:@]*))?)?@)?([^:\/?#]*)(?::(\d*))?)(((\/(?:[^?#](?![^?#\/]*\.[^?#\/.]+(?:[?#]|$)))*\/?)?([^?#\/]*))(?:\?([^#]*))?(?:#(.*))?)/