src/strip.vala
[app.mailtrimmer] / src / strip.vala
1 /**
2
3   needs to scan 2 things
4   a) our mailfort email database
5        point it at the top directory, containing YEAR/MONTH/DAY.... directories.
6        scan each file (over a year old...)
7        extract out the attachment, and replace with HTML
8        DATABASE? - mysql or sqlite? - 
9            filesize / name / date / checksum / mimetype -- into mailfort should be OK.
10   b) the imap user emails
11            loop through user's directories
12            check age of email .. over 1 years..
13            ?? how to prevent 'repeat' scanning of emails?
14               ??? hidden '.' files containing last scan date?
15
16            check if file exists in our DB.. - replace the link...
17            otherwise generate a file. + add to DB...
18            
19    c) retreival system
20      -> URL -> get file
21    d) redirect system.
22      -> URL -> redirect to correct server
23
24
25 More notes on our Mailfort DB sync:
26 * some of these attachments are already in the database...
27  - so we need to update the DB..
28  - probably worth putting the code in a stored procedure..
29  
30  -- key scenarios
31    * first scan (and extract)
32    * rescan (as I messed up the first time - fix the DB...)
33    * email scan - attachments might not have related messages.
34  
35  
36  - {id} attachment_init(
37                 {exim_msg_id}
38                 {chksum}
39                 {filename),
40         )
41         // creates or returns id (can look for existing messages?
42         // can do a merge?? - copy 'old' record data into 'new'....  "prefer checksummed"
43         
44         attachment_update(
45                 {id}
46                 {exim_msg_id}
47                 {mailfort_msg_sig}
48                 {file_size}
49                 {created} // message date..
50                 {chksum}
51                 {filename),
52         {mime_type}
53         )
54         attachment_update_store(
55                         {id}
56                         {stored_filename}
57         )
58
59
60 */ 
61
62 // valac --pkg gmime --vapi
63 /*
64
65 // http://www.fromdual.com/mysql-vala-program-example << check mysql if this does not work.
66
67  valac  -g --vapidir=. --thread  strip.vala   --vapidir=../vapi \
68      --pkg glib-2.0 --pkg mysql --pkg gio-2.0 --pkg posix --pkg gmime-2.6 \
69       --Xcc=-lmysqlclient  -v \
70        -o /tmp/strip
71 */ 
72  
73 public class StripApplication : GLib.Application {
74
75         public static string? opt_path = null;
76         public static string? opt_file = null;  
77         public static string? opt_target_path = null;
78         public static string? opt_db_host = "127.0.0.1";
79         public static string? opt_db_name = null;       
80         public static string? opt_db_user = null;               
81         public static string? opt_db_pass = null;               
82
83         public static int    opt_limit = -1;
84
85         public static bool      opt_is_extracting = false;
86         public static bool      opt_is_replacing = false;
87         public static bool      opt_scan_imap  = false; 
88         public static bool      opt_scan_mailfort  = false;     
89         public static bool              opt_dump = false;       
90         public static bool              opt_debug = false; 
91         
92         public static bool opt_debug_sql = false;       
93         public static string? opt_replace_link = null;
94         
95         
96         public const GLib.OptionEntry[] options = {
97                 
98                 { "debug", 0, 0, OptionArg.NONE, ref opt_debug, "show debug messages for components", null },
99                 { "debug-sql", 0, 0, OptionArg.NONE, ref opt_debug_sql, "debug the SQL statements", null },         
100
101                 { "path", 0, 0, OptionArg.STRING, ref opt_path, "Directory where email to be parsed is", null },        
102                 { "file", 0, 0, OptionArg.STRING, ref opt_file, "A specific file to be parsed", null }, 
103
104                 { "target-path", 0, 0, OptionArg.STRING, ref opt_target_path, "Directory where attachments are to be put", null },
105
106                 { "link", 0, 0, OptionArg.STRING, ref opt_replace_link, "url for the replement link: eg. http://www.mysite.com/xxxx/%s", null },         
107                         
108                 { "host", 0, 0, OptionArg.STRING, ref opt_db_host, "Mysql host (default localhost)", null },    
109                 { "name", 0, 0, OptionArg.STRING, ref opt_db_name, "Mysql database name REQUIRED", null },      
110                 { "user", 0, 0, OptionArg.STRING, ref opt_db_user, "Mysql database user REQUIRED", null },      
111                 { "pass", 0, 0, OptionArg.STRING, ref opt_db_pass, "Mysql database password (default empty)", null },            
112
113                 { "extract", 0, 0, OptionArg.NONE, ref opt_is_extracting, "Should attachments be extracted (default NO)", null },
114                 { "replace", 0, 0, OptionArg.NONE, ref opt_is_replacing, "Should attachments be replaced (default NO)", null },
115                 { "dump", 0, 0, OptionArg.NONE, ref opt_dump, "Print the replaced mail contents to stdout", null },         
116
117                 { "limit", 0, 0, OptionArg.INT, ref opt_limit, "stop after X number of messages with attachments have been processed", null },         
118
119                 { "scan-imap", 0, 0, OptionArg.NONE, ref opt_scan_imap, "scan an imap tree", null },
120                 { "scan-mailfort", 0, 0, OptionArg.NONE, ref opt_scan_mailfort, "scan a mailfort tree", null },  
121                 { null }       
122         };         
123     public StripApplication( string[] args ) 
124     {
125                  Object(
126             application_id: "org.roojs.mailstripper",
127             flags: ApplicationFlags.FLAGS_NONE
128          );
129  
130                         
131          var opt_context =  new GLib.OptionContext ("Mail Stripper");
132                         
133          try {
134                                 
135             opt_context.set_help_enabled (true);
136             opt_context.add_main_entries (options, null);
137             opt_context.parse ( ref  args);
138             //opt_detach = !optx_no_detach;
139                             
140  
141                             
142              // options that have to be set.. bee or hive... (or stop all)
143             if ((!opt_scan_mailfort && !opt_scan_imap) || (opt_scan_mailfort && opt_scan_imap))  {
144                stdout.printf ("You must specify the type of directory tree to scan - either imap or mailfort\n%s",
145                    opt_context.get_help(true, null));
146                GLib.Process.exit(Posix.EXIT_FAILURE);
147             }
148                         
149                          if ((opt_db_name == null || opt_db_name.length < 1 || opt_db_user == null || opt_db_user.length < 1))  {
150                stdout.printf ("You must specify the database name / user \n%s",
151                    opt_context.get_help(true, null));
152                GLib.Process.exit(Posix.EXIT_FAILURE);
153             }
154                          if ((opt_path == null || opt_path.length < 1)   )  {
155                stdout.printf ("You must specify the scan start path\n%s",
156                    opt_context.get_help(true, null));
157                GLib.Process.exit(Posix.EXIT_FAILURE);
158             }
159                         if (opt_replace_link == null || (opt_replace_link.length < 1))  {
160                stdout.printf ("You must specify the link to use in the replacement \n%s",
161                    opt_context.get_help(true, null));
162                GLib.Process.exit(Posix.EXIT_FAILURE);
163             }
164             if ((opt_is_replacing || opt_is_extracting ) && (opt_target_path == null || opt_target_path.length < 1)) {
165                       stdout.printf ("You must specify a target path to put attachments\n%s",
166                    opt_context.get_help(true, null));
167                GLib.Process.exit(Posix.EXIT_FAILURE);
168             }
169             
170             
171          } catch (GLib.OptionError e) {
172             stdout.printf ("error: %s\n", e.message);
173             stdout.printf ("Run '%s --help' to see a full list of available command line options.\n%s", 
174                       args[0], opt_context.get_help(true, null));
175             GLib.Process.exit(Posix.EXIT_FAILURE);
176          }
177         }
178          
179     public static int main(string[] args) 
180     {
181                 
182                 var application = new StripApplication(  args);
183                 
184                 GLib.Log.set_always_fatal(LogLevelFlags.LEVEL_ERROR | LogLevelFlags.LEVEL_CRITICAL); 
185            
186            if (opt_debug || opt_debug_sql) {
187                         GLib.Log.set_handler(null, 
188                         GLib.LogLevelFlags.LEVEL_DEBUG | GLib.LogLevelFlags.LEVEL_WARNING | GLib.LogLevelFlags.LEVEL_INFO, 
189                         (dom, lvl, msg) => {
190                                         print("%s\n", msg);
191                                 }
192                         );
193                 }
194         
195         GMime.init(0);
196                 if (StripApplication.opt_is_replacing) {
197                         StripApplication.opt_is_extracting = true;
198                 }
199   
200                 GLib.debug("scanning folder: %s", opt_path );
201                 
202                 var strip = new Strip( opt_path );
203  
204                 
205                 strip.mysql  = new Mysql.Database();
206                 if (!strip.mysql.real_connect(
207                                 opt_db_host,
208                                 opt_db_user ,
209                                 opt_db_pass == null ? "" : opt_db_pass, //passwd
210                                 opt_db_name, //DB
211                                 3306, // not changable...?
212                                 null
213                         )
214                 ) {
215                         stdout.printf("ERROR %u: Connection failed: %s\n", 
216                                 strip.mysql.errno(), strip.mysql.error()
217                         );
218                         return 1;
219                 }
220         if (opt_file != null) {
221                 strip.base_dir = opt_path;
222                 strip.scan_file( GLib.Path.get_dirname(opt_file),  GLib.Path.get_basename(opt_file));
223                 return 0;
224         }
225
226                 strip.scan_dir(opt_path);
227         
228
229         
230         return 0;
231     }
232 }
233
234 public class Strip : GLib.Object {
235         
236  
237         
238         public string base_dir = "";
239         
240         public Mysql.Database mysql;
241         
242         int processed = 0;
243     
244     uint64 used_space_before = 0;
245     uint64 used_space_after = 0;
246     
247     
248     public Strip(string base_dir)
249     {
250         this.base_dir = base_dir;
251     }
252     
253     public void handle_part(GMime.Object parent, GMime.Object mime_obj)
254     {
255                 if (mime_obj is GMime.Part) {
256                    var  p = (GMime.Part)mime_obj;
257                         var ct = p.get_content_type();
258                         var cd = p.get_content_disposition();
259                         
260                         var sid = p.get_header("X-strip-id");
261                     if (sid != null && sid.length > 0) {
262                         this.update_attachment_db(p);
263                             GLib.debug("Skip attachment replace - it's already been done");
264                         return;
265                         }
266                         
267                         if (cd == null || cd.get_disposition().down() != "attachment") {
268                                 return;
269                         }
270                         if (ct.get_media_type() == "text") {
271                                 return;
272                         }
273                         if (ct.to_string() == "application/pgp-encrypted") {
274                                 return;
275                         }
276                         if (ct.to_string() == "application/pgp-keys") {
277                                 return;
278                         }
279                         if (p.get_filename() == null) {
280                                 return;
281                         }
282                          // print("got part %s\n", ct.to_string());
283                          if (parent is GMime.Multipart) {
284                                 
285                                 this.replace_attachment(((GMime.Multipart)parent), p);
286                                 // remove it !?
287
288                           }
289
290
291                         return;
292                 }
293                 if (mime_obj is GMime.Multipart) {
294                         
295
296                         var  mp = (GMime.Multipart)mime_obj;
297                         //var ct = mp.get_content_type();
298
299                         //print("got multi-part %s\n", ct.to_string());
300                         for (var i = 0; i< mp.get_count(); i++) { 
301                           var mo = mp.get_part(i);
302                           this.handle_part(mime_obj,mo);
303                         }
304                    // ((GMime.Multipart)mime_obj).foreach((sub_obj) => {
305                    //     Strip.handle_part(sub_obj);
306                 //
307                    // });
308
309
310                         return;
311                 }
312
313                 if (mime_obj is GMime.MessagePart) {
314                         var msg = ((GMime.MessagePart)mime_obj).get_message();
315                         msg.foreach((subobj) => {
316                          this.handle_part(msg,subobj);
317                     });
318                 
319                         //print("got message-part\n");
320                         return;
321                 }
322                 
323                 if (mime_obj is GMime.Message) {
324                         var mp = ((GMime.Message) mime_obj).get_mime_part();
325
326                         if (!(mp is GMime.Multipart)) {
327                                 GLib.debug("get mimepart does not return a Multipart?");
328                                 return;
329                         }
330                         
331                         var mpc = ((GMime.Multipart)mp).get_count();
332                         
333                         //GLib.debug("Message has %d parts", mpc); 
334                         for (var i =0 ; i < mpc; i++) {
335                                 //GLib.debug("Getting part %d", i); 
336                                 var submime_obj = ((GMime.Multipart)mp).get_part(i);
337                         this.handle_part(mp,submime_obj);                       
338                     }
339                         print("got message??\n");
340                         return;
341                 }
342                 
343                 print("got something else\n");
344
345
346     }
347     public void update_attachment_db(GMime.Part attachment)
348     {
349         // only called when we have an sid...
350         var sid = attachment.get_header("X-strip-id");
351         if (sid == null || sid.length < 1) {
352                 GLib.debug("Strange - update attachment db called ?");
353                 return;
354         }
355         
356         // initialize it with known data..
357         // that should wipe out dupes.
358         
359         this.query("""
360                 SELECT 
361                 
362                 attachment_init(
363                                 msgid,
364                                 checksum,
365                                 mime_filename,
366                                 filesize
367                         ) as id 
368                         FROM
369                         attachment
370                         WHERE
371                         id = %d
372                         
373           """.printf(
374                         int.parse(sid)
375                 ));
376         this.query("""
377                 SELECT attachment_update(
378                                 %d, -- in_id INT(11),
379                                 '%s', -- in_mime_type varchar(255),
380                                 %d, -- in_mime_size int(11),
381                                 '%s', -- in_created DATETIME,
382                                 '%s' -- in_mailfort_sig varchar(64)
383                                 
384                     )""
385         
386                                  
387               """.printf(
388                         int.parse(sid),
389                         "", // this will be ignored..
390                         0, // this will be ingored..
391                                 this.created_date,
392                                 this.mysql_escape(this.active_message_x_mailfort_sig)
393               
394               )
395                 );
396         
397         
398     
399     }
400     
401     
402     public void replace_attachment(GMime.Multipart parent, GMime.Part attachment)
403     {
404         var sid = attachment.get_header("X-strip-id");
405         if (sid != null && sid.length > 0) {
406                 GLib.debug("Skip attachment replace - it's already been done");
407                 return;
408         }
409         
410         var c = attachment.get_content_object();
411         
412         var filename = attachment.get_filename().replace("/", "-");
413         var fn = GLib.Environment.get_tmp_dir() +
414                         "/"+ this.active_name + "."+   filename;
415
416             var outfile = new GMime.StreamFile.for_path(fn, "w");
417             outfile.set_owner(true);
418             var file_size = (int) c.write_to_stream(outfile);
419             var chksum = this.md5_file(fn);
420             outfile.flush();
421             outfile = null;
422         
423         if (file_size == 0) {
424
425                 GLib.debug("ERROR - file size of write to stream returned 0?");
426                 Posix.unlink(fn);               
427                 return;
428         }
429         
430         
431         
432  
433         var mime_type= attachment.get_content_type().to_string();
434         // at this point we have to do our database magic...
435         //filesize / name / date / checksum / mimetype -- into mailfort should be OK.
436         
437         this.query("""
438                 SELECT 
439                 
440                 attachment_init(
441                                 '%s', -- in_msgid VARCHAR(32),
442                                 '%s', -- in_checksum VARCHAR(64),
443                                 '%s', -- in_mime_filename varchar(255)
444                                 %d -- filesize
445                         ) as id 
446                         
447           """.printf(
448                         this.mysql_escape(this.active_message_exim_id),
449                         chksum,
450                         this.mysql_escape( attachment.get_filename() ), // what is thsi is invalid?
451                          file_size)
452                 );
453                 var file_id = "0";
454         var rs = mysql.use_result();
455  
456                 var row = rs.fetch_row();
457                 
458                 var target_fn = "";
459                 
460                 //var create_dir = this.created_dir;
461                 
462                 
463                 if (rs == null  || rs.num_rows() < 1) {
464                         GLib.debug("ERROR - CALL to attachment_init failed");
465                 Posix.unlink(fn);               
466                 return;
467                 
468                 }
469                 file_id =  row[0];
470                 if (int.parse(file_id) < 1) {
471                         GLib.debug("ERROR - CALL to attachment_init failed - returned 0?");
472                 Posix.unlink(fn);               
473                 return;
474                 
475                 }
476                         
477         
478                 GLib.debug("fn = %s, m5=%s, id= %s", filename, mime_type, this.active_message_id);
479                 this.query("""
480                 
481                         SELECT attachment_update(
482                                 %d, -- in_id INT(11),
483                                 '%s', -- in_mime_type varchar(255),
484                                 '%s', -- in_created DATETIME,
485                                 '%s', -- in_mailfort_sig varchar(64)
486                                 
487                                 ) as result
488       """.printf(
489                 int.parse(file_id),
490                         this.mysql_escape(mime_type),
491                         this.created_date,
492                         this.mysql_escape(this.active_message_x_mailfort_sig)
493                 ));
494
495                                  
496  
497                 this.used_space_after += file_size;
498                         
499                          
500
501             if (StripApplication.opt_is_extracting) {
502                         target_fn = StripApplication.opt_target_path + "/" + this.created_dir +"/"+ file_id  + "-" + filename;
503                 } 
504                     
505             var stored =  "/" + this.created_dir +"/"+ file_id  + "-" + filename;
506                  this.query("""
507                 
508                         SELECT attachment_update_store(
509                                 %d, -- in_id INT(11),
510                                 '%s'  -- in_store_filename varchar(255),
511                          
512                                 
513                                 ) as result
514       """.printf(
515                 int.parse(file_id),
516                          this.mysql_escape( stored)
517                 ));   
518                           
519                 
520         var rep = new GMime.Part.with_type("text","html");
521         // we have to set up a redirect server - to redirect hpasite... to their internal service..
522         rep.set_filename(filename);
523         string txt = "<html><body>"+
524             "<a href=\"" + StripApplication.opt_replace_link + "/" +
525                         file_id + "/" + this.created_dir + "/"+chksum+"/"+ GLib.Uri.escape_string( filename) +"\">" + 
526             GLib.Uri.escape_string( filename) + // fixme needs html escaping...
527             "</a>" +
528             "</body></html>";
529
530         rep.get_content_type().set_parameter("charset", "utf-8");
531                 rep.set_header("X-strip-id", file_id);
532                 rep.set_header("X-strip-content-name",  filename);                              
533                 rep.set_header("X-strip-path", this.created_dir + "/" + file_id + "-" + filename);              
534                 rep.set_header("X-strip-content-type", mime_type);              
535         var stream =  new GMime.StreamMem.with_buffer(txt.data);
536         var con = new GMime.DataWrapper.with_stream(stream,GMime.ContentEncoding.DEFAULT);
537
538         rep.set_content_object(con);
539         GLib.debug("Replacing Attachment with HTML");
540         parent.replace(parent.index_of(attachment), rep);
541                 this.has_replaced = true;
542                  
543                 if (StripApplication.opt_is_extracting && target_fn.length > 0) {
544                         var dir = GLib.Path.get_dirname(target_fn);
545                         if (!FileUtils.test (dir, FileTest.IS_DIR)) {
546                                 GLib.DirUtils.create_with_parents(dir, 0755);
547                         }
548                         GLib.debug("Creating file %s", target_fn);
549                         if (!FileUtils.test (target_fn, FileTest.EXISTS)) {
550                                 Posix.link(fn, target_fn);
551                         }
552                 } else { 
553                         GLib.debug("Skipping extraction %s", target_fn);
554                 }
555                 Posix.unlink(fn);
556                 
557
558
559     }
560     
561     public int query(string str)
562     {
563         if (StripApplication.opt_debug_sql) {
564                 GLib.debug("SQL: %s\n", str);
565                 }
566         
567         var rc=  this.mysql.query(str);         
568         if ( rc != 0 ) {
569
570                     GLib.debug("ERROR %u: Query failed: %s\n", this.mysql.errno(), this.mysql.error());
571                 }
572                 return rc;
573         }
574     
575     public string mysql_escape(string str)
576     {
577             unichar[] value_escaped = new unichar[str.length * 2 + 1];
578                 this.mysql.real_escape_string ((string) value_escaped, str, str.length);
579                 return (string) value_escaped;
580     }
581     
582     public string  md5_file(string fn) {
583               Checksum checksum = new Checksum (ChecksumType.MD5);
584
585               FileStream stream = FileStream.open (fn, "rb");
586               uint8 fbuf[100];
587               size_t size;
588
589               while ((size = stream.read (fbuf)) > 0) {
590                       checksum.update (fbuf, size);
591               }
592
593               unowned string digest = checksum.get_string ();
594               return digest;
595     }
596
597         string active_path = "";    
598     string active_name = "";
599     string active_message_id = "";
600     string active_message_x_mailfort_sig = "";
601     string active_message_exim_id = "";
602     bool has_replaced = false;
603     string created_date = ""; // should be YYYY-mm-dd
604     string created_dir = ""; // should be YYY/mm/dd
605     
606     public void scan_file(string path, string name)
607     {
608                 GLib.debug("Scan: %s/%s", path,name); 
609                 
610                 this.has_replaced = false; 
611         this.active_path = path;
612         this.active_name = name;
613         this.active_message_id = "";
614
615         this.created_dir = this.active_path.substring(this.base_dir.length + 1 );
616                 this.created_date = this.created_dir.replace("/", "-");
617         
618         var file_size = (int) File.new_for_path(path +"/" + name)
619                                         .query_info(GLib.FileAttribute.STANDARD_SIZE,GLib.FileQueryInfoFlags.NONE,null)
620                                         .get_size();
621                                                
622         this.used_space_before += file_size;
623         
624         var stream = new GMime.StreamFs.for_path (path +"/" + name,Posix.O_RDONLY, 0);
625         //stream.set_owner(true);
626         var parser = new GMime.Parser.with_stream(stream);
627         var message = parser.construct_message();
628  
629                 if (message == null) {
630                         GLib.debug("Could not parse file? %s/%s", path,name);
631                 this.used_space_after += file_size;                     
632                 return;
633                 }       
634
635
636                 // check : - is message over a year old?                
637                 // get various msg info..
638                 this.active_message_id = message.get_message_id();
639                 this.active_message_x_mailfort_sig = message.get_header("x-mailfort-sig");
640                 var recvd = message.get_header("received");
641                 this.active_message_exim_id = "";
642                 if (recvd != null && recvd.length > 1) {
643                         GLib.debug("RECV: %s", recvd);
644                         var lines = recvd.split("\t");
645                         for (var i = 0; i < lines.length;i++) {
646                                 var bits = lines[i].strip().split(" ");
647                                 if (bits[0] == "id") {
648                                         this.active_message_exim_id = bits[1];
649                                 }
650                         }
651                 }
652                 GLib.debug("Message DATA:\n mid: %s\nmailfort: %s \nexim_id: %s",
653                         this.active_message_id,
654                         this.active_message_x_mailfort_sig,
655                         this.active_message_exim_id
656                 );
657                  
658                         
659                 // DATE?
660                 
661                 var mp = message.get_mime_part();
662
663                 if (!(mp is GMime.Multipart)) {
664                         GLib.debug("get mimepart does not return a Multipart?");
665                 this.used_space_after += file_size;                                             
666                         return;
667                 }
668                 
669                 var mpc = ((GMime.Multipart)mp).get_count();
670                 
671                 //GLib.debug("Message has %d parts", mpc); 
672                 for (var i =0 ; i < mpc; i++) {
673                         //GLib.debug("Getting part %d", i); 
674                         var mime_obj = ((GMime.Multipart)mp).get_part(i);
675             this.handle_part(mp,mime_obj);                      
676         }
677                 
678         parser= null;
679
680       //  stream.set_owner(false);
681             //stream.close();
682         stream = null;//.close();
683         
684         
685                 if (!this.has_replaced) {
686                         this.used_space_after += file_size;
687                         GLib.debug("skpping write file - no replacement occured");
688                         return;
689                 }
690                 string tmpfile = "";
691                 GMime.Stream outstream = new GMime.StreamNull();
692                 if (StripApplication.opt_is_replacing) {
693                 
694                         tmpfile = GLib.Environment.get_tmp_dir() +"/" + name;
695                 outstream = new GMime.StreamFile.for_path (tmpfile,"w");
696                 ((GMime.StreamFile)outstream).set_owner(true);
697         }
698                 if (StripApplication.opt_dump) {
699                         outstream = new GMime.StreamMem();
700         }
701         
702         file_size = (int) message.write_to_stream(outstream);
703         if (StripApplication.opt_is_replacing) {
704                 ((GMime.StreamFile)outstream).set_owner(false);
705         }
706                 if (StripApplication.opt_dump) {
707                         var ua = ((GMime.StreamMem)outstream).get_byte_array().data;
708                         print("%s\n", (string) ua);
709                 }        
710         message = null;
711         outstream.flush();
712         outstream.close();
713         GLib.debug("finished writing output %d", file_size);
714
715         //
716         
717           
718         this.used_space_after += file_size;
719         
720         
721         if (StripApplication.opt_is_replacing) {
722                 Posix.unlink(path +"/" + name);         
723                 GLib.debug("copy tmp file %s to %s" , tmpfile, path +"/" + name);               
724                 Posix.link(tmpfile, path +"/" + name);
725                 Posix.unlink(tmpfile);
726                 }
727         this.processed++;
728         
729         if (StripApplication.opt_limit > -1 && this.processed >= StripApplication.opt_limit) {
730                 GLib.debug("Reached replacement limit");
731                 Posix.exit(1);
732         }
733         
734         
735         
736         
737     }
738     
739     
740     public void scan_dir(string path)
741     {
742         var f = File.new_for_path(path);
743                 FileEnumerator file_enum;
744         var cancellable = new Cancellable ();
745         try {      
746             file_enum = f.enumerate_children(
747                 FileAttribute.STANDARD_DISPLAY_NAME + "," +   FileAttribute.STANDARD_TYPE,
748                         FileQueryInfoFlags.NOFOLLOW_SYMLINKS,  // FileQueryInfoFlags.NONE,
749                         cancellable
750                 );
751         } catch (Error e) {
752                 GLib.debug("Got error scanning dir? %s", e.message);
753             // FIXME - show error..
754             return;
755         }
756         FileInfo next_file;
757          
758         while (cancellable.is_cancelled () == false ) {
759             try {
760                 next_file = file_enum.next_file (cancellable);
761             } catch(Error e) {
762                 GLib.debug("error getting next file? %s", e.message);
763                 break;
764             }
765
766             if (next_file == null) {
767                 break;
768             }
769
770
771             if (next_file.get_file_type() != FileType.DIRECTORY) {
772                 
773                 if (next_file.get_display_name()[0] == ',') {
774                         continue;
775                 }
776                 
777                 this.scan_file(path , next_file.get_display_name());
778                 this.report_state("After scanning %s/%s".printf(path , next_file.get_display_name()));
779                 continue;
780             }
781
782
783             //stdout.printf("Monitor.monitor: got file %s : type :%u\n",
784             //        next_file.get_display_name(), next_file.get_file_type());
785
786
787             if (next_file.get_is_symlink()) {
788                 next_file = null;
789                 continue;
790             }
791             
792             var ds = next_file.get_display_name();
793             if (ds[0] == '.') {
794                 next_file = null;
795                 continue;
796             }
797             if (ds == "attachments") {
798                         continue;
799                 }
800             
801             
802             var sp = path+"/"+next_file.get_display_name();
803             // skip modules.
804             //print("got a file : " + sp);
805          
806             next_file = null;
807             
808             
809             this.scan_dir(sp);
810             
811         }
812     
813     
814     }
815     void report_state(string msg) 
816     {
817         // Saved: 2G  Original 10G : 20%
818         GLib.debug("Saved : %s (%.1f%%) | Original %s | %s", 
819                         GLib.format_size(this.used_space_before - this.used_space_after), 
820                         100f * ((1f * (this.used_space_before - this.used_space_after)) / (this.used_space_before * 1f)), 
821                         GLib.format_size(this.used_space_before),                       
822                         msg
823                 );
824         
825         }
826         
827         
828
829 }