- void buildSymbolTree()
- {
- //println("<PRE>");
-
- this.ts.rewind();
- this.braceNesting = 0;
-
- // print(JSON.stringify(this.ts.tokens, null,4));
-
-
- this.globalScope = new Scope(-1, false, -1, '');
- this.indexedScopes = { 0 : this.globalScope };
-
- this.mode = 'BUILDING_SYMBOL_TREE';
- this.parseScope(this.globalScope);
-
- //print("---------------END PASS 1 ---------------- ");
-
- },
- mungeSymboltree : function()
- {
-
- if (!this.munge) {
- return;
- }
-
- // One problem with obfuscation resides in the use of undeclared
- // and un-namespaced global symbols that are 3 characters or less
- // in length. Here is an example:
- //
- // var declaredGlobalVar;
- //
- // function declaredGlobalFn() {
- // var localvar;
- // localvar = abc; // abc is an undeclared global symbol
- // }
- //
- // In the example above, there is a slim chance that localvar may be
- // munged to 'abc', conflicting with the undeclared global symbol
- // abc, creating a potential bug. The following code detects such
- // global symbols. This must be done AFTER the entire file has been
- // parsed, and BEFORE munging the symbol tree. Note that declaring
- // extra symbols in the global scope won't hurt.
- //
- // Note: Since we go through all the tokens to do this, we also use
- // the opportunity to count how many times each identifier is used.
-
- this.ts.rewind();
- this.braceNesting = 0;
- this.mode = 'PASS2_SYMBOL_TREE';
-
- //println("MUNGING?");
-
- this.parseScope(this.globalScope);
-
- //this.globalScope.dump();
-
-
- this.globalScope.munge();
- },
-
-
- log : function(str)
- {
- print (" ".substring(0, this.braceNesting*2) + str);
-
- //println("<B>LOG:</B>" + htmlescape(str) + "<BR/>\n");
- },
- logR : function(str)
- {
- //println("<B>LOG:</B>" + str + "<BR/>");
- },
-
-
-
-
-
- parseScope : function(scope) // parse a token stream..
- {
- //this.timerPrint("parseScope EnterScope");
- //this.log(">>> ENTER SCOPE" + this.scopes.length);
- var symbol;
- var token;
-
- var identifier;
-
- var expressionBraceNesting = this.braceNesting + 0;
-
- var parensNesting = 0;
-
- var isObjectLitAr = [ false ];
- var isInObjectLitAr;
-
-
- //var scopeIndent = '';
- //this.scopes.forEach(function() {
- // scopeIndent += ' ';
- //});
- //print(">> ENTER SCOPE");
-
-
-
-
- token = this.ts.lookTok(1);
- while (token) {
- // this.timerPrint("parseScope AFTER lookT: " + token.toString());
- //this.dumpToken(token , this.scopes, this.braceNesting);
- //print('SCOPE:' + token.toString());
- //this.log(token.data);
- //if (token.type == 'NAME') {
- // print('*' + token.data);
- //}
- switch(token.type + '.' + token.name) {
- case "KEYW.VAR":
- case "KEYW.CONST": // not really relivant as it's only mozzy that does this.
- //print('SCOPE-VAR:' + token.toString());
- var vstart = this.ts.cursor +1;
-
- //this.log("parseScope GOT VAR/CONST : " + token.toString());
- while (true) {
- token = this.ts.nextTok();
- //!this.debug|| print( token.toString());
- // print('SCOPE-VAR-VAL:' + JSON.stringify(token, null, 4));
- if (!token) { // can return false at EOF!
- break;
- }
- if (token.name == "VAR" || token.data == ',') { // kludge..
- continue;
- }
- //this.logR("parseScope GOT VAR : <B>" + token.toString() + "</B>");
- if (token.type != "NAME") {
- for(var i = Math.max(this.ts.cursor-10,0); i < this.ts.cursor+1; i++) {
- print(this.ts.tokens[i].toString());
- }
-
- print( "var without ident");
- Seed.quit()
- }
-
-
- if (this.mode == "BUILDING_SYMBOL_TREE") {
- identifier = scope.getIdentifier(token.data,token) ;
-
- if (identifier == false) {
- scope.declareIdentifier(token.data, token);
- } else {
- token.identifier = identifier;
- this.warn("(SCOPE) The variable " + token.data + ' (line:' + token.line + ") has already been declared in the same scope...");
- }
- }
-
- token = this.ts.nextTok();
- !this.debug|| print(token.toString());
- /*
- assert token.getType() == Token.SEMI ||
- token.getType() == Token.ASSIGN ||
- token.getType() == Token.COMMA ||
- token.getType() == Token.IN;
- */
- if (token.name == "IN") {
- break;
- } else {
- //var bn = this.braceNesting;
- var bn = this.braceNesting;
- var nts = [];
- while (true) {
- if (!token || token.type == 'VOID' || token.data == ',') {
- break;
- }
- nts.push(token);
- token = this.ts.nextTok();
- }
- if (nts.length) {
- var TS = this.ts;
- this.ts = new TokenStream(nts);
- this.parseExpression(scope);
- this.ts = TS;
- }
-
- this.braceNesting = bn;
- //this.braceNesting = bn;
- //this.logR("parseScope DONE : <B>ParseExpression</B> - tok is:" + this.ts.lookT(0).toString());
-
- token = this.ts.lookTok(1);
- //!this.debug||
- // print("AFTER EXP: " + token.toString());
- if (token.data == ';') {
- break;
- }
- }
- }
-
- //print("VAR:")
- //this.ts.dump(vstart , this.ts.cursor);
-
- break;
-
-
- case "KEYW.FUNCTION":
- //if (this.mode == 'BUILDING_SYMBOL_TREE')
- // print('SCOPE-FUNC:' + JSON.stringify(token,null,4));
- //println("<i>"+token.data+"</i>");
- var bn = this.braceNesting;
- this.parseFunctionDeclaration(scope);
- this.braceNesting = bn;
- break;
-
- case "PUNC.LEFT_CURLY": // {
- case "PUNC.LEFT_PAREN": // (
- case "PUNC.LEFT_BRACE": // [
- //print('SCOPE-CURLY/PAREN:' + token.toString());
- //println("<i>"+token.data+"</i>");
- var curTS = this.ts;
- if (token.props) {
-
- // { a : ... , c : .... }
-
- for (var prop in token.props) {
-
-
- // print('SCOPE-PROPS:' + JSON.stringify(token.props[prop],null,4));
- if (token.props[prop].val[0].data == 'function') {
- // parse a function..
- this.ts = new TokenStream(token.props[prop].val);
- this.ts.nextTok();
- this.parseFunctionDeclaration(scope);
-
- continue;
- }
- // key value..
-
- this.ts = new TokenStream(token.props[prop].val);
- this.parseExpression(scope);
-
- }
- this.ts = curTS;
-
- // it's an object literal..
- // the values could be replaced..
- break;
- }
-
- // ( ... ) or { .... } not object literals..
-
- var _this = this;
- for (var xx =0; xx < token.items.length; xx++) {
- expr = token.items[xx];
- //token.items.forEach(function(expr) {
- //print(expr.toString());
- _this.ts = new TokenStream(expr);
- //if (curTS.data == '(') {
- _this.parseScope(scope)
- //} else {
- // _this.parseExpression(scope)
- //}
-
- }
- this.ts = curTS;
- //print("NOT PROPS"); Seed.quit();
-
- //isObjectLitAr.push(false);
- //this.braceNesting++;
-
- //print(">>>>>> OBJLIT PUSH(false)" + this.braceNesting);
- break;
-
- case "PUNC.RIGHT_CURLY": // }
- //print("<< EXIT SCOPE");
- return;
-
- case "KEYW.WITH":
- //print('SCOPE-WITH:' + token.toString());
- //println("<i>"+token.data+"</i>");
- if (this.mode == "BUILDING_SYMBOL_TREE") {
- // Inside a 'with' block, it is impossible to figure out
- // statically whether a symbol is a local variable or an
- // object member. As a consequence, the only thing we can
- // do is turn the obfuscation off for the highest scope
- // containing the 'with' block.
- this.protectScopeFromObfuscation(scope);
- this.warn("Using 'with' is not recommended." + (this.munge ? " Moreover, using 'with' reduces the level of compression!" : ""), true);
- }
- break;
-
- case "KEYW.CATCH":
- //print('SCOPE-CATCH:' + token.toString());
- //println("<i>"+token.data+"</i>");
- this.parseCatch(scope);
- break;
-
- case "STRN.DOUBLE_QUOTE": // used for object lit detection..
- case "STRN.SINGLE_QUOTE":
- // print('SCOPE-STRING:' + token.toString());
- //println("<i>"+token.data+"</i>");
-
- if (this.ts.lookTok(-1).data == '{' && this.ts.lookTok(1).data == ':') {
- // then we are in an object lit.. -> we need to flag the brace as such...
- isObjectLitAr.pop();
- isObjectLitAr.push(true);
- //print(">>>>>> OBJLIT REPUSH(true)");
- }
- isInObjectLitAr = isObjectLitAr[isObjectLitAr.length-1];
-
- if (isInObjectLitAr && this.ts.lookTok(1).data == ':' &&
- ( this.ts.lookTok(-1).data == '{' || this.ts.lookTok(-1).data == ':' )) {
- // see if we can replace..
- // remove the quotes..
- // should do a bit more checking!!!! (what about wierd char's in the string..
- var str = token.data.substring(1,token.data.length-1);
- if (/^[a-z_]+$/i.test(str) && ScopeParser.idents.indexOf(str) < 0) {
- token.outData = str;
- }
-
-
-
- }
-
- break;
-
- case "NAME.NAME":
- //print('SCOPE-NAME:' + token.toString());
- //print("DEAL WITH NAME:");
- // got identifier..
- // look for { ** : <- indicates obj literal.. ** this could occur with numbers ..
- // skip anyting with "." before it..!!
-
- if (this.ts.lookTok(-1).data == ".") {
- // skip, it's an object prop.
- //println("<i>"+token.data+"</i>");
- break;
- }
- //print("SYMBOL: " + token.toString());
-
- symbol = token.data;
- if (symbol == 'this') {
- break;
- }
- if (this.mode == 'PASS2_SYMBOL_TREE') {
-
- //println("GOT IDENT: -2 : " + this.ts.lookT(-2).toString() + " <BR> ..... -1 : " + this.ts.lookT(-1).toString() + " <BR> ");
-
- //print ("MUNGE?" + symbol);
-
- //println("GOT IDENT: <B>" + symbol + "</B><BR/>");
-
- //println("GOT IDENT (2): <B>" + symbol + "</B><BR/>");
- identifier = this.getIdentifier(symbol, scope, token);
-
- if (identifier == false) {
+ void buildSymbolTree()
+ {
+ //println("<PRE>");
+
+ this.ts.rewind();
+ this.braceNesting = 0;
+
+ // print(JSON.stringify(this.ts.tokens, null,4));
+
+
+ this.globalScope = new Scope(-1, false, -1, '');
+ this.indexedScopes = new Gee.HashMap<int,Scope>();
+ this.indexedScopes.set(0, this.globalScope );
+
+ this.mode = ScopeParserMode.BUILDING_SYMBOL_TREE;
+
+ this.parseScope(this.globalScope);
+
+ //print("---------------END PASS 1 ---------------- ");
+
+ }
+
+ void mungeSymboltree()
+ {
+
+ if (!this.munge) {
+ return;
+ }
+
+ // One problem with obfuscation resides in the use of undeclared
+ // and un-namespaced global symbols that are 3 characters or less
+ // in length. Here is an example:
+ //
+ // var declaredGlobalVar;
+ //
+ // function declaredGlobalFn() {
+ // var localvar;
+ // localvar = abc; // abc is an undeclared global symbol
+ // }
+ //
+ // In the example above, there is a slim chance that localvar may be
+ // munged to 'abc', conflicting with the undeclared global symbol
+ // abc, creating a potential bug. The following code detects such
+ // global symbols. This must be done AFTER the entire file has been
+ // parsed, and BEFORE munging the symbol tree. Note that declaring
+ // extra symbols in the global scope won't hurt.
+ //
+ // Note: Since we go through all the tokens to do this, we also use
+ // the opportunity to count how many times each identifier is used.
+
+ this.ts.rewind();
+ this.braceNesting = 0;
+ this.mode = ScopeParserMode.PASS2_SYMBOL_TREE;
+
+ //println("MUNGING?");
+
+ this.parseScope(this.globalScope);
+
+ //this.globalScope.dump();
+
+
+ this.globalScope.munge();
+ }
+
+
+ void log(string str)
+ {
+ print(str);
+ //print (" ".substring(0, this.braceNesting*2) + str);
+
+ //println("<B>LOG:</B>" + htmlescape(str) + "<BR/>\n");
+ }
+ void logR (string str)
+ {
+ //println("<B>LOG:</B>" + str + "<BR/>");
+ }
+
+
+
+
+
+ void parseScope(Scope scope) // parse a token stream..
+ {
+ //this.timerPrint("parseScope EnterScope");
+ //this.log(">>> ENTER SCOPE" + this.scopes.length);
+
+ var expressionBraceNesting = this.braceNesting + 0;
+
+ var parensNesting = 0;
+
+ var isObjectLitAr = new Gee.ArrayList<bool>();
+ isObjectLitAr.add(false);
+
+
+
+ //var scopeIndent = '';
+ //this.scopes.forEach(function() {
+ // scopeIndent += ' ';
+ //});
+ //print(">> ENTER SCOPE");
+
+
+
+
+ var token = this.ts.lookTok(1);
+ while (token != null) {
+ // this.timerPrint("parseScope AFTER lookT: " + token.toString());
+ //this.dumpToken(token , this.scopes, this.braceNesting);
+ //print('SCOPE:' + token.toString());
+ //this.log(token.data);
+ //if (token.type == 'NAME') {
+ // print('*' + token.data);
+ //}
+ switch(token.type + '.' + token.name) {
+ case "KEYW.VAR":
+ case "KEYW.CONST": // not really relivant as it's only mozzy that does this.
+ //print('SCOPE-VAR:' + token.toString());
+ var vstart = this.ts.cursor +1;
+
+ //this.log("parseScope GOT VAR/CONST : " + token.toString());
+ while (true) {
+ token = this.ts.nextTok();
+ //!this.debug|| print( token.toString());
+ // print('SCOPE-VAR-VAL:' + JSON.stringify(token, null, 4));
+ if (token == null) { // can return false at EOF!
+ break;
+ }
+ if (token.name == "VAR" || token.data == ",") { // kludge..
+ continue;
+ }
+ //this.logR("parseScope GOT VAR : <B>" + token.toString() + "</B>");
+ if (token.type != "NAME") {
+
+ for(var i = int.max(this.ts.cursor-10,0); i < this.ts.cursor+1; i++) {
+ print(this.ts.tokens[i].toString());
+ }
+
+ print( "var without ident");
+ GLib.Process.exit (0);
+ }
+
+
+ if (this.mode == ScopeParserMode.BUILDING_SYMBOL_TREE) {
+ var identifier = scope.getIdentifier(token.data,token) ;
+
+ if (identifier == false) {
+ scope.declareIdentifier(token.data, token);
+ } else {
+ token.identifier = identifier;
+ this.warn("(SCOPE) The variable " + token.data + " (line:" + token.line + ") has already been declared in the same scope...");
+ }
+ }
+
+ token = this.ts.nextTok();
+ //!this.debug|| print(token.toString());
+ /*
+ assert token.getType() == Token.SEMI ||
+ token.getType() == Token.ASSIGN ||
+ token.getType() == Token.COMMA ||
+ token.getType() == Token.IN;
+ */
+ if (token.name == "IN") {
+ break;
+ } else {
+ //var bn = this.braceNesting;
+ var bn = this.braceNesting;
+ var nts = new Gee.ArrayList<Token>();
+ while (true) {
+ if (!token || token.type == "VOID" || token.data == ",") {
+ break;
+ }
+ nts.add(token);
+ token = this.ts.nextTok();
+ }
+ if (nts.size > 0) {
+ var TS = this.ts;
+ this.ts = new TokenStream(nts);
+ this.parseExpression(scope);
+ this.ts = TS;
+ }
+
+ this.braceNesting = bn;
+ //this.braceNesting = bn;
+ //this.logR("parseScope DONE : <B>ParseExpression</B> - tok is:" + this.ts.lookT(0).toString());
+
+ token = this.ts.lookTok(1);
+ //!this.debug||
+ // print("AFTER EXP: " + token.toString());
+ if (token.data == ";") {
+ break;
+ }
+ }
+ }
+
+ //print("VAR:")
+ //this.ts.dump(vstart , this.ts.cursor);
+
+ break;
+
+
+ case "KEYW.FUNCTION":
+ //if (this.mode == 'BUILDING_SYMBOL_TREE')
+ // print('SCOPE-FUNC:' + JSON.stringify(token,null,4));
+ //println("<i>"+token.data+"</i>");
+ var bn = this.braceNesting;
+ this.parseFunctionDeclaration(scope);
+ this.braceNesting = bn;
+ break;
+
+ case "PUNC.LEFT_CURLY": // {
+ case "PUNC.LEFT_PAREN": // (
+ case "PUNC.LEFT_BRACE": // [
+ //print('SCOPE-CURLY/PAREN:' + token.toString());
+ //println("<i>"+token.data+"</i>");
+ var curTS = this.ts;
+ if (token.props.size() > 0) {
+
+ // { a : ... , c : .... }
+ var iter = token.props.map_iterator();
+
+ while(iter.next()) {
+
+ TokenKeyMap val = iter.get_value(); // TokenKeyMap
+
+
+ // print('SCOPE-PROPS:' + JSON.stringify(token.props[prop],null,4));
+ if (val.vals.get(0).data == "function") {
+ // parse a function..
+ this.ts = new TokenStream(val.vals);
+ this.ts.nextTok();
+ this.parseFunctionDeclaration(scope);
+
+ continue;
+ }
+ // key value..
+
+ this.ts = new TokenStream(val.vals);
+ this.parseExpression(scope);
+
+ }
+ this.ts = curTS;
+
+ // it's an object literal..
+ // the values could be replaced..
+ break;
+ }
+
+ // ( ... ) or { .... } not object literals..
+
+
+ for (var xx =0; xx < token.items.size; xx++) {
+ expr = token.items.get(xx);
+ //token.items.forEach(function(expr) {
+ //print(expr.toString());
+ this.ts = new TokenStream(expr);
+ //if (curTS.data == '(') {
+ this.parseScope(scope);
+ //} else {
+ // _this.parseExpression(scope)
+ //}
+
+ }
+ this.ts = curTS;
+ //print("NOT PROPS"); Seed.quit();
+
+ //isObjectLitAr.push(false);
+ //this.braceNesting++;
+
+ //print(">>>>>> OBJLIT PUSH(false)" + this.braceNesting);
+ break;
+
+ case "PUNC.RIGHT_CURLY": // }
+ //print("<< EXIT SCOPE");
+ return;
+
+ case "KEYW.WITH":
+ //print('SCOPE-WITH:' + token.toString());
+ //println("<i>"+token.data+"</i>");
+ if (this.mode == ScopeParserMode.BUILDING_SYMBOL_TREE) {
+ // Inside a 'with' block, it is impossible to figure out
+ // statically whether a symbol is a local variable or an
+ // object member. As a consequence, the only thing we can
+ // do is turn the obfuscation off for the highest scope
+ // containing the 'with' block.
+ this.protectScopeFromObfuscation(scope);
+ this.warn("Using 'with' is not recommended." + (this.munge ? " Moreover, using 'with' reduces the level of compression!" : ""), true);
+ }
+ break;
+
+ case "KEYW.CATCH":
+ //print('SCOPE-CATCH:' + token.toString());
+ //println("<i>"+token.data+"</i>");
+ this.parseCatch(scope);
+ break;
+
+ case "STRN.DOUBLE_QUOTE": // used for object lit detection..
+ case "STRN.SINGLE_QUOTE":
+ // print('SCOPE-STRING:' + token.toString());
+ //println("<i>"+token.data+"</i>");
+
+ if (this.ts.lookTok(-1).data == "{" && this.ts.lookTok(1).data == ":") {
+ // then we are in an object lit.. -> we need to flag the brace as such...
+ isObjectLitAr.remove_at(isObjectLitAr.size-1);
+ isObjectLitAr.add(true);
+ //print(">>>>>> OBJLIT REPUSH(true)");
+ }
+ isInObjectLitAr = isObjectLitAr.get(isObjectLitAr.size-1);
+
+ if (isInObjectLitAr && this.ts.lookTok(1).data == ":" &&
+ ( this.ts.lookTok(-1).data == "{" || this.ts.lookTok(-1).data == ":" )) {
+ // see if we can replace..
+ // remove the quotes..
+ // should do a bit more checking!!!! (what about wierd char's in the string..
+ var str = token.data.substring(1,token.data.length-1);
+
+ if (Regex.match_simple ("^[a-z_]+$", str) && this.idents.index_of(str) < 0) {
+ token.outData = str;
+ }
+
+
+
+ }
+
+ break;
+
+ case "NAME.NAME":
+ //print('SCOPE-NAME:' + token.toString());
+ //print("DEAL WITH NAME:");
+ // got identifier..
+ // look for { ** : <- indicates obj literal.. ** this could occur with numbers ..
+ // skip anyting with "." before it..!!
+
+ if (this.ts.lookTok(-1).data == ".") {
+ // skip, it's an object prop.
+ //println("<i>"+token.data+"</i>");
+ break;
+ }
+ //print("SYMBOL: " + token.toString());
+
+ symbol = token.data;
+ if (symbol == "this") {
+ break;
+ }
+
+ if (this.mode == ScopeParserMode.PASS2_SYMBOL_TREE) {
+
+ //println("GOT IDENT: -2 : " + this.ts.lookT(-2).toString() + " <BR> ..... -1 : " + this.ts.lookT(-1).toString() + " <BR> ");
+
+ //print ("MUNGE?" + symbol);
+
+ //println("GOT IDENT: <B>" + symbol + "</B><BR/>");
+
+ //println("GOT IDENT (2): <B>" + symbol + "</B><BR/>");
+ identifier = this.getIdentifier(symbol, scope, token);
+
+ if (identifier == false) {