* * Usage: $minified = JSMinPlus::minify($script [, $filename]) * * Versionlog (see also changelog.txt): * 12-04-2009 - some small bugfixes and performance improvements * 09-04-2009 - initial open sourced version 1.0 * * Latest version of this script: http://files.tweakers.net/jsminplus/jsminplus.zip * */ /* ***** BEGIN LICENSE BLOCK ***** * Version: MPL 1.1/GPL 2.0/LGPL 2.1 * * The contents of this file are subject to the Mozilla Public License Version * 1.1 (the "License"); you may not use this file except in compliance with * the License. You may obtain a copy of the License at * http://www.mozilla.org/MPL/ * * Software distributed under the License is distributed on an "AS IS" basis, * WITHOUT WARRANTY OF ANY KIND, either express or implied. See the License * for the specific language governing rights and limitations under the * License. * * The Original Code is the Narcissus JavaScript engine. * * The Initial Developer of the Original Code is * Brendan Eich . * Portions created by the Initial Developer are Copyright (C) 2004 * the Initial Developer. All Rights Reserved. * * Contributor(s): Tino Zijdel * PHP port, modifications and minifier routine are (C) 2009 * * Alternatively, the contents of this file may be used under the terms of * either the GNU General Public License Version 2 or later (the "GPL"), or * the GNU Lesser General Public License Version 2.1 or later (the "LGPL"), * in which case the provisions of the GPL or the LGPL are applicable instead * of those above. If you wish to allow use of your version of this file only * under the terms of either the GPL or the LGPL, and not to allow others to * use your version of this file under the terms of the MPL, indicate your * decision by deleting the provisions above and replace them with the notice * and other provisions required by the GPL or the LGPL. If you do not delete * the provisions above, a recipient may use your version of this file under * the terms of any one of the MPL, the GPL or the LGPL. * * ***** END LICENSE BLOCK ***** */ define('TOKEN_END', 1); define('TOKEN_NUMBER', 2); define('TOKEN_IDENTIFIER', 3); define('TOKEN_STRING', 4); define('TOKEN_REGEXP', 5); define('TOKEN_NEWLINE', 6); define('TOKEN_CONDCOMMENT_MULTILINE', 7); define('JS_SCRIPT', 100); define('JS_BLOCK', 101); define('JS_LABEL', 102); define('JS_FOR_IN', 103); define('JS_CALL', 104); define('JS_NEW_WITH_ARGS', 105); define('JS_INDEX', 106); define('JS_ARRAY_INIT', 107); define('JS_OBJECT_INIT', 108); define('JS_PROPERTY_INIT', 109); define('JS_GETTER', 110); define('JS_SETTER', 111); define('JS_GROUP', 112); define('JS_LIST', 113); define('DECLARED_FORM', 0); define('EXPRESSED_FORM', 1); define('STATEMENT_FORM', 2); class JSMinPlus { private $parser; private $reserved = array( 'break', 'case', 'catch', 'continue', 'default', 'delete', 'do', 'else', 'finally', 'for', 'function', 'if', 'in', 'instanceof', 'new', 'return', 'switch', 'this', 'throw', 'try', 'typeof', 'var', 'void', 'while', 'with', // Words reserved for future use 'abstract', 'boolean', 'byte', 'char', 'class', 'const', 'debugger', 'double', 'enum', 'export', 'extends', 'final', 'float', 'goto', 'implements', 'import', 'int', 'interface', 'long', 'native', 'package', 'private', 'protected', 'public', 'short', 'static', 'super', 'synchronized', 'throws', 'transient', 'volatile', // These are not reserved, but should be taken into account // in isValidIdentifier (See jslint source code) 'arguments', 'eval', 'true', 'false', 'Infinity', 'NaN', 'null', 'undefined' ); private function __construct() { $this->parser = new JSParser(); } static public function minify($js, $filename='') { static $instance = null; // this is a singleton if(!$instance) { $instance = new JSMinPlus(); } return $instance->min($js, $filename); } private function min($js, $filename) { try { $n = $this->parser->parse($js, $filename, 1); return $this->parseTree($n); } catch(Exception $e) { echo $e->getMessage() . "\n"; } return false; } private function parseTree($n, $noBlockGrouping = false) { $s = ''; switch ($n->type) { case KEYWORD_FUNCTION: $s .= 'function' . ($n->name ? ' ' . $n->name : '') . '('; $params = $n->params; for ($i = 0, $j = count($params); $i < $j; $i++) $s .= ($i ? ',' : '') . $params[$i]; $s .= '){' . $this->parseTree($n->body, true) . '}'; break; case JS_SCRIPT: // we do nothing with funDecls or varDecls $noBlockGrouping = true; // fall through case JS_BLOCK: $childs = $n->treeNodes; for ($c = 0, $i = 0, $j = count($childs); $i < $j; $i++) { $t = $this->parseTree($childs[$i]); if (strlen($t)) { if ($c) { if ($childs[$i]->type == KEYWORD_FUNCTION && $childs[$i]->functionForm == DECLARED_FORM) $s .= "\n"; // put declared functions on a new line else $s .= ';'; } $s .= $t; $c++; } } if ($c > 1 && !$noBlockGrouping) { $s = '{' . $s . '}'; } break; case KEYWORD_IF: $s = 'if(' . $this->parseTree($n->condition) . ')'; $thenPart = $this->parseTree($n->thenPart); $elsePart = $n->elsePart ? $this->parseTree($n->elsePart) : null; // quite a rancid hack to see if we should enclose the thenpart in brackets if ($thenPart[0] != '{') { if (strpos($thenPart, 'if(') !== false) $thenPart = '{' . $thenPart . '}'; elseif ($elsePart) $thenPart .= ';'; } $s .= $thenPart; if ($elsePart) { $s .= 'else'; if ($elsePart[0] != '{') $s .= ' '; $s .= $elsePart; } break; case KEYWORD_SWITCH: $s = 'switch(' . $this->parseTree($n->discriminant) . '){'; $cases = $n->cases; for ($i = 0, $j = count($cases); $i < $j; $i++) { $case = $cases[$i]; if ($case->type == KEYWORD_CASE) $s .= 'case' . ($case->caseLabel->type != TOKEN_STRING ? ' ' : '') . $this->parseTree($case->caseLabel) . ':'; else $s .= 'default:'; $statement = $this->parseTree($case->statements); if ($statement) $s .= $statement . ';'; } $s = rtrim($s, ';') . '}'; break; case KEYWORD_FOR: $s = 'for(' . ($n->setup ? $this->parseTree($n->setup) : '') . ';' . ($n->condition ? $this->parseTree($n->condition) : '') . ';' . ($n->update ? $this->parseTree($n->update) : '') . ')' . $this->parseTree($n->body); break; case KEYWORD_WHILE: $s = 'while(' . $this->parseTree($n->condition) . ')' . $this->parseTree($n->body); break; case JS_FOR_IN: $s = 'for(' . ($n->varDecl ? $this->parseTree($n->varDecl) : $this->parseTree($n->iterator)) . ' in ' . $this->parseTree($n->object) . ')' . $this->parseTree($n->body); break; case KEYWORD_DO: $s = 'do{' . $this->parseTree($n->body, true) . '}while(' . $this->parseTree($n->condition) . ')'; break; case KEYWORD_BREAK: case KEYWORD_CONTINUE: $s = $n->value . ($n->label ? ' ' . $n->label : ''); break; case KEYWORD_TRY: $s = 'try{' . $this->parseTree($n->tryBlock, true) . '}'; $catchClauses = $n->catchClauses; for ($i = 0, $j = count($catchClauses); $i < $j; $i++) { $t = $catchClauses[$i]; $s .= 'catch(' . $t->varName . ($t->guard ? ' if ' . $this->parseTree($t->guard) : '') . '){' . $this->parseTree($t->block, true) . '}'; } if ($n->finallyBlock) $s .= 'finally{' . $this->parseTree($n->finallyBlock, true) . '}'; break; case KEYWORD_THROW: $s = 'throw ' . $this->parseTree($n->exception); break; case KEYWORD_RETURN: $s = 'return' . ($n->value ? ' ' . $this->parseTree($n->value) : ''); break; case KEYWORD_WITH: $s = 'with(' . $this->parseTree($n->object) . ')' . $this->parseTree($n->body); break; case KEYWORD_VAR: case KEYWORD_CONST: $s = $n->value . ' '; $childs = $n->treeNodes; for ($i = 0, $j = count($childs); $i < $j; $i++) { $t = $childs[$i]; $s .= ($i ? ',' : '') . $t->name; $u = $t->initializer; if ($u) $s .= '=' . $this->parseTree($u); } break; case KEYWORD_DEBUGGER: throw new Exception('NOT IMPLEMENTED: DEBUGGER'); break; case TOKEN_CONDCOMMENT_MULTILINE: $s = $n->value . ' '; $childs = $n->treeNodes; for ($i = 0, $j = count($childs); $i < $j; $i++) $s .= $this->parseTree($childs[$i]); break; case OP_SEMICOLON: if ($expression = $n->expression) $s = $this->parseTree($expression); break; case JS_LABEL: $s = $n->label . ':' . $this->parseTree($n->statement); break; case OP_COMMA: $childs = $n->treeNodes; for ($i = 0, $j = count($childs); $i < $j; $i++) $s .= ($i ? ',' : '') . $this->parseTree($childs[$i]); break; case OP_ASSIGN: $s = $this->parseTree($n->treeNodes[0]) . $n->value . $this->parseTree($n->treeNodes[1]); break; case OP_HOOK: $s = $this->parseTree($n->treeNodes[0]) . '?' . $this->parseTree($n->treeNodes[1]) . ':' . $this->parseTree($n->treeNodes[2]); break; case OP_OR: case OP_AND: case OP_BITWISE_OR: case OP_BITWISE_XOR: case OP_BITWISE_AND: case OP_EQ: case OP_NE: case OP_STRICT_EQ: case OP_STRICT_NE: case OP_LT: case OP_LE: case OP_GE: case OP_GT: case OP_LSH: case OP_RSH: case OP_URSH: case OP_MUL: case OP_DIV: case OP_MOD: $s = $this->parseTree($n->treeNodes[0]) . $n->type . $this->parseTree($n->treeNodes[1]); break; case OP_PLUS: case OP_MINUS: $s = $this->parseTree($n->treeNodes[0]) . $n->type; $nextTokenType = $n->treeNodes[1]->type; if ( $nextTokenType == OP_PLUS || $nextTokenType == OP_MINUS || $nextTokenType == OP_INCREMENT || $nextTokenType == OP_DECREMENT || $nextTokenType == OP_UNARY_PLUS || $nextTokenType == OP_UNARY_MINUS ) $s .= ' '; $s .= $this->parseTree($n->treeNodes[1]); break; case KEYWORD_IN: $s = $this->parseTree($n->treeNodes[0]) . ' in ' . $this->parseTree($n->treeNodes[1]); break; case KEYWORD_INSTANCEOF: $s = $this->parseTree($n->treeNodes[0]) . ' instanceof ' . $this->parseTree($n->treeNodes[1]); break; case KEYWORD_DELETE: $s = 'delete ' . $this->parseTree($n->treeNodes[0]); break; case KEYWORD_VOID: $s = 'void(' . $this->parseTree($n->treeNodes[0]) . ')'; break; case KEYWORD_TYPEOF: $s = 'typeof ' . $this->parseTree($n->treeNodes[0]); break; case OP_NOT: case OP_BITWISE_NOT: case OP_UNARY_PLUS: case OP_UNARY_MINUS: $s = $n->value . $this->parseTree($n->treeNodes[0]); break; case OP_INCREMENT: case OP_DECREMENT: if ($n->postfix) $s = $this->parseTree($n->treeNodes[0]) . $n->value; else $s = $n->value . $this->parseTree($n->treeNodes[0]); break; case OP_DOT: $s = $this->parseTree($n->treeNodes[0]) . '.' . $this->parseTree($n->treeNodes[1]); break; case JS_INDEX: $s = $this->parseTree($n->treeNodes[0]); // See if we can replace named index with a dot saving 3 bytes if ( $n->treeNodes[0]->type == TOKEN_IDENTIFIER && $n->treeNodes[1]->type == TOKEN_STRING && $this->isValidIdentifier(substr($n->treeNodes[1]->value, 1, -1)) ) $s .= '.' . substr($n->treeNodes[1]->value, 1, -1); else $s .= '[' . $this->parseTree($n->treeNodes[1]) . ']'; break; case JS_LIST: $childs = $n->treeNodes; for ($i = 0, $j = count($childs); $i < $j; $i++) $s .= ($i ? ',' : '') . $this->parseTree($childs[$i]); break; case JS_CALL: $s = $this->parseTree($n->treeNodes[0]) . '(' . $this->parseTree($n->treeNodes[1]) . ')'; break; case KEYWORD_NEW: case JS_NEW_WITH_ARGS: $s = 'new ' . $this->parseTree($n->treeNodes[0]) . '(' . ($n->type == JS_NEW_WITH_ARGS ? $this->parseTree($n->treeNodes[1]) : '') . ')'; break; case JS_ARRAY_INIT: $s = '['; $childs = $n->treeNodes; for ($i = 0, $j = count($childs); $i < $j; $i++) { $s .= ($i ? ',' : '') . $this->parseTree($childs[$i]); } $s .= ']'; break; case JS_OBJECT_INIT: $s = '{'; $childs = $n->treeNodes; for ($i = 0, $j = count($childs); $i < $j; $i++) { $t = $childs[$i]; if ($i) $s .= ','; if ($t->type == JS_PROPERTY_INIT) { // Ditch the quotes when the index is a valid identifier if ( $t->treeNodes[0]->type == TOKEN_STRING && $this->isValidIdentifier(substr($t->treeNodes[0]->value, 1, -1)) ) $s .= substr($t->treeNodes[0]->value, 1, -1); else $s .= $t->treeNodes[0]->value; $s .= ':' . $this->parseTree($t->treeNodes[1]); } else { $s .= $t->type == JS_GETTER ? 'get' : 'set'; $s .= ' ' . $t->name . '('; $params = $t->params; for ($i = 0, $j = count($params); $i < $j; $i++) $s .= ($i ? ',' : '') . $params[$i]; $s .= '){' . $this->parseTree($t->body, true) . '}'; } } $s .= '}'; break; case KEYWORD_NULL: case KEYWORD_THIS: case KEYWORD_TRUE: case KEYWORD_FALSE: case TOKEN_IDENTIFIER: case TOKEN_NUMBER: case TOKEN_STRING: case TOKEN_REGEXP: $s = $n->value; break; case JS_GROUP: $s = '(' . $this->parseTree($n->treeNodes[0]) . ')'; break; default: throw new Exception('UNKNOWN TOKEN TYPE: ' . $n->type); } return $s; } private function isValidIdentifier($string) { return preg_match('/^[a-zA-Z_][a-zA-Z0-9_]*$/', $string) && !in_array($string, $this->reserved); } } class JSParser { private $t; private $opPrecedence = array( ';' => 0, ',' => 1, '=' => 2, '?' => 2, ':' => 2, // The above all have to have the same precedence, see bug 330975. '||' => 4, '&&' => 5, '|' => 6, '^' => 7, '&' => 8, '==' => 9, '!=' => 9, '===' => 9, '!==' => 9, '<' => 10, '<=' => 10, '>=' => 10, '>' => 10, 'in' => 10, 'instanceof' => 10, '<<' => 11, '>>' => 11, '>>>' => 11, '+' => 12, '-' => 12, '*' => 13, '/' => 13, '%' => 13, 'delete' => 14, 'void' => 14, 'typeof' => 14, '!' => 14, '~' => 14, 'U+' => 14, 'U-' => 14, '++' => 15, '--' => 15, 'new' => 16, '.' => 17, JS_NEW_WITH_ARGS => 0, JS_INDEX => 0, JS_CALL => 0, JS_ARRAY_INIT => 0, JS_OBJECT_INIT => 0, JS_GROUP => 0 ); private $opArity = array( ',' => -2, '=' => 2, '?' => 3, '||' => 2, '&&' => 2, '|' => 2, '^' => 2, '&' => 2, '==' => 2, '!=' => 2, '===' => 2, '!==' => 2, '<' => 2, '<=' => 2, '>=' => 2, '>' => 2, 'in' => 2, 'instanceof' => 2, '<<' => 2, '>>' => 2, '>>>' => 2, '+' => 2, '-' => 2, '*' => 2, '/' => 2, '%' => 2, 'delete' => 1, 'void' => 1, 'typeof' => 1, '!' => 1, '~' => 1, 'U+' => 1, 'U-' => 1, '++' => 1, '--' => 1, 'new' => 1, '.' => 2, JS_NEW_WITH_ARGS => 2, JS_INDEX => 2, JS_CALL => 2, JS_ARRAY_INIT => 1, JS_OBJECT_INIT => 1, JS_GROUP => 1, TOKEN_CONDCOMMENT_MULTILINE => 1 ); public function __construct() { $this->t = new JSTokenizer(); } public function parse($s, $f, $l) { // initialize tokenizer $this->t->init($s, $f, $l); $x = new JSCompilerContext(false); $n = $this->Script($x); if (!$this->t->isDone()) throw $this->t->newSyntaxError('Syntax error'); return $n; } private function Script($x) { $n = $this->Statements($x); $n->type = JS_SCRIPT; $n->funDecls = $x->funDecls; $n->varDecls = $x->varDecls; return $n; } private function Statements($x) { $n = new JSNode($this->t, JS_BLOCK); array_push($x->stmtStack, $n); while (!$this->t->isDone() && $this->t->peek() != OP_RIGHT_CURLY) $n->addNode($this->Statement($x)); array_pop($x->stmtStack); return $n; } private function Block($x) { $this->t->mustMatch(OP_LEFT_CURLY); $n = $this->Statements($x); $this->t->mustMatch(OP_RIGHT_CURLY); return $n; } private function Statement($x) { $tt = $this->t->get(); $n2 = null; // Cases for statements ending in a right curly return early, avoiding the // common semicolon insertion magic after this switch. switch ($tt) { case KEYWORD_FUNCTION: return $this->FunctionDefinition( $x, true, count($x->stmtStack) > 1 ? STATEMENT_FORM : DECLARED_FORM ); break; case OP_LEFT_CURLY: $n = $this->Statements($x); $this->t->mustMatch(OP_RIGHT_CURLY); return $n; case KEYWORD_IF: $n = new JSNode($this->t); $n->condition = $this->ParenExpression($x); array_push($x->stmtStack, $n); $n->thenPart = $this->Statement($x); $n->elsePart = $this->t->match(KEYWORD_ELSE) ? $this->Statement($x) : null; array_pop($x->stmtStack); return $n; case KEYWORD_SWITCH: $n = new JSNode($this->t); $this->t->mustMatch(OP_LEFT_PAREN); $n->discriminant = $this->Expression($x); $this->t->mustMatch(OP_RIGHT_PAREN); $n->cases = array(); $n->defaultIndex = -1; array_push($x->stmtStack, $n); $this->t->mustMatch(OP_LEFT_CURLY); while (($tt = $this->t->get()) != OP_RIGHT_CURLY) { switch ($tt) { case KEYWORD_DEFAULT: if ($n->defaultIndex >= 0) throw $this->t->newSyntaxError('More than one switch default'); // FALL THROUGH case KEYWORD_CASE: $n2 = new JSNode($this->t); if ($tt == KEYWORD_DEFAULT) $n->defaultIndex = count($n->cases); else $n2->caseLabel = $this->Expression($x, OP_COLON); break; default: throw $this->t->newSyntaxError('Invalid switch case'); } $this->t->mustMatch(OP_COLON); $n2->statements = new JSNode($this->t, JS_BLOCK); while (($tt = $this->t->peek()) != KEYWORD_CASE && $tt != KEYWORD_DEFAULT && $tt != OP_RIGHT_CURLY) $n2->statements->addNode($this->Statement($x)); array_push($n->cases, $n2); } array_pop($x->stmtStack); return $n; case KEYWORD_FOR: $n = new JSNode($this->t); $n->isLoop = true; $this->t->mustMatch(OP_LEFT_PAREN); if (($tt = $this->t->peek()) != OP_SEMICOLON) { $x->inForLoopInit = true; if ($tt == KEYWORD_VAR || $tt == KEYWORD_CONST) { $this->t->get(); $n2 = $this->Variables($x); } else { $n2 = $this->Expression($x); } $x->inForLoopInit = false; } if ($n2 && $this->t->match(KEYWORD_IN)) { $n->type = JS_FOR_IN; if ($n2->type == KEYWORD_VAR) { if (count($n2->treeNodes) != 1) { throw $this->t->SyntaxError( 'Invalid for..in left-hand side', $this->t->filename, $n2->lineno ); } // NB: n2[0].type == IDENTIFIER and n2[0].value == n2[0].name. $n->iterator = $n2->treeNodes[0]; $n->varDecl = $n2; } else { $n->iterator = $n2; $n->varDecl = null; } $n->object = $this->Expression($x); } else { $n->setup = $n2 ? $n2 : null; $this->t->mustMatch(OP_SEMICOLON); $n->condition = $this->t->peek() == OP_SEMICOLON ? null : $this->Expression($x); $this->t->mustMatch(OP_SEMICOLON); $n->update = $this->t->peek() == OP_RIGHT_PAREN ? null : $this->Expression($x); } $this->t->mustMatch(OP_RIGHT_PAREN); $n->body = $this->nest($x, $n); return $n; case KEYWORD_WHILE: $n = new JSNode($this->t); $n->isLoop = true; $n->condition = $this->ParenExpression($x); $n->body = $this->nest($x, $n); return $n; case KEYWORD_DO: $n = new JSNode($this->t); $n->isLoop = true; $n->body = $this->nest($x, $n, KEYWORD_WHILE); $n->condition = $this->ParenExpression($x); if (!$x->ecmaStrictMode) { //