X-Git-Url: http://git.asbjorn.biz/?a=blobdiff_plain;f=lib%2Fas3%2Fparser.y;h=59e7f6a474a59b0d727a4143f7b9f4d6e7cdfc5c;hb=3f9b43eec2a339e1c60a4139556b6153f8b3cc65;hp=c104f550e41aff6e20a589700e29d21ef5307eaa;hpb=499c73edd0924ce0d7ddbdc0c6af6a5536457021;p=swftools.git diff --git a/lib/as3/parser.y b/lib/as3/parser.y index c104f55..59e7f6a 100644 --- a/lib/as3/parser.y +++ b/lib/as3/parser.y @@ -1,54 +1,25 @@ -//%glr-parser -//%expect-rr 1 -%error-verbose +/* parser.lex -%token T_IDENTIFIER -%token T_STRING -%token T_REGEXP -%token T_DOTDOT ".." -%token T_COLONCOLON "::" -%token T_GE ">=" -%token T_LE "<=" -%token T_EQEQ "==" -%token T_PLUSPLUS "++" -%token T_MINUSMINUS "--" -%token T_IMPLEMENTS -%token T_NAMESPACE -%token T_PACKAGE -%token T_PROTECTED -%token T_PUBLIC -%token T_PRIVATE -%token T_UINT -%token T_USE -%token T_INTERNAL -%token T_INT -%token T_NEW -%token T_NATIVE -%token T_FUNCTION -%token T_FOR -%token T_CLASS -%token T_CONST -%token T_SET -%token T_STATIC -%token T_IMPORT -%token T_INTERFACE -%token T_NUMBER -%token T_NULL -%token T_FALSE -%token T_TRUE -%token T_BOOLEAN -%token T_VAR -%token T_AS -%token T_IS -%token T_DYNAMIC -%token T_OVERRIDE -%token T_FINAL -%token T_GET -%token T_EXTENDS - - -%token T_EMPTY - + Routines for compiling Flash2 AVM2 ABC Actionscript + + Extension module for the rfxswf library. + Part of the swftools package. + + Copyright (c) 2008 Matthias Kramm + + This program is free software; you can redistribute it and/or modify + it under the terms of the GNU General Public License as published by + the Free Software Foundation; either version 2 of the License, or + (at your option) any later version. + + This program is distributed in the hope that it will be useful, + but WITHOUT ANY WARRANTY; without even the implied warranty of + MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the + GNU General Public License for more details. + + You should have received a copy of the GNU General Public License + along with this program; if not, write to the Free Software + Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA */ %{ #include #include @@ -58,6 +29,189 @@ #include "files.h" #include "tokenizer.h" #include "registry.h" +#include "code.h" +#include "opcodes.h" + +%} + +//%glr-parser +//%expect-rr 1 +%error-verbose + +%union tokenunion { + tokenptr_t token; + multiname_t*multiname; + multiname_list_t*multiname_list; + int number_int; + unsigned int number_uint; + double number_float; + struct _code*code; + struct _typedcode value; + struct _typedcode_list*value_list; + struct _writeable writeable; + char*string; +} + + +%token T_IDENTIFIER +%token T_STRING +%token T_REGEXP +%token T_EMPTY +%token T_INT +%token T_UINT +%token T_BYTE +%token T_SHORT +%token T_FLOAT + +%token KW_IMPLEMENTS +%token KW_NAMESPACE "namespace" +%token KW_PACKAGE "package" +%token KW_PROTECTED +%token KW_PUBLIC +%token KW_PRIVATE +%token KW_USE "use" +%token KW_INTERNAL +%token KW_NEW "new" +%token KW_NATIVE +%token KW_FUNCTION "function" +%token KW_FOR "for" +%token KW_CLASS "class" +%token KW_CONST "const" +%token KW_SET "set" +%token KW_STATIC +%token KW_IMPORT "import" +%token KW_INTERFACE "interface" +%token KW_NULL +%token KW_VAR "var" +%token KW_DYNAMIC +%token KW_OVERRIDE +%token KW_FINAL +%token KW_GET "get" +%token KW_EXTENDS +%token KW_FALSE "false" +%token KW_TRUE "true" +%token KW_BOOLEAN "Boolean" +%token KW_UINT "uint" +%token KW_INT "int" +%token KW_WHILE "while" +%token KW_NUMBER "Number" +%token KW_STRING "String" +%token KW_IF "if" +%token KW_ELSE "else" +%token KW_BREAK "break" +%token KW_IS "is" +%token KW_AS "as" + +%token T_EQEQ "==" +%token T_EQEQEQ "===" +%token T_NE "!=" +%token T_LE "<=" +%token T_GE ">=" +%token T_DIVBY "/=" +%token T_MODBY "%=" +%token T_PLUSBY "+=" +%token T_MINUSBY "-=" +%token T_SHRBY ">>=" +%token T_SHLBY "<<=" +%token T_USHRBY ">>>=" +%token T_OROR "||" +%token T_ANDAND "&&" +%token T_COLONCOLON "::" +%token T_MINUSMINUS "--" +%token T_PLUSPLUS "++" +%token T_DOTDOT ".." +%token T_SHL "<<" +%token T_USHR ">>>" +%token T_SHR ">>" +%token T_SEMICOLON ';' +%token T_STAR '*' +%token T_DOT '.' + +%type CODE +%type CODEPIECE +%type CODEBLOCK MAYBECODE +%type PACKAGE_DECLARATION +%type FUNCTION_DECLARATION +%type VARIABLE_DECLARATION +%type CLASS_DECLARATION +%type NAMESPACE_DECLARATION +%type INTERFACE_DECLARATION +%type VOIDEXPRESSION +%type EXPRESSION +%type MAYBEEXPRESSION +%type E +%type LH +%type CONSTANT +%type FOR IF WHILE MAYBEELSE BREAK +%type USE_NAMESPACE +%type ASSIGNMENT FOR_INIT +%type IMPORT +%type MAYBETYPE +%type PACKAGESPEC +%type GETSET +%type PARAM +%type PARAMS +%type PARAM_LIST +%type MODIFIERS +%type MODIFIER_LIST +%type IMPLEMENTS_LIST +%type EXTENDS +%type EXTENDS_LIST +%type PACKAGEANDCLASS +%type PACKAGEANDCLASS_LIST +%type MULTILEVELIDENTIFIER +%type TYPE +%type VAR +//%type VARIABLE +%type VAR_READ +%type NEW +%type X_IDENTIFIER +%type MODIFIER +%type PACKAGE +%type FUNCTIONCALL +%type MAYBE_EXPRESSION_LIST EXPRESSION_LIST + +// precendence: from low to high +// http://livedocs.adobe.com/flash/9.0/main/wwhelp/wwhimpl/common/html/wwhelp.htm?context=LiveDocs_Parts&file=00000012.html + +%left prec_none +%right '?' ':' +%nonassoc '=' +%nonassoc "/=" "%=" +%nonassoc "+=" "-=" +%nonassoc ">>=" +%nonassoc "<<=" +%nonassoc ">>>=" +%nonassoc "||" +%nonassoc "&&" +%nonassoc '|' +%nonassoc '^' +%nonassoc '&' +%nonassoc "!=" "==" "<=" '<' ">=" '>' // TODO: support "a < b < c" syntax? +%nonassoc "is" +%left '-' +%left '+' +%left "<<" +%left ">>>" +%left ">>" +%left '%' +%left '/' +%left '*' +%left '!' +%left '~' +%left "--" "++" +%left '[' +%nonassoc "as" +%left '.' ".." "::" +%nonassoc T_IDENTIFIER +%left below_semicolon +%left ';' +%nonassoc "else" +%left '(' +%left prec_highest + + +%{ static int yyerror(char*s) { @@ -87,6 +241,18 @@ static token_t* concat3(token_t* t1, token_t* t2, token_t* t3) t->text[l1+l2+l3] = 0; return t; } +static char* concat3str(const char* t1, const char* t2, const char* t3) +{ + int l1 = strlen(t1); + int l2 = strlen(t2); + int l3 = strlen(t3); + char*text = malloc(l1+l2+l3+1); + memcpy(text , t1, l1); + memcpy(text+l1, t2, l2); + memcpy(text+l1+l2, t3, l3); + text[l1+l2+l3] = 0; + return text; +} typedef struct _import { char*path; @@ -102,12 +268,19 @@ typedef struct _state { char*package; char*function; + /* code that needs to be executed at the start of + a method (like initializing local registers) */ + code_t*initcode; + + abc_method_body_t*m; import_list_t*imports; /* class data */ char*classname; abc_class_t*cls; + array_t*vars; + int local_var_base; } state_t; static state_t* state = 0; @@ -116,41 +289,23 @@ DECLARE_LIST(state); static state_list_t*state_stack=0; -static void initialize_state() -{ - NEW(state_t, s); - NEW(state_list_t, sl); - state_stack = sl; - state = sl->state = s; - - state->file = abc_file_new(); - state->level = 0; - - state->init = abc_initscript(state->file, 0, 0); - abc_method_body_t*m = state->init->method->body; - __ getlocal_0(m); - __ pushscope(m); -} -static void finalize_state() -{ - if(state->level) { - syntaxerror("unexpected end of file"); - } - abc_method_body_t*m = state->init->method->body; - //__ popscope(m); - __ returnvoid(m); -} - static void new_state() { NEW(state_t, s); NEW(state_list_t, sl); - memcpy(s, state, sizeof(state_t)); //shallow copy + + state_t*oldstate = state; + if(state) + memcpy(s, state, sizeof(state_t)); //shallow copy sl->next = state_stack; sl->state = s; + if(oldstate) + s->local_var_base = array_length(oldstate->vars) + oldstate->local_var_base; state_stack = sl; state = s; state->level++; + state->vars = array_new(); + state->initcode = 0; } static void old_state() { @@ -161,8 +316,39 @@ static void old_state() state_stack = state_stack->next; free(old); state = state_stack->state; + state->initcode = code_append(state->initcode, oldstate->initcode); +} +void initialize_state() +{ + new_state(); + + state->file = abc_file_new(); + state->file->flags &= ~ABCFILE_LAZY; + + state->init = abc_initscript(state->file, 0, 0); + abc_method_body_t*m = state->init->method->body; + __ getlocal_0(m); + __ pushscope(m); + __ findpropstrict(m, "[package]::trace"); + __ pushstring(m, "[entering global init function]"); + __ callpropvoid(m, "[package]::trace", 1); +} +void* finalize_state() +{ + if(state->level!=1) { + syntaxerror("unexpected end of file"); + } + abc_method_body_t*m = state->init->method->body; + //__ popscope(m); + + __ findpropstrict(m, "[package]::trace"); + __ pushstring(m, "[leaving global init function]"); + __ callpropvoid(m, "[package]::trace", 1); + __ returnvoid(m); + return state->file; } + static void startpackage(token_t*t) { if(state->package) { @@ -179,28 +365,35 @@ static void endpackage() old_state(); } -static void startclass(token_t*modifiers, token_t*name, token_t*extends, token_t*implements) +char*globalclass=0; +static void startclass(token_t*modifiers, token_t*name, multiname_t*extends, multiname_list_t*implements) { - token_list_t*t; if(state->cls) { syntaxerror("inner classes now allowed"); } new_state(); state->classname = name->text; printf("entering class %s\n", name->text); + token_list_t*t=0; printf(" modifiers: ");for(t=modifiers->tokens;t;t=t->next) printf("%s ", t->token->text);printf("\n"); - printf(" extends: %s\n", extends->text); - printf(" implements (%d): ", list_length(implements->tokens));for(t=implements->tokens;t;t=t->next) printf("%s ", t->token->text);printf("\n"); + printf(" extends: %s\n", multiname_tostring(extends)); + + multiname_list_t*mlist=0; + printf(" implements (%d): ", list_length(implements)); + for(mlist=implements;mlist;mlist=mlist->next) { + printf("%s ", multiname_tostring(mlist->multiname)); + } + printf("\n"); char public=0,internal=0,final=0,sealed=1; for(t=modifiers->tokens;t;t=t->next) { - if(t->token->type == T_INTERNAL) { + if(t->token->type == KW_INTERNAL) { /* the programmer is being explicit- being internal is the default anyway */ internal = 1; - } else if(t->token->type == T_PUBLIC) { + } else if(t->token->type == KW_PUBLIC) { public = 1; - } else if(t->token->type == T_FINAL) { + } else if(t->token->type == KW_FINAL) { final = 1; } else { syntaxerror("modifier \"%s\" not supported in class declaration", t->token->text); @@ -220,20 +413,12 @@ static void startclass(token_t*modifiers, token_t*name, token_t*extends, token_t else syntaxerror("public classes only allowed inside a package"); - /* try to find the superclass */ - multiname_t* superclass = 0; - if(extends->type != T_EMPTY) { - superclass = registry_findclass(extends->text); - } else { - superclass = registry_getobjectclass(); - } - - state->cls = abc_class_new(state->file, classname, superclass); + state->cls = abc_class_new(state->file, classname, extends); if(final) abc_class_final(state->cls); if(sealed) abc_class_sealed(state->cls); - for(t=implements->tokens;t;t=t->next) { - abc_class_add_interface(state->cls, registry_findclass(t->token->text)); + for(mlist=implements;mlist;mlist=mlist->next) { + abc_class_add_interface(state->cls, mlist->multiname); } /* now write the construction code for this class */ @@ -241,27 +426,43 @@ static void startclass(token_t*modifiers, token_t*name, token_t*extends, token_t abc_method_body_t*m = state->init->method->body; __ getglobalscope(m); - multiname_t*s = superclass; + multiname_t*s = extends; + int count=0; + while(s) { - //TODO: invert //TODO: take a look at the current scope stack, maybe // we can re-use something + s = registry_getsuperclass(s); + if(!s) + break; __ getlex2(m, s); __ pushscope(m); - s = registry_getsuperclass(s); + m->code = m->code->prev->prev; // invert count++; } + /* continue appending after last op end */ + while(m->code && m->code->next) m->code = m->code->next; + /* TODO: if this is one of *our* classes, we can also do a getglobalscope/getslot (which references the init function's slots) */ - __ getlex2(m, superclass); + __ getlex2(m, extends); + __ dup(m); + __ pushscope(m); // we get a Verify Error #1107 if this is not the top scope __ newclass(m,state->cls); - while(count--) { __ popscope(m); } __ setslot(m, slotindex); + + if(!globalclass && public && multiname_equals(registry_getMovieClip(),extends)) { + if(state->package && state->package[0]) { + globalclass = concat3str(state->package, ".", state->classname); + } else { + globalclass = strdup(state->classname); + } + } } static void endclass() @@ -284,7 +485,7 @@ static void print_imports() } } static void startfunction(token_t*ns, token_t*mod, token_t*getset, token_t*name, - token_t*params, token_t*type) + token_t*params, multiname_t*type) { token_list_t*t; new_state(); @@ -295,22 +496,30 @@ static void startfunction(token_t*ns, token_t*mod, token_t*getset, token_t*name, printf(" getset: %s\n", getset->text); printf(" params: ");for(t=params->tokens;t;t=t->next) printf("%s ", t->token->text);printf("\n"); printf(" mod: ");for(t=mod->tokens;t;t=t->next) printf("%s ", t->token->text);printf("\n"); - printf(" type: %s\n", type->text); + printf(" type: %s\n", multiname_tostring(type)); print_imports(); + + if(state->m) { + syntaxerror("not able to start another method scope"); + } + + if(!strcmp(state->classname,name->text)) { + state->m = abc_class_constructor(state->cls, type, 0); + } else { + state->m = abc_class_method(state->cls, type, name->text, 0); + } + array_append(state->vars, "this", 0); + + __ getlocal_0(state->m); + __ pushscope(state->m); } static void endfunction() { printf("leaving function %s\n", state->function); + __ returnvoid(state->m); + old_state(); } -static int newvariable(token_t*mod, token_t*varconst, token_t*name, token_t*type) -{ - token_list_t*t; - printf("defining new variable %s\n", name->text); - printf(" mod: ");for(t=mod->tokens;t;t=t->next) printf("%s ", t->token->text);printf("\n"); - printf(" access: ");printf("%s\n", varconst->text); - printf(" type: ");printf("%s\n", type->text); -} static token_t* empty_token() { NEW(token_t,t); @@ -339,152 +548,388 @@ void extend_s(token_t*list, char*seperator, token_t*add) { list->text[l1+l2+l3]=0; } +int find_variable(char*name, multiname_t**m) +{ + state_list_t* s = state_stack; + while(s) { + int i = array_find(s->state->vars, name); + if(i>=0) { + if(m) { + *m = array_getvalue(s->state->vars, i); + } + return i + s->state->local_var_base; + } + s = s->next; + } + syntaxerror("undefined variable: %s", name); +} + +multiname_t*join_types(multiname_t*type1, multiname_t*type2, char op) +{ + return registry_getanytype(); // FIXME +} +char is_subtype_of(multiname_t*type, multiname_t*supertype) +{ + return 1; // FIXME +} + +#define TYPE_ANY registry_getanytype() +#define TYPE_IS_ANY(t) ((t) == registry_getanytype()) +#define TYPE_INT registry_getintclass() +#define TYPE_IS_INT(t) ((t) == registry_getintclass()) +#define TYPE_UINT registry_getuintclass() +#define TYPE_IS_UINT(t) ((t) == registry_getuintclass()) +#define TYPE_FLOAT registry_getnumberclass() +#define TYPE_IS_FLOAT(t) ((t) == registry_getnumberclass()) +#define TYPE_BOOLEAN registry_getbooleanclass() +#define TYPE_IS_BOOLEAN(t)((t) == registry_getbooleanclass()) +#define TYPE_STRING registry_getstringclass() +#define TYPE_IS_STRING(t) ((t) == registry_getstringclass()) +#define TYPE_NULL registry_getnullclass() +#define TYPE_IS_NULL(t) ((t) == registry_getnullclass()) + %} + + %% -PROGRAM: CODE PROGRAM -PROGRAM: - -//EMPTY: { -// token_t* t = malloc(sizeof(token_t)); -// t->text = strdup(""); -// t->type = T_EMPTY; -// $$ = t; -//} - -CODE: CODE CODEPIECE {$$=$1;} -CODE: CODEPIECE {$$=empty_token();} - -MAYBECODE: CODE -MAYBECODE: - -CODEPIECE: ';' -CODEPIECE: VARIABLE_DECLARATION {$$=$1;} -CODEPIECE: PACKAGE_DECLARATION -CODEPIECE: IMPORT -CODEPIECE: NAMESPACE_DECLARATION -CODEPIECE: CLASS_DECLARATION -CODEPIECE: INTERFACE_DECLARATION -CODEPIECE: FUNCTION_DECLARATION -CODEPIECE: EXPRESSION -CODEPIECE: FOR -CODEPIECE: USE -CODEPIECE: ASSIGNMENT - -PACKAGE_DECLARATION : T_PACKAGE MULTILEVELIDENTIFIER '{' {startpackage($2)} MAYBECODE '}' {endpackage()} -PACKAGE_DECLARATION : T_PACKAGE '{' {startpackage(0)} MAYBECODE '}' {endpackage()} - -IMPORT : T_IMPORT PACKAGESPEC {addimport($2);} - -TYPE : BUILTIN_TYPE | '*' | T_IDENTIFIER -// TODO: do we need this? all it does it is clutter up our keyword space -BUILTIN_TYPE : T_STRING -BUILTIN_TYPE : T_NUMBER -BUILTIN_TYPE : T_INT -BUILTIN_TYPE : T_UINT -BUILTIN_TYPE : T_BOOLEAN -BUILTIN_TYPE : T_NULL +/* ------------ code blocks / statements ---------------- */ + +PROGRAM: MAYBECODE + +MAYBECODE: CODE {$$=$1;} +MAYBECODE: {$$=code_new();} + +CODE: CODE CODEPIECE {$$=code_append($1,$2);} +CODE: CODEPIECE {$$=$1;} + +CODEPIECE: PACKAGE_DECLARATION {$$=code_new();/*enters a scope*/} +CODEPIECE: CLASS_DECLARATION {$$=code_new();/*enters a scope*/} +CODEPIECE: INTERFACE_DECLARATION {/*TODO*/$$=code_new();} +CODEPIECE: IMPORT {$$=code_new();/*adds imports to current scope*/} +CODEPIECE: ';' {$$=code_new();} +CODEPIECE: VARIABLE_DECLARATION {$$=$1} +CODEPIECE: VOIDEXPRESSION {$$=$1} +CODEPIECE: FOR {$$=$1} +CODEPIECE: WHILE {$$=$1} +CODEPIECE: BREAK {$$=$1} +CODEPIECE: IF {$$=$1} +CODEPIECE: ASSIGNMENT {$$=$1} +CODEPIECE: NAMESPACE_DECLARATION {/*TODO*/$$=code_new();} +CODEPIECE: FUNCTION_DECLARATION {/*TODO*/$$=code_new();} +CODEPIECE: USE_NAMESPACE {/*TODO*/$$=code_new();} + +CODEBLOCK : '{' MAYBECODE '}' {$$=$2;} +CODEBLOCK : CODEPIECE ';' {$$=$1;} +CODEBLOCK : CODEPIECE %prec below_semicolon {$$=$1;} + +/* ------------ functions --------------------------- */ + +FUNCTION_DECLARATION: MODIFIERS "function" GETSET T_IDENTIFIER '(' PARAMS ')' + MAYBETYPE '{' {startfunction(0,$1,$3,$4,$6,$8)} MAYBECODE '}' { + if(!state->m) syntaxerror("internal error: undefined function"); + state->m->code = code_append(state->initcode, $11);state->initcode=0; + endfunction() +} + +/* ------------ variables --------------------------- */ + +MAYBEEXPRESSION : '=' EXPRESSION {$$=$2;} + | {$$.c=abc_pushundefined(0); + $$.t=TYPE_ANY; + } + +VAR : "const" | "var" +VARIABLE_DECLARATION : VAR T_IDENTIFIER MAYBETYPE MAYBEEXPRESSION { + if(array_contains(state->vars, $2->text)) + syntaxerror("Variable %s already defined", $2->text); + $$ = $4.c; + + if(!is_subtype_of($4.t, $3)) { + syntaxerror("Can't convert %s to %s", multiname_tostring($4.t), multiname_tostring($3)); + } + + int index = array_append(state->vars, $2->text, $3) + state->local_var_base; + $$ = abc_setlocal($$, index); + + if($3) { + if(TYPE_IS_INT($3) || TYPE_IS_UINT($3) || TYPE_IS_FLOAT($3)) { + state->initcode = abc_pushbyte(state->initcode, 32); + } else if(TYPE_IS_BOOLEAN($3)) { + state->initcode = abc_pushfalse(state->initcode); + } else { + state->initcode = abc_pushnull(state->initcode); + } + state->initcode = abc_setlocal(state->initcode, index); + } /*else { + // that's the default for a local register, anyway + state->initcode = abc_pushundefined(state->initcode); + state->initcode = abc_setlocal(state->initcode, index); + }*/ + printf("variable %s -> %d (%s)\n", $2->text, index, $4.t->name); +} +ASSIGNMENT : T_IDENTIFIER '=' EXPRESSION { + multiname_t*type=0; + int i = find_variable($1->text, &type); + $$ = $3.c; + if(!type && $3.t) { + // convert to "any" type, the register is untyped + $$ = abc_coerce_a($$); + } else { + // TODO: convert ints to strings etc. + } + $$ = abc_setlocal($$, i); +} + +/* ------------ control flow ------------------------- */ + +MAYBEELSE: %prec prec_none {$$ = code_new();} +MAYBEELSE: "else" CODEBLOCK {$$=$2;} +//MAYBEELSE: ';' "else" CODEBLOCK {$$=$3;} + +IF : "if" '(' {new_state();} EXPRESSION ')' CODEBLOCK MAYBEELSE { + $$=$4.c; + code_t*myjmp,*myif = $$ = abc_iffalse($$, 0); + + $$ = code_append($$, $6); + if($7) { + myjmp = $$ = abc_jump($$, 0); + } + myif->branch = $$ = abc_label($$); + if($7) { + $$ = code_append($$, $7); + myjmp->branch = $$ = abc_label($$); + } + old_state(); +} + +FOR_INIT : {$$=code_new();} +FOR_INIT : ASSIGNMENT | VARIABLE_DECLARATION | VOIDEXPRESSION + +FOR : "for" '(' {new_state();} FOR_INIT ';' EXPRESSION ';' VOIDEXPRESSION ')' CODEBLOCK { + $$ = $4; + code_t*loopstart = $$ = abc_label($$); + $$ = code_append($$, $6.c); + code_t*myif = $$ = abc_iffalse($$, 0); + $$ = code_append($$, $10); + $$ = code_append($$, $8); + $$ = abc_jump($$, loopstart); + $$ = abc_label($$); + myif->branch = $$; + old_state(); +} + +WHILE : "while" '(' {new_state();} EXPRESSION ')' CODEBLOCK { + code_t*myjmp = $$ = abc_jump(0, 0); + code_t*loopstart = $$ = abc_label($$); + $$ = code_append($$, $6); + myjmp->branch = $$ = abc_label($$); + $$ = code_append($$, $4.c); + $$ = abc_iftrue($$, loopstart); + old_state(); +} + +BREAK : "break" { + $$ = abc___break__(0); +} + +/* ------------ packages and imports ---------------- */ + +PACKAGE_DECLARATION : "package" MULTILEVELIDENTIFIER '{' {startpackage($2)} MAYBECODE '}' {endpackage()} +PACKAGE_DECLARATION : "package" '{' {startpackage(0)} MAYBECODE '}' {endpackage()} + +IMPORT : "import" PACKAGESPEC {addimport($2);} + +TYPE : PACKAGEANDCLASS {$$=$1;} + | '*' {$$=registry_getanytype();} + | "String" {$$=registry_getstringclass();} + | "int" {$$=registry_getintclass();} + | "uint" {$$=registry_getuintclass();} + | "Boolean" {$$=registry_getbooleanclass();} + | "Number" {$$=registry_getnumberclass();} MAYBETYPE: ':' TYPE {$$=$2;} -MAYBETYPE: {$$=empty_token();} +MAYBETYPE: {$$=0;} //FUNCTION_HEADER: NAMESPACE MODIFIERS T_FUNCTION GETSET T_IDENTIFIER '(' PARAMS ')' -FUNCTION_HEADER: MODIFIERS T_FUNCTION GETSET T_IDENTIFIER '(' PARAMS ')' +FUNCTION_HEADER: MODIFIERS "function" GETSET T_IDENTIFIER '(' PARAMS ')' MAYBETYPE -FUNCTION_DECLARATION: MODIFIERS T_FUNCTION GETSET T_IDENTIFIER '(' PARAMS ')' - MAYBETYPE '{' {startfunction(0,$1,$3,$4,$6,$8)} MAYBECODE '}' {endfunction()} -NAMESPACE_DECLARATION : MODIFIERS T_NAMESPACE T_IDENTIFIER -NAMESPACE_DECLARATION : MODIFIERS T_NAMESPACE T_IDENTIFIER '=' T_IDENTIFIER -NAMESPACE_DECLARATION : MODIFIERS T_NAMESPACE T_IDENTIFIER '=' T_STRING +NAMESPACE_DECLARATION : MODIFIERS KW_NAMESPACE T_IDENTIFIER +NAMESPACE_DECLARATION : MODIFIERS KW_NAMESPACE T_IDENTIFIER '=' T_IDENTIFIER +NAMESPACE_DECLARATION : MODIFIERS KW_NAMESPACE T_IDENTIFIER '=' T_STRING //NAMESPACE : {$$=empty_token();} //NAMESPACE : T_IDENTIFIER {$$=$1}; -CONSTANT : T_NUMBER -CONSTANT : T_STRING -CONSTANT : T_TRUE | T_FALSE -CONSTANT : T_NULL - -VAR : T_CONST | T_VAR - -// type annotation -// TODO: NAMESPACE +CONSTANT : T_BYTE {$$.c = abc_pushbyte(0, $1); + $$.c = abc_coerce2($$.c, registry_getintclass()); // FIXME + $$.t = TYPE_INT; + } +CONSTANT : T_SHORT {$$.c = abc_pushshort(0, $1); + $$.t = TYPE_INT; + } +CONSTANT : T_INT {$$.c = abc_pushint(0, $1); + $$.t = TYPE_INT; + } +CONSTANT : T_UINT {$$.c = abc_pushuint(0, $1); + $$.t = TYPE_UINT; + } +CONSTANT : T_FLOAT {$$.c = abc_pushdouble(0, $1); + $$.t = TYPE_FLOAT; + } +CONSTANT : T_STRING {$$.c = abc_pushstring(0, $1); + $$.t = TYPE_STRING; + } +CONSTANT : KW_TRUE {$$.c = abc_pushtrue(0); + $$.t = TYPE_BOOLEAN; + } +CONSTANT : KW_FALSE {$$.c = abc_pushfalse(0); + $$.t = TYPE_BOOLEAN; + } +CONSTANT : KW_NULL {$$.c = abc_pushnull(0); + $$.t = TYPE_NULL; + } + +USE_NAMESPACE : "use" "namespace" T_IDENTIFIER + + +EXPRESSION : E %prec prec_none /*precendence below '-x'*/ {$$ = $1;} +VOIDEXPRESSION : E %prec prec_none {$$=$1.c;/*calculate and discard*/$$=abc_pop($$);} + +E : CONSTANT +E : VAR_READ %prec T_IDENTIFIER {$$ = $1;} +E : NEW {$$.c = abc_pushundefined(0); /* FIXME */ + $$.t = TYPE_ANY; + } +E : T_REGEXP {$$.c = abc_pushundefined(0); /* FIXME */ + $$.t = TYPE_ANY; + } +E : FUNCTIONCALL +E : E '<' E {$$.c = code_append($1.c,$3.c);$$.c = abc_greaterequals($$.c);$$.c=abc_not($$.c); + $$.t = TYPE_BOOLEAN; + } +E : E '>' E {$$.c = code_append($1.c,$3.c);$$.c = abc_greaterthan($$.c); + $$.t = TYPE_BOOLEAN; + } +E : E "<=" E {$$.c = code_append($1.c,$3.c);$$.c = abc_greaterthan($$.c);$$.c=abc_not($$.c); + $$.t = TYPE_BOOLEAN; + } +E : E ">=" E {$$.c = code_append($1.c,$3.c);$$.c = abc_greaterequals($$.c); + $$.t = TYPE_BOOLEAN; + } +E : E "==" E {$$.c = code_append($1.c,$3.c);$$.c = abc_equals($$.c); + $$.t = TYPE_BOOLEAN; + } +E : E "===" E {$$.c = code_append($1.c,$3.c);$$.c = abc_strictequals($$.c); + $$.t = TYPE_BOOLEAN; + } +E : E "!=" E {$$.c = code_append($1.c,$3.c);$$.c = abc_equals($$.c);$$.c = abc_not($$.c); + $$.t = TYPE_BOOLEAN; + } + +E : E '-' E +E : E '/' E +E : E '+' E {$$.c = code_append($1.c,$3.c);$$.c = abc_add($$.c);$$.c=abc_coerce_a($$.c); + $$.t = join_types($1.t, $3.t, '+'); + } +E : E '%' E {$$.c = code_append($1.c,$3.c);$$.c = abc_modulo($$.c);$$.c=abc_coerce_a($$.c); + $$.t = join_types($1.t, $3.t, '%'); + } +E : E '*' E {$$.c = code_append($1.c,$3.c);$$.c = abc_multiply($$.c);$$.c=abc_coerce_a($$.c); + $$.t = join_types($1.t, $3.t, '*'); + } + +E : E "as" TYPE +E : E "is" TYPE +E : '(' E ')' {$$=$2;} +E : '-' E {$$=$2;} + +E : LH "+=" E {$$.c = $1.read;$$.c=code_append($$.c,$3.c);$$.c=abc_add($$.c); + $$.c=abc_coerce2($$.c, registry_getintclass()); // FIXME + $$.c=abc_dup($$.c);$$.c=code_append($$.c,$1.write); + $$.t = $1.type; + } +E : LH "-=" E {$$.c = $1.read;$$.c=code_append($$.c,$3.c);$$.c=abc_add($$.c); + $$.c=abc_coerce2($$.c, registry_getintclass()); // FIXME + $$.c=abc_dup($$.c);$$.c=code_append($$.c,$1.write); + $$.t = $1.type; + } + +// TODO: use inclocal where appropriate +E : LH "++" {$$.c = $1.read;$$.c=abc_increment($$.c); + $$.c=abc_coerce2($$.c, registry_getintclass()); //FIXME + $$.c=abc_dup($$.c);$$.c=code_append($$.c,$1.write); + $$.t = $1.type; + } +E : LH "--" {$$.c = $1.read;$$.c=abc_decrement($$.c); + $$.c=abc_coerce2($$.c, registry_getintclass()); //FIXME + $$.c=abc_dup($$.c);$$.c=code_append($$.c,$1.write); + $$.t = $1.type; + } + +LH: T_IDENTIFIER { + int i = find_variable($1->text, &$$.type); + $$.read = abc_getlocal(0, i); + $$.write = abc_setlocal(0, i); +} -VARIABLE_DECLARATION : MODIFIERS VAR T_IDENTIFIER MAYBETYPE { - int i = newvariable($1,$2,$3,$4); +NEW : "new" T_IDENTIFIER {$$.c=0;$$.t=0;/*FIXME*/} + | "new" T_IDENTIFIER '(' ')' {$$.c=0;$$.t=0;/*FIXME*/} + | "new" T_IDENTIFIER '(' EXPRESSION_LIST ')' {$$.c=0;$$.t=0;/*FIXME*/} + +FUNCTIONCALL : T_IDENTIFIER '(' MAYBE_EXPRESSION_LIST ')' { + /* TODO: use abc_call (for calling local variables), + abc_callstatic (for calling own methods) */ + $$.c = code_new(); + $$.c = abc_findpropstrict($$.c, $1->text); + typedcode_list_t*l = $3; + // push parameters on stack + int len = 0; + while(l) { + $$.c = code_append($$.c, l->typedcode.c); + l = l->nxt; + len ++; + } + $$.c = abc_callproperty($$.c, $1->text, len); } -VARIABLE_DECLARATION : MODIFIERS VAR T_IDENTIFIER MAYBETYPE '=' EXPRESSION { - int i = newvariable($1,$2,$3,$4); - //setvariable(i,$6); + +MAYBE_EXPRESSION_LIST : {$$=0;} +MAYBE_EXPRESSION_LIST : EXPRESSION_LIST +EXPRESSION_LIST : EXPRESSION {$$=malloc(sizeof(typedcode_list_t)); + $$->nxt = 0; + $$->typedcode = $1;} +EXPRESSION_LIST : EXPRESSION_LIST ',' EXPRESSION {$$=malloc(sizeof(typedcode_list_t)); + $$->nxt = $1; + $$->typedcode = $3; + } + +VAR_READ : T_IDENTIFIER { + int i = find_variable($1->text, &$$.t); + $$.c = abc_getlocal(0, i); } -// operator prescendence: -// http://livedocs.adobe.com/flash/9.0/main/wwhelp/wwhimpl/common/html/wwhelp.htm?context=LiveDocs_Parts&file=00000012.html -EXPRESSION : EXPRESSION '<' EXPRESSION -EXPRESSION : EXPRESSION '>' EXPRESSION -EXPRESSION : EXPRESSION "<=" EXPRESSION -EXPRESSION : EXPRESSION ">=" EXPRESSION -EXPRESSION : EXPRESSION "==" EXPRESSION -EXPRESSION : EXPRESSION '+' TERM -EXPRESSION : EXPRESSION '-' TERM -EXPRESSION : TERM -EXPRESSION : '-' TERM -TERM : TERM '*' FACTOR -TERM : TERM '/' FACTOR -TERM : EMOD -EMOD: FACTOR "++" -EMOD: FACTOR "--" -EMOD: FACTOR -FACTOR : '(' EXPRESSION ')' -FACTOR : CONSTANT -FACTOR : VARIABLE -FACTOR : FUNCTIONCALL -FACTOR : T_REGEXP -FACTOR : NEW -FACTOR : IS -FACTOR : AS - -IS : EXPRESSION T_IS TYPE -AS : EXPRESSION T_AS TYPE -NEW : T_NEW T_IDENTIFIER | T_NEW T_IDENTIFIER '(' ')' -NEW : T_NEW T_IDENTIFIER '(' EXPRESSIONLIST ')' - -FUNCTIONCALL : VARIABLE '(' EXPRESSIONLIST ')' -FUNCTIONCALL : VARIABLE '(' ')' - -EXPRESSIONLIST : EXPRESSION -EXPRESSIONLIST : EXPRESSION ',' EXPRESSIONLIST - -VARIABLE : T_IDENTIFIER -VARIABLE : VARIABLE '.' T_IDENTIFIER -VARIABLE : VARIABLE ".." T_IDENTIFIER // descendants -VARIABLE : VARIABLE "::" VARIABLE // namespace declaration -VARIABLE : VARIABLE "::" '[' EXPRESSION ']' // qualified expression -VARIABLE : VARIABLE '[' EXPRESSION ']' // unqualified expression - -ASSIGNMENT : VARIABLE '=' EXPRESSION -NEW_ASSIGNMENT : T_VAR VARIABLE MAYBETYPE '=' EXPRESSION - -FOR : T_FOR '(' NEW_ASSIGNMENT ';' EXPRESSION ';' EXPRESSION ')' '{' MAYBECODE '}' -FOR : T_FOR '(' ASSIGNMENT ';' EXPRESSION ';' EXPRESSION ')' '{' MAYBECODE '}' - -USE : T_USE T_NAMESPACE T_IDENTIFIER +//VARIABLE : T_IDENTIFIER +//VARIABLE : VARIABLE '.' T_IDENTIFIER +//VARIABLE : VARIABLE ".." T_IDENTIFIER // descendants +//VARIABLE : VARIABLE "::" VARIABLE // namespace declaration +//VARIABLE : VARIABLE "::" '[' EXPRESSION ']' // qualified expression +//VARIABLE : VARIABLE '[' EXPRESSION ']' // unqualified expression // keywords which also may be identifiers -X_IDENTIFIER : T_IDENTIFIER | T_PACKAGE +X_IDENTIFIER : T_IDENTIFIER | KW_PACKAGE PACKAGESPEC : PACKAGESPEC '.' PACKAGESPEC {if($1->text[0]=='*') syntaxerror("wildcard in the middle of path"); $$ = concat3($1,$2,$3);} PACKAGESPEC : X_IDENTIFIER {$$=$1;} PACKAGESPEC : '*' {$$=$1;} -GETSET : T_GET {$$=$1;} - | T_SET {$$=$1;} +GETSET : "get" {$$=$1;} + | "set" {$$=$1;} | {$$=empty_token();} -CLASS_DECLARATION : MODIFIERS T_CLASS T_IDENTIFIER EXTENDS IMPLEMENTS_LIST '{' {startclass($1,$3,$4,$5);} MAYBE_DECLARATION_LIST '}' {endclass();} -INTERFACE_DECLARATION : MODIFIERS T_INTERFACE T_IDENTIFIER EXTENDS_LIST '{' MAYBE_IDECLARATION_LIST '}' +CLASS_DECLARATION : MODIFIERS "class" T_IDENTIFIER EXTENDS IMPLEMENTS_LIST '{' {startclass($1,$3,$4,$5);} MAYBE_DECLARATION_LIST '}' {endclass();} +INTERFACE_DECLARATION : MODIFIERS "interface" T_IDENTIFIER EXTENDS_LIST '{' MAYBE_IDECLARATION_LIST '}' PARAMS: {$$=empty_token();} PARAMS: PARAM_LIST {$$=$1;} @@ -496,7 +941,7 @@ MODIFIERS : {$$=empty_token();} MODIFIERS : MODIFIER_LIST {$$=$1} MODIFIER_LIST : MODIFIER MODIFIER_LIST {extend($2,$1);$$=$2;} MODIFIER_LIST : MODIFIER {$$=empty_token();extend($$,$1);} -MODIFIER : T_PUBLIC | T_PRIVATE | T_PROTECTED | T_STATIC | T_DYNAMIC | T_FINAL | T_OVERRIDE | T_NATIVE | T_INTERNAL +MODIFIER : KW_PUBLIC | KW_PRIVATE | KW_PROTECTED | KW_STATIC | KW_DYNAMIC | KW_FINAL | KW_OVERRIDE | KW_NATIVE | KW_INTERNAL DECLARATION : VARIABLE_DECLARATION DECLARATION : FUNCTION_DECLARATION @@ -504,23 +949,28 @@ DECLARATION : FUNCTION_DECLARATION IDECLARATION : VARIABLE_DECLARATION IDECLARATION : FUNCTION_DECLARATION -IMPLEMENTS_LIST : {$$=empty_token();} -IMPLEMENTS_LIST : T_IMPLEMENTS MIDENTIFIER_LIST {$$=$2;} +IMPLEMENTS_LIST : {$$=list_new();} +IMPLEMENTS_LIST : KW_IMPLEMENTS PACKAGEANDCLASS_LIST {$$=$2;} -EXTENDS : {$$=empty_token();} -EXTENDS : T_EXTENDS MULTILEVELIDENTIFIER {$$=$2;} +EXTENDS : {$$=registry_getobjectclass();} +EXTENDS : KW_EXTENDS PACKAGEANDCLASS {$$=$2;} -EXTENDS_LIST : {$$=empty_token();} -EXTENDS_LIST : T_EXTENDS MIDENTIFIER_LIST {$$=$2;} +EXTENDS_LIST : {$$=list_new();} +EXTENDS_LIST : KW_EXTENDS PACKAGEANDCLASS_LIST {$$=$2;} //IDENTIFIER_LIST : T_IDENTIFIER ',' IDENTIFIER_LIST {extend($3,$1);$$=$3;} //IDENTIFIER_LIST : T_IDENTIFIER {$$=empty_token();extend($$,$1);} -MULTILEVELIDENTIFIER : T_IDENTIFIER {$$=empty_token();extend($$,$1);} -MULTILEVELIDENTIFIER : MULTILEVELIDENTIFIER '.' X_IDENTIFIER {extend_s($1,".",$3);$$=$1;} +PACKAGEANDCLASS : T_IDENTIFIER {$$ = registry_findclass(state->package, $1->text);} +PACKAGEANDCLASS : PACKAGE '.' T_IDENTIFIER {$$ = registry_findclass($1->text, $3->text);} +PACKAGE : X_IDENTIFIER +PACKAGE : PACKAGE '.' X_IDENTIFIER {$$=$1;extend_s($$,".",$3);} + +MULTILEVELIDENTIFIER : MULTILEVELIDENTIFIER '.' X_IDENTIFIER {$$=$1;extend_s($$, ".", $3)} +MULTILEVELIDENTIFIER : T_IDENTIFIER {$$=$1;extend($$,$1)}; -MIDENTIFIER_LIST : MULTILEVELIDENTIFIER {$$=empty_token();extend($$,$1);} -MIDENTIFIER_LIST : MIDENTIFIER_LIST ',' MULTILEVELIDENTIFIER {extend($1,$3);$$=$1;} +PACKAGEANDCLASS_LIST : PACKAGEANDCLASS {$$=list_new();list_append($$, $1);} +PACKAGEANDCLASS_LIST : PACKAGEANDCLASS_LIST ',' PACKAGEANDCLASS {$$=$1;list_append($$,$3);} MAYBE_DECLARATION_LIST : MAYBE_DECLARATION_LIST : DECLARATION_LIST @@ -532,76 +982,7 @@ MAYBE_IDECLARATION_LIST : IDECLARATION_LIST IDECLARATION_LIST : IDECLARATION IDECLARATION_LIST : IDECLARATION_LIST FUNCTION_HEADER +// chapter 14 // keywords: as break case catch class const continue default delete do else extends false finally for function if implements import in instanceof interface internal is native new null package private protected public return super switch this throw to true try typeof use var void while with // syntactic keywords: each get set namespace include dynamic final native override static -// chapter 14 - -%% - -#ifdef MAIN - -#include -#include -#include -#include - -void test_lexer() -{ - while(1) { - int token = yylex(); - if(token==T_EOF) - break; - if(token>=32 && token<256) { - printf("'%c'\n", token); - } else { - printf("%s\n", token2string(avm2_lval)); - } - } -} - -int main(int argn, char*argv[]) -{ - //FILE*fi = fopen("/home/kramm/c/flex/text.as", "rb"); - char*filename = "include.as"; - char buf[512]; - if(argn>1) - filename=argv[1]; - - add_include_dir(getcwd(buf, 512)); - char*fullfilename = enter_file(filename, 0); - - FILE*fi = fopen(fullfilename, "rb"); - if(!fi) { - perror(fullfilename); - return 1; - } - initialize_state(); - avm2_set_in(fi); - - if(argn>2 && !strcmp(argv[2], "-lex")) { - test_lexer(); - return 0; - } - avm2_parse(); - - finalize_state(); - - SWF swf; - memset(&swf, 0, sizeof(swf)); - swf.fileVersion = 9; - swf.frameRate = 0x2500; - swf.movieSize.xmin = swf.movieSize.ymin = 0; - swf.movieSize.xmax = 1024*20; - swf.movieSize.ymax = 768*20; - TAG*tag = swf.firstTag = swf_InsertTag(0, ST_DOABC); - swf_WriteABC(tag, state->file); - swf_InsertTag(tag, ST_END); - - int f = open("abc.swf",O_RDWR|O_CREAT|O_TRUNC|O_BINARY,0644); - swf_WriteSWF(f,&swf); - close(f); - - return 0; -} -#endif