This shows you the differences between two versions of the page.
|
alf:teme:tema4_en [2020/04/21 17:56] alexandru.radovici |
alf:teme:tema4_en [2020/04/25 12:15] (current) alexandru.radovici |
||
|---|---|---|---|
| Line 54: | Line 54: | ||
| <code javascript> | <code javascript> | ||
| { | { | ||
| - | symbol_table: [...], // the symbol_table | + | symbol_table: {...}, // the symbol_table |
| - | ast: {...}, // the ast with the type for very node that returns a value | + | ast: [...], // the ast with the type for very node that returns a value |
| - | error_list [] // the error list | + | errors [] // the error list |
| } | } | ||
| </code> | </code> | ||
| Line 62: | Line 62: | ||
| ===== Symbol table ===== | ===== Symbol table ===== | ||
| - | The symbol table is an array of context objects. | + | The symbol table is represented by a Javascript object, where each property is the name of a context. In the example below you |
| + | can see there are two contexts: | ||
| + | * //script// - the context for the main script | ||
| + | * //function_sum// - the context generated by the `sum` function | ||
| <code javascript> | <code javascript> | ||
| - | [ | + | { |
| - | // context object id 0 - the context of the main script | + | "script": { |
| - | { | + | "type": "script", |
| - | ... | + | "variables": {}, |
| - | }, | + | "functions": { |
| - | // context object id 1 - the context object of a function | + | "sum": { |
| - | { | + | "type": "int", |
| - | ... | + | "parameters": [ |
| - | }, | + | { |
| - | ... | + | "type": "int", |
| - | ] | + | "title": "n1", |
| + | "line": 4 | ||
| + | }, | ||
| + | { | ||
| + | "type": "int", | ||
| + | "title": "n2", | ||
| + | "line": 4 | ||
| + | } | ||
| + | ], | ||
| + | "line": 4 | ||
| + | } | ||
| + | }, | ||
| + | "types": {} | ||
| + | }, | ||
| + | "function_sum": { | ||
| + | "title": "sum", | ||
| + | "type": "function", | ||
| + | "parent": "script", | ||
| + | "variables": { | ||
| + | "n1": { | ||
| + | "type": "int", | ||
| + | "parameter": true, | ||
| + | "index": 0 | ||
| + | }, | ||
| + | "n2": { | ||
| + | "type": "int", | ||
| + | "parameter": true, | ||
| + | "index": 1 | ||
| + | } | ||
| + | }, | ||
| + | "functions": {}, | ||
| + | "types": {} | ||
| + | } | ||
| + | } | ||
| </code> | </code> | ||
| - | While determining the symbol table, add to each AST node a parameter //symbol// with the value of the its context id. | + | |
| + | While determining the symbol table, add to each AST node a parameter //symbol_table// with the name of the symbol table in which it | ||
| + | has its variables, functions and types. | ||
| ==== Context Object ==== | ==== Context Object ==== | ||
| Line 84: | Line 122: | ||
| * the variable declared in that context | * the variable declared in that context | ||
| * the function declared in that context | * the function declared in that context | ||
| - | * the struct declared in that context | + | * the types (array, struct) declared in that context |
| - | * the parent context id (position in the symbol_table array) | + | * the parent context name |
| - | * the type of the context (module or message) | + | * the type of the context (`script`, `statements` or `function`) |
| - | * the name of the function which context it is (unless this is not the module) | + | * the title of the function which context it is (if the context type is `function`) |
| - | * the name of the struct which context it is (unless this is not the module) | + | |
| - | * the type of the return value of the function which context it is (unless this is not the script) | + | |
| <note> | <note> | ||
| Line 95: | Line 131: | ||
| * the main module | * the main module | ||
| * a function definition | * a function definition | ||
| - | * a struct | + | * a if definition |
| + | * a for definition | ||
| + | * a loop when and loop go definition | ||
| </note> | </note> | ||
| Line 105: | Line 143: | ||
| "type": // type of the variable | "type": // type of the variable | ||
| "line": // the line where the variable was declared | "line": // the line where the variable was declared | ||
| + | "parameter": //true if this is a function parameter, false otherwise | ||
| "value": // the expression that the variable initially has (optional, if the define was with an assignment) | "value": // the expression that the variable initially has (optional, if the define was with an assignment) | ||
| } | } | ||
| }, | }, | ||
| "functions": { // a dictionary of functions | "functions": { // a dictionary of functions | ||
| - | "function_name": { | + | "function_title": { |
| "type": // the return type of the function | "type": // the return type of the function | ||
| "parameters": [] // the list of parameters the function takes (the parameters node from the AST) | "parameters": [] // the list of parameters the function takes (the parameters node from the AST) | ||
| "line": // the line where the function was declared | "line": // the line where the function was declared | ||
| - | "symbol": // the context object id that the function creates | ||
| } | } | ||
| Line 119: | Line 157: | ||
| "types": { // a dictionary of types | "types": { // a dictionary of types | ||
| "type": { | "type": { | ||
| - | "type": // the type of the new type class or array | + | "type": // the type of the new type struct or array |
| "line": // the line where the type was declared | "line": // the line where the type was declared | ||
| // for array | // for array | ||
| "elements_type": // the type of each array element | "elements_type": // the type of each array element | ||
| - | "from": // the first index | + | "first": // the first index |
| - | "to": // the last index | + | "length": // the number of elements in the array |
| // for struct | // for struct | ||
| - | "elements": [ // a list of array elements (the node form the AST) | + | "properties": [ // a list of array elements (the node form the AST) |
| { | { | ||
| "type": | "type": | ||
| - | "id": | + | "title": |
| + | "value": // the expression that the variable initially has (optional, if the define was with an assignment) | ||
| "line": | "line": | ||
| + | "symbol_table": // the context title where the structure was defined | ||
| }, | }, | ||
| ... | ... | ||
| Line 136: | Line 176: | ||
| } | } | ||
| }, | }, | ||
| - | "parent": 0, // the parent context position in the symbol_table (except of the main script that has no parent), usually 0, | + | "parent": // the parent context the symbol_table (except of the main script that has no parent) |
| - | "type": // the type of the | + | "type": // the type of the context (script, function or statements) |
| - | "function": // the function name if this is a function context | + | |
| - | "struct": // the struct name if the context is in a function that is in a struct | + | |
| - | "return_value": // the return type of the function if this is a function context | + | |
| } | } | ||
| </code> | </code> | ||
| - | === Exemple === | + | |
| + | ==== Context names ==== | ||
| + | * ''script'' - script | ||
| + | * ''function'' - function_''title'' | ||
| + | * ''if_then'' - if_''line_where_the_if_then_was_defined'' | ||
| + | * ''loop_when'' - do_while_''line_where_the_loop_when_was_defined'' | ||
| + | * ''loop_go'' - while_''line_where_the_loop_go_was_defined'' | ||
| + | |||
| + | ===== The new AST ===== | ||
| + | The AST from the parser has to be transformed so that it does not contain any variable, function or type definitions. | ||
| + | |||
| + | The new AST is a list of objects, each object being either the script either a function. | ||
| <code javascript> | <code javascript> | ||
| - | { | + | [ |
| - | "variables": { | + | // the script |
| - | "s": { | + | "script": { |
| - | "type": "school", | + | statements: [ |
| - | "line": 8 | + | ... |
| - | } | + | ] |
| - | }, | + | }, |
| - | "functions": {}, | + | // a function |
| - | "types": { | + | "function_title": { |
| - | "school": { | + | statements: [ |
| - | "type": "struct", | + | ... |
| - | "line": 6, | + | ] |
| - | "elements": [ | + | } |
| - | { | + | ] |
| - | "type": "int", | + | |
| - | "id": "type", | + | |
| - | "line": 5 | + | |
| - | }, | + | |
| - | { | + | |
| - | "type": "bool", | + | |
| - | "id": "private", | + | |
| - | "line": 4 | + | |
| - | }, | + | |
| - | { | + | |
| - | "type": "string", | + | |
| - | "id": "name", | + | |
| - | "line": 3 | + | |
| - | } | + | |
| - | ] | + | |
| - | } | + | |
| - | } | + | |
| - | } | + | |
| </code> | </code> | ||
| + | |||
| + | ==== Variable definitions ==== | ||
| + | The variable definitions will be written to the symbol table. The definition will be deleted from the AST (it will not be placed in the | ||
| + | statements, as it has no actual action). If the definition is with an attribution ''@var x:int <- 7;'', it will be replaced with | ||
| + | an attribution node equivalent to ''x <- 7;''. | ||
| + | |||
| + | ==== Type definitions ==== | ||
| + | Structs and vectors are type definitions. These will be written to the ''types'' part in the symbol table. | ||
| + | |||
| + | For structs, if the properties have default values, every struct variable declaration will be replaced with attributions for | ||
| + | all the properties. There is an [[https://github.com/UPB-FILS/alf/blob/master/Devoir/semantic/verify/semantic/4_struct/definition_with_values_and_variable.alf|example]] in the repository. | ||
| ===== Verify Types in the AST ===== | ===== Verify Types in the AST ===== | ||
| Line 188: | Line 230: | ||
| * return | * return | ||
| * element_of_vector | * element_of_vector | ||
| - | * prop | + | * property |
| - | * dispatch | + | * function_call |
| + | |||
| + | All the other elements have the return type ''none''. If there is a type error (eg. float * string) it will be ''error''. | ||
| Set type the by adding a parameter type in the node. | Set type the by adding a parameter type in the node. | ||
| Line 195: | Line 239: | ||
| <note> | <note> | ||
| When searching for a variable, the algorithm is: | When searching for a variable, the algorithm is: | ||
| - | * if it is a function context, search the local variables | + | * search the local context |
| - | * if not found, search the parameters | + | * if not found, search the parent context |
| - | * if not found, search the struct context local variables | + | |
| - | + | ||
| - | * if it is the module context, search the global variables | + | |
| </note> | </note> | ||
| === Example === | === Example === | ||
| <code javascript> | <code javascript> | ||
| - | { | + | { |
| - | "id": "expr", | + | "id": "expr", |
| - | "op": "=", | + | "op": "+", |
| - | "left": { | + | "left": { |
| - | "id": "expr", | + | "id": "value", |
| - | "op": "mod", | + | "type": "int", |
| - | "left": { | + | "value": 2, |
| - | "id": "identifier", | + | "line": 3, |
| - | "value": "n", | + | "symbol_table": "script" |
| - | "line": 8, | + | }, |
| - | "symbol": 1, | + | "right": { |
| - | "type": "int" | + | "id": "value", |
| - | }, | + | "type": "int", |
| - | "right": { | + | "value": 3, |
| - | "id": "identifier", | + | "line": 3, |
| - | "value": "i", | + | "symbol_table": "script" |
| - | "line": 8, | + | }, |
| - | "symbol": 1, | + | "line": 3, |
| - | "type": "int" | + | "symbol_table": "script", |
| - | }, | + | "type": "int" |
| - | "line": 8, | + | |
| - | "symbol": 1, | + | |
| - | "t": "int" | + | |
| - | }, | + | |
| - | "right": { | + | |
| - | "id": "value", | + | |
| - | "type": "int", | + | |
| - | "value": 0, | + | |
| - | "line": 8, | + | |
| - | "symbol": 1 | + | |
| - | }, | + | |
| - | "line": 8, | + | |
| - | "symbol": 1, | + | |
| - | "type": "bool" | + | |
| } | } | ||
| </code> | </code> | ||
| Line 271: | Line 298: | ||
| { | { | ||
| type: // string with the error type | type: // string with the error type | ||
| - | line: // the line number in the source (starting at 1) | + | elements: { |
| - | elements: // items for the error, each type of error has different items | + | // items for the error, each type of error has different items |
| + | line: // the line where the error is | ||
| + | }, | ||
| text: // the error text message | text: // the error text message | ||
| } | } | ||
| </code> | </code> | ||
| + | |||
| ==== Error type ==== | ==== Error type ==== | ||
| Line 286: | Line 316: | ||
| <code javascript> | <code javascript> | ||
| { | { | ||
| - | variable: // variable name | + | variable: // variable name, |
| } | } | ||
| </code> | </code> | ||
| Line 310: | Line 340: | ||
| </code> | </code> | ||
| - | === STRUCT_ELEMENT_ALREADY_DEFINED === | + | === STRUCT_PROPERTY_ALREADY_DEFINED === |
| The error occurs when a struct element definition is repeated. | The error occurs when a struct element definition is repeated. | ||
| == Elements == | == Elements == | ||
| { | { | ||
| - | struct: // struct type name | + | type: // struct type title |
| - | element: // element name | + | title: // property title |
| } | } | ||
| Line 325: | Line 355: | ||
| <code javascript> | <code javascript> | ||
| { | { | ||
| - | vector: // array type name | + | array: // array type name |
| - | low_index: // the lower index value | + | length: // the negative length |
| - | high_index: // the higher index value | + | |
| } | } | ||
| </code> | </code> | ||
| Line 340: | Line 369: | ||
| variable: // the name of the variable with the unresolved type | variable: // the name of the variable with the unresolved type | ||
| } | } | ||
| - | // struct element | + | // struct property |
| { | { | ||
| struct: // name of struct type | struct: // name of struct type | ||
| - | element: // name of struct element with the unresolved type | + | property: // name of struct element with the unresolved type |
| } | } | ||
| </code> | </code> | ||
| - | === UNDEFINED_MESSAGE === | + | === UNDEFINED_FUNCTION === |
| - | The error occurs when a function call is made to a function that is not defned. | + | The error occurs when a function call is made to a function that is not defined. |
| == Elements == | == Elements == | ||
| <code javascript> | <code javascript> | ||
| { | { | ||
| - | id: // message name | + | title: // function title |
| } | } | ||
| </code> | </code> | ||
| Line 364: | Line 393: | ||
| <code javascript> | <code javascript> | ||
| { | { | ||
| - | variable: // variable name | + | variable: // variable title |
| } | } | ||
| </code> | </code> | ||
| Line 373: | Line 402: | ||
| == Elements == | == Elements == | ||
| { | { | ||
| - | variable: // the variable that has that type | + | value: // the type that is undefined |
| - | type: // the type that is undefined | + | |
| } | } | ||
| Line 383: | Line 411: | ||
| <code javascript> | <code javascript> | ||
| { | { | ||
| - | struct: // struct name | + | type: // struct title |
| - | property: // element name | + | title: // property title |
| } | } | ||
| </code> | </code> | ||
| Line 408: | Line 436: | ||
| </code> | </code> | ||
| === ARRAY_INDEX_TYPE === | === ARRAY_INDEX_TYPE === | ||
| - | The error occurs when an index for an array is not a number or symbol | + | The error occurs when an index for an array is not an int |
| == Elements == | == Elements == | ||
| <code javascript> | <code javascript> | ||
| { | { | ||
| - | vector: // array type | + | type: // the index type |
| - | index: // supplied index type | + | |
| } | } | ||
| </code> | </code> | ||
| Line 449: | Line 476: | ||
| op: // if, while, repeat | op: // if, while, repeat | ||
| } | } | ||
| - | // for | + | // attribution (including for variable) |
| { | { | ||
| - | exp: // expression type | + | to: // to type, |
| - | op: "for" | + | op: "<-", |
| - | element: // variable, from, to or step | + | from: // from type |
| } | } | ||
| - | // value_of_function | + | // return |
| { | { | ||
| - | op: "value" | + | op: "return" |
| to: // return type | to: // return type | ||
| from: // provided type | from: // provided type | ||
| } | } | ||
| - | // is | + | // iteration (for i in exp go) |
| { | { | ||
| - | op: "is" | + | op: "iteration" |
| - | to: // to type | + | value: // the exp type |
| - | from: // from type | + | |
| } | } | ||
| - | // struct element type is undefined | + | // typecast |
| { | { | ||
| - | struct: // struct type, | + | op: "typecast", |
| - | element: // name of struct element | + | to: // to type, |
| + | from: // from type | ||
| } | } | ||
| - | // variable type is undefined | ||
| - | { | ||
| - | variable: // name of the variable | ||
| - | } | ||
| - | </code> | ||
| === LEXICAL === | === LEXICAL === | ||