X-Git-Url: https://code.kerkeslager.com/?p=fur;a=blobdiff_plain;f=transformation.py;h=7d47ed494100f2f8673f3b11e261b2418fd206ba;hp=67fd73cca88355a8db4dd94f6ce63e1fee0c0a2a;hb=b47a0017d1dbfda8e8bae7989fff9ccb31897a28;hpb=e0873511cc1425343bb70545571406b25b9cf5d9 diff --git a/transformation.py b/transformation.py index 67fd73c..7d47ed4 100644 --- a/transformation.py +++ b/transformation.py @@ -1,6 +1,7 @@ import collections -import parsing +import normalization +import parsing # TODO Remove this import, as we should be normalizing everything before it gets here CIntegerLiteral = collections.namedtuple( 'CIntegerLiteral', @@ -12,14 +13,15 @@ CIntegerLiteral = collections.namedtuple( CStringLiteral = collections.namedtuple( 'CStringLiteral', [ + 'index', 'value', ], ) -CConstantExpression = collections.namedtuple( - 'CConstantExpression', +CVariableExpression = collections.namedtuple( + 'CVariableExpression', [ - 'value' + 'variable', ], ) @@ -31,6 +33,24 @@ CSymbolExpression = collections.namedtuple( ], ) +CStructureLiteralExpression = collections.namedtuple( + 'CStructureLiteralExpression', + [ + 'field_count', + 'symbol_list_variable', + 'value_list_variable', + ], +) + +CDotExpression = collections.namedtuple( + 'CDotExpression', + [ + 'instance', + 'symbol', + 'symbol_list_index', + ], +) + CNegationExpression = collections.namedtuple( 'CNegationExpression', [ @@ -41,22 +61,29 @@ CNegationExpression = collections.namedtuple( CFunctionCallForFurInfixOperator = collections.namedtuple( 'CFunctionCallForFurInfixOperator', [ + 'metadata', 'name', - 'left', - 'right', ], ) +CPushStatement = collections.namedtuple( + 'CPushStatement', + ( + 'expression', + ), +) + CFunctionCallExpression = collections.namedtuple( 'CFunctionCallExpression', [ - 'name', - 'arguments', + 'function_expression', + 'argument_count', ], ) -CAssignmentStatement = collections.namedtuple( - 'CAssignmentStatement', +# TODO We are currently not changing variables, just preventing them from being accessed. +CSymbolAssignmentStatement = collections.namedtuple( + 'CSymbolAssignmentStatement', [ 'target', 'target_symbol_list_index', @@ -64,155 +91,360 @@ CAssignmentStatement = collections.namedtuple( ], ) +CArrayVariableInitializationStatement = collections.namedtuple( + 'CArrayVariableInitializationStatement', + [ + 'variable', + 'items', + ], +) + +CSymbolArrayVariableInitializationStatement = collections.namedtuple( + 'CSymbolArrayVariableInitializationStatement', + [ + 'variable', + 'symbol_list', + 'symbol_list_indices', + ], +) + +CVariableInitializationStatement = collections.namedtuple( + 'CVariableInitializationStatement', + [ + 'variable', + 'expression', + ], +) + +CVariableReassignmentStatement = collections.namedtuple( + 'CVariableReassignmentStatement', + [ + 'variable', + 'expression', + ], +) + +CExpressionStatement = collections.namedtuple( + 'CExpressionStatement', + [ + 'expression', + ], +) + +CIfElseStatement = collections.namedtuple( + 'CIfElseStatement', + [ + 'condition_expression', + 'if_statement_list', + 'else_statement_list', + ], +) + +CFunctionDeclaration = collections.namedtuple( + 'CFunctionDeclaration', + [ + 'name', + ], +) + +# TODO If a function definition doesn't end with an expression, we have issues currently because we try to return statement. +# TODO Closures currently wrap entire defining environment, even symbols that are not used, which makes garbage collection ineffective. +CFunctionDefinition = collections.namedtuple( + 'CFunctionDefinition', + [ + 'name', + 'argument_name_list', + 'statement_list', + ], +) + CProgram = collections.namedtuple( 'CProgram', [ 'builtin_set', + 'function_definition_list', + 'operator_declarations', 'statements', 'standard_libraries', + 'string_literal_list', 'symbol_list', ], ) -EQUALITY_LEVEL_OPERATOR_TO_FUNCTION_NAME_MAPPING = { - '==': 'equals', - '!=': 'notEquals', - '<=': 'lessThanOrEqual', - '>=': 'greaterThanOrEqual', - '<': 'lessThan', - '>': 'greaterThan', +BUILTINS = { + 'concatenate': [], + 'false': [], + 'pow': ['math.h'], + 'print': ['stdio.h'], + 'true': [], } -def transform_equality_level_expression(accumulators, expression): - # Transform expressions like 1 < 2 < 3 into expressions like 1 < 2 && 2 < 3 - if isinstance(expression.left, parsing.FurInfixExpression) and expression.left.order == 'equality_level': - left = transform_equality_level_expression( - accumulators, - expression.left - ) +def transform_variable_expression(accumulators, expression): + assert isinstance(expression, normalization.NormalVariableExpression) + return CVariableExpression(variable=expression.variable) - middle = left.right +def transform_string_literal_expression(accumulators, expression): + value = expression.string - right = transform_expression( - accumulators, - expression.right, - ) - - # TODO Don't evaluate the middle expression twice - return CFunctionCallForFurInfixOperator( - name='and', - left=left, - right=CFunctionCallForFurInfixOperator( - name=EQUALITY_LEVEL_OPERATOR_TO_FUNCTION_NAME_MAPPING[expression.operator], - left=middle, - right=right, - ), - ) + try: + index = accumulators.string_literal_list.index(value) + except ValueError: + index = len(accumulators.string_literal_list) + accumulators.string_literal_list.append(value) - return CFunctionCallForFurInfixOperator( - name=EQUALITY_LEVEL_OPERATOR_TO_FUNCTION_NAME_MAPPING[expression.operator], - left=transform_expression(accumulators, expression.left), - right=transform_expression(accumulators, expression.right), + return CStringLiteral(index=index, value=value) + +def transform_symbol_expression(accumulators, expression): + if expression.symbol in BUILTINS: + accumulators.builtin_set.add(expression.symbol) + + try: + symbol_list_index = accumulators.symbol_list.index(expression.symbol) + except ValueError: + symbol_list_index = len(accumulators.symbol_list) + accumulators.symbol_list.append(expression.symbol) + + return CSymbolExpression( + symbol=expression.symbol, + symbol_list_index=symbol_list_index, ) -BUILTINS = { - 'false': [], - 'pow': ['math.h'], - 'print': ['stdio.h'], - 'true': [], +CInfixDeclaration = collections.namedtuple( + 'CInfixDeclaration', + [ + 'name', + 'in_type', + 'out_type', + 'operator', + ], +) + +FUR_INFIX_OPERATOR_TO_C_FUNCTION = { + '++': 'concatenate', } +FUR_INFIX_OPERATOR_TO_C_INFIX_OPERATOR = { + '+': CInfixDeclaration(name='add', in_type='integer', out_type='integer', operator='+'), + '-': CInfixDeclaration(name='subtract', in_type='integer', out_type='integer', operator='-'), + '*': CInfixDeclaration(name='multiply', in_type='integer', out_type='integer', operator='*'), + '//': CInfixDeclaration(name='integerDivide', in_type='integer', out_type='integer', operator='/'), + '%': CInfixDeclaration(name='modularDivide', in_type='integer', out_type='integer', operator='%'), + 'and': CInfixDeclaration(name='and', in_type='boolean', out_type='boolean', operator='&&'), + 'or': CInfixDeclaration(name='or', in_type='boolean', out_type='boolean', operator='||'), + '==': CInfixDeclaration(name='equals', in_type='integer', out_type='boolean', operator='=='), + '!=': CInfixDeclaration(name='notEquals', in_type='integer', out_type='boolean', operator='!='), + '<=': CInfixDeclaration(name='lessThanOrEqual', in_type='integer', out_type='boolean', operator='<='), + '>=': CInfixDeclaration(name='greaterThanOrEqual', in_type='integer', out_type='boolean', operator='>='), + '<': CInfixDeclaration(name='lessThan', in_type='integer', out_type='boolean', operator='<'), + '>': CInfixDeclaration(name='greaterThan', in_type='integer', out_type='boolean', operator='>'), +} + +def transform_infix_operator_without_c_equivalent(accumulators, expression): + return CFunctionCallForFurInfixOperator( + metadata=expression.metadata, + name='concatenate', + ) + +def transform_infix_expression(accumulators, expression): + if expression.operator in FUR_INFIX_OPERATOR_TO_C_FUNCTION: + return transform_infix_operator_without_c_equivalent(accumulators, expression) + + accumulators.operator_set.add(FUR_INFIX_OPERATOR_TO_C_INFIX_OPERATOR[expression.operator]) + + return CFunctionCallForFurInfixOperator( + metadata=expression.metadata, + name=FUR_INFIX_OPERATOR_TO_C_INFIX_OPERATOR[expression.operator].name, + ) + +def transform_integer_literal_expression(accumulators, expression): + return CIntegerLiteral(value=expression.integer) + +def transform_negation_expression(accumulators, expression): + return CNegationExpression( + value=transform_expression(accumulators, expression.internal_expression), + ) + +CListConstructExpression = collections.namedtuple( + 'CListConstructExpression', + [ + 'allocate', + ], +) + +CListAppendStatement = collections.namedtuple( + 'CListAppendStatement', + [ + 'list_expression', + 'item_expression', + ], +) + +CListGetExpression = collections.namedtuple( + 'CListGetExpression', + [ + 'list_expression', + 'index_expression', + ], +) + +def transform_structure_literal_expression(accumulators, expression): + return CStructureLiteralExpression( + field_count=expression.field_count, + symbol_list_variable=expression.symbol_list_variable, + value_list_variable=expression.value_list_variable, + ) + +def transform_dot_expression(accumulators, expression): + try: + symbol_list_index = accumulators.symbol_list.index(expression.field) + + except ValueError: + symbol_list_index = len(accumulators.symbol_list) + accumulators.symbol_list.append(expression.field) + + return CDotExpression( + instance=transform_variable_expression(accumulators, expression.instance), + symbol=expression.field, + symbol_list_index=symbol_list_index, + ) + +def transform_list_construct_expression(accumulators, expression): + return CListConstructExpression(allocate=expression.allocate) + +def transform_list_get_expression(accumulators, expression): + return CListGetExpression( + list_expression=transform_expression(accumulators, expression.list_expression), + index_expression=transform_expression(accumulators, expression.index_expression), + ) + +def transform_list_append_statement(accumulators, expression): + return CListAppendStatement( + list_expression=transform_expression(accumulators, expression.list_expression), + item_expression=transform_expression(accumulators, expression.item_expression), + ) + def transform_expression(accumulators, expression): - if isinstance(expression, parsing.FurParenthesizedExpression): - # Parentheses can be removed because everything in the C output is explicitly parenthesized - return transform_expression(accumulators, expression.internal) - - if isinstance(expression, parsing.FurNegationExpression): - return transform_negation_expression(accumulators, expression) - - if isinstance(expression, parsing.FurFunctionCallExpression): - return transform_function_call_expression(accumulators, expression) - - if isinstance(expression, parsing.FurSymbolExpression): - if expression.value in ['true', 'false']: - return CConstantExpression(value=expression.value) - - if expression.value not in accumulators.symbol_list: - symbol_list.append(expression.value) - - return CSymbolExpression( - symbol=expression.value, - symbol_list_index=accumulators.symbol_list.index(expression.value), - ) - - LITERAL_TYPE_MAPPING = { - parsing.FurIntegerLiteralExpression: CIntegerLiteral, - parsing.FurStringLiteralExpression: CStringLiteral, - } - - if type(expression) in LITERAL_TYPE_MAPPING: - return LITERAL_TYPE_MAPPING[type(expression)](value=expression.value) - - if isinstance(expression, parsing.FurInfixExpression): - if expression.order == 'equality_level': - return transform_equality_level_expression(accumulators, expression) - - INFIX_OPERATOR_TO_FUNCTION_NAME = { - '+': 'add', - '-': 'subtract', - '*': 'multiply', - '//': 'integerDivide', - '%': 'modularDivide', - 'and': 'and', - 'or': 'or', - } - - return CFunctionCallForFurInfixOperator( - name=INFIX_OPERATOR_TO_FUNCTION_NAME[expression.operator], - left=transform_expression(accumulators, expression.left), - right=transform_expression(accumulators, expression.right), - ) - - raise Exception('Could not transform expression "{}"'.format(expression)) - -def transform_assignment_statement(accumulators, assignment_statement): + # TODO Clean up handlers for parsing expressions + return { + parsing.FurInfixExpression: transform_infix_expression, + parsing.FurIntegerLiteralExpression: transform_integer_literal_expression, + parsing.FurNegationExpression: transform_negation_expression, + parsing.FurStringLiteralExpression: transform_string_literal_expression, + normalization.NormalDotExpression: transform_dot_expression, + normalization.NormalFunctionCallExpression: transform_function_call_expression, + normalization.NormalInfixExpression: transform_infix_expression, + normalization.NormalIntegerLiteralExpression: transform_integer_literal_expression, + normalization.NormalListConstructExpression: transform_list_construct_expression, + normalization.NormalListGetExpression: transform_list_get_expression, + normalization.NormalNegationExpression: transform_negation_expression, + normalization.NormalStructureLiteralExpression: transform_structure_literal_expression, + normalization.NormalStringLiteralExpression: transform_string_literal_expression, + normalization.NormalSymbolExpression: transform_symbol_expression, + normalization.NormalVariableExpression: transform_variable_expression, + }[type(expression)](accumulators, expression) + +def transform_symbol_assignment_statement(accumulators, assignment_statement): # TODO Check that target is not a builtin - if assignment_statement.target not in accumulators.symbol_list: + try: + symbol_list_index = accumulators.symbol_list.index(assignment_statement.target) + except ValueError: + symbol_list_index = len(accumulators.symbol_list) accumulators.symbol_list.append(assignment_statement.target) - return CAssignmentStatement( + return CSymbolAssignmentStatement( target=assignment_statement.target, - target_symbol_list_index=accumulators.symbol_list.index(assignment_statement.target), + target_symbol_list_index=symbol_list_index, expression=transform_expression( accumulators, assignment_statement.expression, ), ) -def transform_negation_expression(accumulators, negation_expression): - return CNegationExpression( - value=transform_expression(accumulators, negation_expression.value), +def transform_function_call_expression(accumulators, function_call): + # TODO Use the symbol from SYMBOL LIST + return CFunctionCallExpression( + function_expression=transform_expression(accumulators, function_call.function_expression), + argument_count=function_call.argument_count, ) -def transform_function_call_expression(accumulators, function_call): - if function_call.function.value in BUILTINS.keys(): - # TODO Check that the builtin is actually callable - accumulators.builtin_set.add(function_call.function.value) +def transform_expression_statement(accumulators, statement): + return CExpressionStatement( + expression=transform_expression(accumulators, statement.expression), + ) + +def transform_if_else_statement(accumulators, statement): + return CIfElseStatement( + condition_expression=transform_expression(accumulators, statement.condition_expression), + if_statement_list=tuple(transform_statement(accumulators, s) for s in statement.if_statement_list), + else_statement_list=tuple(transform_statement(accumulators, s) for s in statement.else_statement_list), + ) + +def transform_array_variable_initialization_statement(accumulators, statement): + return CArrayVariableInitializationStatement( + variable=statement.variable, + items=tuple(transform_expression(accumulators, i) for i in statement.items), + ) + +def transform_symbol_array_variable_initialization_statement(accumulators, statement): + symbol_list_indices = [] + + for symbol in statement.symbol_list: + try: + symbol_list_index = accumulators.symbol_list.index(symbol) + except ValueError: + symbol_list_index = len(accumulators.symbol_list) + accumulators.symbol_list.append(symbol) + + symbol_list_indices.append(symbol_list_index) + + return CSymbolArrayVariableInitializationStatement( + variable=statement.variable, + symbol_list=statement.symbol_list, + symbol_list_indices=tuple(symbol_list_indices), + ) + +def transform_variable_initialization_statement(accumulators, statement): + return CVariableInitializationStatement( + variable=statement.variable, + expression=transform_expression(accumulators, statement.expression), + ) + +def transform_variable_reassignment_statement(accumulators, statement): + return CVariableReassignmentStatement( + variable=statement.variable, + expression=transform_expression(accumulators, statement.expression), + ) + +def transform_function_definition_statement(accumulators, statement): + # TODO Allow defining the same function in different contexts + if any(fd.name == statement.name for fd in accumulators.function_definition_list): + raise Exception('A function with name "{}" already exists'.format(statement.name)) + + # TODO Add argument names to the symbol table + accumulators.function_definition_list.append(CFunctionDefinition( + name=statement.name, + argument_name_list=statement.argument_name_list, + statement_list=tuple(transform_statement(accumulators, s) for s in statement.statement_list) + )) - return CFunctionCallExpression( - name='builtin$' + function_call.function.value, - arguments=tuple( - transform_expression(accumulators, arg) - for arg in function_call.arguments - ), - ) + return CFunctionDeclaration(name=statement.name) - raise Exception() +def transform_push_statement(accumulators, statement): + return CPushStatement(expression=transform_expression(accumulators, statement.expression)) def transform_statement(accumulators, statement): return { - parsing.FurAssignmentStatement: transform_assignment_statement, - parsing.FurFunctionCallExpression: transform_function_call_expression, + parsing.FurExpressionStatement: transform_expression_statement, + normalization.NormalArrayVariableInitializationStatement: transform_array_variable_initialization_statement, + normalization.NormalAssignmentStatement: transform_symbol_assignment_statement, + normalization.NormalExpressionStatement: transform_expression_statement, + normalization.NormalFunctionDefinitionStatement: transform_function_definition_statement, + normalization.NormalIfElseStatement: transform_if_else_statement, + normalization.NormalListAppendStatement: transform_list_append_statement, + normalization.NormalPushStatement: transform_push_statement, + normalization.NormalSymbolArrayVariableInitializationStatement: transform_symbol_array_variable_initialization_statement, + normalization.NormalVariableInitializationStatement: transform_variable_initialization_statement, + normalization.NormalVariableReassignmentStatement: transform_variable_reassignment_statement, }[type(statement)](accumulators, statement) @@ -220,29 +452,38 @@ Accumulators = collections.namedtuple( 'Accumulators', [ 'builtin_set', + 'function_definition_list', + 'operator_set', 'symbol_list', + 'string_literal_list', ], ) def transform(program): accumulators = Accumulators( builtin_set=set(), - symbol_list = [], + function_definition_list=[], + operator_set=set(), + symbol_list=[], + string_literal_list=[], ) - c_statements = [ + statement_list = [ transform_statement(accumulators, statement) for statement in program.statement_list ] - standard_libraries = set() + standard_library_set = set() for builtin in accumulators.builtin_set: for standard_library in BUILTINS[builtin]: - standard_libraries.add(standard_library) + standard_library_set.add(standard_library) return CProgram( builtin_set=accumulators.builtin_set, - statements=c_statements, - standard_libraries=standard_libraries, + function_definition_list=accumulators.function_definition_list, + operator_declarations=tuple(sorted(accumulators.operator_set)), + statements=statement_list, + standard_libraries=standard_library_set, + string_literal_list=accumulators.string_literal_list, symbol_list=accumulators.symbol_list, )