X-Git-Url: https://code.kerkeslager.com/?p=fur;a=blobdiff_plain;f=transformation.py;h=a9cad95b600141efa33a873942f1f06f54f0cb95;hp=1fe7dc938b55e51674750a7db5a66cc621e3b474;hb=37d4a702fda63b87c1482a59b2ef4c1bba2e3696;hpb=f60d1b48bbf73c51d214c5ae5c22ea3cdee087c1 diff --git a/transformation.py b/transformation.py index 1fe7dc9..a9cad95 100644 --- a/transformation.py +++ b/transformation.py @@ -1,6 +1,6 @@ import collections -import parsing +import conversion CIntegerLiteral = collections.namedtuple( 'CIntegerLiteral', @@ -12,124 +12,378 @@ CIntegerLiteral = collections.namedtuple( CStringLiteral = collections.namedtuple( 'CStringLiteral', [ + 'index', 'value', ], ) -CAdditionExpression = collections.namedtuple( - 'CAdditionExpression', +CVariableExpression = collections.namedtuple( + 'CVariableExpression', [ - 'left', - 'right', + 'variable', ], ) -CSubtractionExpression = collections.namedtuple( - 'CSubtractionExpression', +CSymbolExpression = collections.namedtuple( + 'CSymbolExpression', [ - 'left', - 'right', + 'symbol', + 'symbol_list_index', ], ) -CMultiplicationExpression = collections.namedtuple( - 'CMultiplicationExpression', +CStructureLiteralExpression = collections.namedtuple( + 'CStructureLiteralExpression', [ - 'left', - 'right', + 'field_count', + 'symbol_list_variable', + 'value_list_variable', ], ) -CIntegerDivisionExpression = collections.namedtuple( - 'CIntegerDivisionExpression', +CPushStatement = collections.namedtuple( + 'CPushStatement', + ( + 'expression', + ), +) + +CFunctionCallExpression = collections.namedtuple( + 'CFunctionCallExpression', + ( + 'metadata', + 'function_expression', + 'argument_count', + ), +) + +# TODO We are currently not changing variables, just preventing them from being accessed. +CSymbolAssignmentStatement = collections.namedtuple( + 'CSymbolAssignmentStatement', [ - 'left', - 'right', + 'target', + 'target_symbol_list_index', + 'expression', ], ) -CModularDivisionExpression = collections.namedtuple( - 'CModularDivisionExpression', +CArrayVariableInitializationStatement = collections.namedtuple( + 'CArrayVariableInitializationStatement', [ - 'left', - 'right', + 'variable', + 'items', ], ) -CFunctionCallExpression = collections.namedtuple( - 'CFunctionCallExpression', +CSymbolArrayVariableInitializationStatement = collections.namedtuple( + 'CSymbolArrayVariableInitializationStatement', + [ + 'variable', + 'symbol_list', + 'symbol_list_indices', + ], +) + +CVariableInitializationStatement = collections.namedtuple( + 'CVariableInitializationStatement', + [ + 'variable', + 'expression', + ], +) + +CVariableReassignmentStatement = collections.namedtuple( + 'CVariableReassignmentStatement', + [ + 'variable', + 'expression', + ], +) + +CExpressionStatement = collections.namedtuple( + 'CExpressionStatement', + [ + 'expression', + ], +) + +CIfElseStatement = collections.namedtuple( + 'CIfElseStatement', + [ + 'condition_expression', + 'if_statement_list', + 'else_statement_list', + ], +) + +# TODO If a function definition doesn't end with an expression, we have issues currently because we try to return statement. +# TODO Closures currently wrap entire defining environment, even symbols that are not used, which makes garbage collection ineffective. +CFunctionDefinition = collections.namedtuple( + 'CFunctionDefinition', [ 'name', - 'arguments', + 'index', + 'argument_name_list', + 'statement_list', ], ) CProgram = collections.namedtuple( 'CProgram', [ - 'builtins', + 'builtin_set', + 'function_definition_list', + 'operator_declarations', 'statements', 'standard_libraries', + 'string_literal_list', + 'symbol_list', ], ) BUILTINS = { - 'pow': ['math.h'], - 'print': ['stdio.h'], + 'concatenate': [], + 'false': [], + 'pow': ['math.h'], + 'print': ['stdio.h'], + 'true': [], } -def transform_expression(builtin_dependencies, expression): - if isinstance(expression, parsing.FurFunctionCallExpression): - return transform_function_call_expression(builtin_dependencies, expression) - - LITERAL_TYPE_MAPPING = { - parsing.FurIntegerLiteralExpression: CIntegerLiteral, - parsing.FurStringLiteralExpression: CStringLiteral, - } - - if type(expression) in LITERAL_TYPE_MAPPING: - return LITERAL_TYPE_MAPPING[type(expression)](value=expression.value) - - INFIX_TYPE_MAPPING = { - parsing.FurAdditionExpression: CAdditionExpression, - parsing.FurSubtractionExpression: CSubtractionExpression, - parsing.FurMultiplicationExpression: CMultiplicationExpression, - parsing.FurIntegerDivisionExpression: CIntegerDivisionExpression, - parsing.FurModularDivisionExpression: CModularDivisionExpression, - } - - return INFIX_TYPE_MAPPING[type(expression)]( - left=transform_expression(builtin_dependencies, expression.left), - right=transform_expression(builtin_dependencies, expression.right), +def transform_variable_expression(accumulators, expression): + assert isinstance(expression, conversion.CPSVariableExpression) + return CVariableExpression(variable=expression.variable) + +def transform_string_literal_expression(accumulators, expression): + value = expression.string + + try: + index = accumulators.string_literal_list.index(value) + except ValueError: + index = len(accumulators.string_literal_list) + accumulators.string_literal_list.append(value) + + return CStringLiteral(index=index, value=value) + +def transform_symbol_expression(accumulators, expression): + if expression.symbol in BUILTINS: + accumulators.builtin_set.add(expression.symbol) + + try: + symbol_list_index = accumulators.symbol_list.index(expression.symbol) + except ValueError: + symbol_list_index = len(accumulators.symbol_list) + accumulators.symbol_list.append(expression.symbol) + + return CSymbolExpression( + symbol=expression.symbol, + symbol_list_index=symbol_list_index, ) -def transform_function_call_expression(builtin_dependencies, function_call): - if function_call.name in BUILTINS.keys(): - builtin_dependencies.add(function_call.name) +def transform_integer_literal_expression(accumulators, expression): + return CIntegerLiteral(value=expression.integer) + +CListConstructExpression = collections.namedtuple( + 'CListConstructExpression', + ( + 'allocate', + ), +) - return CFunctionCallExpression( - name='builtin$' + function_call.name, - arguments=tuple(transform_expression(builtin_dependencies, arg) for arg in function_call.arguments), - ) +CLambdaExpression = collections.namedtuple( + 'CLambdaExpression', + ( + 'name', + 'index', + ), +) - raise Exception() +CListAppendStatement = collections.namedtuple( + 'CListAppendStatement', + ( + 'list_expression', + 'item_expression', + ), +) + +def transform_structure_literal_expression(accumulators, expression): + return CStructureLiteralExpression( + field_count=expression.field_count, + symbol_list_variable=expression.symbol_list_variable, + value_list_variable=expression.value_list_variable, + ) + +def transform_lambda_expression(accumulators, expression): + if expression.name is None: + name = '__lambda' + else: + name = expression.name + + index = accumulators.function_name_iterators.get(name, 0) + accumulators.function_name_iterators[name] = index + 1 + + accumulators.function_definition_list.append(CFunctionDefinition( + name=name, + index=index, + argument_name_list=expression.argument_name_list, + statement_list=tuple(transform_statement(accumulators, s) for s in expression.statement_list), + )) + + return CLambdaExpression( + name=name, + index=index, + ) + + +def transform_list_construct_expression(accumulators, expression): + return CListConstructExpression(allocate=expression.allocate) + +def transform_list_append_statement(accumulators, expression): + return CListAppendStatement( + list_expression=transform_expression(accumulators, expression.list_expression), + item_expression=transform_expression(accumulators, expression.item_expression), + ) + +def transform_expression(accumulators, expression): + return { + conversion.CPSFunctionCallExpression: transform_function_call_expression, + conversion.CPSIntegerLiteralExpression: transform_integer_literal_expression, + conversion.CPSLambdaExpression: transform_lambda_expression, + conversion.CPSListConstructExpression: transform_list_construct_expression, + conversion.CPSStructureLiteralExpression: transform_structure_literal_expression, + conversion.CPSStringLiteralExpression: transform_string_literal_expression, + conversion.CPSSymbolExpression: transform_symbol_expression, + conversion.CPSVariableExpression: transform_variable_expression, + }[type(expression)](accumulators, expression) + +def transform_symbol_assignment_statement(accumulators, assignment_statement): + # TODO Check that target is not a builtin + try: + symbol_list_index = accumulators.symbol_list.index(assignment_statement.target) + except ValueError: + symbol_list_index = len(accumulators.symbol_list) + accumulators.symbol_list.append(assignment_statement.target) + + return CSymbolAssignmentStatement( + target=assignment_statement.target, + target_symbol_list_index=symbol_list_index, + expression=transform_expression( + accumulators, + assignment_statement.expression, + ), + ) + +def transform_function_call_expression(accumulators, function_call): + # TODO Use the symbol from SYMBOL LIST + return CFunctionCallExpression( + metadata=function_call.metadata, + function_expression=transform_expression(accumulators, function_call.function_expression), + argument_count=function_call.argument_count, + ) + +def transform_expression_statement(accumulators, statement): + return CExpressionStatement( + expression=transform_expression(accumulators, statement.expression), + ) + +def transform_if_else_statement(accumulators, statement): + return CIfElseStatement( + condition_expression=transform_expression(accumulators, statement.condition_expression), + if_statement_list=tuple(transform_statement(accumulators, s) for s in statement.if_statement_list), + else_statement_list=tuple(transform_statement(accumulators, s) for s in statement.else_statement_list), + ) + +def transform_array_variable_initialization_statement(accumulators, statement): + return CArrayVariableInitializationStatement( + variable=statement.variable, + items=tuple(transform_expression(accumulators, i) for i in statement.items), + ) + +def transform_symbol_array_variable_initialization_statement(accumulators, statement): + symbol_list_indices = [] + + for symbol in statement.symbol_list: + try: + symbol_list_index = accumulators.symbol_list.index(symbol) + except ValueError: + symbol_list_index = len(accumulators.symbol_list) + accumulators.symbol_list.append(symbol) + + symbol_list_indices.append(symbol_list_index) + + return CSymbolArrayVariableInitializationStatement( + variable=statement.variable, + symbol_list=statement.symbol_list, + symbol_list_indices=tuple(symbol_list_indices), + ) + +def transform_variable_initialization_statement(accumulators, statement): + return CVariableInitializationStatement( + variable=statement.variable, + expression=transform_expression(accumulators, statement.expression), + ) + +def transform_variable_reassignment_statement(accumulators, statement): + return CVariableReassignmentStatement( + variable=statement.variable, + expression=transform_expression(accumulators, statement.expression), + ) + +def transform_push_statement(accumulators, statement): + return CPushStatement(expression=transform_expression(accumulators, statement.expression)) + +def transform_statement(accumulators, statement): + return { + conversion.CPSArrayVariableInitializationStatement: transform_array_variable_initialization_statement, + conversion.CPSAssignmentStatement: transform_symbol_assignment_statement, + conversion.CPSExpressionStatement: transform_expression_statement, + conversion.CPSIfElseStatement: transform_if_else_statement, + conversion.CPSListAppendStatement: transform_list_append_statement, + conversion.CPSPushStatement: transform_push_statement, + conversion.CPSSymbolArrayVariableInitializationStatement: transform_symbol_array_variable_initialization_statement, + conversion.CPSVariableInitializationStatement: transform_variable_initialization_statement, + conversion.CPSVariableReassignmentStatement: transform_variable_reassignment_statement, + }[type(statement)](accumulators, statement) + + +Accumulators = collections.namedtuple( + 'Accumulators', + [ + 'builtin_set', + 'function_definition_list', + 'function_name_iterators', + 'operator_set', + 'symbol_list', + 'string_literal_list', + ], +) def transform(program): - builtins = set() + accumulators = Accumulators( + builtin_set=set(), + function_definition_list=[], + function_name_iterators={}, + operator_set=set(), + symbol_list=[], + string_literal_list=[], + ) - c_statements = [ - transform_function_call_expression(builtins, statement) for statement in program.statement_list + statement_list = [ + transform_statement(accumulators, statement) for statement in program.statement_list ] - standard_libraries = set() - for builtin in builtins: + standard_library_set = set() + for builtin in accumulators.builtin_set: for standard_library in BUILTINS[builtin]: - standard_libraries.add(standard_library) + standard_library_set.add(standard_library) return CProgram( - builtins=builtins, - statements=c_statements, - standard_libraries=standard_libraries, + builtin_set=accumulators.builtin_set, + function_definition_list=accumulators.function_definition_list, + operator_declarations=tuple(sorted(accumulators.operator_set)), + statements=statement_list, + standard_libraries=standard_library_set, + string_literal_list=accumulators.string_literal_list, + symbol_list=accumulators.symbol_list, )