Allocate Fur stacks on the C heap
[fur] / transformation.py
index f2bd2a7..7d47ed4 100644 (file)
@@ -1,6 +1,7 @@
 import collections
 
-import parsing
+import normalization
+import parsing # TODO Remove this import, as we should be normalizing everything before it gets here
 
 CIntegerLiteral = collections.namedtuple(
     'CIntegerLiteral',
@@ -12,65 +13,478 @@ CIntegerLiteral = collections.namedtuple(
 CStringLiteral = collections.namedtuple(
     'CStringLiteral',
     [
+        'index',
         'value',
     ],
 )
 
-CFunctionCallStatement = collections.namedtuple(
-    'CFunctionCallStatement',
+CVariableExpression = collections.namedtuple(
+    'CVariableExpression',
     [
+        'variable',
+    ],
+)
+
+CSymbolExpression = collections.namedtuple(
+    'CSymbolExpression',
+    [
+        'symbol',
+        'symbol_list_index',
+    ],
+)
+
+CStructureLiteralExpression = collections.namedtuple(
+    'CStructureLiteralExpression',
+    [
+        'field_count',
+        'symbol_list_variable',
+        'value_list_variable',
+    ],
+)
+
+CDotExpression = collections.namedtuple(
+    'CDotExpression',
+    [
+        'instance',
+        'symbol',
+        'symbol_list_index',
+    ],
+)
+
+CNegationExpression = collections.namedtuple(
+    'CNegationExpression',
+    [
+        'value',
+    ],
+)
+
+CFunctionCallForFurInfixOperator = collections.namedtuple(
+    'CFunctionCallForFurInfixOperator',
+    [
+        'metadata',
         'name',
-        'arguments',
+    ],
+)
+
+CPushStatement = collections.namedtuple(
+    'CPushStatement',
+    (
+        'expression',
+    ),
+)
+
+CFunctionCallExpression = collections.namedtuple(
+    'CFunctionCallExpression',
+    [
+        'function_expression',
+        'argument_count',
+    ],
+)
+
+# TODO We are currently not changing variables, just preventing them from being accessed.
+CSymbolAssignmentStatement = collections.namedtuple(
+    'CSymbolAssignmentStatement',
+    [
+        'target',
+        'target_symbol_list_index',
+        'expression',
+    ],
+)
+
+CArrayVariableInitializationStatement = collections.namedtuple(
+    'CArrayVariableInitializationStatement',
+    [
+        'variable',
+        'items',
+    ],
+)
+
+CSymbolArrayVariableInitializationStatement = collections.namedtuple(
+    'CSymbolArrayVariableInitializationStatement',
+    [
+        'variable',
+        'symbol_list',
+        'symbol_list_indices',
+    ],
+)
+
+CVariableInitializationStatement = collections.namedtuple(
+    'CVariableInitializationStatement',
+    [
+        'variable',
+        'expression',
+    ],
+)
+
+CVariableReassignmentStatement = collections.namedtuple(
+    'CVariableReassignmentStatement',
+    [
+        'variable',
+        'expression',
+    ],
+)
+
+CExpressionStatement = collections.namedtuple(
+    'CExpressionStatement',
+    [
+        'expression',
+    ],
+)
+
+CIfElseStatement = collections.namedtuple(
+    'CIfElseStatement',
+    [
+        'condition_expression',
+        'if_statement_list',
+        'else_statement_list',
+    ],
+)
+
+CFunctionDeclaration = collections.namedtuple(
+    'CFunctionDeclaration',
+    [
+        'name',
+    ],
+)
+
+# TODO If a function definition doesn't end with an expression, we have issues currently because we try to return statement.
+# TODO Closures currently wrap entire defining environment, even symbols that are not used, which makes garbage collection ineffective.
+CFunctionDefinition = collections.namedtuple(
+    'CFunctionDefinition',
+    [
+        'name',
+        'argument_name_list',
+        'statement_list',
     ],
 )
 
 CProgram = collections.namedtuple(
     'CProgram',
     [
-        'builtins',
+        'builtin_set',
+        'function_definition_list',
+        'operator_declarations',
         'statements',
         'standard_libraries',
+        'string_literal_list',
+        'symbol_list',
     ],
 )
 
 BUILTINS = {
-    'print': ['stdio.h.'],
+    'concatenate':      [],
+    'false':            [],
+    'pow':              ['math.h'],
+    'print':            ['stdio.h'],
+    'true':             [],
+}
+
+def transform_variable_expression(accumulators, expression):
+    assert isinstance(expression, normalization.NormalVariableExpression)
+    return CVariableExpression(variable=expression.variable)
+
+def transform_string_literal_expression(accumulators, expression):
+    value = expression.string
+
+    try:
+        index = accumulators.string_literal_list.index(value)
+    except ValueError:
+        index = len(accumulators.string_literal_list)
+        accumulators.string_literal_list.append(value)
+
+    return CStringLiteral(index=index, value=value)
+
+def transform_symbol_expression(accumulators, expression):
+    if expression.symbol in BUILTINS:
+        accumulators.builtin_set.add(expression.symbol)
+
+    try:
+        symbol_list_index = accumulators.symbol_list.index(expression.symbol)
+    except ValueError:
+        symbol_list_index = len(accumulators.symbol_list)
+        accumulators.symbol_list.append(expression.symbol)
+
+    return CSymbolExpression(
+        symbol=expression.symbol,
+        symbol_list_index=symbol_list_index,
+    )
+
+CInfixDeclaration = collections.namedtuple(
+    'CInfixDeclaration',
+    [
+        'name',
+        'in_type',
+        'out_type',
+        'operator',
+    ],
+)
+
+FUR_INFIX_OPERATOR_TO_C_FUNCTION = {
+    '++':   'concatenate',
 }
 
-def transform_argument(builtin_dependencies, argument):
+FUR_INFIX_OPERATOR_TO_C_INFIX_OPERATOR = {
+    '+':    CInfixDeclaration(name='add', in_type='integer', out_type='integer', operator='+'),
+    '-':    CInfixDeclaration(name='subtract', in_type='integer', out_type='integer', operator='-'),
+    '*':    CInfixDeclaration(name='multiply', in_type='integer', out_type='integer', operator='*'),
+    '//':   CInfixDeclaration(name='integerDivide', in_type='integer', out_type='integer', operator='/'),
+    '%':    CInfixDeclaration(name='modularDivide', in_type='integer', out_type='integer', operator='%'),
+    'and':  CInfixDeclaration(name='and', in_type='boolean', out_type='boolean', operator='&&'),
+    'or':   CInfixDeclaration(name='or', in_type='boolean', out_type='boolean', operator='||'),
+    '==':   CInfixDeclaration(name='equals', in_type='integer', out_type='boolean', operator='=='),
+    '!=':   CInfixDeclaration(name='notEquals', in_type='integer', out_type='boolean', operator='!='),
+    '<=':   CInfixDeclaration(name='lessThanOrEqual', in_type='integer', out_type='boolean', operator='<='),
+    '>=':   CInfixDeclaration(name='greaterThanOrEqual', in_type='integer', out_type='boolean', operator='>='),
+    '<':    CInfixDeclaration(name='lessThan', in_type='integer', out_type='boolean', operator='<'),
+    '>':    CInfixDeclaration(name='greaterThan', in_type='integer', out_type='boolean', operator='>'),
+}
+
+def transform_infix_operator_without_c_equivalent(accumulators, expression):
+    return CFunctionCallForFurInfixOperator(
+        metadata=expression.metadata,
+        name='concatenate',
+    )
+
+def transform_infix_expression(accumulators, expression):
+    if expression.operator in FUR_INFIX_OPERATOR_TO_C_FUNCTION:
+        return transform_infix_operator_without_c_equivalent(accumulators, expression)
+
+    accumulators.operator_set.add(FUR_INFIX_OPERATOR_TO_C_INFIX_OPERATOR[expression.operator])
+
+    return CFunctionCallForFurInfixOperator(
+        metadata=expression.metadata,
+        name=FUR_INFIX_OPERATOR_TO_C_INFIX_OPERATOR[expression.operator].name,
+    )
+
+def transform_integer_literal_expression(accumulators, expression):
+    return CIntegerLiteral(value=expression.integer)
+
+def transform_negation_expression(accumulators, expression):
+    return CNegationExpression(
+        value=transform_expression(accumulators, expression.internal_expression),
+    )
+
+CListConstructExpression = collections.namedtuple(
+    'CListConstructExpression',
+    [
+        'allocate',
+    ],
+)
+
+CListAppendStatement = collections.namedtuple(
+    'CListAppendStatement',
+    [
+        'list_expression',
+        'item_expression',
+    ],
+)
+
+CListGetExpression = collections.namedtuple(
+    'CListGetExpression',
+    [
+        'list_expression',
+        'index_expression',
+    ],
+)
+
+def transform_structure_literal_expression(accumulators, expression):
+    return CStructureLiteralExpression(
+        field_count=expression.field_count,
+        symbol_list_variable=expression.symbol_list_variable,
+        value_list_variable=expression.value_list_variable,
+    )
+
+def transform_dot_expression(accumulators, expression):
+    try:
+        symbol_list_index = accumulators.symbol_list.index(expression.field)
+
+    except ValueError:
+        symbol_list_index = len(accumulators.symbol_list)
+        accumulators.symbol_list.append(expression.field)
+
+    return CDotExpression(
+        instance=transform_variable_expression(accumulators, expression.instance),
+        symbol=expression.field,
+        symbol_list_index=symbol_list_index,
+    )
+
+def transform_list_construct_expression(accumulators, expression):
+    return CListConstructExpression(allocate=expression.allocate)
+
+def transform_list_get_expression(accumulators, expression):
+    return CListGetExpression(
+        list_expression=transform_expression(accumulators, expression.list_expression),
+        index_expression=transform_expression(accumulators, expression.index_expression),
+    )
+
+def transform_list_append_statement(accumulators, expression):
+    return CListAppendStatement(
+        list_expression=transform_expression(accumulators, expression.list_expression),
+        item_expression=transform_expression(accumulators, expression.item_expression),
+    )
+
+def transform_expression(accumulators, expression):
+    # TODO Clean up handlers for parsing expressions
     return {
-        parsing.IntegerLiteral: CIntegerLiteral,
-        parsing.StringLiteral: CStringLiteral,
-    }[type(argument)](value=argument.value)
+        parsing.FurInfixExpression: transform_infix_expression,
+        parsing.FurIntegerLiteralExpression: transform_integer_literal_expression,
+        parsing.FurNegationExpression: transform_negation_expression,
+        parsing.FurStringLiteralExpression: transform_string_literal_expression,
+        normalization.NormalDotExpression: transform_dot_expression,
+        normalization.NormalFunctionCallExpression: transform_function_call_expression,
+        normalization.NormalInfixExpression: transform_infix_expression,
+        normalization.NormalIntegerLiteralExpression: transform_integer_literal_expression,
+        normalization.NormalListConstructExpression: transform_list_construct_expression,
+        normalization.NormalListGetExpression: transform_list_get_expression,
+        normalization.NormalNegationExpression: transform_negation_expression,
+        normalization.NormalStructureLiteralExpression: transform_structure_literal_expression,
+        normalization.NormalStringLiteralExpression: transform_string_literal_expression,
+        normalization.NormalSymbolExpression: transform_symbol_expression,
+        normalization.NormalVariableExpression: transform_variable_expression,
+    }[type(expression)](accumulators, expression)
+
+def transform_symbol_assignment_statement(accumulators, assignment_statement):
+    # TODO Check that target is not a builtin
+    try:
+        symbol_list_index = accumulators.symbol_list.index(assignment_statement.target)
+    except ValueError:
+        symbol_list_index = len(accumulators.symbol_list)
+        accumulators.symbol_list.append(assignment_statement.target)
+
+    return CSymbolAssignmentStatement(
+        target=assignment_statement.target,
+        target_symbol_list_index=symbol_list_index,
+        expression=transform_expression(
+            accumulators,
+            assignment_statement.expression,
+        ),
+    )
 
-def transform_function_call_statement(builtin_dependencies, function_call):
-    if function_call.name in BUILTINS.keys():
-        builtin_dependencies.add(function_call.name)
+def transform_function_call_expression(accumulators, function_call):
+    # TODO Use the symbol from SYMBOL LIST
+    return CFunctionCallExpression(
+        function_expression=transform_expression(accumulators, function_call.function_expression),
+        argument_count=function_call.argument_count,
+    )
 
-        return CFunctionCallStatement(
-            name='builtin$' + function_call.name,
-            arguments=tuple(transform_argument(builtin_dependencies, arg) for arg in function_call.arguments),
-        )
+def transform_expression_statement(accumulators, statement):
+    return CExpressionStatement(
+        expression=transform_expression(accumulators, statement.expression),
+    )
 
-    raise Exception()
+def transform_if_else_statement(accumulators, statement):
+    return CIfElseStatement(
+        condition_expression=transform_expression(accumulators, statement.condition_expression),
+        if_statement_list=tuple(transform_statement(accumulators, s) for s in statement.if_statement_list),
+        else_statement_list=tuple(transform_statement(accumulators, s) for s in statement.else_statement_list),
+    )
 
+def transform_array_variable_initialization_statement(accumulators, statement):
+    return CArrayVariableInitializationStatement(
+        variable=statement.variable,
+        items=tuple(transform_expression(accumulators, i) for i in statement.items),
+    )
+
+def transform_symbol_array_variable_initialization_statement(accumulators, statement):
+    symbol_list_indices = []
+
+    for symbol in statement.symbol_list:
+        try:
+            symbol_list_index = accumulators.symbol_list.index(symbol)
+        except ValueError:
+            symbol_list_index = len(accumulators.symbol_list)
+            accumulators.symbol_list.append(symbol)
+
+        symbol_list_indices.append(symbol_list_index)
+
+    return CSymbolArrayVariableInitializationStatement(
+        variable=statement.variable,
+        symbol_list=statement.symbol_list,
+        symbol_list_indices=tuple(symbol_list_indices),
+    )
+
+def transform_variable_initialization_statement(accumulators, statement):
+    return CVariableInitializationStatement(
+        variable=statement.variable,
+        expression=transform_expression(accumulators, statement.expression),
+    )
+
+def transform_variable_reassignment_statement(accumulators, statement):
+    return CVariableReassignmentStatement(
+        variable=statement.variable,
+        expression=transform_expression(accumulators, statement.expression),
+    )
+
+def transform_function_definition_statement(accumulators, statement):
+    # TODO Allow defining the same function in different contexts
+    if any(fd.name == statement.name for fd in accumulators.function_definition_list):
+        raise Exception('A function with name "{}" already exists'.format(statement.name))
+
+    # TODO Add argument names to the symbol table
+    accumulators.function_definition_list.append(CFunctionDefinition(
+        name=statement.name,
+        argument_name_list=statement.argument_name_list,
+        statement_list=tuple(transform_statement(accumulators, s) for s in statement.statement_list)
+    ))
+
+    return CFunctionDeclaration(name=statement.name)
+
+def transform_push_statement(accumulators, statement):
+    return CPushStatement(expression=transform_expression(accumulators, statement.expression))
+
+def transform_statement(accumulators, statement):
+    return {
+        parsing.FurExpressionStatement: transform_expression_statement,
+        normalization.NormalArrayVariableInitializationStatement: transform_array_variable_initialization_statement,
+        normalization.NormalAssignmentStatement: transform_symbol_assignment_statement,
+        normalization.NormalExpressionStatement: transform_expression_statement,
+        normalization.NormalFunctionDefinitionStatement: transform_function_definition_statement,
+        normalization.NormalIfElseStatement: transform_if_else_statement,
+        normalization.NormalListAppendStatement: transform_list_append_statement,
+        normalization.NormalPushStatement: transform_push_statement,
+        normalization.NormalSymbolArrayVariableInitializationStatement: transform_symbol_array_variable_initialization_statement,
+        normalization.NormalVariableInitializationStatement: transform_variable_initialization_statement,
+        normalization.NormalVariableReassignmentStatement: transform_variable_reassignment_statement,
+    }[type(statement)](accumulators, statement)
+
+
+Accumulators = collections.namedtuple(
+    'Accumulators',
+    [
+        'builtin_set',
+        'function_definition_list',
+        'operator_set',
+        'symbol_list',
+        'string_literal_list',
+    ],
+)
 
 def transform(program):
-    builtins = set()
+    accumulators = Accumulators(
+        builtin_set=set(),
+        function_definition_list=[],
+        operator_set=set(),
+        symbol_list=[],
+        string_literal_list=[],
+    )
 
-    c_statements = [
-        transform_function_call_statement(builtins, statement) for statement in program.statement_list
+    statement_list = [
+        transform_statement(accumulators, statement) for statement in program.statement_list
     ]
 
-    standard_libraries = set()
-    for builtin in builtins:
+    standard_library_set = set()
+    for builtin in accumulators.builtin_set:
         for standard_library in BUILTINS[builtin]:
-            standard_libraries.add(standard_library)
+            standard_library_set.add(standard_library)
 
     return CProgram(
-        builtins=builtins,
-        statements=c_statements,
-        standard_libraries=standard_libraries,
+        builtin_set=accumulators.builtin_set,
+        function_definition_list=accumulators.function_definition_list,
+        operator_declarations=tuple(sorted(accumulators.operator_set)),
+        statements=statement_list,
+        standard_libraries=standard_library_set,
+        string_literal_list=accumulators.string_literal_list,
+        symbol_list=accumulators.symbol_list,
     )