Added lambda expressions
[fur] / transformation.py
index b75b3a0..e8ee51c 100644 (file)
@@ -1,6 +1,6 @@
 import collections
 
-import parsing
+import conversion
 
 CIntegerLiteral = collections.namedtuple(
     'CIntegerLiteral',
@@ -17,10 +17,10 @@ CStringLiteral = collections.namedtuple(
     ],
 )
 
-CConstantExpression = collections.namedtuple(
-    'CConstantExpression',
+CVariableExpression = collections.namedtuple(
+    'CVariableExpression',
     [
-        'value'
+        'variable',
     ],
 )
 
@@ -32,32 +32,34 @@ CSymbolExpression = collections.namedtuple(
     ],
 )
 
-CNegationExpression = collections.namedtuple(
-    'CNegationExpression',
+CStructureLiteralExpression = collections.namedtuple(
+    'CStructureLiteralExpression',
     [
-        'value',
+        'field_count',
+        'symbol_list_variable',
+        'value_list_variable',
     ],
 )
 
-CFunctionCallForFurInfixOperator = collections.namedtuple(
-    'CFunctionCallForFurInfixOperator',
-    [
-        'name',
-        'left',
-        'right',
-    ],
+CPushStatement = collections.namedtuple(
+    'CPushStatement',
+    (
+        'expression',
+    ),
 )
 
 CFunctionCallExpression = collections.namedtuple(
     'CFunctionCallExpression',
-    [
-        'name',
-        'arguments',
-    ],
+    (
+        'metadata',
+        'function_expression',
+        'argument_count',
+    ),
 )
 
-CAssignmentStatement = collections.namedtuple(
-    'CAssignmentStatement',
+# TODO We are currently not changing variables, just preventing them from being accessed.
+CSymbolAssignmentStatement = collections.namedtuple(
+    'CSymbolAssignmentStatement',
     [
         'target',
         'target_symbol_list_index',
@@ -65,10 +67,79 @@ CAssignmentStatement = collections.namedtuple(
     ],
 )
 
+CArrayVariableInitializationStatement = collections.namedtuple(
+    'CArrayVariableInitializationStatement',
+    [
+        'variable',
+        'items',
+    ],
+)
+
+CSymbolArrayVariableInitializationStatement = collections.namedtuple(
+    'CSymbolArrayVariableInitializationStatement',
+    [
+        'variable',
+        'symbol_list',
+        'symbol_list_indices',
+    ],
+)
+
+CVariableInitializationStatement = collections.namedtuple(
+    'CVariableInitializationStatement',
+    [
+        'variable',
+        'expression',
+    ],
+)
+
+CVariableReassignmentStatement = collections.namedtuple(
+    'CVariableReassignmentStatement',
+    [
+        'variable',
+        'expression',
+    ],
+)
+
+CExpressionStatement = collections.namedtuple(
+    'CExpressionStatement',
+    [
+        'expression',
+    ],
+)
+
+CIfElseStatement = collections.namedtuple(
+    'CIfElseStatement',
+    [
+        'condition_expression',
+        'if_statement_list',
+        'else_statement_list',
+    ],
+)
+
+CFunctionDeclaration = collections.namedtuple(
+    'CFunctionDeclaration',
+    [
+        'name',
+    ],
+)
+
+# TODO If a function definition doesn't end with an expression, we have issues currently because we try to return statement.
+# TODO Closures currently wrap entire defining environment, even symbols that are not used, which makes garbage collection ineffective.
+CFunctionDefinition = collections.namedtuple(
+    'CFunctionDefinition',
+    [
+        'name',
+        'argument_name_list',
+        'statement_list',
+    ],
+)
+
 CProgram = collections.namedtuple(
     'CProgram',
     [
         'builtin_set',
+        'function_definition_list',
+        'operator_declarations',
         'statements',
         'standard_libraries',
         'string_literal_list',
@@ -76,155 +147,217 @@ CProgram = collections.namedtuple(
     ],
 )
 
-EQUALITY_LEVEL_OPERATOR_TO_FUNCTION_NAME_MAPPING = {
-    '==':   'equals',
-    '!=':   'notEquals',
-    '<=':   'lessThanOrEqual',
-    '>=':   'greaterThanOrEqual',
-    '<':    'lessThan',
-    '>':    'greaterThan',
+BUILTINS = {
+    'concatenate':      [],
+    'false':            [],
+    'pow':              ['math.h'],
+    'print':            ['stdio.h'],
+    'true':             [],
 }
 
-def transform_equality_level_expression(accumulators, expression):
-    # Transform expressions like 1 < 2 < 3 into expressions like 1 < 2 && 2 < 3
-    if isinstance(expression.left, parsing.FurInfixExpression) and expression.left.order == 'equality_level':
-        left = transform_equality_level_expression(
-            accumulators,
-            expression.left
-        )
+def transform_variable_expression(accumulators, expression):
+    assert isinstance(expression, conversion.CPSVariableExpression)
+    return CVariableExpression(variable=expression.variable)
 
-        middle = left.right
+def transform_string_literal_expression(accumulators, expression):
+    value = expression.string
 
-        right = transform_expression(
-            accumulators,
-            expression.right,
-        )
-
-        # TODO Don't evaluate the middle expression twice
-        return CFunctionCallForFurInfixOperator(
-            name='and',
-            left=left,
-            right=CFunctionCallForFurInfixOperator(
-                name=EQUALITY_LEVEL_OPERATOR_TO_FUNCTION_NAME_MAPPING[expression.operator],
-                left=middle,
-                right=right,
-            ),
-        )
-
-    return CFunctionCallForFurInfixOperator(
-        name=EQUALITY_LEVEL_OPERATOR_TO_FUNCTION_NAME_MAPPING[expression.operator],
-        left=transform_expression(accumulators, expression.left),
-        right=transform_expression(accumulators, expression.right),
-    )
+    try:
+        index = accumulators.string_literal_list.index(value)
+    except ValueError:
+        index = len(accumulators.string_literal_list)
+        accumulators.string_literal_list.append(value)
 
-BUILTINS = {
-    'false':    [],
-    'pow':      ['math.h'],
-    'print':    ['stdio.h'],
-    'true':     [],
-}
+    return CStringLiteral(index=index, value=value)
 
-def transform_expression(accumulators, expression):
-    if isinstance(expression, parsing.FurParenthesizedExpression):
-        # Parentheses can be removed because everything in the C output is explicitly parenthesized
-        return transform_expression(accumulators, expression.internal)
+def transform_symbol_expression(accumulators, expression):
+    if expression.symbol in BUILTINS:
+        accumulators.builtin_set.add(expression.symbol)
 
-    if isinstance(expression, parsing.FurNegationExpression):
-        return transform_negation_expression(accumulators, expression)
+    try:
+        symbol_list_index = accumulators.symbol_list.index(expression.symbol)
+    except ValueError:
+        symbol_list_index = len(accumulators.symbol_list)
+        accumulators.symbol_list.append(expression.symbol)
 
-    if isinstance(expression, parsing.FurFunctionCallExpression):
-        return transform_function_call_expression(accumulators, expression)
+    return CSymbolExpression(
+        symbol=expression.symbol,
+        symbol_list_index=symbol_list_index,
+    )
 
-    if isinstance(expression, parsing.FurSymbolExpression):
-        if expression.value in ['true', 'false']:
-            return CConstantExpression(value=expression.value)
+def transform_integer_literal_expression(accumulators, expression):
+    return CIntegerLiteral(value=expression.integer)
 
-        if expression.value not in accumulators.symbol_list:
-            symbol_list.append(expression.value)
+CListConstructExpression = collections.namedtuple(
+    'CListConstructExpression',
+    (
+        'allocate',
+    ),
+)
 
-        return CSymbolExpression(
-            symbol=expression.value,
-            symbol_list_index=accumulators.symbol_list.index(expression.value),
-        )
+CLambdaExpression = collections.namedtuple(
+    'CLambdaExpression',
+    (
+        'name',
+    ),
+)
 
-    if isinstance(expression, parsing.FurStringLiteralExpression):
-        value = expression.value
+CListAppendStatement = collections.namedtuple(
+    'CListAppendStatement',
+    (
+        'list_expression',
+        'item_expression',
+    ),
+)
 
-        try:
-            index = accumulators.string_literal_list.index(value)
-        except ValueError:
-            index = len(accumulators.string_literal_list)
-            accumulators.string_literal_list.append(value)
+def transform_structure_literal_expression(accumulators, expression):
+    return CStructureLiteralExpression(
+        field_count=expression.field_count,
+        symbol_list_variable=expression.symbol_list_variable,
+        value_list_variable=expression.value_list_variable,
+    )
 
-        return CStringLiteral(index=index, value=value)
+def transform_lambda_expression(accumulators, expression):
+    # TODO This function feels hacky
+    if len(accumulators.lambda_number_list) == 0:
+        accumulators.lambda_number_list.append(0)
+    else:
+        accumulators.lambda_number_list.append(accumulators.lambda_number_list[-1] + 1)
 
-    LITERAL_TYPE_MAPPING = {
-        parsing.FurIntegerLiteralExpression: CIntegerLiteral,
-    }
+    name = '__lambda_{}'.format(accumulators.lambda_number_list[-1])
 
-    if type(expression) in LITERAL_TYPE_MAPPING:
-        return LITERAL_TYPE_MAPPING[type(expression)](value=expression.value)
+    accumulators.function_definition_list.append(CFunctionDefinition(
+        name=name,
+        argument_name_list=expression.argument_name_list,
+        statement_list=tuple(transform_statement(accumulators, s) for s in expression.statement_list),
+    ))
 
-    if isinstance(expression, parsing.FurInfixExpression):
-        if expression.order == 'equality_level':
-            return transform_equality_level_expression(accumulators, expression)
+    return CLambdaExpression(name=name)
 
-        INFIX_OPERATOR_TO_FUNCTION_NAME = {
-            '+':    'add',
-            '-':    'subtract',
-            '*':    'multiply',
-            '//':   'integerDivide',
-            '%':    'modularDivide',
-            'and':  'and',
-            'or':   'or',
-        }
 
-        return CFunctionCallForFurInfixOperator(
-            name=INFIX_OPERATOR_TO_FUNCTION_NAME[expression.operator],
-            left=transform_expression(accumulators, expression.left),
-            right=transform_expression(accumulators, expression.right),
-        )
+def transform_list_construct_expression(accumulators, expression):
+    return CListConstructExpression(allocate=expression.allocate)
 
-    raise Exception('Could not transform expression "{}"'.format(expression))
+def transform_list_append_statement(accumulators, expression):
+    return CListAppendStatement(
+        list_expression=transform_expression(accumulators, expression.list_expression),
+        item_expression=transform_expression(accumulators, expression.item_expression),
+    )
 
-def transform_assignment_statement(accumulators, assignment_statement):
+def transform_expression(accumulators, expression):
+    return {
+        conversion.CPSFunctionCallExpression: transform_function_call_expression,
+        conversion.CPSIntegerLiteralExpression: transform_integer_literal_expression,
+        conversion.CPSLambdaExpression: transform_lambda_expression,
+        conversion.CPSListConstructExpression: transform_list_construct_expression,
+        conversion.CPSStructureLiteralExpression: transform_structure_literal_expression,
+        conversion.CPSStringLiteralExpression: transform_string_literal_expression,
+        conversion.CPSSymbolExpression: transform_symbol_expression,
+        conversion.CPSVariableExpression: transform_variable_expression,
+    }[type(expression)](accumulators, expression)
+
+def transform_symbol_assignment_statement(accumulators, assignment_statement):
     # TODO Check that target is not a builtin
-    if assignment_statement.target not in accumulators.symbol_list:
+    try:
+        symbol_list_index = accumulators.symbol_list.index(assignment_statement.target)
+    except ValueError:
+        symbol_list_index = len(accumulators.symbol_list)
         accumulators.symbol_list.append(assignment_statement.target)
 
-    return CAssignmentStatement(
+    return CSymbolAssignmentStatement(
         target=assignment_statement.target,
-        target_symbol_list_index=accumulators.symbol_list.index(assignment_statement.target),
+        target_symbol_list_index=symbol_list_index,
         expression=transform_expression(
             accumulators,
             assignment_statement.expression,
         ),
     )
 
-def transform_negation_expression(accumulators, negation_expression):
-    return CNegationExpression(
-        value=transform_expression(accumulators, negation_expression.value),
+def transform_function_call_expression(accumulators, function_call):
+    # TODO Use the symbol from SYMBOL LIST
+    return CFunctionCallExpression(
+        metadata=function_call.metadata,
+        function_expression=transform_expression(accumulators, function_call.function_expression),
+        argument_count=function_call.argument_count,
     )
 
-def transform_function_call_expression(accumulators, function_call):
-    if function_call.function.value in BUILTINS.keys():
-        # TODO Check that the builtin is actually callable
-        accumulators.builtin_set.add(function_call.function.value)
+def transform_expression_statement(accumulators, statement):
+    return CExpressionStatement(
+        expression=transform_expression(accumulators, statement.expression),
+    )
+
+def transform_if_else_statement(accumulators, statement):
+    return CIfElseStatement(
+        condition_expression=transform_expression(accumulators, statement.condition_expression),
+        if_statement_list=tuple(transform_statement(accumulators, s) for s in statement.if_statement_list),
+        else_statement_list=tuple(transform_statement(accumulators, s) for s in statement.else_statement_list),
+    )
+
+def transform_array_variable_initialization_statement(accumulators, statement):
+    return CArrayVariableInitializationStatement(
+        variable=statement.variable,
+        items=tuple(transform_expression(accumulators, i) for i in statement.items),
+    )
+
+def transform_symbol_array_variable_initialization_statement(accumulators, statement):
+    symbol_list_indices = []
+
+    for symbol in statement.symbol_list:
+        try:
+            symbol_list_index = accumulators.symbol_list.index(symbol)
+        except ValueError:
+            symbol_list_index = len(accumulators.symbol_list)
+            accumulators.symbol_list.append(symbol)
+
+        symbol_list_indices.append(symbol_list_index)
+
+    return CSymbolArrayVariableInitializationStatement(
+        variable=statement.variable,
+        symbol_list=statement.symbol_list,
+        symbol_list_indices=tuple(symbol_list_indices),
+    )
+
+def transform_variable_initialization_statement(accumulators, statement):
+    return CVariableInitializationStatement(
+        variable=statement.variable,
+        expression=transform_expression(accumulators, statement.expression),
+    )
+
+def transform_variable_reassignment_statement(accumulators, statement):
+    return CVariableReassignmentStatement(
+        variable=statement.variable,
+        expression=transform_expression(accumulators, statement.expression),
+    )
+
+def transform_function_definition_statement(accumulators, statement):
+    # TODO Allow defining the same function in different contexts
+    if any(fd.name == statement.name for fd in accumulators.function_definition_list):
+        raise Exception('A function with name "{}" already exists'.format(statement.name))
+
+    # TODO Add argument names to the symbol table
+    accumulators.function_definition_list.append(CFunctionDefinition(
+        name=statement.name,
+        argument_name_list=statement.argument_name_list,
+        statement_list=tuple(transform_statement(accumulators, s) for s in statement.statement_list)
+    ))
 
-        return CFunctionCallExpression(
-            name='builtin$' + function_call.function.value,
-            arguments=tuple(
-                transform_expression(accumulators, arg)
-                for arg in function_call.arguments
-            ),
-        )
+    return CFunctionDeclaration(name=statement.name)
 
-    raise Exception()
+def transform_push_statement(accumulators, statement):
+    return CPushStatement(expression=transform_expression(accumulators, statement.expression))
 
 def transform_statement(accumulators, statement):
     return {
-        parsing.FurAssignmentStatement: transform_assignment_statement,
-        parsing.FurFunctionCallExpression: transform_function_call_expression,
+        conversion.CPSArrayVariableInitializationStatement: transform_array_variable_initialization_statement,
+        conversion.CPSAssignmentStatement: transform_symbol_assignment_statement,
+        conversion.CPSExpressionStatement: transform_expression_statement,
+        conversion.CPSFunctionDefinitionStatement: transform_function_definition_statement,
+        conversion.CPSIfElseStatement: transform_if_else_statement,
+        conversion.CPSListAppendStatement: transform_list_append_statement,
+        conversion.CPSPushStatement: transform_push_statement,
+        conversion.CPSSymbolArrayVariableInitializationStatement: transform_symbol_array_variable_initialization_statement,
+        conversion.CPSVariableInitializationStatement: transform_variable_initialization_statement,
+        conversion.CPSVariableReassignmentStatement: transform_variable_reassignment_statement,
     }[type(statement)](accumulators, statement)
 
 
@@ -232,6 +365,9 @@ Accumulators = collections.namedtuple(
     'Accumulators',
     [
         'builtin_set',
+        'function_definition_list',
+        'lambda_number_list',
+        'operator_set',
         'symbol_list',
         'string_literal_list',
     ],
@@ -240,23 +376,28 @@ Accumulators = collections.namedtuple(
 def transform(program):
     accumulators = Accumulators(
         builtin_set=set(),
+        function_definition_list=[],
+        lambda_number_list=[],
+        operator_set=set(),
         symbol_list=[],
         string_literal_list=[],
     )
 
-    c_statements = [
+    statement_list = [
         transform_statement(accumulators, statement) for statement in program.statement_list
     ]
 
-    standard_libraries = set()
+    standard_library_set = set()
     for builtin in accumulators.builtin_set:
         for standard_library in BUILTINS[builtin]:
-            standard_libraries.add(standard_library)
+            standard_library_set.add(standard_library)
 
     return CProgram(
         builtin_set=accumulators.builtin_set,
-        statements=c_statements,
-        standard_libraries=standard_libraries,
+        function_definition_list=accumulators.function_definition_list,
+        operator_declarations=tuple(sorted(accumulators.operator_set)),
+        statements=statement_list,
+        standard_libraries=standard_library_set,
         string_literal_list=accumulators.string_literal_list,
         symbol_list=accumulators.symbol_list,
     )