import collections
-import parsing
+import normalization
+import parsing # TODO Remove this import, as we should be normalizing everything before it gets here
CIntegerLiteral = collections.namedtuple(
'CIntegerLiteral',
CStringLiteral = collections.namedtuple(
'CStringLiteral',
[
+ 'index',
'value',
],
)
-CAdditionExpression = collections.namedtuple(
- 'CAdditionExpression',
+CVariableExpression = collections.namedtuple(
+ 'CVariableExpression',
[
- 'left',
- 'right',
+ 'variable',
],
)
-CSubtractionExpression = collections.namedtuple(
- 'CSubtractionExpression',
+CSymbolExpression = collections.namedtuple(
+ 'CSymbolExpression',
[
- 'left',
- 'right',
+ 'symbol',
+ 'symbol_list_index',
],
)
-CMultiplicationExpression = collections.namedtuple(
- 'CMultiplicationExpression',
+CStructureLiteralExpression = collections.namedtuple(
+ 'CStructureLiteralExpression',
[
- 'left',
- 'right',
+ 'field_count',
+ 'symbol_list_variable',
+ 'value_list_variable',
],
)
-CIntegerDivisionExpression = collections.namedtuple(
- 'CIntegerDivisionExpression',
+CDotExpression = collections.namedtuple(
+ 'CDotExpression',
[
- 'left',
- 'right',
+ 'instance',
+ 'symbol',
+ 'symbol_list_index',
],
)
-CModularDivisionExpression = collections.namedtuple(
- 'CModularDivisionExpression',
+CNegationExpression = collections.namedtuple(
+ 'CNegationExpression',
[
- 'left',
- 'right',
+ 'value',
],
)
-CFunctionCallStatement = collections.namedtuple(
- 'CFunctionCallStatement',
+CFunctionCallForFurInfixOperator = collections.namedtuple(
+ 'CFunctionCallForFurInfixOperator',
[
+ 'metadata',
'name',
- 'arguments',
+ ],
+)
+
+CPushStatement = collections.namedtuple(
+ 'CPushStatement',
+ (
+ 'expression',
+ ),
+)
+
+CFunctionCallExpression = collections.namedtuple(
+ 'CFunctionCallExpression',
+ [
+ 'function_expression',
+ 'argument_count',
+ ],
+)
+
+# TODO We are currently not changing variables, just preventing them from being accessed.
+CSymbolAssignmentStatement = collections.namedtuple(
+ 'CSymbolAssignmentStatement',
+ [
+ 'target',
+ 'target_symbol_list_index',
+ 'expression',
+ ],
+)
+
+CArrayVariableInitializationStatement = collections.namedtuple(
+ 'CArrayVariableInitializationStatement',
+ [
+ 'variable',
+ 'items',
+ ],
+)
+
+CSymbolArrayVariableInitializationStatement = collections.namedtuple(
+ 'CSymbolArrayVariableInitializationStatement',
+ [
+ 'variable',
+ 'symbol_list',
+ 'symbol_list_indices',
+ ],
+)
+
+CVariableInitializationStatement = collections.namedtuple(
+ 'CVariableInitializationStatement',
+ [
+ 'variable',
+ 'expression',
+ ],
+)
+
+CVariableReassignmentStatement = collections.namedtuple(
+ 'CVariableReassignmentStatement',
+ [
+ 'variable',
+ 'expression',
+ ],
+)
+
+CExpressionStatement = collections.namedtuple(
+ 'CExpressionStatement',
+ [
+ 'expression',
+ ],
+)
+
+CIfElseStatement = collections.namedtuple(
+ 'CIfElseStatement',
+ [
+ 'condition_expression',
+ 'if_statement_list',
+ 'else_statement_list',
+ ],
+)
+
+CFunctionDeclaration = collections.namedtuple(
+ 'CFunctionDeclaration',
+ [
+ 'name',
+ ],
+)
+
+# TODO If a function definition doesn't end with an expression, we have issues currently because we try to return statement.
+# TODO Closures currently wrap entire defining environment, even symbols that are not used, which makes garbage collection ineffective.
+CFunctionDefinition = collections.namedtuple(
+ 'CFunctionDefinition',
+ [
+ 'name',
+ 'argument_name_list',
+ 'statement_list',
],
)
CProgram = collections.namedtuple(
'CProgram',
[
- 'builtins',
+ 'builtin_set',
+ 'function_definition_list',
+ 'operator_declarations',
'statements',
'standard_libraries',
+ 'string_literal_list',
+ 'symbol_list',
],
)
BUILTINS = {
- 'print': ['stdio.h.'],
+ 'concatenate': [],
+ 'false': [],
+ 'pow': ['math.h'],
+ 'print': ['stdio.h'],
+ 'true': [],
}
-def transform_expression(builtin_dependencies, expression):
+def transform_variable_expression(accumulators, expression):
+ assert isinstance(expression, normalization.NormalVariableExpression)
+ return CVariableExpression(variable=expression.variable)
- LITERAL_TYPE_MAPPING = {
- parsing.FurIntegerLiteralExpression: CIntegerLiteral,
- parsing.FurStringLiteralExpression: CStringLiteral,
- }
+def transform_string_literal_expression(accumulators, expression):
+ value = expression.string
- if type(expression) in LITERAL_TYPE_MAPPING:
- return LITERAL_TYPE_MAPPING[type(expression)](value=expression.value)
+ try:
+ index = accumulators.string_literal_list.index(value)
+ except ValueError:
+ index = len(accumulators.string_literal_list)
+ accumulators.string_literal_list.append(value)
- INFIX_TYPE_MAPPING = {
- parsing.FurAdditionExpression: CAdditionExpression,
- parsing.FurSubtractionExpression: CSubtractionExpression,
- parsing.FurMultiplicationExpression: CMultiplicationExpression,
- parsing.FurIntegerDivisionExpression: CIntegerDivisionExpression,
- parsing.FurModularDivisionExpression: CModularDivisionExpression,
- }
+ return CStringLiteral(index=index, value=value)
- return INFIX_TYPE_MAPPING[type(expression)](
- left=transform_expression(builtin_dependencies, expression.left),
- right=transform_expression(builtin_dependencies, expression.right),
+def transform_symbol_expression(accumulators, expression):
+ if expression.symbol in BUILTINS:
+ accumulators.builtin_set.add(expression.symbol)
+
+ try:
+ symbol_list_index = accumulators.symbol_list.index(expression.symbol)
+ except ValueError:
+ symbol_list_index = len(accumulators.symbol_list)
+ accumulators.symbol_list.append(expression.symbol)
+
+ return CSymbolExpression(
+ symbol=expression.symbol,
+ symbol_list_index=symbol_list_index,
+ )
+
+CInfixDeclaration = collections.namedtuple(
+ 'CInfixDeclaration',
+ [
+ 'name',
+ 'in_type',
+ 'out_type',
+ 'operator',
+ ],
+)
+
+FUR_INFIX_OPERATOR_TO_C_FUNCTION = {
+ '++': 'concatenate',
+}
+
+FUR_INFIX_OPERATOR_TO_C_INFIX_OPERATOR = {
+ '+': CInfixDeclaration(name='add', in_type='integer', out_type='integer', operator='+'),
+ '-': CInfixDeclaration(name='subtract', in_type='integer', out_type='integer', operator='-'),
+ '*': CInfixDeclaration(name='multiply', in_type='integer', out_type='integer', operator='*'),
+ '//': CInfixDeclaration(name='integerDivide', in_type='integer', out_type='integer', operator='/'),
+ '%': CInfixDeclaration(name='modularDivide', in_type='integer', out_type='integer', operator='%'),
+ 'and': CInfixDeclaration(name='and', in_type='boolean', out_type='boolean', operator='&&'),
+ 'or': CInfixDeclaration(name='or', in_type='boolean', out_type='boolean', operator='||'),
+ '==': CInfixDeclaration(name='equals', in_type='integer', out_type='boolean', operator='=='),
+ '!=': CInfixDeclaration(name='notEquals', in_type='integer', out_type='boolean', operator='!='),
+ '<=': CInfixDeclaration(name='lessThanOrEqual', in_type='integer', out_type='boolean', operator='<='),
+ '>=': CInfixDeclaration(name='greaterThanOrEqual', in_type='integer', out_type='boolean', operator='>='),
+ '<': CInfixDeclaration(name='lessThan', in_type='integer', out_type='boolean', operator='<'),
+ '>': CInfixDeclaration(name='greaterThan', in_type='integer', out_type='boolean', operator='>'),
+}
+
+def transform_infix_operator_without_c_equivalent(accumulators, expression):
+ return CFunctionCallForFurInfixOperator(
+ metadata=expression.metadata,
+ name='concatenate',
)
-def transform_function_call_statement(builtin_dependencies, function_call):
- if function_call.name in BUILTINS.keys():
- builtin_dependencies.add(function_call.name)
+def transform_infix_expression(accumulators, expression):
+ if expression.operator in FUR_INFIX_OPERATOR_TO_C_FUNCTION:
+ return transform_infix_operator_without_c_equivalent(accumulators, expression)
- return CFunctionCallStatement(
- name='builtin$' + function_call.name,
- arguments=tuple(transform_expression(builtin_dependencies, arg) for arg in function_call.arguments),
- )
+ accumulators.operator_set.add(FUR_INFIX_OPERATOR_TO_C_INFIX_OPERATOR[expression.operator])
- raise Exception()
+ return CFunctionCallForFurInfixOperator(
+ metadata=expression.metadata,
+ name=FUR_INFIX_OPERATOR_TO_C_INFIX_OPERATOR[expression.operator].name,
+ )
+
+def transform_integer_literal_expression(accumulators, expression):
+ return CIntegerLiteral(value=expression.integer)
+
+def transform_negation_expression(accumulators, expression):
+ return CNegationExpression(
+ value=transform_expression(accumulators, expression.internal_expression),
+ )
+
+CListConstructExpression = collections.namedtuple(
+ 'CListConstructExpression',
+ [
+ 'allocate',
+ ],
+)
+
+CListAppendStatement = collections.namedtuple(
+ 'CListAppendStatement',
+ [
+ 'list_expression',
+ 'item_expression',
+ ],
+)
+
+CListGetExpression = collections.namedtuple(
+ 'CListGetExpression',
+ [
+ 'list_expression',
+ 'index_expression',
+ ],
+)
+
+def transform_structure_literal_expression(accumulators, expression):
+ return CStructureLiteralExpression(
+ field_count=expression.field_count,
+ symbol_list_variable=expression.symbol_list_variable,
+ value_list_variable=expression.value_list_variable,
+ )
+
+def transform_dot_expression(accumulators, expression):
+ try:
+ symbol_list_index = accumulators.symbol_list.index(expression.field)
+
+ except ValueError:
+ symbol_list_index = len(accumulators.symbol_list)
+ accumulators.symbol_list.append(expression.field)
+
+ return CDotExpression(
+ instance=transform_variable_expression(accumulators, expression.instance),
+ symbol=expression.field,
+ symbol_list_index=symbol_list_index,
+ )
+
+def transform_list_construct_expression(accumulators, expression):
+ return CListConstructExpression(allocate=expression.allocate)
+
+def transform_list_get_expression(accumulators, expression):
+ return CListGetExpression(
+ list_expression=transform_expression(accumulators, expression.list_expression),
+ index_expression=transform_expression(accumulators, expression.index_expression),
+ )
+
+def transform_list_append_statement(accumulators, expression):
+ return CListAppendStatement(
+ list_expression=transform_expression(accumulators, expression.list_expression),
+ item_expression=transform_expression(accumulators, expression.item_expression),
+ )
+
+def transform_expression(accumulators, expression):
+ # TODO Clean up handlers for parsing expressions
+ return {
+ parsing.FurInfixExpression: transform_infix_expression,
+ parsing.FurIntegerLiteralExpression: transform_integer_literal_expression,
+ parsing.FurNegationExpression: transform_negation_expression,
+ parsing.FurStringLiteralExpression: transform_string_literal_expression,
+ normalization.NormalDotExpression: transform_dot_expression,
+ normalization.NormalFunctionCallExpression: transform_function_call_expression,
+ normalization.NormalInfixExpression: transform_infix_expression,
+ normalization.NormalIntegerLiteralExpression: transform_integer_literal_expression,
+ normalization.NormalListConstructExpression: transform_list_construct_expression,
+ normalization.NormalListGetExpression: transform_list_get_expression,
+ normalization.NormalNegationExpression: transform_negation_expression,
+ normalization.NormalStructureLiteralExpression: transform_structure_literal_expression,
+ normalization.NormalStringLiteralExpression: transform_string_literal_expression,
+ normalization.NormalSymbolExpression: transform_symbol_expression,
+ normalization.NormalVariableExpression: transform_variable_expression,
+ }[type(expression)](accumulators, expression)
+
+def transform_symbol_assignment_statement(accumulators, assignment_statement):
+ # TODO Check that target is not a builtin
+ try:
+ symbol_list_index = accumulators.symbol_list.index(assignment_statement.target)
+ except ValueError:
+ symbol_list_index = len(accumulators.symbol_list)
+ accumulators.symbol_list.append(assignment_statement.target)
+
+ return CSymbolAssignmentStatement(
+ target=assignment_statement.target,
+ target_symbol_list_index=symbol_list_index,
+ expression=transform_expression(
+ accumulators,
+ assignment_statement.expression,
+ ),
+ )
+
+def transform_function_call_expression(accumulators, function_call):
+ # TODO Use the symbol from SYMBOL LIST
+ return CFunctionCallExpression(
+ function_expression=transform_expression(accumulators, function_call.function_expression),
+ argument_count=function_call.argument_count,
+ )
+
+def transform_expression_statement(accumulators, statement):
+ return CExpressionStatement(
+ expression=transform_expression(accumulators, statement.expression),
+ )
+
+def transform_if_else_statement(accumulators, statement):
+ return CIfElseStatement(
+ condition_expression=transform_expression(accumulators, statement.condition_expression),
+ if_statement_list=tuple(transform_statement(accumulators, s) for s in statement.if_statement_list),
+ else_statement_list=tuple(transform_statement(accumulators, s) for s in statement.else_statement_list),
+ )
+
+def transform_array_variable_initialization_statement(accumulators, statement):
+ return CArrayVariableInitializationStatement(
+ variable=statement.variable,
+ items=tuple(transform_expression(accumulators, i) for i in statement.items),
+ )
+
+def transform_symbol_array_variable_initialization_statement(accumulators, statement):
+ symbol_list_indices = []
+
+ for symbol in statement.symbol_list:
+ try:
+ symbol_list_index = accumulators.symbol_list.index(symbol)
+ except ValueError:
+ symbol_list_index = len(accumulators.symbol_list)
+ accumulators.symbol_list.append(symbol)
+
+ symbol_list_indices.append(symbol_list_index)
+
+ return CSymbolArrayVariableInitializationStatement(
+ variable=statement.variable,
+ symbol_list=statement.symbol_list,
+ symbol_list_indices=tuple(symbol_list_indices),
+ )
+
+def transform_variable_initialization_statement(accumulators, statement):
+ return CVariableInitializationStatement(
+ variable=statement.variable,
+ expression=transform_expression(accumulators, statement.expression),
+ )
+
+def transform_variable_reassignment_statement(accumulators, statement):
+ return CVariableReassignmentStatement(
+ variable=statement.variable,
+ expression=transform_expression(accumulators, statement.expression),
+ )
+
+def transform_function_definition_statement(accumulators, statement):
+ # TODO Allow defining the same function in different contexts
+ if any(fd.name == statement.name for fd in accumulators.function_definition_list):
+ raise Exception('A function with name "{}" already exists'.format(statement.name))
+
+ # TODO Add argument names to the symbol table
+ accumulators.function_definition_list.append(CFunctionDefinition(
+ name=statement.name,
+ argument_name_list=statement.argument_name_list,
+ statement_list=tuple(transform_statement(accumulators, s) for s in statement.statement_list)
+ ))
+
+ return CFunctionDeclaration(name=statement.name)
+
+def transform_push_statement(accumulators, statement):
+ return CPushStatement(expression=transform_expression(accumulators, statement.expression))
+
+def transform_statement(accumulators, statement):
+ return {
+ parsing.FurExpressionStatement: transform_expression_statement,
+ normalization.NormalArrayVariableInitializationStatement: transform_array_variable_initialization_statement,
+ normalization.NormalAssignmentStatement: transform_symbol_assignment_statement,
+ normalization.NormalExpressionStatement: transform_expression_statement,
+ normalization.NormalFunctionDefinitionStatement: transform_function_definition_statement,
+ normalization.NormalIfElseStatement: transform_if_else_statement,
+ normalization.NormalListAppendStatement: transform_list_append_statement,
+ normalization.NormalPushStatement: transform_push_statement,
+ normalization.NormalSymbolArrayVariableInitializationStatement: transform_symbol_array_variable_initialization_statement,
+ normalization.NormalVariableInitializationStatement: transform_variable_initialization_statement,
+ normalization.NormalVariableReassignmentStatement: transform_variable_reassignment_statement,
+ }[type(statement)](accumulators, statement)
+
+
+Accumulators = collections.namedtuple(
+ 'Accumulators',
+ [
+ 'builtin_set',
+ 'function_definition_list',
+ 'operator_set',
+ 'symbol_list',
+ 'string_literal_list',
+ ],
+)
def transform(program):
- builtins = set()
+ accumulators = Accumulators(
+ builtin_set=set(),
+ function_definition_list=[],
+ operator_set=set(),
+ symbol_list=[],
+ string_literal_list=[],
+ )
- c_statements = [
- transform_function_call_statement(builtins, statement) for statement in program.statement_list
+ statement_list = [
+ transform_statement(accumulators, statement) for statement in program.statement_list
]
- standard_libraries = set()
- for builtin in builtins:
+ standard_library_set = set()
+ for builtin in accumulators.builtin_set:
for standard_library in BUILTINS[builtin]:
- standard_libraries.add(standard_library)
+ standard_library_set.add(standard_library)
return CProgram(
- builtins=builtins,
- statements=c_statements,
- standard_libraries=standard_libraries,
+ builtin_set=accumulators.builtin_set,
+ function_definition_list=accumulators.function_definition_list,
+ operator_declarations=tuple(sorted(accumulators.operator_set)),
+ statements=statement_list,
+ standard_libraries=standard_library_set,
+ string_literal_list=accumulators.string_literal_list,
+ symbol_list=accumulators.symbol_list,
)