Bash++
Bash++ compiler internal documentation
|
The main listener class for the Bash++ compiler. More...
#include <BashppListener.h>
Classes | |
struct | code_segment |
A struct to hold (compiled) code segments. More... | |
Public Member Functions | |
void | set_source_file (std::string source_file) |
void | set_include_paths (std::shared_ptr< std::vector< std::string >> include_paths) |
void | set_dynamic_linking (bool dynamic_linking) |
void | set_included (bool included) |
void | set_included_from (BashppListener *included_from) |
Sets the included_from pointer to the given listener. More... | |
void | set_errors () |
Sets the program_has_errors flag to true. More... | |
void | set_output_stream (std::shared_ptr< std::ostream > output_stream) |
void | set_output_file (std::string output_file) |
void | set_run_on_exit (bool run_on_exit) |
void | set_suppress_warnings (bool suppress_warnings) |
void | set_arguments (std::vector< char * > arguments) |
std::shared_ptr< bpp::bpp_program > | get_program () |
std::set< std::string > | get_included_files () |
std::stack< std::string > | get_include_stack () |
code_segment | generate_supershell_code (const std::string &code_to_run_in_supershell) |
Generates a supershell code segment for executing a bash command. More... | |
code_segment | generate_delete_code (std::shared_ptr< bpp::bpp_object > object, const std::string &object_reference_string, bool force_pointer=false) |
Generates a code segment for deleting an object. More... | |
code_segment | generate_method_call_code (const std::string &reference_code, const std::string &method_name, std::shared_ptr< bpp::bpp_class > assumed_class) |
Generates a code segment for calling a method. More... | |
code_segment | generate_dynamic_cast_code (const std::string &reference_code, const std::string &class_name) |
Generates a code segment for performing a dynamic cast. More... | |
void | enterProgram (BashppParser::ProgramContext *ctx) override |
void | exitProgram (BashppParser::ProgramContext *ctx) override |
void | enterInclude_statement (BashppParser::Include_statementContext *ctx) override |
void | exitInclude_statement (BashppParser::Include_statementContext *ctx) override |
void | enterClass_definition (BashppParser::Class_definitionContext *ctx) override |
void | exitClass_definition (BashppParser::Class_definitionContext *ctx) override |
void | enterMember_declaration (BashppParser::Member_declarationContext *ctx) override |
void | exitMember_declaration (BashppParser::Member_declarationContext *ctx) override |
void | enterObject_instantiation (BashppParser::Object_instantiationContext *ctx) override |
void | exitObject_instantiation (BashppParser::Object_instantiationContext *ctx) override |
void | enterPointer_declaration (BashppParser::Pointer_declarationContext *ctx) override |
void | exitPointer_declaration (BashppParser::Pointer_declarationContext *ctx) override |
void | enterValue_assignment (BashppParser::Value_assignmentContext *ctx) override |
void | exitValue_assignment (BashppParser::Value_assignmentContext *ctx) override |
void | enterMethod_definition (BashppParser::Method_definitionContext *ctx) override |
void | exitMethod_definition (BashppParser::Method_definitionContext *ctx) override |
void | enterConstructor_definition (BashppParser::Constructor_definitionContext *ctx) override |
void | exitConstructor_definition (BashppParser::Constructor_definitionContext *ctx) override |
void | enterDestructor_definition (BashppParser::Destructor_definitionContext *ctx) override |
void | exitDestructor_definition (BashppParser::Destructor_definitionContext *ctx) override |
void | enterSelf_reference (BashppParser::Self_referenceContext *ctx) override |
void | exitSelf_reference (BashppParser::Self_referenceContext *ctx) override |
void | enterSelf_reference_as_lvalue (BashppParser::Self_reference_as_lvalueContext *ctx) override |
void | exitSelf_reference_as_lvalue (BashppParser::Self_reference_as_lvalueContext *ctx) override |
void | enterStatement (BashppParser::StatementContext *ctx) override |
void | exitStatement (BashppParser::StatementContext *ctx) override |
void | enterClass_body_statement (BashppParser::Class_body_statementContext *ctx) override |
void | exitClass_body_statement (BashppParser::Class_body_statementContext *ctx) override |
void | enterGeneral_statement (BashppParser::General_statementContext *ctx) override |
void | exitGeneral_statement (BashppParser::General_statementContext *ctx) override |
void | enterObject_assignment (BashppParser::Object_assignmentContext *ctx) override |
void | exitObject_assignment (BashppParser::Object_assignmentContext *ctx) override |
void | enterPointer_dereference (BashppParser::Pointer_dereferenceContext *ctx) override |
void | exitPointer_dereference (BashppParser::Pointer_dereferenceContext *ctx) override |
void | enterObject_address (BashppParser::Object_addressContext *ctx) override |
void | exitObject_address (BashppParser::Object_addressContext *ctx) override |
void | enterObject_reference (BashppParser::Object_referenceContext *ctx) override |
void | exitObject_reference (BashppParser::Object_referenceContext *ctx) override |
void | enterObject_reference_as_lvalue (BashppParser::Object_reference_as_lvalueContext *ctx) override |
void | exitObject_reference_as_lvalue (BashppParser::Object_reference_as_lvalueContext *ctx) override |
void | enterNullptr_ref (BashppParser::Nullptr_refContext *ctx) override |
void | exitNullptr_ref (BashppParser::Nullptr_refContext *ctx) override |
void | enterNew_statement (BashppParser::New_statementContext *ctx) override |
void | exitNew_statement (BashppParser::New_statementContext *ctx) override |
void | enterDelete_statement (BashppParser::Delete_statementContext *ctx) override |
void | exitDelete_statement (BashppParser::Delete_statementContext *ctx) override |
void | enterDynamic_cast_statement (BashppParser::Dynamic_cast_statementContext *ctx) override |
void | exitDynamic_cast_statement (BashppParser::Dynamic_cast_statementContext *ctx) override |
void | enterSupershell (BashppParser::SupershellContext *ctx) override |
void | exitSupershell (BashppParser::SupershellContext *ctx) override |
void | enterSubshell (BashppParser::SubshellContext *ctx) override |
void | exitSubshell (BashppParser::SubshellContext *ctx) override |
void | enterDeprecated_subshell (BashppParser::Deprecated_subshellContext *ctx) override |
void | exitDeprecated_subshell (BashppParser::Deprecated_subshellContext *ctx) override |
void | enterBash_arithmetic (BashppParser::Bash_arithmeticContext *ctx) override |
void | exitBash_arithmetic (BashppParser::Bash_arithmeticContext *ctx) override |
void | enterString (BashppParser::StringContext *ctx) override |
void | exitString (BashppParser::StringContext *ctx) override |
void | enterSinglequote_string (BashppParser::Singlequote_stringContext *ctx) override |
void | exitSinglequote_string (BashppParser::Singlequote_stringContext *ctx) override |
void | enterParameter (BashppParser::ParameterContext *ctx) override |
void | exitParameter (BashppParser::ParameterContext *ctx) override |
void | enterOther_statement (BashppParser::Other_statementContext *ctx) override |
void | exitOther_statement (BashppParser::Other_statementContext *ctx) override |
void | enterRaw_rvalue (BashppParser::Raw_rvalueContext *ctx) override |
void | exitRaw_rvalue (BashppParser::Raw_rvalueContext *ctx) override |
void | enterArray_value (BashppParser::Array_valueContext *ctx) override |
void | exitArray_value (BashppParser::Array_valueContext *ctx) override |
void | enterArray_index (BashppParser::Array_indexContext *ctx) override |
void | exitArray_index (BashppParser::Array_indexContext *ctx) override |
void | enterBash_if_statement (BashppParser::Bash_if_statementContext *ctx) override |
void | exitBash_if_statement (BashppParser::Bash_if_statementContext *ctx) override |
void | enterBash_if_root_branch (BashppParser::Bash_if_root_branchContext *ctx) override |
void | exitBash_if_root_branch (BashppParser::Bash_if_root_branchContext *ctx) override |
void | enterBash_if_else_branch (BashppParser::Bash_if_else_branchContext *ctx) override |
void | exitBash_if_else_branch (BashppParser::Bash_if_else_branchContext *ctx) override |
void | enterBash_if_condition (BashppParser::Bash_if_conditionContext *ctx) override |
void | exitBash_if_condition (BashppParser::Bash_if_conditionContext *ctx) override |
void | enterBash_case_statement (BashppParser::Bash_case_statementContext *ctx) override |
void | exitBash_case_statement (BashppParser::Bash_case_statementContext *ctx) override |
void | enterBash_case_pattern (BashppParser::Bash_case_patternContext *ctx) override |
void | exitBash_case_pattern (BashppParser::Bash_case_patternContext *ctx) override |
void | enterBash_case_pattern_header (BashppParser::Bash_case_pattern_headerContext *ctx) override |
void | exitBash_case_pattern_header (BashppParser::Bash_case_pattern_headerContext *ctx) override |
void | enterBash_while_loop (BashppParser::Bash_while_loopContext *ctx) override |
void | exitBash_while_loop (BashppParser::Bash_while_loopContext *ctx) override |
void | enterBash_while_condition (BashppParser::Bash_while_conditionContext *ctx) override |
void | exitBash_while_condition (BashppParser::Bash_while_conditionContext *ctx) override |
void | enterBash_for_loop (BashppParser::Bash_for_loopContext *ctx) override |
void | exitBash_for_loop (BashppParser::Bash_for_loopContext *ctx) override |
void | enterBash_for_header (BashppParser::Bash_for_headerContext *ctx) override |
void | exitBash_for_header (BashppParser::Bash_for_headerContext *ctx) override |
void | enterHeredoc (BashppParser::HeredocContext *ctx) override |
void | exitHeredoc (BashppParser::HeredocContext *ctx) override |
void | enterHeredoc_header (BashppParser::Heredoc_headerContext *ctx) override |
void | exitHeredoc_header (BashppParser::Heredoc_headerContext *ctx) override |
void | enterExtra_statement (BashppParser::Extra_statementContext *ctx) override |
void | exitExtra_statement (BashppParser::Extra_statementContext *ctx) override |
void | enterTerminal_token (BashppParser::Terminal_tokenContext *ctx) override |
void | exitTerminal_token (BashppParser::Terminal_tokenContext *ctx) override |
Private Member Functions | |
bool | is_protected_keyword (const std::string &keyword) |
Private Attributes | |
std::string | source_file |
Path to the source file being compiled (used for error reporting) More... | |
bool | included = false |
std::shared_ptr< std::vector< std::string > > | include_paths = nullptr |
A list of paths to search for included files. More... | |
bool | dynamic_linking = false |
bool | suppress_warnings = false |
std::set< std::string > | included_files = {} |
A set of (unique) included files (used for '@include_once' directives) More... | |
BashppListener * | included_from = nullptr |
std::stack< std::string > | include_stack |
A chain of included files, from the main file to the current file (used for error reporting) More... | |
std::shared_ptr< std::ostream > | output_stream |
Pointer to the output stream to write the compiled code to. More... | |
std::string | output_file |
bool | run_on_exit = false |
std::vector< char * > | arguments = {} |
Command-line arguments to pass to the compiled program if run_on_exit is true. More... | |
std::shared_ptr< bpp::bpp_program > | program = std::make_shared<bpp::bpp_program>() |
bool | in_comment = false |
bool | in_singlequote_string = false |
bool | in_while_condition = false |
std::shared_ptr< bpp::bash_while_condition > | current_while_condition = nullptr |
std::stack< std::shared_ptr< bpp::bpp_entity > > | entity_stack |
A stack to keep track of the current entity being processed. More... | |
std::shared_ptr< bpp::bpp_class > | primitive |
bool | error_thrown = false |
antlr4::ParserRuleContext * | error_context = nullptr |
bool | program_has_errors = false |
Static Private Attributes | |
static constexpr const char * | protected_keywords [] |
The main listener class for the Bash++ compiler.
This class is the main listener for the Bash++ compiler. This is where the main logic for the compiler is implemented by walking the parse tree generated by the ANTLR parser.
The listener is responsible for generating the compiled Bash code from the parsed Bash++ code. The listener is also responsible for handling errors and warnings.
A brief run-down of how the parse tree works:
When we enter a node in the parse tree, we execute the enter* function for that node. When we exit a node in the parse tree, we execute the exit* function for that node.
|
override |
Array indices take the form: [...] Where the contents of the brackets are the array index And can be any valid sequence of statements
|
override |
Array values are rvalues in assignment operations which take the form (...) Where the contents of the parentheses are the array elements Empty arrays are written as ()
|
override |
Bash arithmetic is a series of arithmetic operations that are enclosed in $((...)) They do not run in a subshell. So, unlike with the subshell rule, We can preserve objects instantiated within the arithmetic context, etc
|
override |
|
override |
|
override |
Bash case statements take the form case (something) in pattern1) ... ;; ... esac
The code to handle each pattern will be caught by the Bash_case_pattern context These will be children of the Bash_case_statement context in the parse tree
The patterns to be matched will be caught by the Bash_case_pattern_header context These will be children of the Bash_case_pattern context in the parse tree
|
override |
|
override |
|
override |
|
override |
|
override |
|
override |
Bash if statement take the form if CONDITION; then ... elif CONDITION; then ... else ... fi
The elif/else branches will be caught by the Bash_if_root_branch and Bash_if_else_branch contexts Both of those will be children of the Bash_if_statement context in the parse tree
The only thing that we need to be careful about is this: All of the pre-code which is generated INSIDE of the if CONDITION Should be placed before the if statement altogether, not only before the condition Likewise all of the post-code for the condition should be placed after the if statement
For example, consider the following code: if [[ -f "@this.filePath" ]]; then ... elif [[ -f "@this.otherFilePath" ]]; then ... fi
Pre-code has to be generated in order to access @this.filePath and @this.otherFilePath The pre-code converts these references into ordinary variable references which we can substitute directly into the if condition As in, for example, swapping 'if [[ -f "@this.filePath" ]]' with 'if [[ -f "$filePath" ]]' Although we have better naming conventions for the variables, this is just an example
If we weren't careful, and just placed the pre-code the way we always do, we would end up with something like this: $filePath={whatever we need to do to access @this.filePath} if [[ -f "$filePath" ]]; then ... $otherFilePath={whatever we need to do to access @this.otherFilePath} elif [[ -f "$otherFilePath" ]]; then ... fi
As you can tell from the above, the $otherFilePath assignment is INSIDE the first branch of the if statement And therefore is completely useless – if the first branch is taken, the second branch will never be taken And in the event that the second branch IS taken, $otherFilePath will not be defined
So, what we have to do instead is a bit more like: $filePath={whatever we need to do to access @this.filePath} $otherFilePath={whatever we need to do to access @this.otherFilePath} if [[ -f "$filePath" ]]; then ... elif [[ -f "$otherFilePath" ]]; then ... fi
|
override |
|
override |
|
override |
|
override |
|
override |
Constructor definitions take the form @constructor { ... }
|
override |
Delete statements take the form @delete @object Where object is the name of the object to delete
This statement calls the __delete function for the object and the object's destructor if it exists If the destructor exists, it will be called first (before __delete) It then unsets the object
|
override |
|
override |
Destructor definitions take the form @destructor { ... }
|
override |
Dynamic cast statements take the form @dynamic_cast<ClassName> Object Where ClassName is the name of the class to cast to And Object is the object to cast
This statement performs a runtime check to verify the cast is valid And substitutes either the address of the cast object or the @nullptr value
|
override |
|
override |
|
override |
|
override |
|
override |
|
override |
This will either be:
|
override |
|
override |
New statements take the form @new ClassName Where ClassName is the name of the class to instantiate
This statement creates a new object of the specified class And replaces the "@new ClassName" statement with the address of the new object
|
override |
Nullptr references take the form @nullptr
This reference will be replaced with the value of the nullptr constant
|
override |
Object addresses take the form &@IDENTIFIER.IDENTIFIER... Or &@this.IDENTIFIER.IDENTIFIER...
This reference will be replaced with the memory address of the object
|
override |
|
override |
The object type will be stored in one of either IDENTIFIER_LVALUE or IDENTIFIER(0) If IDENTIFIER_LVALUE, then the object name will be in IDENTIFIER(0) If IDENTIFIER(0), then the object name will be in IDENTIFIER(1)
|
override |
Object references take the form @IDENTIFIER.IDENTIFIER.IDENTIFIER... Where each IDENTIFIER following a dot is a member of the object referenced by the preceding IDENTIFIER
This reference may resolve to either an object or a method If it's a primitive object, treat this as an rvalue and get the value of the primitive object If it's a non-primitive object, this is a method call to .toPrimitive If it's a method, call the method in a supershell and substitute the result
|
override |
Lvalue object references take the form @IDENTIFIER_LVALUE.IDENTIFIER.IDENTIFIER... Where each IDENTIFIER following a dot is a member of the object referenced by the preceding IDENTIFIER
This reference may resolve to either an object or a method If it's a primitive object, replace the reference with the address of the primitive object If it's a non-primitive object, this is a method call to .toPrimitive If it's a method, replace the reference with a call to the method There is no need to call the method in a supershell for lvalues. We can (and must) just call it directly
|
override |
|
override |
|
override |
The pointer type will be stored in one of either IDENTIFIER_LVALUE or IDENTIFIER(0) If IDENTIFIER_LVALUE, then the pointer name will be in IDENTIFIER(0) If IDENTIFIER(0), then the pointer name will be in IDENTIFIER(1)
|
override |
Pointer dereferences take the form *@IDENTIFIER.IDENTIFIER... Or *@this.IDENTIFIER.IDENTIFIER... The result should be the object pointed to by the pointer For instance, @MyClass myObject=*@myPointer Should copy the object pointed to by myPointer into myObject Or: var=*@myPointer Should store the output of the object's toPrimitive method in var
|
override |
|
override |
|
override |
Self references take the form @this.IDENTIFIER.IDENTIFIER... Where each IDENTIFIER following a dot is a member of the object referenced by the preceding IDENTIFIER
This reference may resolve to either an object or a method If it's a primitive object, treat this as an rvalue and get the value of the primitive object If it's a non-primitive object, this is a method call to .toPrimitive If it's a method, call the method in a supershell and substitute the result
|
override |
Self references take the form @this.IDENTIFIER.IDENTIFIER... Where each IDENTIFIER following a dot is a member of the object referenced by the preceding IDENTIFIER
This reference may resolve to either an object or a method If it's a primitive object, replace the reference with the address of the primitive object If it's a non-primitive object, this is a method call to .toPrimitive If it's a method, replace the reference with a call to the method There is no need to call the method in a supershell for lvalues. We can (and must) just call it directly
|
override |
|
override |
|
override |
|
override |
|
override |
Supershells take the form @(...) Where ... is a series of commands to be executed in a supershell Supershells can be nested
|
override |
|
override |
|
override |
|
override |
|
override |
|
override |
|
override |
|
override |
|
override |
|
override |
|
override |
|
override |
|
override |
|
override |
|
override |
|
override |
|
override |
|
override |
|
override |
|
override |
|
override |
|
override |
|
override |
|
override |
|
override |
|
override |
|
override |
|
override |
|
override |
|
override |
|
override |
|
override |
|
override |
|
override |
|
override |
|
override |
Suppose we have an 'object' with a datamember 'array' which is an array of primitives Accessing index 'i' of that array would, in Bash++, take the form: @object.array[$i] And the compiled code's version of the reference: ${bpp__objectClass__object__array[$i]}
Suppose however that 'object' has a non-primitive datamember 'inner' which has a datamember 'array' which is an array of primitives (In this case, we're nesting – the array is not a datamember of 'object', but of 'object.inner') Accessing index 'i' of that array would, in Bash++, take the form: @object.inner.array[$i] But the compiled code's version of the reference would have to take a slightly different form, Since we have to dereference the pointer to 'inner' before we can access 'array': bpp__objectClass__object__inner__array=${bpp__objectClass__object__inner}__array This "bpp__objectClass__object__inner__array" evaluates to a STRING which is the variable name where the array is actually stored We then have to evaluate that string to get the actual values stored in the array: bpp__objectClass__object__inner__arrayString="${bpp__objectClass__object__inner__array}[${i}]"
eval bpp__objectClass__object__inner__arrayIndex="\${${bpp__objectClass__object__inner__arrayString}"}"
So, we have to follow a different procedure based on whether or not we have to dereference a pointer
To make this code less disgraceful, at some point, object references should be re-worked altogether In the meantime, we can do a HACKY fix by checking the size of the IDENTIFIER list If it's greater than 2, we're guaranteed to have to dereference a pointer If it's not, we're guaranteed not to have to dereference a pointer (unless the very first identifier refers to a pointer)
TODO(@rail5): Fix this. Really just fix object references from the ground-up
|
override |
|
override |
|
override |
|
override |
|
override |
|
override |
|
override |
|
override |
|
override |
|
override |
|
override |
|
override |
|
override |
|
override |
|
override |
|
override |
Value assignments will appear in the following contexts:
BashppListener::code_segment BashppListener::generate_delete_code | ( | std::shared_ptr< bpp::bpp_object > | object, |
const std::string & | object_reference_string, | ||
bool | force_pointer = false |
||
) |
Generates a code segment for deleting an object.
This function constructs a code segment to delete an object. The generated code includes:
object | The object to be deleted. |
object_reference_string | The string representing the object's reference in the compiled code. |
force_pointer | Whether to force the object to be treated as a pointer. |
BashppListener::code_segment BashppListener::generate_dynamic_cast_code | ( | const std::string & | reference_code, |
const std::string & | class_name | ||
) |
Generates a code segment for performing a dynamic cast.
This function constructs a code segment to perform a dynamic cast on an object. The generated code includes:
reference_code | The code representing the object reference |
class_name | The type to which we want to cast |
BashppListener::code_segment BashppListener::generate_method_call_code | ( | const std::string & | reference_code, |
const std::string & | method_name, | ||
std::shared_ptr< bpp::bpp_class > | assumed_class | ||
) |
Generates a code segment for calling a method.
This function constructs a code segment to call a method on an object. The generated code includes:
reference_code | The code representing the object reference. |
method_name | The name of the method to be called. |
assumed_class | The class to which the object is assumed to belong at compile-time. |
BashppListener::code_segment BashppListener::generate_supershell_code | ( | const std::string & | code_to_run_in_supershell | ) |
Generates a supershell code segment for executing a bash command.
This function constructs a code segment to run a specified command in a supershell. It creates a unique function name and output variable using a global counter. The generated code includes:
code_to_run_in_supershell | The bash command to be executed within the supershell. |
std::stack< std::string > BashppListener::get_include_stack | ( | ) |
std::set< std::string > BashppListener::get_included_files | ( | ) |
std::shared_ptr< bpp::bpp_program > BashppListener::get_program | ( | ) |
|
inlineprivate |
void BashppListener::set_arguments | ( | std::vector< char * > | arguments | ) |
void BashppListener::set_dynamic_linking | ( | bool | dynamic_linking | ) |
void BashppListener::set_errors | ( | ) |
Sets the program_has_errors flag to true.
This function is called when a syntax error is encountered during parsing.
void BashppListener::set_include_paths | ( | std::shared_ptr< std::vector< std::string >> | include_paths | ) |
void BashppListener::set_included | ( | bool | included | ) |
void BashppListener::set_included_from | ( | BashppListener * | included_from | ) |
Sets the included_from pointer to the given listener.
void BashppListener::set_output_file | ( | std::string | output_file | ) |
void BashppListener::set_output_stream | ( | std::shared_ptr< std::ostream > | output_stream | ) |
void BashppListener::set_run_on_exit | ( | bool | run_on_exit | ) |
void BashppListener::set_source_file | ( | std::string | source_file | ) |
void BashppListener::set_suppress_warnings | ( | bool | suppress_warnings | ) |
|
private |
Command-line arguments to pass to the compiled program if run_on_exit is true.
|
private |
|
private |
|
private |
A stack to keep track of the current entity being processed.
For example, when we encounter a class definition, we push the class onto the entity_stack. Then, inside that class, when we encounter a method definition, we push the method onto the entity_stack. Inside that method, when we encounter a value assignment, we push the value assignment onto the entity_stack. When we're done with the value assignment, we pop it off the entity_stack, so that the method is now at the top of the stack. When we're done with the method, we pop it off the entity_stack, so that the class is now at the top of the stack. When we're done with the class, we pop it off the entity_stack, so that the program is now at the top of the stack.
|
private |
|
private |
|
private |
|
private |
|
private |
|
private |
A list of paths to search for included files.
|
private |
A chain of included files, from the main file to the current file (used for error reporting)
|
private |
|
private |
A set of (unique) included files (used for '@include_once' directives)
|
private |
|
private |
|
private |
Pointer to the output stream to write the compiled code to.
|
private |
|
private |
|
private |
|
staticconstexprprivate |
|
private |
|
private |
Path to the source file being compiled (used for error reporting)
|
private |