// See the file "COPYING" in the toplevel directory for copyright. #include "Gen-ZAM.h" #include #include #include using namespace std; // Helper functions to convert dashes to underscores or vice versa. static char dash_to_under(char c) { return c == '-' ? '_' : c; } static char under_to_dash(char c) { return c == '_' ? '-' : c; } // Structure for binding together Zeek script types, internal names Gen-ZAM // uses to track them, mnemonics for referring to them in instruction names, // the corresponding Val accessor, and whether the type requires memory // management. struct TypeInfo { string tag; ZAM_ExprType et; string suffix; string accessor; // doesn't include "As" prefix or "()" suffix bool is_managed; }; static vector ZAM_type_info = { {"TYPE_ADDR", ZAM_EXPR_TYPE_ADDR, "A", "Addr", true}, {"TYPE_ANY", ZAM_EXPR_TYPE_ANY, "a", "Any", true}, {"TYPE_COUNT", ZAM_EXPR_TYPE_UINT, "U", "Count", false}, {"TYPE_DOUBLE", ZAM_EXPR_TYPE_DOUBLE, "D", "Double", false}, {"TYPE_FILE", ZAM_EXPR_TYPE_FILE, "f", "File", true}, {"TYPE_FUNC", ZAM_EXPR_TYPE_FUNC, "F", "Func", true}, {"TYPE_INT", ZAM_EXPR_TYPE_INT, "I", "Int", false}, {"TYPE_LIST", ZAM_EXPR_TYPE_LIST, "L", "List", true}, {"TYPE_OPAQUE", ZAM_EXPR_TYPE_OPAQUE, "O", "Opaque", true}, {"TYPE_PATTERN", ZAM_EXPR_TYPE_PATTERN, "P", "Pattern", true}, {"TYPE_RECORD", ZAM_EXPR_TYPE_RECORD, "R", "Record", true}, {"TYPE_STRING", ZAM_EXPR_TYPE_STRING, "S", "String", true}, {"TYPE_SUBNET", ZAM_EXPR_TYPE_SUBNET, "N", "SubNet", true}, {"TYPE_TABLE", ZAM_EXPR_TYPE_TABLE, "T", "Table", true}, {"TYPE_TYPE", ZAM_EXPR_TYPE_TYPE, "t", "Type", true}, {"TYPE_VECTOR", ZAM_EXPR_TYPE_VECTOR, "V", "Vector", true}, }; // Given a ZAM_ExprType, returns the corresponding TypeInfo. const TypeInfo& find_type_info(ZAM_ExprType et) { assert(et != ZAM_EXPR_TYPE_NONE); auto pred = [et](const TypeInfo& ti) -> bool { return ti.et == et; }; auto ti = std::find_if(ZAM_type_info.begin(), ZAM_type_info.end(), pred); assert(ti != ZAM_type_info.end()); return *ti; } // Given a ZAM_ExprType, return its ZVal accessor. Takes into account // some naming inconsistencies between ZVal's and Val's. string find_type_accessor(ZAM_ExprType et) { switch ( et ) { case ZAM_EXPR_TYPE_NONE: return ""; case ZAM_EXPR_TYPE_UINT: return "uint_val"; case ZAM_EXPR_TYPE_PATTERN: return "re_val"; default: { string acc = find_type_info(et).accessor; transform(acc.begin(), acc.end(), acc.begin(), ::tolower); return acc + "_val"; } } } // Maps ZAM operand types to pairs of (1) the C++ name used to declare // the operand in a method declaration, and (2) the variable name to // use for the operand. unordered_map> ArgsManager::ot_to_args = { {ZAM_OT_AUX, {"OpaqueVals*", "v"}}, {ZAM_OT_CONSTANT, {"const ConstExpr*", "c"}}, {ZAM_OT_EVENT_HANDLER, {"EventHandler*", "h"}}, {ZAM_OT_INT, {"int", "i"}}, {ZAM_OT_LIST, {"const ListExpr*", "l"}}, {ZAM_OT_RECORD_FIELD, {"const NameExpr*", "n"}}, {ZAM_OT_VAR, {"const NameExpr*", "n"}}, // The following gets special treatment. {ZAM_OT_ASSIGN_FIELD, {"const NameExpr*", "n"}}, }; ArgsManager::ArgsManager(const vector& ot, ZAM_InstClass zc) { int n = 0; bool add_field = false; for ( const auto& ot_i : ot ) { if ( ot_i == ZAM_OT_NONE ) { // it had better be the only operand type assert(ot.size() == 1); break; } if ( n++ == 0 && zc == ZIC_COND ) // Skip the conditional's nominal assignment slot. continue; // Start off the argument info using the usual case // of (1) same method parameter name as GenInst argument, // and (2) not requiring a record field. auto& arg_i = ot_to_args[ot_i]; Arg arg = {arg_i.second, arg_i.first, arg_i.second, false}; if ( ot_i == ZAM_OT_ASSIGN_FIELD ) { arg.is_field = true; if ( n == 1 ) { // special-case the parameter arg.decl_name = "flhs"; arg.decl_type = "const FieldLHSAssignExpr*"; } } args.emplace_back(move(arg)); } Differentiate(); } void ArgsManager::Differentiate() { // First, figure out which parameter names are used how often. map name_count; // how often the name apepars map usage_count; // how often the name's been used so far for ( auto& arg : args ) { auto& name = arg.param_name; if ( name_count.count(name) == 0 ) { name_count[name] = 1; usage_count[name] = 0; } else ++name_count[name]; } // Now for each name - whether appearing as an argument or in // a declaration - if it's used more than once, then differentiate // it. Note, some names only appear multiple times as arguments // when invoking methods, but not in the declarations of the methods // themselves. for ( auto& arg : args ) { auto& decl = arg.decl_name; auto& name = arg.param_name; bool decl_and_arg_same = decl == name; if ( name_count[name] == 1 ) continue; // it's unique auto n = to_string(++usage_count[name]); name += n; if ( decl_and_arg_same ) decl += n; } // Finally, build the full versions of the declaration and parameters. // Tracks how many record fields we're dealing with. int num_fields = 0; for ( auto& arg : args ) { if ( ! full_decl.empty() ) full_decl += ", "; full_decl += arg.decl_type + " " + arg.decl_name; if ( ! full_params.empty() ) full_params += ", "; full_params += arg.param_name; params.push_back(arg.param_name); if ( arg.is_field ) ++num_fields; } assert(num_fields <= 2); // Add in additional arguments/parameters for record fields. if ( num_fields == 1 ) full_params += ", field"; else if ( num_fields == 2 ) { full_decl += ", int field2"; full_params += ", field1, field2"; } } ZAM_OpTemplate::ZAM_OpTemplate(ZAMGen* _g, string _base_name) : g(_g), base_name(move(_base_name)) { // Make the base name viable in a C++ name. transform(base_name.begin(), base_name.end(), base_name.begin(), dash_to_under); cname = base_name; transform(cname.begin(), cname.end(), cname.begin(), ::toupper); } void ZAM_OpTemplate::Build() { op_loc = g->CurrLoc(); string line; while ( g->ScanLine(line) ) { if ( line.size() <= 1 ) break; auto words = g->SplitIntoWords(line); if ( words.empty() ) break; Parse(words[0], line, words); } } void ZAM_OpTemplate::Instantiate() { InstantiateOp(OperandTypes(), IncludesVectorOp()); } void ZAM_OpTemplate::UnaryInstantiate() { // First operand is always the frame slot to which this operation // assigns the result of the applying unary operator. vector ots = {ZAM_OT_VAR}; ots.resize(2); // Now build versions for a constant operand (maybe not actually // needed due to constant folding, but sometimes that gets deferred // to run-time) ... if ( ! NoConst() ) { ots[1] = ZAM_OT_CONSTANT; InstantiateOp(ots, IncludesVectorOp()); } // ... and for a variable (frame-slot) operand. ots[1] = ZAM_OT_VAR; InstantiateOp(ots, IncludesVectorOp()); } void ZAM_OpTemplate::Parse(const string& attr, const string& line, const Words& words) { int num_args = -1; // -1 = don't enforce int nwords = static_cast(words.size()); if ( attr == "type" ) { if ( nwords <= 1 ) g->Gripe("missing argument", line); num_args = 1; const char* types = words[1].c_str(); while ( *types ) { ZAM_OperandType ot = ZAM_OT_NONE; switch ( *types ) { case 'C': ot = ZAM_OT_CONSTANT; break; case 'F': ot = ZAM_OT_ASSIGN_FIELD; break; case 'H': ot = ZAM_OT_EVENT_HANDLER; break; case 'L': ot = ZAM_OT_LIST; break; case 'O': ot = ZAM_OT_AUX; break; case 'R': ot = ZAM_OT_RECORD_FIELD; break; case 'V': ot = ZAM_OT_VAR; break; case 'i': ot = ZAM_OT_INT; break; case 'X': ot = ZAM_OT_NONE; break; default: g->Gripe("bad operand type", words[1]); break; } AddOpType(ot); ++types; } } else if ( attr == "op1-read" ) { num_args = 0; SetOp1Flavor("OP1_READ"); } else if ( attr == "op1-read-write" ) { num_args = 0; SetOp1Flavor("OP1_READ_WRITE"); } else if ( attr == "op1-internal" ) { num_args = 0; SetOp1Flavor("OP1_INTERNAL"); } else if ( attr == "set-type" ) { num_args = 1; if ( nwords > 1 ) SetTypeParam(ExtractTypeParam(words[1])); } else if ( attr == "set-type2" ) { num_args = 1; if ( nwords > 1 ) SetType2Param(ExtractTypeParam(words[1])); } else if ( attr == "custom-method" ) SetCustomMethod(g->SkipWords(line, 1)); else if ( attr == "method-post" ) SetPostMethod(g->SkipWords(line, 1)); else if ( attr == "side-effects" ) { if ( nwords == 3 ) SetAssignmentLess(words[1], words[2]); else // otherwise shouldn't be any arguments num_args = 0; SetHasSideEffects(); } else if ( attr == "no-eval" ) { num_args = 0; SetNoEval(); } else if ( attr == "vector" ) { num_args = 0; SetIncludesVectorOp(); } else if ( attr == "assign-val" ) { num_args = 1; if ( words.size() > 1 ) SetAssignVal(words[1]); } else if ( attr == "eval" ) { AddEval(g->SkipWords(line, 1)); auto addl = GatherEval(); if ( ! addl.empty() ) AddEval(addl); } else if ( attr == "macro" ) g->ReadMacro(line); else g->Gripe("unknown template attribute", attr); if ( num_args >= 0 && num_args != nwords - 1 ) g->Gripe("extraneous or missing arguments", line); } string ZAM_OpTemplate::GatherEval() { string res; string l; while ( g->ScanLine(l) ) { if ( l.size() <= 1 || ! isspace(l.c_str()[0]) ) { g->PutBack(l); return res; } res += l; } return res; } int ZAM_OpTemplate::ExtractTypeParam(const string& arg) { if ( arg == "$$" ) return 1; if ( arg[0] != '$' ) g->Gripe("bad set-type parameter, should be $n", arg); int param = atoi(&arg[1]); if ( param <= 0 || param > 2 ) g->Gripe("bad set-type parameter, should be $1 or $2", arg); // Convert operand to underlying instruction element, i.e., add // one to account for the $$ assignment slot. return param + 1; } // Maps an operand type to a character mnemonic used to distinguish // it from others. unordered_map ZAM_OpTemplate::ot_to_char = { {ZAM_OT_AUX, 'O'}, {ZAM_OT_CONSTANT, 'C'}, {ZAM_OT_EVENT_HANDLER, 'H'}, {ZAM_OT_ASSIGN_FIELD, 'F'}, {ZAM_OT_INT, 'i'}, {ZAM_OT_LIST, 'L'}, {ZAM_OT_NONE, 'X'}, {ZAM_OT_RECORD_FIELD, 'R'}, {ZAM_OT_VAR, 'V'}, }; void ZAM_OpTemplate::InstantiateOp(const vector& ot, bool do_vec) { auto method = MethodName(ot); InstantiateOp(method, ot, ZIC_REGULAR); if ( IncludesFieldOp() ) InstantiateOp(method, ot, ZIC_FIELD); if ( do_vec ) InstantiateOp(method, ot, ZIC_VEC); if ( IsConditionalOp() ) InstantiateOp(method, ot, ZIC_COND); } void ZAM_OpTemplate::InstantiateOp(const string& method, const vector& ot, ZAM_InstClass zc) { string suffix = ""; if ( zc == ZIC_FIELD ) suffix = "_field"; else if ( zc == ZIC_VEC ) suffix = "_vec"; else if ( zc == ZIC_COND ) suffix = "_cond"; if ( ! IsInternalOp() ) InstantiateMethod(method, suffix, ot, zc); if ( IsAssignOp() ) InstantiateAssignOp(ot, suffix); else { InstantiateEval(ot, suffix, zc); if ( HasAssignmentLess() ) { auto op_string = "_" + OpSuffix(ot); auto op = g->GenOpCode(this, op_string); GenAssignmentlessVersion(op); } } } void ZAM_OpTemplate::GenAssignmentlessVersion(const string& op) { EmitTo(AssignFlavor); Emit("assignmentless_op[" + op + "] = " + AssignmentLessOp() + ";"); Emit("assignmentless_op_type[" + op + "] = " + AssignmentLessOpType() + ";"); } void ZAM_OpTemplate::InstantiateMethod(const string& m, const string& suffix, const vector& ot_orig, ZAM_InstClass zc) { if ( IsInternalOp() ) return; auto ot = ot_orig; if ( zc == ZIC_FIELD ) // Need to make room for the field offset. ot.emplace_back(ZAM_OT_INT); auto decls = MethodDeclare(ot, zc); EmitTo(MethodDecl); Emit("const ZAMStmt " + m + suffix + "(" + decls + ");"); EmitTo(MethodDef); Emit("const ZAMStmt ZAMCompiler::" + m + suffix + "(" + decls + ")"); BeginBlock(); InstantiateMethodCore(ot, suffix, zc); if ( HasPostMethod() ) Emit(GetPostMethod()); if ( ! HasCustomMethod() ) Emit("return AddInst(z);"); EndBlock(); NL(); } void ZAM_OpTemplate::InstantiateMethodCore(const vector& ot, const string& suffix, ZAM_InstClass zc) { if ( HasCustomMethod() ) { Emit(GetCustomMethod()); return; } assert(! ot.empty()); string full_suffix = "_" + OpSuffix(ot) + suffix; Emit("ZInstI z;"); if ( ot[0] == ZAM_OT_AUX ) { auto op = g->GenOpCode(this, full_suffix, zc); Emit("z = ZInstI(" + op + ");"); return; } if ( ot[0] == ZAM_OT_NONE ) { auto op = g->GenOpCode(this, full_suffix, zc); Emit("z = GenInst(" + op + ");"); return; } if ( ot.size() > 1 && ot[1] == ZAM_OT_AUX ) { auto op = g->GenOpCode(this, full_suffix, zc); Emit("z = ZInstI(" + op + ", Frame1Slot(n, " + op + "));"); return; } ArgsManager args(ot, zc); BuildInstruction(ot, args.Params(), full_suffix, zc); auto tp = GetTypeParam(); if ( tp > 0 ) Emit("z.SetType(" + args.NthParam(tp - 1) + "->GetType());"); auto tp2 = GetType2Param(); if ( tp2 > 0 ) Emit("z.t2 = " + args.NthParam(tp2 - 1) + "->GetType();"); } void ZAM_OpTemplate::BuildInstruction(const vector& ot, const string& params, const string& suffix, ZAM_InstClass zc) { auto op = g->GenOpCode(this, suffix, zc); Emit("z = GenInst(" + op + ", " + params + ");"); } void ZAM_OpTemplate::InstantiateEval(const vector& ot, const string& suffix, ZAM_InstClass zc) { auto eval = GetEval(); if ( ot.size() > 1 ) { // Check for use of "$1" to indicate the operand string op1; if ( ot[1] == ZAM_OT_CONSTANT ) op1 = "z.c"; else if ( ot[1] == ZAM_OT_VAR ) op1 = "frame[z.v2]"; eval = regex_replace(eval, regex("\\$1"), op1); } InstantiateEval(Eval, OpSuffix(ot) + suffix, eval, zc); } void ZAM_OpTemplate::InstantiateEval(EmitTarget et, const string& op_suffix, const string& eval, ZAM_InstClass zc) { auto op_code = g->GenOpCode(this, "_" + op_suffix, zc); EmitTo(et); Emit("case " + op_code + ":"); BeginBlock(); Emit(eval); EndBlock(); EmitUp("break;"); NL(); } void ZAM_OpTemplate::InstantiateAssignOp(const vector& ot, const string& suffix) { // First, create a generic version of the operand, which the // ZAM compiler uses to find specific-flavored versions. auto op_string = "_" + OpSuffix(ot); auto generic_op = g->GenOpCode(this, op_string); auto flavor_ind = "assignment_flavor[" + generic_op + "]"; EmitTo(AssignFlavor); Emit(flavor_ind + " = empty_map;"); auto eval = GetEval(); auto v = GetAssignVal(); for ( auto& ti : ZAM_type_info ) { auto op = g->GenOpCode(this, op_string + "_" + ti.suffix); if ( IsInternalOp() ) { EmitTo(AssignFlavor); Emit(flavor_ind + "[" + ti.tag + "] = " + op + ";"); if ( HasAssignmentLess() ) GenAssignmentlessVersion(op); } EmitTo(Eval); Emit("case " + op + ":"); BeginBlock(); GenAssignOpCore(ot, eval, ti.accessor, ti.is_managed); Emit("break;"); EndBlock(); } } void ZAM_OpTemplate::GenAssignOpCore(const vector& ot, const string& eval, const string& accessor, bool is_managed) { if ( HasAssignVal() ) { GenAssignOpValCore(eval, accessor, is_managed); return; } if ( ! eval.empty() ) g->Gripe("assign-op should not have an \"eval\"", eval); auto lhs_field = (ot[0] == ZAM_OT_ASSIGN_FIELD); auto rhs_field = lhs_field && ot.size() > 2 && (ot[2] == ZAM_OT_INT); auto constant_op = (ot[1] == ZAM_OT_CONSTANT); string rhs = constant_op ? "z.c" : "frame[z.v2]"; auto acc = ".As" + accessor + "()"; if ( accessor == "Any" && constant_op && ! rhs_field ) { // "any_val = constant" or "x$any_val = constant". // // These require special-casing, because to avoid going // through a CoerceToAny operation, we allow expressing // these directly. They don't fit with the usual assignment // paradigm since the RHS differs in type from the LHS. Emit("auto v = z.c.ToVal(z.t);"); if ( lhs_field ) { Emit("auto r = frame[z.v1].AsRecord();"); Emit("auto& f = r->RawField(z.v2);"); } else Emit("auto& f = frame[z.v1];"); Emit("zeek::Unref(f.ManagedVal());"); Emit("f = ZVal(v.release());"); } else if ( rhs_field ) { // The following is counter-intuitive, but comes from the // fact that we build out the instruction parameters as // an echo of the method parameters, and for this case that // means that the RHS field offset comes *before*, not after, // the LHS field offset. auto lhs_offset = constant_op ? 3 : 4; auto rhs_offset = lhs_offset - 1; Emit("auto v = " + rhs + ".AsRecord()->RawOptField(z.v" + to_string(rhs_offset) + "); // note, RHS field before LHS field"); Emit("if ( ! v )"); BeginBlock(); Emit("ZAM_run_time_error(z.loc, \"field value missing\");"); Emit("break;"); EndBlock(); auto slot = "z.v" + to_string(lhs_offset); Emit("auto r = frame[z.v1].AsRecord();"); Emit("auto& f = r->RawField(" + slot + "); // note, LHS field after RHS field"); if ( is_managed ) { Emit("zeek::Ref((*v)" + acc + ");"); Emit("zeek::Unref(f.ManagedVal());"); } Emit("f = *v;"); } else { if ( is_managed ) Emit("zeek::Ref(" + rhs + acc + ");"); if ( lhs_field ) { auto lhs_offset = constant_op ? 2 : 3; auto slot = "z.v" + to_string(lhs_offset); Emit("auto r = frame[z.v1].AsRecord();"); Emit("auto& f = r->RawField(" + slot + ");"); if ( is_managed ) Emit("zeek::Unref(f.ManagedVal());"); Emit("f = " + rhs + ";"); } else { if ( is_managed ) Emit("zeek::Unref(frame[z.v1].ManagedVal());"); Emit("frame[z.v1] = ZVal(" + rhs + acc + ");"); } } if ( lhs_field ) Emit("r->Modified();"); } void ZAM_OpTemplate::GenAssignOpValCore(const string& eval, const string& accessor, bool is_managed) { auto v = GetAssignVal(); Emit(eval); // Maps Zeek types to how to get the underlying value from a ValPtr. static unordered_map val_accessors = { {"Addr", "->AsAddrVal()"}, {"Any", ".get()"}, {"Count", "->AsCount()"}, {"Double", "->AsDouble()"}, {"Int", "->AsInt()"}, {"Pattern", "->AsPatternVal()"}, {"String", "->AsStringVal()"}, {"SubNet", "->AsSubNetVal()"}, {"Table", "->AsTableVal()"}, {"Vector", "->AsVectorVal()"}, {"File", "->AsFile()"}, {"Func", "->AsFunc()"}, {"List", "->AsListVal()"}, {"Opaque", "->AsOpaqueVal()"}, {"Record", "->AsRecordVal()"}, {"Type", "->AsTypeVal()"}, }; auto val_accessor = val_accessors[accessor]; string rhs; if ( IsInternalOp() ) rhs = v + val_accessor; else rhs = v + ".As" + accessor + "()"; if ( is_managed ) { Emit("auto rhs = " + rhs + ";"); Emit("zeek::Ref(rhs);"); Emit("Unref(frame[z.v1].ManagedVal());"); Emit("frame[z.v1] = ZVal(rhs);"); } else Emit("frame[z.v1] = ZVal(" + rhs + ");"); } string ZAM_OpTemplate::MethodName(const vector& ot) const { return base_name + OpSuffix(ot); } string ZAM_OpTemplate::MethodDeclare(const vector& ot, ZAM_InstClass zc) { ArgsManager args(ot, zc); return args.Decls(); } string ZAM_OpTemplate::OpSuffix(const vector& ot) const { string os; for ( auto& o : ot ) os += ot_to_char[o]; return os; } string ZAM_OpTemplate::SkipWS(const string& s) const { auto sp = s.c_str(); while ( *sp && isspace(*sp) ) ++sp; return sp; } void ZAM_OpTemplate::Emit(const string& s) { g->Emit(curr_et, s); } void ZAM_OpTemplate::EmitNoNL(const string& s) { g->SetNoNL(true); Emit(s); g->SetNoNL(false); } void ZAM_OpTemplate::IndentUp() { g->IndentUp(); } void ZAM_OpTemplate::IndentDown() { g->IndentDown(); } void ZAM_UnaryOpTemplate::Instantiate() { UnaryInstantiate(); } void ZAM_DirectUnaryOpTemplate::Instantiate() { EmitTo(DirectDef); Emit("case EXPR_" + cname + ":\treturn " + direct + "(lhs, rhs);"); } // Maps op-type mnemonics to the corresponding internal value used by Gen-ZAM. static unordered_map expr_type_names = { {'*', ZAM_EXPR_TYPE_DEFAULT}, {'A', ZAM_EXPR_TYPE_ADDR}, {'a', ZAM_EXPR_TYPE_ANY}, {'D', ZAM_EXPR_TYPE_DOUBLE}, {'f', ZAM_EXPR_TYPE_FILE}, {'F', ZAM_EXPR_TYPE_FUNC}, {'I', ZAM_EXPR_TYPE_INT}, {'L', ZAM_EXPR_TYPE_LIST}, {'X', ZAM_EXPR_TYPE_NONE}, {'O', ZAM_EXPR_TYPE_OPAQUE}, {'P', ZAM_EXPR_TYPE_PATTERN}, {'R', ZAM_EXPR_TYPE_RECORD}, {'S', ZAM_EXPR_TYPE_STRING}, {'N', ZAM_EXPR_TYPE_SUBNET}, {'T', ZAM_EXPR_TYPE_TABLE}, {'t', ZAM_EXPR_TYPE_TYPE}, {'U', ZAM_EXPR_TYPE_UINT}, {'V', ZAM_EXPR_TYPE_VECTOR}, }; // Inverse of the above. static unordered_map expr_name_types; ZAM_ExprOpTemplate::ZAM_ExprOpTemplate(ZAMGen* _g, string _base_name) : ZAM_OpTemplate(_g, std::move(_base_name)) { static bool did_map_init = false; if ( ! did_map_init ) { // Create the inverse mapping. for ( auto& tn : expr_type_names ) expr_name_types[tn.second] = tn.first; did_map_init = true; } } void ZAM_ExprOpTemplate::Parse(const string& attr, const string& line, const Words& words) { if ( attr == "op-type" ) { if ( words.size() == 1 ) g->Gripe("op-type needs arguments", line); for ( auto i = 1U; i < words.size(); ++i ) { auto& w_i = words[i]; if ( w_i.size() != 1 ) g->Gripe("bad op-type argument", w_i); auto et_c = w_i.c_str()[0]; if ( expr_type_names.count(et_c) == 0 ) g->Gripe("bad op-type argument", w_i); AddExprType(expr_type_names[et_c]); } } else if ( attr == "includes-field-op" ) { if ( words.size() != 1 ) g->Gripe("includes-field-op does not take any arguments", line); SetIncludesFieldOp(); } else if ( attr == "eval-type" ) { if ( words.size() < 3 ) g->Gripe("eval-type needs type and evaluation", line); auto& type = words[1]; if ( type.size() != 1 ) g->Gripe("bad eval-type type", type); auto type_c = type.c_str()[0]; if ( expr_type_names.count(type_c) == 0 ) g->Gripe("bad eval-type type", type); auto et = expr_type_names[type_c]; if ( expr_types.count(et) == 0 ) g->Gripe("eval-type type not present in eval-type", type); auto eval = g->SkipWords(line, 2); eval += GatherEval(); AddEvalSet(et, eval); } else if ( attr == "eval-mixed" ) { if ( words.size() < 4 ) g->Gripe("eval-mixed needs types and evaluation", line); auto& type1 = words[1]; auto& type2 = words[2]; if ( type1.size() != 1 || type2.size() != 1 ) g->Gripe("bad eval-mixed types", line); auto type_c1 = type1.c_str()[0]; auto type_c2 = type2.c_str()[0]; if ( expr_type_names.count(type_c1) == 0 || expr_type_names.count(type_c2) == 0 ) g->Gripe("bad eval-mixed types", line); auto et1 = expr_type_names[type_c1]; auto et2 = expr_type_names[type_c2]; if ( eval_set.count(et1) > 0 ) g->Gripe("eval-mixed uses type also included in op-type", line); auto eval = g->SkipWords(line, 3); eval += GatherEval(); AddEvalSet(et1, et2, eval); } else if ( attr == "eval-pre" ) { if ( words.size() < 2 ) g->Gripe("eval-pre needs evaluation", line); auto eval = g->SkipWords(line, 1); eval += GatherEval(); SetPreEval(eval); } else // Not an attribute specific to expr-op's. ZAM_OpTemplate::Parse(attr, line, words); } void ZAM_ExprOpTemplate::Instantiate() { InstantiateOp(OperandTypes(), IncludesVectorOp()); if ( op_types.size() > 1 && op_types[1] == ZAM_OT_CONSTANT ) InstantiateC1(op_types, op_types.size() - 1); if ( op_types.size() > 2 && op_types[2] == ZAM_OT_CONSTANT ) InstantiateC2(op_types, op_types.size() - 1); if ( op_types.size() > 3 && op_types[3] == ZAM_OT_CONSTANT ) InstantiateC3(op_types); bool all_var = true; for ( auto i = 1U; i < op_types.size(); ++i ) if ( op_types[i] != ZAM_OT_VAR ) all_var = false; if ( all_var ) InstantiateV(op_types); if ( op_types.size() == 3 && op_types[1] == ZAM_OT_RECORD_FIELD && op_types[2] == ZAM_OT_INT ) InstantiateV(op_types); } void ZAM_ExprOpTemplate::InstantiateC1(const vector& ots, size_t arity, bool do_vec) { string args = "lhs, r1->AsConstExpr()"; if ( arity == 1 && ots[0] == ZAM_OT_RECORD_FIELD ) args += ", rhs->AsFieldExpr()->Field()"; else if ( arity > 1 ) { args += ", "; if ( ots[2] == ZAM_OT_RECORD_FIELD ) args += "rhs->AsFieldExpr()->Field()"; else args += "r2->AsNameExpr()"; } auto m = MethodName(ots); EmitTo(C1Def); EmitNoNL("case EXPR_" + cname + ":"); if ( do_vec ) DoVectorCase(m, args); else EmitUp("return " + m + "(" + args + ");"); if ( IncludesFieldOp() ) { EmitTo(C1FieldDef); Emit("case EXPR_" + cname + ":\treturn " + m + "_field(" + args + ", field);"); } } void ZAM_ExprOpTemplate::InstantiateC2(const vector& ots, size_t arity) { string args = "lhs, r1->AsNameExpr(), r2->AsConstExpr()"; if ( arity == 3 ) args += ", r3->AsNameExpr()"; auto method = MethodName(ots); auto m = method.c_str(); EmitTo(C2Def); Emit("case EXPR_" + cname + ":\treturn " + m + "(" + args + ");"); if ( IncludesFieldOp() ) { EmitTo(C2FieldDef); Emit("case EXPR_" + cname + ":\treturn " + m + "_field(" + args + ", field);"); } } void ZAM_ExprOpTemplate::InstantiateC3(const vector& ots) { EmitTo(C3Def); Emit("case EXPR_" + cname + ":\treturn " + MethodName(ots) + "(lhs, r1->AsNameExpr(), r2->AsNameExpr(), r3->AsConstExpr());"); } void ZAM_ExprOpTemplate::InstantiateV(const vector& ots) { auto m = MethodName(ots); string args = "lhs, r1->AsNameExpr()"; if ( ots.size() >= 3 ) { if ( ots[2] == ZAM_OT_INT ) { string acc_flav = IncludesFieldOp() ? "Has" : ""; args += ", rhs->As" + acc_flav + "FieldExpr()->Field()"; } else args += ", r2->AsNameExpr()"; if ( ots.size() == 4 ) args += ", r3->AsNameExpr()"; } EmitTo(VDef); EmitNoNL("case EXPR_" + cname + ":"); if ( IncludesVectorOp() ) DoVectorCase(m, args); else EmitUp("return " + m + "(" + args + ");"); if ( IncludesFieldOp() ) { EmitTo(VFieldDef); Emit("case EXPR_" + cname + ":\treturn " + m + "_field(" + args + ", field);"); } } void ZAM_ExprOpTemplate::DoVectorCase(const string& m, const string& args) { NL(); IndentUp(); Emit("if ( rt->Tag() == TYPE_VECTOR )"); EmitUp("return " + m + "_vec(" + args + ");"); Emit("else"); EmitUp("return " + m + "(" + args + ");"); IndentDown(); } void ZAM_ExprOpTemplate::BuildInstructionCore(const string& params, const string& suffix, ZAM_InstClass zc) { Emit("auto tag = t->Tag();"); Emit("auto i_t = t->InternalType();"); int ncases = 0; for ( auto& [et1, et2_map] : eval_mixed_set ) for ( auto& [et2, eval] : et2_map ) GenMethodTest(et1, et2, params, suffix, ++ncases > 1, zc); bool do_default = false; for ( auto et : ExprTypes() ) { if ( et == ZAM_EXPR_TYPE_DEFAULT ) do_default = true; else GenMethodTest(et, et, params, suffix, ++ncases > 1, zc); } Emit("else"); if ( do_default ) { auto op = g->GenOpCode(this, suffix, zc); EmitUp("z = GenInst(" + op + ", " + params + ");"); } else EmitUp("reporter->InternalError(\"bad tag when generating method core\");"); } void ZAM_ExprOpTemplate::GenMethodTest(ZAM_ExprType et1, ZAM_ExprType et2, const string& params, const string& suffix, bool do_else, ZAM_InstClass zc) { // Maps ZAM_ExprType's to the information needed (variable name, // constant to compare it against) to identify using an "if" test // that a given AST Expr node employs the given type of operand. static map> if_tests = { {ZAM_EXPR_TYPE_ADDR, {"i_t", "TYPE_INTERNAL_ADDR"}}, {ZAM_EXPR_TYPE_ANY, {"tag", "TYPE_ANY"}}, {ZAM_EXPR_TYPE_DOUBLE, {"i_t", "TYPE_INTERNAL_DOUBLE"}}, {ZAM_EXPR_TYPE_FILE, {"tag", "TYPE_FILE"}}, {ZAM_EXPR_TYPE_FUNC, {"tag", "TYPE_FUNC"}}, {ZAM_EXPR_TYPE_INT, {"i_t", "TYPE_INTERNAL_INT"}}, {ZAM_EXPR_TYPE_LIST, {"tag", "TYPE_LIST"}}, {ZAM_EXPR_TYPE_OPAQUE, {"tag", "TYPE_OPAQUE"}}, {ZAM_EXPR_TYPE_PATTERN, {"tag", "TYPE_PATTERN"}}, {ZAM_EXPR_TYPE_RECORD, {"tag", "TYPE_RECORD"}}, {ZAM_EXPR_TYPE_STRING, {"i_t", "TYPE_INTERNAL_STRING"}}, {ZAM_EXPR_TYPE_SUBNET, {"i_t", "TYPE_INTERNAL_SUBNET"}}, {ZAM_EXPR_TYPE_TABLE, {"tag", "TYPE_TABLE"}}, {ZAM_EXPR_TYPE_TYPE, {"tag", "TYPE_TYPE"}}, {ZAM_EXPR_TYPE_UINT, {"i_t", "TYPE_INTERNAL_UNSIGNED"}}, {ZAM_EXPR_TYPE_VECTOR, {"tag", "TYPE_VECTOR"}}, }; if ( if_tests.count(et1) == 0 ) g->Gripe("bad op-type", op_loc); auto if_test = if_tests[et1]; auto if_var = if_test.first; auto if_val = if_test.second; string test = "if ( " + if_var + " == " + if_val + " )"; if ( do_else ) test = "else " + test; Emit(test); auto op_suffix = suffix + "_" + expr_name_types[et1]; if ( et2 != et1 ) op_suffix += expr_name_types[et2]; auto op = g->GenOpCode(this, op_suffix, zc); EmitUp("z = GenInst(" + op + ", " + params + ");"); } EvalInstance::EvalInstance(ZAM_ExprType _lhs_et, ZAM_ExprType _op1_et, ZAM_ExprType _op2_et, string _eval, bool _is_def) { lhs_et = _lhs_et; op1_et = _op1_et; op2_et = _op2_et; eval = move(_eval); is_def = _is_def; } string EvalInstance::LHSAccessor(bool is_ptr) const { if ( lhs_et == ZAM_EXPR_TYPE_NONE || lhs_et == ZAM_EXPR_TYPE_DEFAULT ) return ""; string deref = is_ptr ? "->" : "."; string acc = find_type_accessor(lhs_et); return deref + acc; } string EvalInstance::Accessor(ZAM_ExprType et, bool is_ptr) const { if ( et == ZAM_EXPR_TYPE_NONE || et == ZAM_EXPR_TYPE_DEFAULT ) return ""; string deref = is_ptr ? "->" : "."; return deref + "As" + find_type_info(et).accessor + "()"; } string EvalInstance::OpMarker() const { if ( op1_et == ZAM_EXPR_TYPE_DEFAULT || op1_et == ZAM_EXPR_TYPE_NONE ) return ""; if ( op1_et == op2_et ) return "_" + find_type_info(op1_et).suffix; return "_" + find_type_info(op1_et).suffix + find_type_info(op2_et).suffix; } void ZAM_ExprOpTemplate::InstantiateEval(const vector& ot_orig, const string& suffix, ZAM_InstClass zc) { if ( expr_types.empty() ) { // No operand types to expand over. ZAM_OpTemplate::InstantiateEval(ot_orig, suffix, zc); return; } auto ot = ot_orig; if ( zc == ZIC_FIELD ) // Make room for the offset. ot.emplace_back(ZAM_OT_INT); auto ot_str = OpSuffix(ot); // Some of these might not wind up being used, but no harm in // initializing them in case they are. string lhs, op1, op2; string branch_target = "z.v"; EmitTarget emit_target = Eval; if ( zc == ZIC_VEC ) { lhs = "vec1[i]"; op1 = "vec2[i]"; op2 = "vec3[i]"; emit_target = Arity() == 1 ? Vec1Eval : Vec2Eval; } else { lhs = "frame[z.v1]"; auto op1_offset = zc == ZIC_COND ? 1 : 2; auto op2_offset = op1_offset + 1; bool ot1_const = ot[1] == ZAM_OT_CONSTANT; bool ot2_const = Arity() >= 2 && ot[2] == ZAM_OT_CONSTANT; if ( ot1_const ) { op1 = "z.c"; --op2_offset; branch_target += "2"; } else { op1 = "frame[z.v" + to_string(op1_offset) + "]"; if ( Arity() > 1 && ot[2] == ZAM_OT_VAR ) branch_target += "3"; else branch_target += "2"; } if ( ot2_const ) op2 = "z.c"; else op2 = "frame[z.v" + to_string(op2_offset) + "]"; if ( zc == ZIC_FIELD ) { // Compute the slot holding the field offset. auto f = // The first slots are taken up by the // assignment slot and the operands ... Arity() + 1 + // ... and slots are numbered starting at 1. +1; if ( ot1_const || ot2_const ) // One of the operand slots won't be needed // due to the presence of a constant. // (It's never the case that both operands // are constants - those instead get folded.) --f; lhs += ".AsRecord()->RawField(z.v" + to_string(f) + ")"; } } vector eval_instances; for ( auto et : expr_types ) { auto is_def = eval_set.count(et) == 0; string eval = is_def ? GetEval() : eval_set[et]; auto lhs_et = IsConditionalOp() ? ZAM_EXPR_TYPE_INT : et; eval_instances.emplace_back(lhs_et, et, et, eval, is_def); } if ( zc != ZIC_VEC ) for ( const auto& em1 : eval_mixed_set ) { auto et1 = em1.first; for ( const auto& em2 : em1.second ) { auto et2 = em2.first; // For the LHS, either its expression type is // ignored, or if it's a conditional, so just // note it for the latter. auto lhs_et = ZAM_EXPR_TYPE_INT; eval_instances.emplace_back(lhs_et, et1, et2, em2.second, false); } } for ( auto& ei : eval_instances ) { auto lhs_accessor = ei.LHSAccessor(); if ( HasExplicitResultType() ) lhs_accessor = ""; string lhs_ei = lhs; if ( zc != ZIC_VEC ) lhs_ei += lhs_accessor; auto op1_ei = op1 + ei.Op1Accessor(zc == ZIC_VEC); auto op2_ei = op2 + ei.Op2Accessor(zc == ZIC_VEC); auto eval = SkipWS(ei.Eval()); auto has_target = eval.find("$$") != string::npos; if ( zc == ZIC_VEC ) { const char* rhs; if ( has_target ) rhs = "\\$\\$ = ([^;\n]*)"; else rhs = "^[^;\n]*"; auto replacement = VecEvalRE(has_target); eval = regex_replace(eval, regex(rhs), replacement, std::regex_constants::match_not_null); } auto is_none = ei.LHS_ET() == ZAM_EXPR_TYPE_NONE; auto is_default = ei.LHS_ET() == ZAM_EXPR_TYPE_DEFAULT; if ( ! is_none && ! is_default && find_type_info(ei.LHS_ET()).is_managed && ! HasExplicitResultType() ) { auto pre = "auto hold_lhs = " + lhs; if ( zc == ZIC_VEC ) // For vectors, we have to check for whether // the previous value is present, or a hole. pre += string(" ? ") + lhs + "->"; else pre += "."; pre += "ManagedVal()"; if ( zc == ZIC_VEC ) pre += " : nullptr"; pre += ";\n\t"; auto post = "\tUnref(hold_lhs);"; eval = pre + eval + post; } eval = regex_replace(eval, regex("\\$1"), op1_ei); eval = regex_replace(eval, regex("\\$2"), op2_ei); string pre = GetPreEval(); pre = regex_replace(pre, regex("\\$1"), op1_ei); pre = regex_replace(pre, regex("\\$2"), op2_ei); if ( has_target ) eval = regex_replace(eval, regex("\\$\\$"), lhs_ei); else if ( zc == ZIC_COND ) { // Aesthetics: get rid of trailing newlines. eval = regex_replace(eval, regex("\n"), ""); eval = "if ( ! (" + eval + ") ) " + "{ pc = " + branch_target + "; continue; }"; } else if ( ! is_none && (ei.IsDefault() || IsConditionalOp()) ) { eval = lhs_ei + " = " + eval; // Ensure a single terminating semicolon. eval = regex_replace(eval, regex(";*\n"), ";\n"); } eval = pre + eval; auto full_suffix = ot_str + suffix + ei.OpMarker(); ZAM_OpTemplate::InstantiateEval(emit_target, full_suffix, eval, zc); if ( zc == ZIC_VEC ) { string dispatch_params = "frame[z.v1].AsVectorRef(), frame[z.v2].AsVector()"; if ( Arity() == 2 ) dispatch_params += ", frame[z.v3].AsVector()"; auto op_code = g->GenOpCode(this, "_" + full_suffix); auto dispatch = "vec_exec(" + op_code + ", z.t, " + dispatch_params + ", z);"; ZAM_OpTemplate::InstantiateEval(Eval, full_suffix, dispatch, zc); } } } void ZAM_UnaryExprOpTemplate::Parse(const string& attr, const string& line, const Words& words) { if ( attr == "no-const" ) { if ( words.size() != 1 ) g->Gripe("extraneous argument to no-const", line); SetNoConst(); } else if ( attr == "explicit-result-type" ) { if ( words.size() != 1 ) g->Gripe("extraneous argument to explicit-result-type", line); SetHasExplicitResultType(); } else ZAM_ExprOpTemplate::Parse(attr, line, words); } void ZAM_UnaryExprOpTemplate::Instantiate() { UnaryInstantiate(); vector ots = {ZAM_OT_VAR, ZAM_OT_CONSTANT}; if ( ! NoConst() ) InstantiateC1(ots, 1, IncludesVectorOp()); ots[1] = ZAM_OT_VAR; InstantiateV(ots); } void ZAM_UnaryExprOpTemplate::BuildInstruction(const vector& ot, const string& params, const string& suffix, ZAM_InstClass zc) { const auto& ets = ExprTypes(); if ( ets.size() == 1 && ets.count(ZAM_EXPR_TYPE_NONE) == 1 ) { ZAM_ExprOpTemplate::BuildInstruction(ot, params, suffix, zc); return; } auto constant_op = ot[1] == ZAM_OT_CONSTANT; string type_src = constant_op ? "c" : "n2"; if ( ot[0] == ZAM_OT_ASSIGN_FIELD ) { type_src = constant_op ? "n" : "n1"; Emit("auto " + type_src + " = flhs->GetOp1()->AsNameExpr();"); Emit("auto t = flhs->GetType();"); Emit("int field = flhs->Field();"); } else { if ( IsAssignOp() ) type_src = constant_op ? "n" : "n1"; auto type_suffix = zc == ZIC_VEC ? "->Yield();" : ";"; Emit("auto t = " + type_src + "->GetType()" + type_suffix); } BuildInstructionCore(params, suffix, zc); if ( IsAssignOp() && IsFieldOp() ) // These can't take the type from the LHS variable, since // that's the enclosing record and not the field within it. Emit("z.t = t;"); else if ( zc == ZIC_VEC ) { if ( constant_op ) Emit("z.t = n->GetType();"); else Emit("z.t = n1->GetType();"); } } ZAM_AssignOpTemplate::ZAM_AssignOpTemplate(ZAMGen* _g, string _base_name) : ZAM_UnaryExprOpTemplate(_g, std::move(_base_name)) { // Assignments apply to every valid form of ExprType. for ( auto& etn : expr_type_names ) { auto et = etn.second; if ( et != ZAM_EXPR_TYPE_NONE && et != ZAM_EXPR_TYPE_DEFAULT ) AddExprType(et); } } void ZAM_AssignOpTemplate::Parse(const string& attr, const string& line, const Words& words) { if ( attr == "field-op" ) { if ( words.size() != 1 ) g->Gripe("field-op does not take any arguments", line); SetFieldOp(); } else ZAM_OpTemplate::Parse(attr, line, words); } void ZAM_AssignOpTemplate::Instantiate() { if ( op_types.size() != 1 ) g->Gripe("operation needs precisely one \"type\"", op_loc); vector ots; ots.push_back(op_types[0]); // Build constant/variable versions ... ots.push_back(ZAM_OT_CONSTANT); if ( ots[0] == ZAM_OT_RECORD_FIELD ) ots.push_back(ZAM_OT_INT); InstantiateOp(ots, false); if ( IsFieldOp() ) InstantiateC1(ots, 1); ots[1] = ZAM_OT_VAR; InstantiateOp(ots, false); // ... and for assignments to fields, additional field versions. if ( ots[0] == ZAM_OT_ASSIGN_FIELD ) { ots.push_back(ZAM_OT_INT); InstantiateOp(ots, false); ots[1] = ZAM_OT_CONSTANT; InstantiateOp(ots, false); } else if ( IsFieldOp() ) InstantiateV(ots); } void ZAM_BinaryExprOpTemplate::Instantiate() { // As usual, the first slot receives the operator's result. vector ots = {ZAM_OT_VAR}; ots.resize(3); // Build each combination for constant/variable operand, // except skip constant/constant as that is always folded. // We only include vector operations when both operands // are non-constants. ots[1] = ZAM_OT_CONSTANT; ots[2] = ZAM_OT_VAR; InstantiateOp(ots, false); if ( ! IsInternalOp() ) InstantiateC1(ots, 2, false); ots[1] = ZAM_OT_VAR; ots[2] = ZAM_OT_CONSTANT; InstantiateOp(ots, false); if ( ! IsInternalOp() ) InstantiateC2(ots, 2); ots[2] = ZAM_OT_VAR; InstantiateOp(ots, IncludesVectorOp()); if ( ! IsInternalOp() ) InstantiateV(ots); } void ZAM_BinaryExprOpTemplate::BuildInstruction(const vector& ot, const string& params, const string& suffix, ZAM_InstClass zc) { auto constant_op = ot[1] == ZAM_OT_CONSTANT; string type_src = constant_op ? "c" : "n2"; auto type_suffix = zc == ZIC_VEC ? "->Yield();" : ";"; Emit("auto t = " + type_src + "->GetType()" + type_suffix); BuildInstructionCore(params, suffix, zc); if ( zc == ZIC_VEC ) Emit("z.t = n1->GetType();"); } void ZAM_RelationalExprOpTemplate::Instantiate() { ZAM_BinaryExprOpTemplate::Instantiate(); EmitTo(Cond); Emit("case EXPR_" + cname + ":"); IndentUp(); Emit("if ( n1 && n2 )"); EmitUp("return " + cname + "VVV_cond(n1, n2);"); Emit("else if ( n1 )"); EmitUp("return " + cname + "VVC_cond(n1, c);"); Emit("else"); EmitUp("return " + cname + "VCV_cond(c, n2);"); IndentDown(); NL(); } void ZAM_RelationalExprOpTemplate::BuildInstruction(const vector& ot, const string& params, const string& suffix, ZAM_InstClass zc) { string op1; if ( zc == ZIC_COND ) { if ( ot[1] == ZAM_OT_CONSTANT ) op1 = "c"; else if ( ot[2] == ZAM_OT_CONSTANT ) op1 = "n"; else op1 = "n1"; } else op1 = "n2"; auto type_suffix = zc == ZIC_VEC ? "->Yield();" : ";"; Emit("auto t = " + op1 + "->GetType()" + type_suffix); BuildInstructionCore(params, suffix, zc); if ( zc == ZIC_VEC ) Emit("z.t = n1->GetType();"); } void ZAM_InternalBinaryOpTemplate::Parse(const string& attr, const string& line, const Words& words) { if ( attr == "op-accessor" ) { if ( words.size() != 2 ) g->Gripe("op-accessor takes one argument", line); SetOpAccessor(words[1]); } else if ( attr == "op1-accessor" ) { if ( words.size() != 2 ) g->Gripe("op-accessor1 takes one argument", line); SetOp1Accessor(words[1]); } else if ( attr == "op2-accessor" ) { if ( words.size() != 2 ) g->Gripe("op-accessor2 takes one argument", line); SetOp2Accessor(words[1]); } else ZAM_BinaryExprOpTemplate::Parse(attr, line, words); } void ZAM_InternalBinaryOpTemplate::InstantiateEval(const vector& ot, const string& suffix, ZAM_InstClass zc) { assert(ot.size() == 3); auto op1_const = ot[1] == ZAM_OT_CONSTANT; auto op2_const = ot[2] == ZAM_OT_CONSTANT; string op1 = op1_const ? "z.c" : "frame[z.v2]"; string op2 = op2_const ? "z.c" : (op1_const ? "frame[z.v2]" : "frame[z.v3]"); string prelude = "auto op1 = " + op1 + "." + op1_accessor + ";\n"; prelude += "auto op2 = " + op2 + "." + op2_accessor + ";\n"; auto eval = prelude + GetEval(); auto& ets = ExprTypes(); if ( ! ets.empty() ) { if ( ets.size() != 1 ) g->Gripe("internal-binary-op's can have at most one op-type", op_loc); for ( auto& et : ets ) { auto acc = find_type_accessor(et); auto lhs = "frame[z.v1]." + acc; eval = regex_replace(eval, regex("\\$\\$"), lhs); } } ZAM_OpTemplate::InstantiateEval(Eval, OpSuffix(ot) + suffix, eval, zc); } void ZAM_InternalOpTemplate::Parse(const string& attr, const string& line, const Words& words) { if ( attr != "num-call-args" ) { if ( attr == "indirect-call" ) { if ( words.size() != 1 ) g->Gripe("indirect-call takes one argument", line); // Note, currently only works with a *subsequent* // num-call-args, whose setting needs to be 'n'. is_indirect_call = true; } else ZAM_OpTemplate::Parse(attr, line, words); return; } if ( words.size() != 2 ) g->Gripe("num-call-args takes one argument", line); eval = "std::vector args;\n"; auto& arg = words[1]; int n = arg == "n" ? -1 : stoi(arg); auto arg_offset = HasAssignVal() ? 1 : 0; auto arg_slot = arg_offset + 1; string func = "z.func"; if ( n == 1 ) { eval += "args.push_back("; if ( op_types[arg_offset] == ZAM_OT_CONSTANT ) eval += "z.c"; else eval += "frame[z.v" + to_string(arg_slot) + "]"; eval += ".ToVal(z.t));\n"; } else if ( n != 0 ) { eval += "auto aux = z.aux;\n"; if ( n < 0 ) { if ( is_indirect_call ) { func = "func"; eval += "auto sel = z.v" + to_string(arg_slot) + ";\n"; eval += "auto func = (sel < 0) ? "; eval += "aux->id_val->GetVal()->AsFunc() : "; eval += "frame[sel].AsFunc();\n"; } eval += "auto n = aux->n;\n"; eval += "for ( auto i = 0; i < n; ++i )\n"; eval += "\targs.push_back(aux->ToVal(frame, i));\n"; } else for ( auto i = 0; i < n; ++i ) { eval += "args.push_back(aux->ToVal(frame, "; eval += to_string(i); eval += "));\n"; } } eval += "f->SetCallLoc(z.loc);\n"; if ( HasAssignVal() ) { auto av = GetAssignVal(); eval += "auto " + av + " = " + func + "->Invoke(&args, f);\n"; eval += "if ( ! " + av + " ) { ZAM_error = true; break; }\n"; } else eval += "(void) " + func + "->Invoke(&args, f);\n"; } bool TemplateInput::ScanLine(string& line) { if ( ! put_back.empty() ) { line = put_back; put_back.clear(); return true; } char buf[8192]; // Read lines, discarding comments, which have to start at the // beginning of a line. do { if ( ! fgets(buf, sizeof buf, f) ) return false; ++loc.line_num; } while ( buf[0] == '#' ); line = buf; return true; } vector TemplateInput::SplitIntoWords(const string& line) const { vector words; for ( auto start = line.c_str(); *start && *start != '\n'; ) { auto end = start + 1; while ( *end && ! isspace(*end) ) ++end; words.emplace_back(string(start, end - start)); start = end; while ( *start && isspace(*start) ) ++start; } return words; } string TemplateInput::SkipWords(const string& line, int n) const { auto s = line.c_str(); for ( int i = 0; i < n; ++i ) { // Find end of current word. while ( *s && *s != '\n' ) { if ( isspace(*s) ) break; ++s; } if ( *s == '\n' ) break; // Find start of next word. while ( *s && isspace(*s) ) ++s; } return string(s); } void TemplateInput::Gripe(const char* msg, const string& input) const { auto input_s = input.c_str(); size_t n = strlen(input_s); fprintf(stderr, "%s, line %d: %s - %s", loc.file_name, loc.line_num, msg, input_s); if ( n == 0 || input_s[n - 1] != '\n' ) fprintf(stderr, "\n"); exit(1); } void TemplateInput::Gripe(const char* msg, const InputLoc& l) const { fprintf(stderr, "%s, line %d: %s\n", l.file_name, l.line_num, msg); exit(1); } ZAMGen::ZAMGen(int argc, char** argv) { auto prog_name = argv[0]; if ( argc != 2 ) { fprintf(stderr, "usage: %s \n", prog_name); exit(1); } auto file_name = argv[1]; auto f = strcmp(file_name, "-") ? fopen(file_name, "r") : stdin; if ( ! f ) { fprintf(stderr, "%s: cannot open \"%s\"\n", prog_name, file_name); exit(1); } ti = make_unique(f, prog_name, file_name); InitEmitTargets(); while ( ParseTemplate() ) ; for ( auto& t : templates ) t->Instantiate(); GenMacros(); CloseEmitTargets(); } void ZAMGen::ReadMacro(const string& line) { vector mac; mac.emplace_back(SkipWords(line, 1)); string s; while ( ScanLine(s) ) { if ( s.size() <= 1 || ! isspace(s.c_str()[0]) ) { PutBack(s); break; } mac.push_back(s); } macros.emplace_back(move(mac)); } void ZAMGen::GenMacros() { for ( auto& m : macros ) { for ( auto i = 0U; i < m.size(); ++i ) { auto ms = m[i]; if ( i == 0 ) ms = "#define " + ms; if ( i < m.size() - 1 ) ms = regex_replace(ms, regex("\n"), " \\\n"); Emit(EvalMacros, ms); } Emit(EvalMacros, "\n"); } } string ZAMGen::GenOpCode(const ZAM_OpTemplate* ot, const string& suffix, ZAM_InstClass zc) { auto op = "OP_" + ot->CanonicalName() + suffix; static unordered_set known_opcodes; if ( known_opcodes.count(op) > 0 ) // We've already done this one, don't re-define its auxiliary // information. return op; known_opcodes.insert(op); IndentUp(); // Generate the enum defining the opcode ... Emit(OpDef, op + ","); // ... the "flavor" of how it treats its first operand ... auto op_comment = ",\t// " + op; auto op1_always_read = (zc == ZIC_FIELD || zc == ZIC_COND); auto flavor = op1_always_read ? "OP1_READ" : ot->GetOp1Flavor(); Emit(Op1Flavor, flavor + op_comment); // ... whether it has side effects ... auto se = ot->HasSideEffects() ? "true" : "false"; Emit(OpSideEffects, se + op_comment); // ... and the switch case that maps the enum to a string // representation. auto name = ot->BaseName(); transform(name.begin(), name.end(), name.begin(), ::tolower); name += suffix; transform(name.begin(), name.end(), name.begin(), under_to_dash); Emit(OpName, "case " + op + ":\treturn \"" + name + "\";"); IndentDown(); return op; } void ZAMGen::Emit(EmitTarget et, const string& s) { assert(et != None); if ( gen_files.count(et) == 0 ) { fprintf(stderr, "bad generation file type\n"); exit(1); } FILE* f = gen_files[et]; for ( auto i = indent_level; i > 0; --i ) fputs("\t", f); fputs(s.c_str(), f); if ( ! no_NL && (s.empty() || s.back() != '\n') ) fputs("\n", f); } void ZAMGen::InitEmitTargets() { // Maps an EmitTarget enum to its corresponding filename. static const unordered_map gen_file_names = { {None, nullptr}, {AssignFlavor, "ZAM-AssignFlavorsDefs.h"}, {C1Def, "ZAM-GenExprsDefsC1.h"}, {C1FieldDef, "ZAM-GenFieldsDefsC1.h"}, {C2Def, "ZAM-GenExprsDefsC2.h"}, {C2FieldDef, "ZAM-GenFieldsDefsC2.h"}, {C3Def, "ZAM-GenExprsDefsC3.h"}, {Cond, "ZAM-Conds.h"}, {DirectDef, "ZAM-DirectDefs.h"}, {Eval, "ZAM-EvalDefs.h"}, {EvalMacros, "ZAM-EvalMacros.h"}, {MethodDecl, "ZAM-MethodDecls.h"}, {MethodDef, "ZAM-MethodDefs.h"}, {Op1Flavor, "ZAM-Op1FlavorsDefs.h"}, {OpDef, "ZAM-OpsDefs.h"}, {OpName, "ZAM-OpsNamesDefs.h"}, {OpSideEffects, "ZAM-OpSideEffects.h"}, {VDef, "ZAM-GenExprsDefsV.h"}, {VFieldDef, "ZAM-GenFieldsDefsV.h"}, {Vec1Eval, "ZAM-Vec1EvalDefs.h"}, {Vec2Eval, "ZAM-Vec2EvalDefs.h"}, }; for ( auto& gfn : gen_file_names ) { auto fn = gfn.second; if ( ! fn ) continue; auto f = fopen(fn, "w"); if ( ! f ) { fprintf(stderr, "can't open generation file %s\n", fn); exit(1); } gen_files[gfn.first] = f; } InitSwitch(C1Def, "C1 assignment"); InitSwitch(C2Def, "C2 assignment"); InitSwitch(C3Def, "C3 assignment"); InitSwitch(VDef, "V assignment"); InitSwitch(C1FieldDef, "C1 field assignment"); InitSwitch(C2FieldDef, "C2 field assignment"); InitSwitch(VFieldDef, "V field assignment"); } void ZAMGen::InitSwitch(EmitTarget et, string desc) { Emit(et, "{"); Emit(et, "switch ( rhs->Tag() ) {"); switch_targets[et] = std::move(desc); } void ZAMGen::CloseEmitTargets() { FinishSwitches(); for ( auto& gf : gen_files ) fclose(gf.second); } void ZAMGen::FinishSwitches() { for ( auto& st : switch_targets ) { auto et = st.first; auto& desc = st.second; Emit(et, "default:"); IndentUp(); Emit(et, "reporter->InternalError(\"inconsistency in " + desc + ": %s\", obj_desc(rhs).c_str());"); IndentDown(); Emit(et, "}"); Emit(et, "}"); } } bool ZAMGen::ParseTemplate() { string line; if ( ! ScanLine(line) ) return false; if ( line.size() <= 1 ) // A blank line - no template to parse. return true; auto words = SplitIntoWords(line); if ( words.size() < 2 ) Gripe("too few words at start of template", line); auto op = words[0]; if ( op == "macro" ) { ReadMacro(line); return true; } auto op_name = words[1]; // We track issues with the wrong number of template arguments // up front, to avoid mis-invoking constructors, but we don't // report these until later because if the template names a // bad operation, it's better to report that as the core problem. const char* args_mismatch = nullptr; if ( op == "direct-unary-op" ) { if ( words.size() != 3 ) args_mismatch = "direct-unary-op takes 2 arguments"; } else if ( words.size() != 2 ) args_mismatch = "templates take 1 argument"; unique_ptr t; if ( op == "op" ) t = make_unique(this, op_name); else if ( op == "unary-op" ) t = make_unique(this, op_name); else if ( op == "direct-unary-op" && ! args_mismatch ) t = make_unique(this, op_name, words[2]); else if ( op == "assign-op" ) t = make_unique(this, op_name); else if ( op == "expr-op" ) t = make_unique(this, op_name); else if ( op == "unary-expr-op" ) t = make_unique(this, op_name); else if ( op == "binary-expr-op" ) t = make_unique(this, op_name); else if ( op == "rel-expr-op" ) t = make_unique(this, op_name); else if ( op == "internal-binary-op" ) t = make_unique(this, op_name); else if ( op == "internal-op" ) t = make_unique(this, op_name); else if ( op == "internal-assignment-op" ) t = make_unique(this, op_name); else Gripe("bad template name", op); if ( args_mismatch ) Gripe(args_mismatch, line); t->Build(); templates.emplace_back(move(t)); return true; } int main(int argc, char** argv) { try { ZAMGen zg(argc, argv); exit(0); } catch ( const std::regex_error& e ) { fprintf(stderr, "%s: regular expression error - %s\n", argv[0], e.what()); exit(1); } }