//==-- loop_proto_to_llvm.cpp - Protobuf-C++ conversion //---------------------==// // // The LLVM Compiler Infrastructure // // This file is distributed under the University of Illinois Open Source // License. See LICENSE.TXT for details. // //===----------------------------------------------------------------------===// // // Implements functions for converting between protobufs and LLVM IR. // // //===----------------------------------------------------------------------===// #include "loop_proto_to_llvm.h" #include "cxx_loop_proto.pb.h" #include "../handle-llvm/input_arrays.h" // The following is needed to convert protos in human-readable form #include #include #include namespace clang_fuzzer { // Forward decls std::string BinopToString(std::ostream &os, const BinaryOp &x); std::string StateSeqToString(std::ostream &os, const StatementSeq &x); // Counter variable to generate new LLVM IR variable names and wrapper function static std::string get_var() { static int ctr = 0; return "%var" + std::to_string(ctr++); } static bool inner_loop = false; class InnerLoop { public: InnerLoop() { inner_loop = true; } ~InnerLoop() { inner_loop = false; } }; // Proto to LLVM. std::string ConstToString(const Const &x) { return std::to_string(x.val()); } std::string VarRefToString(std::ostream &os, const VarRef &x) { std::string which_loop = inner_loop ? "inner" : "outer"; std::string arr; switch(x.arr()) { case VarRef::ARR_A: arr = "%a"; break; case VarRef::ARR_B: arr = "%b"; break; case VarRef::ARR_C: arr = "%c"; break; } std::string ptr_var = get_var(); os << ptr_var << " = getelementptr inbounds i32, i32* " << arr << ", i64 %" << which_loop << "_ct\n"; return ptr_var; } std::string RvalueToString(std::ostream &os, const Rvalue &x) { if(x.has_cons()) return ConstToString(x.cons()); if(x.has_binop()) return BinopToString(os, x.binop()); if(x.has_varref()) { std::string var_ref = VarRefToString(os, x.varref()); std::string val_var = get_var(); os << val_var << " = load i32, i32* " << var_ref << "\n"; return val_var; } return "1"; } std::string BinopToString(std::ostream &os, const BinaryOp &x) { std::string left = RvalueToString(os, x.left()); std::string right = RvalueToString(os, x.right()); std::string op; switch (x.op()) { case BinaryOp::PLUS: op = "add"; break; case BinaryOp::MINUS: op = "sub"; break; case BinaryOp::MUL: op = "mul"; break; case BinaryOp::XOR: op = "xor"; break; case BinaryOp::AND: op = "and"; break; case BinaryOp::OR: op = "or"; break; // Support for Boolean operators will be added later case BinaryOp::EQ: case BinaryOp::NE: case BinaryOp::LE: case BinaryOp::GE: case BinaryOp::LT: case BinaryOp::GT: op = "add"; break; } std::string val_var = get_var(); os << val_var << " = " << op << " i32 " << left << ", " << right << "\n"; return val_var; } std::ostream &operator<<(std::ostream &os, const AssignmentStatement &x) { std::string rvalue = RvalueToString(os, x.rvalue()); std::string var_ref = VarRefToString(os, x.varref()); return os << "store i32 " << rvalue << ", i32* " << var_ref << "\n"; } std::ostream &operator<<(std::ostream &os, const Statement &x) { return os << x.assignment(); } std::ostream &operator<<(std::ostream &os, const StatementSeq &x) { for (auto &st : x.statements()) { os << st; } return os; } void NestedLoopToString(std::ostream &os, const LoopFunction &x) { os << "target triple = \"x86_64-unknown-linux-gnu\"\n" << "define void @foo(i32* %a, i32* %b, i32* noalias %c, i64 %s) {\n" << "outer_loop_start:\n" << "%cmp = icmp sgt i64 %s, 0\n" << "br i1 %cmp, label %inner_loop_start, label %end\n" << "outer_loop:\n" << x.outer_statements() << "%o_ct_new = add i64 %outer_ct, 1\n" << "%jmp_outer = icmp eq i64 %o_ct_new, %s\n" << "br i1 %jmp_outer, label %end, label %inner_loop_start\n" << "inner_loop_start:\n" << "%outer_ct = phi i64 [%o_ct_new, %outer_loop], [0, %outer_loop_start]\n" << "br label %inner_loop\n" << "inner_loop:\n" << "%inner_ct = phi i64 [0, %inner_loop_start], [%i_ct_new, %inner_loop]\n"; { InnerLoop IL; os << x.inner_statements(); } os << "%i_ct_new = add i64 %inner_ct, 1\n" << "%jmp_inner = icmp eq i64 %i_ct_new, %s\n" << "br i1 %jmp_inner, label %outer_loop, label %inner_loop, !llvm.loop !0\n" << "end:\n" << "ret void\n" << "}\n" << "!0 = distinct !{!0, !1, !2}\n" << "!1 = !{!\"llvm.loop.vectorize.enable\", i1 true}\n" << "!2 = !{!\"llvm.loop.vectorize.width\", i32 " << kArraySize << "}\n"; } void SingleLoopToString(std::ostream &os, const LoopFunction &x) { os << "target triple = \"x86_64-unknown-linux-gnu\"\n" << "define void @foo(i32* %a, i32* %b, i32* noalias %c, i64 %s) {\n" << "%cmp = icmp sgt i64 %s, 0\n" << "br i1 %cmp, label %start, label %end\n" << "start:\n" << "br label %loop\n" << "end:\n" << "ret void\n" << "loop:\n" << "%outer_ct = phi i64 [ %ctnew, %loop ], [ 0, %start ]\n" << x.outer_statements() << "%ctnew = add i64 %outer_ct, 1\n" << "%j = icmp eq i64 %ctnew, %s\n" << "br i1 %j, label %end, label %loop, !llvm.loop !0\n}\n" << "!0 = distinct !{!0, !1, !2}\n" << "!1 = !{!\"llvm.loop.vectorize.enable\", i1 true}\n" << "!2 = !{!\"llvm.loop.vectorize.width\", i32 " << kArraySize << "}\n"; } std::ostream &operator<<(std::ostream &os, const LoopFunction &x) { if (x.has_inner_statements()) NestedLoopToString(os, x); else SingleLoopToString(os, x); return os; } // --------------------------------- std::string LoopFunctionToLLVMString(const LoopFunction &input) { std::ostringstream os; os << input; return os.str(); } std::string LoopProtoToLLVM(const uint8_t *data, size_t size) { LoopFunction message; if (!message.ParsePartialFromArray(data, size)) return "#error invalid proto\n"; return LoopFunctionToLLVMString(message); } } // namespace clang_fuzzer