doxygen-c/html/python__print_8cpp_source.html

 #include <c10/util/Exception.h>
 #include <torch/csrc/jit/attributes.h>
 #include <torch/csrc/jit/export.h>
 #include <torch/csrc/jit/ir.h>
 #include <torch/csrc/jit/ir_views.h>
 #include <torch/csrc/jit/passes/python_print.h>
 #include <torch/csrc/jit/resource_guard.h>
 #include <torch/csrc/jit/script/error_report.h>
 #include <torch/csrc/jit/script/module.h>

 namespace torch {
 namespace jit {

 // unix isprint but insensitive to locale
 static bool isPrint(char s) {
   return s > 0x1f && s < 0x7f;
 }

 void printQuotedString(std::ostream& stmt, const std::string& str) {
   stmt << "\"";
   for (auto s : str) {
     switch (s) {
       case '\\':
         stmt << "\\\\";
         break;
       case '\'':
         stmt << "\\'";
         break;
       case '\"':
         stmt << "\\\"";
         break;
       case '\a':
         stmt << "\\a";
         break;
       case '\b':
         stmt << "\\b";
         break;
       case '\f':
         stmt << "\\f";
         break;
       case '\n':
         stmt << "\\n";
         break;
       case '\r':
         stmt << "\\r";
         break;
       case '\t':
         stmt << "\\t";
         break;
       case '\v':
         stmt << "\\v";
         break;
       default:
         if (isPrint(s)) {
           stmt << s;
         } else {
           // C++ io has stateful formatting settings. Messing with
           // them is probably worse than doing this manually.
           char buf[4] = "000";
           buf[2] += s % 8;
           s /= 8;
           buf[1] += s % 8;
           s /= 8;
           buf[0] += s;
           stmt << "\\" << buf;
         }
         break;
     }
   }
   stmt << "\"";
 }

 static bool isValidIdentifierChar(char c, size_t pos) {
   return islower(c) || isupper(c) || c == '_' || (pos > 0 && isdigit(c));
 }

 static bool isValidIdentifier(const std::string& name) {
   if (name.size() == 0)
     return false;
   for (size_t i = 0; i < name.size(); ++i) {
     if (!isValidIdentifierChar(name[i], i))
       return false;
   }
   return true;
 }

 // handles names of the form, e.g., self.a.b
 // if a field is not a valid identifier, then it will print as, e.g.
 // getattr(self, "0").b
 struct QualifiedName;
 using QualifiedNamePtr = c10::intrusive_ptr<QualifiedName>;
 struct QualifiedName : c10::intrusive_ptr_target {
   QualifiedName(QualifiedNamePtr prefix, std::string name)
       : prefix_(std::move(prefix)), name_(std::move(name)) {}
   QualifiedNamePtr prefix_;
   std::string name_;
   static QualifiedNamePtr create(QualifiedNamePtr prefix, std::string name) {
     return c10::make_intrusive<QualifiedName>(
         std::move(prefix), std::move(name));
   }
   static QualifiedNamePtr create(std::string name) {
     return c10::make_intrusive<QualifiedName>(
         QualifiedNamePtr(), std::move(name));
   }
   std::string str() const {
     std::stringstream ss;
     emit(ss);
     return ss.str();
   }

  private:
   void emit(std::ostream& out) const {
     if (isValidIdentifier(name_)) {
       if (prefix_) {
         prefix_->emit(out);
         out << ".";
       }
       out << name_;
     } else {
       AT_ASSERT(prefix_);
       out << "getattr(";
       prefix_->emit(out);
       out << ", ";
       printQuotedString(out, name_);
       out << ")";
     }
   }
 };

 void createTensorToParameterNameMap(
     const script::Module& module,
     const QualifiedNamePtr& prefix,
     std::unordered_map<IValue*, QualifiedNamePtr>& result) {
   for (const auto& elem : module.get_parameters()) {
     const script::NamedIValue& param = elem.value();
     result[param.slot()] = QualifiedName::create(prefix, param.name_);
   }
   for (const auto& elem : module.get_attributes()) {
     const script::NamedIValue& param = elem.value();
     result[param.slot()] = QualifiedName::create(prefix, param.name_);
   }
   for (const auto& elem : module.get_modules()) {
     createTensorToParameterNameMap(
         *elem->module, QualifiedName::create(prefix, elem.key()), result);
   }
 }

 // some names are valid identifiers but off limits because
 // they are keywords or namespaces used in the output
 const static std::unordered_set<std::string> reserved_names = {
     // identifiers in the environment while parsing
     "_", // avoid the confusing unnamed _
     "aten",
     "attribute",
     "CONSTANTS",
     "fork",
     "getattr",
     "inf",
     "nan",
     "ops",
     "self",
     // the python keywords
     "and",
     "as",
     "assert",
     "async",
     "await",
     "break",
     "class",
     "continue",
     "def",
     "del",
     "elif",
     "else",
     "except",
     "False",
     "finally",
     "for",
     "from",
     "global",
     "if",
     "import",
     "in",
     "is",
     "lambda",
     "None",
     "nonlocal",
     "not",
     "or",
     "pass",
     "raise",
     "return",
     "True",
     "try",
     "while",
     "with",
     "yield",
 };

 struct PythonPrintPass {
   std::ostream& out;

   // constants are written to this table, and given then named CONSTANTS.cN
   // where N is the index into this table.
   std::vector<at::Tensor>& tensor_table_;

   // Any classes used are written to this table, to be later written out as
   // dependencies.
   std::vector<ClassTypePtr>& class_table_;
   // Helper to avoid duplicating class types
   void addToClassTable(const ClassTypePtr& classType) {
     if (std::find(class_table_.cbegin(), class_table_.cend(), classType) ==
         class_table_.cend()) {
       class_table_.push_back(classType);
     }
   }

   // When printing this node, is it safe to write it inline (i.e. without
   // assigning a temporary variable
   std::unordered_set<Node*> output_inline_;

   // when we print this, should we error if the resulting output would
   // not be able to be reparsed?
   bool enforce_importable_;

   // what valid identifiers are in use for the current function
   std::unordered_set<std::string> used_names_;

   // used method names
   std::unordered_set<std::string> used_method_names_;

   // for fork,
   // subgraphs get added to the worklist, and will be printed later
   std::vector<std::function<void(void)>> worklist;

   // scanValue, scanNode, scanBlock:
   // decide if it is safe to omit the output of a temporary variable,
   // and inline the expression into its use
   // we only do this if
   // (1) it is a constant, or
   // (2) the temporary is unnamed, is single output, is used once,
   //     and would appear in the same order when the expression tree is
   //     reparsed.
   // The last case can be checked
   // becuase when we emit a expresion tree in the parser,
   // we do a left-to-right postorder traversal of the expression tree (emit
   // children, then emit op). The reverse of this is a right-to-left preorder
   // traversal of the tree. By doing a right-to-left preorder traversal of the
   // inputs of a node, while also scanning the list of emitted nodes backward,
   // we can see if they line up with what would happen when parsed the node as
   // an expression. While they line up we collapse them into an inline
   // expression.

   // The inductive step is that the right-most input should be produced by the
   // node immediatly before the current node if it is in tree order.

   bool canInline(Value* v) {
     Node* n = v->node();
     // there must be only 1 values, otherwise we need an assignment to handle
     // the multiple outout values
     if (n->outputs().size() != 1)
       return false;
     // if it is used more than once, then we need a variable
     if (v->uses().size() != 1)
       return false;
     auto use = v->uses().at(0);
     // if it has a name set, then it was written as a variable so preserve that
     // unless it is being fed directly to the end of the block.
     // in which case it is not as useful to give it a name just to return it
     if (v->hasUniqueName() && use.user->kind() != prim::Return)
       return false;
     // don't try to inline control blocks
     if (n->blocks().size() != 0)
       return false;
     // if it is a loop-carried input, we need a variable
     // otherwise the condition or trip count may be emitted in the wrong order
     // w.r.t. to it
     if (use.user->kind() == prim::Loop && use.offset >= 2)
       return false;
     return true;
   }

   // block_point is the current node in the reverse linear scan of the emitted
   // nodes v is the current value in the tree traversal that may match with
   // block_point's output.
   Node* scanValue(Node* block_point, Value* v) {
     Node* n = v->node();
     AT_ASSERT(n->kind() == prim::Constant || output_inline_.count(n) == 0);

     if (n == block_point &&
         canInline(v)) { // the node must be at the expected point of the typical
                         // tree traversal
       // recursively see if we can inline the inputs to this input
       block_point = scanNode(block_point);
       output_inline_.insert(n);
     } else if (n->kind() == prim::Constant) {
       // constant nodes can always be inlined, we will de-dup them on parsing
       // and put them at the top of the function regardless
       output_inline_.insert(n);
     }
     return block_point;
   }
   Node* previousNonConstant(Node* n) {
     do {
       n = n->prev();
     } while (n->kind() == prim::Constant);
     return n;
   }

   Node* scanNode(Node* n) {
     // don't bother to scan nodes we have already determined to be inline
     if (output_inline_.count(n)) {
       return n;
     }
     for (auto b : n->blocks()) {
       scanBlock(b);
     }
     Node* block_point = previousNonConstant(n);
     for (auto it = n->inputs().rbegin(), end = n->inputs().rend(); it != end;
          ++it) {
       block_point = scanValue(block_point, *it);
     }
     return block_point;
   }

   void scanBlock(Block* b) {
     scanNode(b->return_node());
     for (auto node : b->nodes().reverse()) {
       scanNode(node);
     }
   }

   size_t getOrAddTensorConstant(at::Tensor t) {
     // XXX - N^2 warning. This code does the exact same thing as
     // ConstantPool, which is also N^2 in the size of the constants,
     // because it doesn't hash any information about the tensors.
     // We will probably need to optimize this at some point using hashing.
     for (size_t i = 0; i < tensor_table_.size(); ++i) {
       if (t.type() == tensor_table_[i].type() && t.equal(tensor_table_[i])) {
         return i;
       }
     }
     AT_ASSERT(t.is_variable());
     tensor_table_.emplace_back(std::move(t));
     return tensor_table_.size() - 1;
   }

   std::unordered_set<Node*> seen_constants;
   void buildConstantList(Node* n, std::vector<Node*>& constants) {
     for (auto input : n->inputs()) {
       if (input->node()->kind() == prim::Constant &&
           seen_constants.count(input->node()) == 0) {
         constants.push_back(input->node());
         seen_constants.insert(input->node());
       }
     }
     for (auto b : n->blocks()) {
       buildConstantList(b, constants);
     }
   }
   void buildConstantList(Block* b, std::vector<Node*>& constants) {
     for (auto n : b->nodes())
       buildConstantList(n, constants);
     buildConstantList(b->return_node(), constants);
   }

   // get a new name unique across calls to uniqueName() and
   // anything we have used.
   std::unordered_map<std::string, size_t> next_id;

   std::string genNameImpl(
       const std::string& candidate,
       std::unordered_set<std::string>& used) {
     std::string name = candidate;
     while (used.count(name) || reserved_names.count(name)) {
       name = candidate + std::to_string(next_id[name]++);
     }
     used.insert(name);
     return name;
   }
   std::string genName(const std::string& candidate) {
     return genNameImpl(candidate, used_names_);
   }

   // methods self.foo are in a different namespace than
   // global identifiers, so they have a different procedure for finding a
   // uniquename
   std::string genMethodName(const std::string& candidate) {
     return genNameImpl(candidate, used_method_names_);
   }

   // unique names might not be valid identifiers,
   // force them to be by rewriting them
   static std::string makeValidIdentifier(const std::string& candidate) {
     std::stringstream ss;
     if (candidate.size() == 0 || isdigit(candidate[0]))
       ss << "_";
     for (char c : candidate) {
       if (isupper(c) || islower(c) || isdigit(c) || c == '_')
         ss << c;
       else
         ss << '_';
     }
     return ss.str();
   }
   // if we have to assign 'v' a name, what should it be?
   // use the uniqueName if it was set, otherwise generate a name.
   std::string genUniqueNameFor(Value* v) {
     return genName(
         v->hasUniqueName() ? makeValidIdentifier(v->uniqueNameBase()) : "_");
   }

   // map from Value to how it should be printed at each use
   std::unordered_map<Value*, std::string> value_names_;

   std::string useOf(Value* v) const {
     return value_names_.at(v);
   }
   void assignValue(Value* v, const std::string& s) {
     value_names_[v] = s;
   }
   void assignValue(Value* v, Value* w) {
     assignValue(v, useOf(w));
   }
   void assignValuesToTheirUniqueNames(at::ArrayRef<Value*> values) {
     for (auto v : values) {
       assignValue(v, genUniqueNameFor(v));
     }
   }

   size_t level = 0;
   // indent to the current indent level
   std::ostream& indent() {
     for (size_t i = 0; i < level; ++i) {
       out << "  ";
     }
     return out;
   }

   ResourceGuard WithIndented() {
     level++;
     return ResourceGuard([this] { level--; });
   }

   template <class T0, class T1, class F>
   void zipWith(at::ArrayRef<T0> list_a, at::ArrayRef<T1> list_b, F action)
       const {
     auto it_a = list_a.begin();
     auto it_b = list_b.begin();

     if (list_a.size() != list_b.size()) {
       AT_ERROR("Python printer expected 2 lists of same size");
     }

     for (; it_a != list_a.end(); ++it_a, ++it_b) {
       action(*it_a, *it_b);
     }
   }

   void printValueList(
       std::ostream& stmt,
       at::ArrayRef<Value*> list,
       const char* begin = "",
       const char* end = "") {
     stmt << begin;
     auto delimiter = "";
     for (auto* value : list) {
       stmt << delimiter;
       stmt << useOf(value);
       delimiter = ", ";
     }
     stmt << end;
   }

   void printDict(
       std::ostream& stmt,
       at::ArrayRef<Value*> key_value_pairs,
       const char* begin = "{",
       const char* end = "}") {
     stmt << begin;
     auto delimiter = "";
     for (size_t i = 0; i < key_value_pairs.size(); i += 2) {
       stmt << delimiter;
       auto key = key_value_pairs[i];
       auto value = key_value_pairs[i + 1];

       stmt << useOf(key) << ": " << useOf(value);

       delimiter = ", ";
     }
     stmt << end;
   }

   void printAssignment(at::ArrayRef<Value*> lhs, at::ArrayRef<Value*> rhs) {
     if (lhs.size() > 0) {
       indent();
       printValueList(out, lhs);
       out << " = ";
       printValueList(out, rhs);
       out << "\n";
     }
   }

   void printIf(IfView stmt) {
     assignValuesToTheirUniqueNames(stmt.outputs());
     indent() << "if " << useOf(stmt.cond()) << ":\n";
     {
       auto guard = WithIndented();
       // Print node contents
       printBlock(stmt.thenBlock(), stmt.outputs().size() > 0);
       printAssignment(stmt.outputs(), stmt.thenOutputs());
     }
     indent() << "else:\n";
     {
       auto guard = WithIndented();
       printBlock(stmt.elseBlock(), stmt.outputs().size() > 0);
       printAssignment(stmt.outputs(), stmt.elseOutputs());
     }
   }

   // our way of encoding loops makes them difficult to turn back into python
   // syntax. we have to check properties of the condition and trip count inputs
   // to figure out which one it initially was
   static bool shouldEmitAsForLoop(LoopView stmt) {
     auto trip_count = toIValue(stmt.maxTripCount());
     auto cond_input = toIValue(stmt.inputCond());
     auto cond_next = toIValue(stmt.nextCond());

     bool condition_is_always_true =
         cond_input && cond_input->toBool() && cond_next && cond_next->toBool();
     bool trip_count_is_specified = !trip_count || // trip is not a constant
         trip_count->toInt() !=
             std::numeric_limits<int64_t>::max() || // it is a constant but not
                                                    // the default one
         stmt.currentTripCount()->uses().size() >
             0; // it is actually being used in the body.

     if (condition_is_always_true) {
       // if the trip count was not specified this was a user-written while True:
       return trip_count_is_specified;
     } else {
       // this must be a while loop, but check that there isn't _also_ a trip
       // count
       if (trip_count_is_specified) {
         throw script::ErrorReport(stmt.node()->getSourceLocation())
             << "loop cannot be printed as python "
             << "because it has gone through an optimization "
             << "that combined while and for loops. File a bug.";
       }
       return false;
     }
   }

   void printLoop(LoopView stmt) {
     // Loop carried dependencies are handled by assigning their initial
     // values to the node->outputs() before the loop,
     // and assign node->outputs() to the new values at the end of each trip.

     bool emit_as_for_loop = shouldEmitAsForLoop(stmt);

     assignValuesToTheirUniqueNames(stmt.carriedOutputs());
     // Add aliases for loop-carried dependencies
     zipWith(
         stmt.bodyCarriedInputs(), // Start at 1 to ignore trip count
         stmt.carriedOutputs(),
         [&](Value* block_input, Value* node_output) {
           assignValue(block_input, node_output);
         });

     // Print initial assignments of loop node outputs = loop node inputs
     printAssignment(stmt.carriedOutputs(), stmt.carriedInputs());

     assignValuesToTheirUniqueNames(stmt.currentTripCount());
     // Loop header
     if (emit_as_for_loop) {
       indent();
       out << "for " << useOf(stmt.currentTripCount()) << " in range("
           << useOf(stmt.maxTripCount()) << "):\n";
     } else {
       // note: trip_count_in_block is unused because this is a while loop,
       // so we reuse the Value* as a stand-in for the loop condition
       printAssignment(stmt.currentTripCount(), stmt.inputCond());
       indent();
       out << "while " << useOf(stmt.currentTripCount()) << ":\n";
     }
     // Loop body
     {
       ResourceGuard indent = WithIndented();
       // Update block outputs to block inputs for next loop iteration
       // skip the assignment to the new condition in for loops because
       // the condition is always True
       size_t offset = emit_as_for_loop ? 1 : 0;
       auto body_block = stmt.bodyBlock();
       ArrayRef<Value*> loop_carried_block_inputs =
           body_block->inputs().slice(offset);
       printBlock(body_block, loop_carried_block_inputs.size() > 0);
       printAssignment(
           loop_carried_block_inputs, body_block->outputs().slice(offset));
     }
   }

   bool isLongLine(const std::string& str) {
     return str.size() + level * 2 >= 40;
   }

   bool isLongInline(Node* node) {
     return output_inline_.count(node) && isLongLine(useOf(node->output()));
   }

   bool isNonConstantInline(Value* input) {
     return input->node()->kind() != prim::Constant &&
         output_inline_.count(input->node());
   }

   // [reordering of inlines]
   // We inline anything that is semantically legal to inline, but sometimes
   // we find that these lines get too long. In that case we break the lines
   //   r = foo(x.add_(b), some_long + expression)
   //  wrong!
   //   _0 = some_long + expression
   //   r = foo(x.add_(b), _0) # wrong! _0 runs before mutating add_
   // legal!
   //   _0 = x.add_(b)
   //   _1 = some_long + expression
   //   r = foo(_0, _1)
   void splitLongInlines(at::ArrayRef<Value*> inputs) {
     size_t long_inline_slice = 0;
     // find the last input that is too long
     for (size_t i = 0; i < inputs.size(); ++i) {
       if (isLongInline(inputs[i]->node())) {
         long_inline_slice = i + 1;
       }
     }
     // un-inline everything through the last long line
     // constants are ignored since long constants are never inlined in the
     // first place
     for (size_t i = 0; i < long_inline_slice; ++i) {
       if (isNonConstantInline(inputs[i])) {
         printOutputDefinition(inputs[i]->node(), useOf(inputs[i]));
       }
     }
   }

   void printOutputDefinition(Node* node, const std::string& str) {
     assignValuesToTheirUniqueNames(node->outputs());
     indent();
     // Print outputs
     if (node->outputs().size() > 0) {
       printValueList(out, node->outputs());
       out << " = ";
     }
     out << str << "\n";
   }

   // Recursively check contained types for any class dependencies
   void registerClassDependencies(const TypePtr& type) {
     if (const auto classType = type->cast<ClassType>()) {
       addToClassTable(classType);
     }
     for (const auto& containedType : type->containedTypes()) {
       registerClassDependencies(containedType);
     }
   }

   void printNode(Node* node, bool print_const) {
     // Check for class dependencies. If this node inputs or outputs a class
     // type, we need to add it to our table of dependencies.
     for (const auto input : node->inputs()) {
       registerClassDependencies(input->type());
     }
     for (const auto output : node->outputs()) {
       registerClassDependencies(output->type());
     }

     if (!print_const && node->kind() == prim::Constant)
       return;
     if (node->kind() == prim::PythonOp) {
       auto value = static_cast<const PythonOp*>(node);
       if (enforce_importable_ && value->ignore_on_export) {
         // Op has been marked as ignored, so insert an error in its place
         indent();
         out << "ops.prim.IgnoredPythonOp()\n";
         return;
       }
     }
     splitLongInlines(node->inputs());
     switch (node->kind()) {
       case prim::Return:
         if (enforce_importable_ && node->inputs().size() != 1) {
           throw script::ErrorReport(node->getSourceLocation())
               << "Exportable methods must have a single return value. "
               << "Normal use of ScriptMethods should enforce this.";
         }
         if (node->inputs().size() > 0) {
           indent();
           out << "return ";
           printValueList(out, node->inputs());
           out << "\n";
         }
         break;
       case prim::Loop:
         printLoop(LoopView(node));
         break;
       case prim::If:
         printIf(IfView(node));
         break;
       case prim::TupleUnpack:
       case prim::ListUnpack:
         assignValuesToTheirUniqueNames(node->outputs());
         indent();
         // TupleUnpack(unpacked) turns into an assignment op that forces
         // the unpack to be inserted when parsed back in:
         // a, b, = unpacked
         // a, = unpacked # trailing comma forces an unpack to happen
         if (node->outputs().size() > 0) {
           printValueList(out, node->outputs(), "", ", = ");
         }
         out << useOf(node->input()) << "\n";
         break;
       case prim::SetAttr: {
         const auto obj = node->inputs().at(0);
         const auto newVal = node->inputs().at(1);
         const auto type = obj->type()->expect<ClassType>();
         const auto& attrname = node->s(attr::name);
         indent();
         out << useOf(obj) << "." << attrname << " = " << useOf(newVal) << "\n";
       } break;
       default:
         std::stringstream ss;
         printRHS(ss, node);

         // we prevent long constants from inlining here.
         // it is not safe to do the same thing for non-constants here
         // because of [reordering of inlines]
         if (output_inline_.count(node) == 0 ||
             (node->kind() == prim::Constant && isLongLine(ss.str()))) {
           printOutputDefinition(node, ss.str());
         } else {
           // this node is safe to inline, so assign the output value
           // to that expression directly
           assignValue(node->output(), ss.str());
         }
     }
   }

   void printMaybeAnnotatedConstantList(
       std::ostream& stmt,
       const char* the_type,
       size_t list_size,
       const IValue& the_list) {
     if (list_size == 0) {
       stmt << "annotate(List[" << the_type << "], [])";
     } else {
       stmt << the_list;
     }
   }

   void printConstant(std::ostream& stmt, const IValue& v) {
     if (v.isTensor()) {
       stmt << "CONSTANTS.c" << getOrAddTensorConstant(v.toTensor());
     } else if (v.isString()) {
       printQuotedString(stmt, v.toStringRef());
     } else if (v.isDevice()) {
       std::stringstream ss;
       ss << v.toDevice();
       stmt << "torch.device(";
       printQuotedString(stmt, ss.str());
       stmt << ")";
     } else if (v.isTensorList()) {
       stmt << "[";
       const char* delim = "";
       for (const auto& t : v.toTensorListRef()) {
         stmt << delim << "CONSTANTS.c" << getOrAddTensorConstant(t);
         delim = ", ";
       }
       stmt << "]";
     } else if (v.isBoolList()) {
       printMaybeAnnotatedConstantList(
           stmt, "bool", v.toBoolListRef().size(), v);
     } else if (v.isIntList()) {
       printMaybeAnnotatedConstantList(stmt, "int", v.toIntListRef().size(), v);
     } else if (v.isDoubleList()) {
       printMaybeAnnotatedConstantList(
           stmt, "float", v.toDoubleListRef().size(), v);
     } else {
       stmt << v;
     }
   }

   void printNone(std::ostream& stmt, const Node* node) {
     if (node->output()->type()->isSubtypeOf(NoneType::get())) {
       stmt << "None";
       return;
     }
     // XXX - when None has an Optional[T] type, we must ensure that type
     // can be recovered on parsing. It cannot be recovered if it will be
     // matched to schema with free variables. If it is used only in places
     // where there is schema and the scheme has no free variables, then we
     // can recover it without annotation. Otherwise, we annotate None with
     // the right optional type
     const auto& uses = node->output()->uses();
     bool all_usable_schema =
         std::all_of(uses.begin(), uses.end(), [](const Use& u) {
           if (auto schema = u.user->maybeSchema()) {
             if (u.offset >= schema->arguments().size()) {
               return false;
             }
             return !schema->arguments().at(u.offset).type()->hasFreeVariables();
           }
           return false;
         });

     if (all_usable_schema) {
       stmt << "None";
     } else {
       stmt << "annotate(" << node->output()->type()->python_str() << ", None)";
     }
   }

   // Prints the RHS value of a Node, e.g. `aten.add(x, y)`
   void printRHS(std::ostream& stmt, Node* node) {
     switch (node->kind()) {
       case PythonOp::Kind: {
         auto value = static_cast<const PythonOp*>(node);
         if (enforce_importable_) {
           throw script::ErrorReport(node->getSourceLocation())
               << "could not export python function call " << value->name()
               << ". Remove calls to Python functions before export."
               << "Did you forget add @script annotation? "
               << "If this is a modulelist, add it to __constants__.";
         }

         stmt << "^" << value->name();
         value->writeScalars(stmt);
         printValueList(stmt, node->inputs(), "(", ")");
       } break;
       case prim::Constant: {
         if (node->kind() == prim::Constant && !node->mustBeNone()) {
           IValue v = toIValue(node->output()).value();
           printConstant(stmt, v);
         } else {
           printNone(stmt, node);
         }
       } break;
       case prim::ImplicitTensorToNum: {
         stmt << "annotate(" << node->output()->type()->python_str() << ", "
              << useOf(node->input()) << ")";
       } break;
       case prim::Int: {
         printValueList(stmt, node->inputs(), "int(", ")");
       } break;
       case prim::Float: {
         printValueList(stmt, node->inputs(), "float(", ")");
       } break;
       case prim::Bool: {
         printValueList(stmt, node->inputs(), "bool(", ")");
       } break;
       case prim::Print: {
         printValueList(stmt, node->inputs(), "print(", ")");
       } break;
       case prim::TupleConstruct: {
         printValueList(
             stmt, node->inputs(), "(", node->inputs().size() == 1 ? ",)" : ")");
       } break;
       case prim::TupleIndex: {
         stmt << "(" << useOf(node->input()) << ")[" << node->i(attr::index)
              << "]";
       } break;
       case prim::TupleSlice: {
         stmt << "(" << useOf(node->input()) << ")[" << node->i(attr::beg) << ":"
              << node->i(attr::end) << "]";
       } break;
       case prim::ListConstruct: {
         // when the list is empty and is not a list of tensors,
         // we need to annotate it, otherwise it won't be possible
         // to infer the type on import
         if (node->inputs().size() == 0 &&
             !node->output()->type()->isSubtypeOf(TensorType::get())) {
           stmt << "annotate(" << node->output()->type()->python_str()
                << ", [])";
         } else {
           printValueList(stmt, node->inputs(), "[", "]");
         }
       } break;
       case prim::DictConstruct: {
         auto dict_type = node->output()->type()->expect<DictType>();
         bool is_default_type =
             dict_type->getKeyType()->isSubtypeOf(StringType::get()) &&
             dict_type->getKeyType()->isSubtypeOf(TensorType::get());
         if (node->inputs().size() == 0 && !is_default_type) {
           stmt << "annotate(" << node->output()->type()->python_str()
                << ", {})";
         } else {
           printDict(stmt, node->inputs());
         }
       } break;
       case prim::DictIndex: {
         stmt << "(" << useOf(node->inputs().at(0)) << ")["
              << useOf(node->inputs().at(1)) << "]";
       } break;
       case prim::fork: {
         // the subgraph gets emitted as another function
         auto name = genMethodName("__forked_function");
         std::shared_ptr<Graph> graph = node->g(attr::Subgraph);
         worklist.emplace_back(
             [graph, name, this] { printFunctionDefinition(*graph, name); });
         // and we put a call to fork which invokes that function.
         stmt << "fork(self." << name;
         for (Value* v : node->inputs()) {
           stmt << ", " << useOf(v);
         }
         stmt << ")";
       } break;
       case prim::Function: {
         if (enforce_importable_) {
           throw script::ErrorReport(node->getSourceLocation())
               << "closures are not exportable";
         }
         auto name = genMethodName("__lambda");
         std::shared_ptr<Graph> graph = node->g(attr::Subgraph);
         worklist.emplace_back(
             [graph, name, this] { printFunctionDefinition(*graph, name); });
         stmt << "self." << name;
       } break;
       case prim::CreateObject: {
         const auto classType = node->output()->type()->expect<ClassType>();
         stmt << classType->name() << ".__new__(" << classType->name() << ")";
       } break;
       case prim::GetAttr: {
         const auto obj = node->inputs().at(0);
         const auto classType = obj->type()->expect<ClassType>();
         const auto& field = node->s(attr::name);
         stmt << useOf(obj) << "." << field;
       } break;
       default: {
         Symbol kind = node->kind();
         if (kind.is_aten()) {
           // special case aten -> torch because we want to rename
           // the aten namespace, but this change will take more time
           // doing it here ensures we do not have fix up archives later
           stmt << "torch." << kind.toUnqualString() << "(";
         } else {
           stmt << "ops." << kind.ns().toUnqualString() << "."
                << kind.toUnqualString() << "(";
         }
         const FunctionSchema& schema = node->schema();
         for (size_t i = 0; i < node->inputs().size(); ++i) {
           if (i > 0) {
             stmt << ", ";
           }
           auto v = useOf(node->inputs().at(i));
           // print the kwarg name if it is a kwarg only argument.
           if (i < schema.arguments().size()) {
             auto arg = schema.arguments().at(i);
             if (arg.kwarg_only()) {
               stmt << arg.name() << "=";
             }
           } else {
             // vararg functions like format can have extra arguments
             AT_ASSERT(schema.is_vararg());
           }
           stmt << v;
         }
         stmt << ")";
       } break;
     }
   }

   std::ostream& printBlock(Block* root, bool block_has_other_statements) {
     // pythons weird 'pass' syntax creates a bunch of places where we have to
     // check if this block would be empty. But not everything in a block is a
     // node. Sometimes if, loop, and return statements will follow this block
     // and block_has_other_statements == true.
     if (!block_has_other_statements &&
         root->nodes().begin() == root->nodes().end()) {
       indent();
       out << "pass\n";
     }
     for (auto* node : root->nodes()) {
       printNode(node, /*print_const=*/false);
     }
     return out;
   }

   void printDefaultValue(
       const TypePtr& typ,
       std::ostream& stmt,
       const IValue& value) {
     // xxx - many weak script modules store default values for broadcasting
     // lists that are not actually the same type as the argument. We can only
     // serialize default values that will implicitly convert to their declared
     // return type since we do not need to serialize these built-in modules with
     // their defaults, we just drop them for now.
     if (typ->kind() == ListType::Kind &&
         (value.isInt() || value.isDouble() || value.isBool())) {
       return;
     }
     stmt << "=";
     printConstant(stmt, value);
   }
   void printFunctionDefinition(
       Graph& graph,
       const std::string& name,
       bool is_class = false,
       const std::vector<c10::optional<IValue>>& defaults = {},
       const std::vector<std::string>& param_names = {}) {
     used_names_.clear(); // each graph can reuse local names

     // we always print constants at the top of the function, in the order
     // in which they are used.
     std::vector<Node*> constants;
     buildConstantList(graph.block(), constants);

     // current graph is used to de-dup names within a single graph
     scanBlock(graph.block());

     // last param_names.size() arguments to the graph are parameters and not
     // actual inputs, we will print these as, e.g. self.foo.bar
     // while we print the true_inputs out as parameters
     auto true_inputs =
         graph.inputs().slice(0, graph.inputs().size() - param_names.size());
     auto param_names_it = param_names.begin();
     for (auto param : graph.inputs().slice(true_inputs.size())) {
       assignValue(param, *param_names_it++);
     }
     assignValuesToTheirUniqueNames(true_inputs);
     auto defaults_offset = defaults.begin();

     indent();
     out << "def " << name << "(";

     auto input_iter = true_inputs.begin();
     // Print the `self` argument
     if (is_class) {
       // If this is a class, print the self var without a type annotation,
       // following Python convention
       AT_ASSERT(true_inputs.size() > 0);
       out << useOf(*input_iter);
       ++input_iter;

       AT_ASSERT(!defaults_offset->has_value());
       ++defaults_offset;
     } else {
       // If this is not a class, then we need to insert a "self".
       out << "self";
     }

     // Print the rest of the arguments
     for (; input_iter != true_inputs.end(); ++input_iter) {
       auto input = *input_iter;
       out << ",\n    " << useOf(input) << ": " << input->type()->python_str();
       if (defaults_offset != defaults.end()) {
         const c10::optional<IValue>& def = *defaults_offset++;
         if (def) {
           printDefaultValue(input->type(), out, *def);
         }
       }
     }

     // have we use all the provided defaults?
     AT_ASSERT(defaults_offset == defaults.end());

     out << ") -> " << resultType(graph)->python_str() << ":\n";
     {
       auto guard = WithIndented();
       // Print initial constant table (most are just inlined into their use,
       // but some like long strings do get emitted)
       for (Node* n : constants) {
         printNode(n, /*print_const=*/true);
       }
       // Print body
       printBlock(
           graph.block(), graph.block()->return_node()->inputs().size() > 0);
       printNode(graph.block()->return_node(), /*print_const=*/false);
     }
   }

  public:
   PythonPrintPass(
       std::ostream& out_,
       std::vector<at::Tensor>& tensor_table,
       std::vector<ClassTypePtr>& class_table,
       bool enforce_importable)
       : out(out_),
         tensor_table_(tensor_table),
         class_table_(class_table),
         enforce_importable_(enforce_importable) {}

   // TODO: we should consider forcing functions to return a single value
   // instead of handling this tuple logic both in the compiler and the printer
   TypePtr resultType(const Graph& graph) {
     if (graph.outputs().size() == 1) {
       return graph.outputs().at(0)->type();
     } else {
       return TupleType::create(
           fmap(graph.outputs(), [&](const Value* v) { return v->type(); }));
     }
   }

   void printFunction(
       Graph& graph,
       const std::string& name,
       bool is_class,
       const std::vector<c10::optional<IValue>>& defaults = {},
       const std::vector<std::string>& param_names = {}) {
     printFunctionDefinition(graph, name, is_class, defaults, param_names);
     while (!worklist.empty()) {
       out << "\n\n";
       auto work = worklist.back();
       worklist.pop_back();
       work();
     }
   }
   void printMethod(script::Method& method) {
     std::unordered_map<IValue*, QualifiedNamePtr> extra_ivalue_names;
     createTensorToParameterNameMap(
         method.owner(), QualifiedName::create("self"), extra_ivalue_names);
     printMethod(method, /*is_class=*/false, extra_ivalue_names);
   }
   void printMethod(
       script::Method& method,
       bool is_class,
       const std::unordered_map<IValue*, QualifiedNamePtr>& extra_ivalue_names) {
     std::vector<std::string> ivalue_names = fmap(
         method.initial_ivalues(),
         [&](IValue* slot) { return extra_ivalue_names.at(slot)->str(); });
     const std::string& name = method.name();
     Graph& graph = *method.graph();
     auto defaults = fmap(
         method.getSchema().arguments(),
         [](const Argument& arg) { return arg.default_value(); });
     printFunction(graph, name, is_class, defaults, ivalue_names);
   }
   void printModule(script::Module& module) {
     std::unordered_map<IValue*, QualifiedNamePtr> extra_ivalue_names;
     createTensorToParameterNameMap(
         module, QualifiedName::create("self"), extra_ivalue_names);
     for (auto& method : module.get_methods()) {
       const std::string& name = method.value()->name();
       // we skip __forked_functions because they actually get inlined into their
       // callers, exporting them again will lead to more code generated on each
       // export
       if (name.find("__forked_function") == 0) {
         continue;
       }
       printMethod(*method.value(), /*is_class=*/false, extra_ivalue_names);
     }
   }

   void printClass(const ClassTypePtr& classType) {
     out << "class " << classType->name() << ":\n";
     {
       const auto guard = WithIndented();
       std::unordered_map<IValue*, QualifiedNamePtr> extra_ivalue_names;
       for (auto& method : classType->methods()) {
         printMethod(*method, /*is_class=*/true, extra_ivalue_names);
       }
     }
   }
 };

 TORCH_API void PythonPrint(
     std::ostream& out,
     const Graph& graph,
     std::vector<at::Tensor>& tensor_table,
     std::vector<ClassTypePtr>& class_table,
     bool enforce_importable) {
   PythonPrintPass pp(out, tensor_table, class_table, enforce_importable);
   // NOLINTNEXTLINE(cppcoreguidelines-pro-type-const-cast)
   pp.printFunction(const_cast<Graph&>(graph), "graph", /*is_class=*/false);
 }

 TORCH_API void PythonPrint(
     std::ostream& out,
     const script::Method& method,
     std::vector<at::Tensor>& tensor_table,
     std::vector<ClassTypePtr>& class_table,
     bool enforce_importable) {
   PythonPrintPass pp(out, tensor_table, class_table, enforce_importable);
   // NOLINTNEXTLINE(cppcoreguidelines-pro-type-const-cast)
   pp.printMethod(const_cast<script::Method&>(method));
 }

 TORCH_API void PythonPrint(
     std::ostream& out,
     const script::Module& module,
     std::vector<at::Tensor>& tensor_table,
     std::vector<ClassTypePtr>& class_table,
     bool enforce_importable) {
   PythonPrintPass pp(out, tensor_table, class_table, enforce_importable);
   // NOLINTNEXTLINE(cppcoreguidelines-pro-type-const-cast)
   pp.printModule(const_cast<script::Module&>(module));
 }

 TORCH_API void PythonPrint(
     std::ostream& out,
     const ClassTypePtr& classType,
     std::vector<at::Tensor>& tensor_table,
     std::vector<ClassTypePtr>& class_table,
     bool enforce_importable) {
   PythonPrintPass pp(out, tensor_table, class_table, enforce_importable);
   pp.printClass(classType);
 }

 TORCH_API bool printerHasSpecialCaseFor(Symbol sym) {
   // WARNING: by adding a value to this set, you are asserting
   // that you have also added special handling of this symbol to
   // the printer above. Not adding handling will cause import and export
   // of modules with this new operator to fail. This is only required
   // for operators without schema. Prefer registering your operator with
   // schema to editing this list here. These cases should only be things
   // that require special handling because they do not fit normal schema
   const static std::unordered_set<Symbol> handled = {
       prim::Constant,
       prim::fork,
       prim::ListConstruct,
       prim::DictConstruct,
       prim::ListUnpack,
       prim::Print,
       prim::PythonOp,
       prim::TupleConstruct,
       prim::TupleIndex,
       prim::DictIndex,
       prim::TupleSlice,
       prim::TupleUnpack,
       prim::CreateObject,
       prim::GetAttr,
       prim::SetAttr,
   };

   // WARNING: by adding a value to this set, you are asserting that your
   // primitive is only ever added during optimization and does not need
   // to be correctly printed for export (a process that happens before
   // optimization passes run)
   const static std::unordered_set<Symbol> unneeded = {
       c10::onnx::Reshape, // only used in onnx
       c10::onnx::Shape, // only used in onnx
       prim::AutogradZero, // temporarily inserted by autograd
       prim::AutogradAnyNonZero, // temporarily inserted by autograd
       prim::AutogradAdd, // temporarily inserted by autograd
       prim::ConstantChunk, // optimization pass adds it
       prim::DifferentiableGraph, // optimization pass adds it
       prim::BroadcastSizes, // optimization pass (fuser) adds it
       prim::ChunkSizes, // optimization pass (fuser) adds it
       prim::Drop, // used in interpreter only
       prim::FusedConcat, // optimization pass adds it
       prim::FusionGroup, // optimization pass adds it
       prim::Load, // used in interpreter only
       prim::MMTreeReduce, // used as an optimization
       prim::MMBatchSide, // used as an optimization
       prim::Store, // used in interpreter only

   };

   return handled.count(sym) || unneeded.count(sym);
 }

 } // namespace jit
 } // namespace torch
torch::jit::script::ErrorReport
Definition: error_report.h:9

torch::jit::ResourceGuard
Definition: resource_guard.h:7

at::Tensor
Definition: Tensor.h:48

c10::DictType
Definition: jit_type.h:534

c10::ClassType
Definition: jit_type.h:1107

torch::jit::IfView
Definition: ir_views.h:6

torch::jit::Use
Definition: ir.h:99

c10::ArrayRef::slice
AT_CPP14_CONSTEXPR ArrayRef< T > slice(size_t N, size_t M) const
slice(n, m) - Chop off the first N elements of the array, and keep M elements in the array...
Definition: ArrayRef.h:161

torch::jit::Graph
Definition: ir.h:936

c10::ArrayRef::size
constexpr size_t size() const
size - Get the array size.
Definition: ArrayRef.h:138

at::Tensor::is_variable
bool is_variable() const noexcept
Returns true if the Tensor is actually a torch::autograd::Variable.
Definition: TensorMethods.h:1283

c10::intrusive_ptr< QualifiedName >

c10::Argument
Definition: function_schema.h:14

torch::jit::script::NamedIValue
Definition: module.h:361

torch::jit::Value
Definition: ir.h:144

torch::jit::script::Method
Definition: module.h:55

torch::jit::script::Module
Definition: module.h:375

c10::optional
Definition: Optional.h:118

torch::jit::QualifiedName
Definition: python_print.cpp:92

torch
Definition: jit_type.h:17

c10::intrusive_ptr_target
intrusive_ptr<T> is an alternative to shared_ptr<T> that has better performance because it does the r...
Definition: intrusive_ptr.h:35

c10::IValue
Definition: ivalue.h:127

torch::jit::PythonPrintPass
Definition: python_print.cpp:200

c10::ArrayRef
ArrayRef - Represent a constant reference to an array (0 or more elements consecutively in memory)...
Definition: ArrayRef.h:41

torch::jit::PythonPrintPass::splitLongInlines
void splitLongInlines(at::ArrayRef< Value * > inputs)
and it is important that we un-inline all the inputs preceeding the long input:
Definition: python_print.cpp:628

c10::Symbol
Definition: interned_strings.h:215

torch::jit::Node
Definition: ir.h:228

c10::FunctionSchema
Definition: function_schema.h:67

torch::jit::Block
Definition: ir.h:818

torch::jit::LoopView
Definition: ir_views.h:39

torch::jit::PythonOp
Definition: ir.h:1236