chore: address review comments

peri044 · peri044 · commit d053b4d5138a · 2022-09-22T10:49:32.000-07:00
Signed-off-by: Dheeraj Peri &lt;peri.dheeraj@gmail.com&gt;
diff --git a/core/compiler.cpp b/core/compiler.cpp
@@ -138,9 +138,9 @@ partitioning::GraphAndMapping BuildHybridGraph(
 
   auto partitioning_ctx = partitioning::PartitioningCtx(block, partitioning_info);
   auto collection_input_ivalues_map =
-      partitioning::GenerateRandomInputs(partitioning_info.collection_input_spec_map, first_use_types);
+      partitioning::generateRandomInputs(partitioning_info.collection_input_spec_map, first_use_types);
 
-  partitioning::Partition(&partitioning_ctx, collection_input_ivalues_map);
+  partitioning::partition(&partitioning_ctx, collection_input_ivalues_map);
 
   for (auto& partitioned_block : partitioning_ctx.partitioned_blocks) {
     partitioning::PartitionedGraph& segmented_blocks = partitioned_block.second;
@@ -174,7 +174,7 @@ partitioning::GraphAndMapping BuildHybridGraph(
     }
   }
 
-  return partitioning::Stitch(&partitioning_ctx, block);
+  return partitioning::stitch(&partitioning_ctx, block);
 }
 
 void MapInputsAndDetermineDTypes(
diff --git a/core/partitioning/partitioning.cpp b/core/partitioning/partitioning.cpp
@@ -29,7 +29,7 @@ bool containNonTensorOutputs(torch::jit::Node* n) {
 }
 
 // Check if the inputs and outputs of the graph are Tensor. If not, then fallback connected nodes
-void SetInputsOutputsConnectedNodes(PartitioningCtx* ctx, torch::jit::Block* block) {
+void setInputsOutputsConnectedNodes(PartitioningCtx* ctx, torch::jit::Block* block) {
   // fallback nodes that produce entire graph's nonTensor output
   for (auto i : block->outputs()) {
     if (!isTensor(i)) {
@@ -50,7 +50,7 @@ void SetInputsOutputsConnectedNodes(PartitioningCtx* ctx, torch::jit::Block* blo
 // Find and set all explicit fallback nodes (nodes that are unsupported or forced fallback)
 // we use a map to indicate the reason why it's fallback to torch
 // For any node that's not explicitly fallback, we set it to run in TensorRT for now
-void SetExplicitFallbackNodes(PartitioningCtx* ctx, torch::jit::Block* block) {
+void setExplicitFallbackNodes(PartitioningCtx* ctx, torch::jit::Block* block) {
   auto nodes = block->nodes();
   const auto to_compile_sym = c10::Symbol::attr("to_compile");
 
@@ -78,7 +78,7 @@ void SetExplicitFallbackNodes(PartitioningCtx* ctx, torch::jit::Block* block) {
 
 // For a given set of fallback nodes, check their inputs/outputs, if any inputs/outputs of them are NonTensor,
 // then the nodes that produces/consumes those values should also fallback
-void SetNonTensorConnectedNodes(PartitioningCtx* ctx, std::vector<torch::jit::Node*>& initial_fallback_nodes) {
+void setNonTensorConnectedNodes(PartitioningCtx* ctx, std::vector<torch::jit::Node*>& initial_fallback_nodes) {
   // initial_fallback_nodes are the fallback nodes that we have before we run BFS in this function
   std::queue<torch::jit::Node*> q;
   for (auto& node : initial_fallback_nodes) {
@@ -112,7 +112,7 @@ void SetNonTensorConnectedNodes(PartitioningCtx* ctx, std::vector<torch::jit::No
 }
 
 // Sub-function that traverses the entire block and check if TensorRT node sequence satisfy min_block_size
-std::vector<torch::jit::Node*> TraverseNodesForMinBlockSize(PartitioningCtx* ctx, torch::jit::Block* block) {
+std::vector<torch::jit::Node*> traverseNodesForMinBlockSize(PartitioningCtx* ctx, torch::jit::Block* block) {
   auto nodes = block->nodes();
   std::vector<torch::jit::Node*> cur_trt_nodes;
   std::vector<torch::jit::Node*> min_block_fallback_nodes;
@@ -138,19 +138,19 @@ std::vector<torch::jit::Node*> TraverseNodesForMinBlockSize(PartitioningCtx* ctx
 }
 
 // Set the nodes that fallback because of min_block_size
-void SetMinBlockFallbackNodes(PartitioningCtx* ctx, torch::jit::Block* block) {
+void setMinBlockFallbackNodes(PartitioningCtx* ctx, torch::jit::Block* block) {
   // first traverse all the nodes to find the initial nodes that don't meet the min_block_size requirement
-  auto min_block_fallback_nodes = TraverseNodesForMinBlockSize(ctx, block);
+  auto min_block_fallback_nodes = traverseNodesForMinBlockSize(ctx, block);
 
   // keep fallback until all segments meet the min_block_size requirement
   while (!min_block_fallback_nodes.empty()) {
     for (const auto i : min_block_fallback_nodes) {
       ctx->setNodeExecutorDecision(i, NodeExecutorDecision::kMIN_BLOCK_FALLBACK);
     }
     // find the fallback nodes because of dependency with min_block_size caused fallback nodes
-    SetNonTensorConnectedNodes(ctx, min_block_fallback_nodes);
+    setNonTensorConnectedNodes(ctx, min_block_fallback_nodes);
     // keep traverse the graph until there is no node fallback because of min_block_size
-    min_block_fallback_nodes = TraverseNodesForMinBlockSize(ctx, block);
+    min_block_fallback_nodes = traverseNodesForMinBlockSize(ctx, block);
   }
 }
 
@@ -173,7 +173,7 @@ bool isModifyingNodes(torch::jit::Node* node, torch::jit::Value* val) {
   return false;
 }
 
-std::vector<torch::jit::Node*> FindModifyingNodes(
+std::vector<torch::jit::Node*> findModifyingNodes(
     torch::jit::Value* val,
     const std::unordered_set<torch::jit::Node*>& seg_block_nodes) {
   std::vector<torch::jit::Node*> modifying_nodes;
@@ -190,7 +190,7 @@ std::vector<torch::jit::Node*> FindModifyingNodes(
 }
 
 // this function is only used when a TRT segment produces nonTensor values which are used by later TRT segment
-std::vector<torch::jit::Node*> GetDependencyNodes(
+std::vector<torch::jit::Node*> getDependencyNodes(
     const std::vector<torch::jit::Value*>& vals,
     const SegmentedBlock& seg_block) {
   // get all nodes in the segmentedblock
@@ -206,7 +206,7 @@ std::vector<torch::jit::Node*> GetDependencyNodes(
     auto node = cur_val->node();
     if (node->kind() != torch::jit::prim::Constant && !visited.count(node)) {
       visited.insert(node);
-      auto modifying_nodes = FindModifyingNodes(cur_val, seg_block_nodes);
+      auto modifying_nodes = findModifyingNodes(cur_val, seg_block_nodes);
       stk.insert(stk.end(), modifying_nodes.rbegin(), modifying_nodes.rend());
       stk.push_back(node);
       for (auto input : node->inputs()) {
@@ -220,7 +220,7 @@ std::vector<torch::jit::Node*> GetDependencyNodes(
   return stk;
 }
 
-void ResolveTRTNonTensorInputs(PartitioningCtx* ctx, torch::jit::Block* block) {
+void resolveTRTNonTensorInputs(PartitioningCtx* ctx, torch::jit::Block* block) {
   // if a TRT segment has nonTensor Inputs, the nodes that produce this nonTensor Inputs must in another TensorRT engine
   // because we have already found the interface between Torch and TRT in segmentation phase
   // what we do here is just find the dependency nodes of the TRT segments that have nonTensor inputs
@@ -235,7 +235,7 @@ void ResolveTRTNonTensorInputs(PartitioningCtx* ctx, torch::jit::Block* block) {
       }
       if (!inputs_to_resolve.empty()) {
         std::vector<torch::jit::Node*> dependency_nodes =
-            GetDependencyNodes(inputs_to_resolve, cur_partitioned_block[i]);
+            getDependencyNodes(inputs_to_resolve, cur_partitioned_block[i]);
         dependency_nodes.insert(
             dependency_nodes.end(),
             cur_partitioned_block[i].raw_nodes().begin(),
@@ -246,7 +246,7 @@ void ResolveTRTNonTensorInputs(PartitioningCtx* ctx, torch::jit::Block* block) {
   }
 }
 
-void RegisterSegmentsOutputs(PartitioningCtx* ctx, torch::jit::Block* block) {
+void registerSegmentsOutputs(PartitioningCtx* ctx, torch::jit::Block* block) {
   // find the corresponding raw values in original global graph for this segmented block's inputs/outputs
   PartitionedGraph& cur_partitioned_block = ctx->partitioned_blocks[block];
   auto cmp = [](torch::jit::Value* a, torch::jit::Value* b) { return a->unique() < b->unique(); };
@@ -332,32 +332,32 @@ void finalizeNewBlock(
   LOG_DEBUG(g.back());
 }
 
-void SetNodeExecutorLUT(PartitioningCtx* ctx, torch::jit::Block* block) {
+void setNodeExecutorLUT(PartitioningCtx* ctx, torch::jit::Block* block) {
   // First, find all the explicit fallback nodes that should run in Torch:
   // 1. nodes that are unsupported
   // 2. nodes that the user specifies to run in torch
   // 3. nodes that the user specifies the module containing this op to run in torch
   // At the same time, set all the rest nodes to NodeExecutorDecision::kCONVERT
-  SetExplicitFallbackNodes(ctx, block);
+  setExplicitFallbackNodes(ctx, block);
 
   // Second, check if there is nonTensor input/output for the block, if there is, then fallback the nodes that
   // consume/produce this nonTensor value
-  SetInputsOutputsConnectedNodes(ctx, block);
+  setInputsOutputsConnectedNodes(ctx, block);
 
   // Third, for fallback nodes, if it consumes any NonTensor inputs, then the nodes that produce this
   // input should also fallback. Similarly, if it produces any NonTensor outputs, then the nodes
   // that consume this output should also fallback
   auto cur_fallback_nodes = ctx->getNodesRunInTorch();
-  SetNonTensorConnectedNodes(ctx, cur_fallback_nodes);
+  setNonTensorConnectedNodes(ctx, cur_fallback_nodes);
 
   // Finally, check if all current tensorrt blocks satisfy the min_block_size requirement.
   // We need to traverse the whole graph many times here
-  SetMinBlockFallbackNodes(ctx, block);
+  setMinBlockFallbackNodes(ctx, block);
 }
 
-void SegmentGraph(PartitioningCtx* ctx, torch::jit::Block* block) {
+void segmentGraph(PartitioningCtx* ctx, torch::jit::Block* block) {
   // Find all the fallback nodes and build execution decision LUT for all nodes
-  SetNodeExecutorLUT(ctx, block);
+  setNodeExecutorLUT(ctx, block);
 
   auto nodes = block->nodes();
 
@@ -436,24 +436,24 @@ void SegmentGraph(PartitioningCtx* ctx, torch::jit::Block* block) {
   return;
 }
 
-void Partition(PartitioningCtx* ctx, ExampleIValues& example_tensor_map) {
+void partition(PartitioningCtx* ctx, ExampleIValues& example_tensor_map) {
   LOG_DEBUG(ctx->settings);
 
   // Go through all the blocks to do the partitioning
   for (torch::jit::Block* block : ctx->original_blocks) {
     // segment lowering global graph into blocks
-    SegmentGraph(ctx, block);
+    segmentGraph(ctx, block);
 
     // It's possible that some TensorRT blocks have nonTensor inputs/output because they are interleaved by Torch blocks
     // resolve nonTensor inputs/outputs
-    ResolveTRTNonTensorInputs(ctx, block);
+    resolveTRTNonTensorInputs(ctx, block);
 
     // register input/output torch::jit::Value for segmented graphs
     LOG_DEBUG("Registering input/output torch::jit::Value for segmented graphs");
-    RegisterSegmentsOutputs(ctx, block);
+    registerSegmentsOutputs(ctx, block);
 
     // run shape analysis on each segmented block
-    RunShapeAnalysis(ctx, block, example_tensor_map);
+    runShapeAnalysis(ctx, block, example_tensor_map);
   }
 }
 
diff --git a/core/partitioning/partitioning.h b/core/partitioning/partitioning.h
@@ -18,15 +18,15 @@ typedef std::unordered_map<const torch::jit::Value*, torch::jit::IValue> Example
 typedef std::pair<std::shared_ptr<torch::jit::Graph>, std::unordered_map<torch::jit::Value*, torch::jit::Value*>>
     GraphAndMapping;
 
-ExampleIValues GenerateRandomInputs(ir::CollectionInputSpecMap& input_ranges, ir::CollectionTypeMap& input_types);
+ExampleIValues generateRandomInputs(ir::CollectionInputSpecMap& input_ranges, ir::CollectionTypeMap& input_types);
 
-void RunShapeAnalysis(PartitioningCtx* ctx, torch::jit::Block* block, ExampleIValues& ivalues_maps);
+void runShapeAnalysis(PartitioningCtx* ctx, torch::jit::Block* block, ExampleIValues& ivalues_maps);
 
-void SegmentGraph(PartitioningCtx* ctx, torch::jit::Block* block);
+void segmentGraph(PartitioningCtx* ctx, torch::jit::Block* block);
 
-GraphAndMapping Stitch(PartitioningCtx* ctx, torch::jit::Block* block);
+GraphAndMapping stitch(PartitioningCtx* ctx, torch::jit::Block* block);
 
-void Partition(PartitioningCtx* ctx, ExampleIValues& example_tensor_map);
+void partition(PartitioningCtx* ctx, ExampleIValues& example_tensor_map);
 
 } // namespace partitioning
 } // namespace core
diff --git a/core/partitioning/shape_analysis.cpp b/core/partitioning/shape_analysis.cpp
@@ -9,7 +9,7 @@ namespace torch_tensorrt {
 namespace core {
 namespace partitioning {
 
-at::Tensor GenerateSingleInput(ir::Input& input, c10::optional<at::ScalarType>& type_opt) {
+at::Tensor generateSingleInput(ir::Input& input, c10::optional<at::ScalarType>& type_opt) {
   auto cur_shape = input.input_shape;
   std::vector<int64_t> shape;
   shape.insert(shape.begin(), std::begin(cur_shape.d), std::begin(cur_shape.d) + cur_shape.nbDims);
@@ -25,7 +25,7 @@ at::Tensor GenerateSingleInput(ir::Input& input, c10::optional<at::ScalarType>&
   return in;
 }
 
-std::unordered_map<const torch::jit::Value*, torch::jit::IValue> GenerateRandomInputs(
+std::unordered_map<const torch::jit::Value*, torch::jit::IValue> generateRandomInputs(
     std::unordered_map<const torch::jit::Value*, std::vector<ir::Input>>& inputs,
     std::unordered_map<const torch::jit::Value*, std::vector<c10::optional<at::ScalarType>>>& types) {
   // generate random inputs for running pytorch segments
@@ -38,28 +38,28 @@ std::unordered_map<const torch::jit::Value*, torch::jit::IValue> GenerateRandomI
       c10::TypePtr elementType = c10::TensorType::get();
       auto generic_list = c10::impl::GenericList(elementType);
       for (size_t i = 0; i < input.second.size(); i++) {
-        auto in = GenerateSingleInput(input.second[i], types[input.first][i]);
+        auto in = generateSingleInput(input.second[i], types[input.first][i]);
         generic_list.push_back(in.clone());
       }
       ivalue_map[input.first] = c10::IValue(generic_list);
     } else if (input.first->type()->kind() == torch::jit::TypeKind::TupleType) {
       // create tuple
       std::vector<torch::jit::IValue> list;
       for (size_t i = 0; i < input.second.size(); i++) {
-        auto in = GenerateSingleInput(input.second[i], types[input.first][i]);
+        auto in = generateSingleInput(input.second[i], types[input.first][i]);
         list.push_back(in.clone());
       }
       auto tuple = c10::ivalue::Tuple::create(list); // create tuple ptr
       ivalue_map[input.first] = c10::IValue(tuple);
     } else {
-      auto in = GenerateSingleInput(input.second[0], types[input.first][0]);
+      auto in = generateSingleInput(input.second[0], types[input.first][0]);
       ivalue_map[input.first] = in.clone();
     }
   }
   return ivalue_map;
 }
 
-void GetSegmentsOutputByRunning(
+void getSegmentsOutputByRunning(
     SegmentedBlock& seg_block,
     std::unordered_map<const torch::jit::Value*, torch::jit::IValue>& ivalues_maps,
     const PartitioningInfo& partitioning_info) {
@@ -181,11 +181,11 @@ void GetSegmentsOutputByRunning(
   seg_block.register_intypes(input_types);
 }
 
-void RunShapeAnalysis(PartitioningCtx* ctx, torch::jit::Block* block, ExampleIValues& example_tensor_map) {
+void runShapeAnalysis(PartitioningCtx* ctx, torch::jit::Block* block, ExampleIValues& example_tensor_map) {
   // register every segment's input shape, and it's running output IValues
   for (auto& seg_block : ctx->partitioned_blocks[block]) {
     torch::jit::ConstantPooling(seg_block.g());
-    GetSegmentsOutputByRunning(seg_block, example_tensor_map, ctx->settings);
+    getSegmentsOutputByRunning(seg_block, example_tensor_map, ctx->settings);
   }
   return;
 }
diff --git a/core/partitioning/stitching.cpp b/core/partitioning/stitching.cpp
@@ -9,7 +9,7 @@ namespace torch_tensorrt {
 namespace core {
 namespace partitioning {
 
-void AddSegmentedBlockToGraph(
+void addSegmentedBlockToGraph(
     std::shared_ptr<torch::jit::Graph>& g,
     partitioning::SegmentedBlock& seg,
     std::unordered_map<torch::jit::Value*, torch::jit::Value*>& old_to_new_g) {
@@ -49,7 +49,7 @@ void AddSegmentedBlockToGraph(
   return;
 }
 
-void AddIfBlockToGraph(
+void addIfBlockToGraph(
     std::shared_ptr<torch::jit::Graph>& new_g,
     torch::jit::Node* if_node,
     const std::vector<GraphAndMapping>& graph_and_mappings,
@@ -97,7 +97,7 @@ void AddIfBlockToGraph(
   return;
 }
 
-GraphAndMapping Stitch(PartitioningCtx* ctx, torch::jit::Block* block) {
+GraphAndMapping stitch(PartitioningCtx* ctx, torch::jit::Block* block) {
   auto new_g = std::make_shared<torch::jit::Graph>();
 
   // the mapping from lowering graph => fallback global graph
@@ -109,20 +109,20 @@ GraphAndMapping Stitch(PartitioningCtx* ctx, torch::jit::Block* block) {
   for (auto seg_block : ctx->partitioned_blocks[block]) {
     LOG_INFO("Block segment:" << seg_block);
     if (seg_block.target() == partitioning::SegmentedBlock::kTensorRT) {
-      AddSegmentedBlockToGraph(new_g, seg_block, old_to_new_g);
+      addSegmentedBlockToGraph(new_g, seg_block, old_to_new_g);
     } else {
       if (seg_block.raw_nodes()[0]->kind() == torch::jit::prim::If) {
         auto if_node = seg_block.raw_nodes()[0];
 
         // convert the 2 blocks in prim::if and get the converted graph with mappings
         std::vector<GraphAndMapping> graph_and_mappings;
         for (auto cur_block : if_node->blocks()) {
-          graph_and_mappings.push_back(Stitch(ctx, cur_block));
+          graph_and_mappings.push_back(stitch(ctx, cur_block));
         }
-        AddIfBlockToGraph(new_g, if_node, graph_and_mappings, old_to_new_g);
+        addIfBlockToGraph(new_g, if_node, graph_and_mappings, old_to_new_g);
 
       } else {
-        AddSegmentedBlockToGraph(new_g, seg_block, old_to_new_g);
+        addSegmentedBlockToGraph(new_g, seg_block, old_to_new_g);
       }
     }
   }
diff --git a/tests/core/partitioning/test_resolve_nontensor_inputs.cpp b/tests/core/partitioning/test_resolve_nontensor_inputs.cpp
@@ -122,9 +122,9 @@ TEST(Partitioning, ResolveNonTensorInputsCorrectly) {
     inputs_map.insert({g->inputs()[i], {inputs[i]}});
     input_types.insert({g->inputs()[i], {{at::kFloat}}});
   }
-  auto input_ivalues_map = torch_tensorrt::core::partitioning::GenerateRandomInputs(inputs_map, input_types);
+  auto input_ivalues_map = torch_tensorrt::core::partitioning::generateRandomInputs(inputs_map, input_types);
   torch_tensorrt::core::partitioning::PartitioningCtx ctx(g->block(), partitioning_info);
-  torch_tensorrt::core::partitioning::Partition(&ctx, input_ivalues_map);
+  torch_tensorrt::core::partitioning::partition(&ctx, input_ivalues_map);
   std::vector<torch_tensorrt::core::partitioning::SegmentedBlock> segmented_blocks =
       ctx.partitioned_blocks.begin()->second;
 
@@ -182,10 +182,10 @@ TEST(Partitioning, ResolveTensorListInputsInTrtCorrectly) {
     inputs_map.insert({g->inputs()[i], {inputs[i]}});
     input_types.insert({g->inputs()[i], {{at::kFloat}}});
   }
-  auto input_ivalues_map = torch_tensorrt::core::partitioning::GenerateRandomInputs(inputs_map, input_types);
+  auto input_ivalues_map = torch_tensorrt::core::partitioning::generateRandomInputs(inputs_map, input_types);
   torch_tensorrt::core::partitioning::PartitioningCtx ctx(g->block(), partitioning_info);
 
-  torch_tensorrt::core::partitioning::Partition(&ctx, input_ivalues_map);
+  torch_tensorrt::core::partitioning::partition(&ctx, input_ivalues_map);
   std::vector<torch_tensorrt::core::partitioning::SegmentedBlock> segmented_blocks =
       ctx.partitioned_blocks.begin()->second;
 
@@ -376,9 +376,9 @@ TEST(Partitioning, ResolveOnlyNeccessaryNonTensorInputs) {
     inputs_map.insert({g->inputs()[i], {inputs[i]}});
     input_types.insert({g->inputs()[i], {{at::kFloat}}});
   }
-  auto input_ivalues_map = torch_tensorrt::core::partitioning::GenerateRandomInputs(inputs_map, input_types);
+  auto input_ivalues_map = torch_tensorrt::core::partitioning::generateRandomInputs(inputs_map, input_types);
   torch_tensorrt::core::partitioning::PartitioningCtx ctx(g->block(), partitioning_info);
-  torch_tensorrt::core::partitioning::Partition(&ctx, input_ivalues_map);
+  torch_tensorrt::core::partitioning::partition(&ctx, input_ivalues_map);
   auto segmented_blocks = ctx.partitioned_blocks.begin()->second;
 
   int torch_block_cnt = 0, trt_block_cnt = 0;
diff --git a/tests/core/partitioning/test_segmentation.cpp b/tests/core/partitioning/test_segmentation.cpp
diff --git a/tests/core/partitioning/test_shape_analysis.cpp b/tests/core/partitioning/test_shape_analysis.cpp

Original file line number	Diff line number	Diff line change
`@@ -138,9 +138,9 @@ partitioning::GraphAndMapping BuildHybridGraph(`
`138`	`138`
`139`	`139`	`auto partitioning_ctx = partitioning::PartitioningCtx(block, partitioning_info);`
`140`	`140`	`auto collection_input_ivalues_map =`
`141`		`- partitioning::GenerateRandomInputs(partitioning_info.collection_input_spec_map, first_use_types);`
	`141`	`+ partitioning::generateRandomInputs(partitioning_info.collection_input_spec_map, first_use_types);`
`142`	`142`
`143`		`- partitioning::Partition(&partitioning_ctx, collection_input_ivalues_map);`
	`143`	`+ partitioning::partition(&partitioning_ctx, collection_input_ivalues_map);`
`144`	`144`
`145`	`145`	`for (auto& partitioned_block : partitioning_ctx.partitioned_blocks) {`
`146`	`146`	`partitioning::PartitionedGraph& segmented_blocks = partitioned_block.second;`
`@@ -174,7 +174,7 @@ partitioning::GraphAndMapping BuildHybridGraph(`
`174`	`174`	`}`
`175`	`175`	`}`
`176`	`176`
`177`		`- return partitioning::Stitch(&partitioning_ctx, block);`
	`177`	`+ return partitioning::stitch(&partitioning_ctx, block);`
`178`	`178`	`}`
`179`	`179`
`180`	`180`	`void MapInputsAndDetermineDTypes(`