d5/d61/TBBSession_8cc_source.html

 /* Copyright 2015 The TensorFlow Authors. All Rights Reserved.

 Licensed under the Apache License, Version 2.0 (the "License");
 you may not use this file except in compliance with the License.
 You may obtain a copy of the License at

     http://www.apache.org/licenses/LICENSE-2.0

 Unless required by applicable law or agreed to in writing, software
 distributed under the License is distributed on an "AS IS" BASIS,
 WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/
 //NOTE: The memory layout of the Node class changes depending on if NDEBUG was
 // set when tensorflow was compiled. The reason is Node class holds two edgeset
 // class instances and edgeset adds a member data if NDEBUG is set

 /*
 This file is an adaptation of the original direct_session.cc file located at
 https://github.com/tensorflow/tensorflow/blob/v1.3.0/tensorflow/core/common_runtime/direct_session.cc
 to meet the demands of the software environment developed and used by the CMS collaboration.

 Changes with respect to the original code are documented in the TBBSession.h header file.
 */

 #if !defined(NDEBUG)
 #define NDEBUG 1
 #endif

 #include "TBBSession.h"

 #include <atomic>
 #include <string>
 #include <vector>

 #include "FWCore/Utilities/interface/thread_safety_macros.h"
 #include "FWCore/Concurrency/interface/FunctorTask.h"

 #include "tbb/task_group.h"

 #include "tensorflow/core/common_runtime/constant_folding.h"
 #include "tensorflow/core/common_runtime/debugger_state_interface.h"
 #include "tensorflow/core/common_runtime/device_factory.h"
 #include "tensorflow/core/common_runtime/executor.h"
 #include "tensorflow/core/common_runtime/function.h"
 #include "tensorflow/core/common_runtime/graph_optimizer.h"
 #include "tensorflow/core/common_runtime/memory_types.h"
 #include "tensorflow/core/common_runtime/optimization_registry.h"
 #include "tensorflow/core/common_runtime/simple_placer.h"
 #include "tensorflow/core/common_runtime/step_stats_collector.h"
 #include "tensorflow/core/framework/function.h"
 #include "tensorflow/core/framework/graph.pb_text.h"
 #include "tensorflow/core/framework/graph.pb.h"
 #include "tensorflow/core/framework/graph_def_util.h"
 #include "tensorflow/core/framework/log_memory.h"
 #include "tensorflow/core/framework/node_def.pb.h"
 #include "tensorflow/core/framework/tensor.h"
 #include "tensorflow/core/framework/versions.pb.h"
 #include "tensorflow/core/graph/algorithm.h"
 #include "tensorflow/core/graph/graph.h"
 #include "tensorflow/core/graph/graph_constructor.h"
 #include "tensorflow/core/graph/graph_partition.h"
 #include "tensorflow/core/graph/subgraph.h"
 #include "tensorflow/core/graph/tensor_id.h"
 #include "tensorflow/core/lib/core/errors.h"
 #include "tensorflow/core/lib/core/notification.h"
 #include "tensorflow/core/lib/core/refcount.h"
 #include "tensorflow/core/lib/core/status.h"
 #include "tensorflow/core/lib/gtl/array_slice.h"
 #include "tensorflow/core/lib/gtl/stl_util.h"
 #include "tensorflow/core/lib/monitoring/counter.h"
 #include "tensorflow/core/lib/strings/numbers.h"
 #include "tensorflow/core/lib/strings/str_util.h"
 #include "tensorflow/core/lib/strings/strcat.h"
 #include "tensorflow/core/platform/cpu_info.h"
 #include "tensorflow/core/platform/logging.h"
 #include "tensorflow/core/platform/mutex.h"
 #include "tensorflow/core/platform/types.h"
 #include "tensorflow/core/util/device_name_utils.h"
 #include "tensorflow/core/util/env_var.h"

 #if GOOGLE_CUDA
 #include "tensorflow/core/common_runtime/gpu/gpu_tracer.h"
 #endif  // GOOGLE_CUDA

 namespace tensorflow {

 namespace {

 CMS_THREAD_SAFE auto* tbb_session_runs = monitoring::Counter<0>::New(
     "/tensorflow/core/tbb_session_runs",
     "The number of times TBBSession::Run() has been called.");


 // TODO(vrv): Figure out how to unify the many different functions
 // that generate RendezvousKey, since many of them have to be
 // consistent with each other.
 string GetRendezvousKey(const string& tensor_name,
                         const DeviceAttributes& device_info,
                         const FrameAndIter& frame_iter) {
   return strings::StrCat(device_info.name(), ";",
                          strings::FpToString(device_info.incarnation()), ";",
                          device_info.name(), ";", tensor_name, ";",
                          frame_iter.frame_id, ":", frame_iter.iter_id);
 }

 }  // namespace

 class TBBSessionFactory : public SessionFactory {
  public:
   TBBSessionFactory() {}

   bool AcceptsOptions(const SessionOptions& options) override {
     return options.target == "tbb";
   }

   Session* NewSession(const SessionOptions& options) override {
     // Must do this before the CPU allocator is created.
     if (options.config.graph_options().build_cost_model() > 0) {
       EnableCPUAllocatorFullStats(true);
     }
     std::vector<Device*> devices;
     Status s = DeviceFactory::AddDevices(
         options, "/job:localhost/replica:0/task:0", &devices);
     if (!s.ok()) {
       LOG(ERROR) << s;
       return nullptr;
     }

     TBBSession* session =
         new TBBSession(options, new DeviceMgr(devices), this);
     {
       mutex_lock l(sessions_lock_);
       sessions_.push_back(session);
     }
     return session;
   }

   Status Reset(const SessionOptions& options,
                const std::vector<string>& containers) override {
     std::vector<TBBSession*> sessions_to_reset;
     {
       mutex_lock l(sessions_lock_);
       // We create a copy to ensure that we don't have a deadlock when
       // session->Close calls the TBBSessionFactory.Deregister, which
       // acquires sessions_lock_.
       std::swap(sessions_to_reset, sessions_);
     }
     Status s;
     for (auto session : sessions_to_reset) {
       s.Update(session->Reset(containers));
     }
     // TODO(suharshs): Change the Reset behavior of all SessionFactories so that
     // it doesn't close the sessions?
     for (auto session : sessions_to_reset) {
       s.Update(session->Close());
     }
     return s;
   }

   void Deregister(const TBBSession* session) {
     mutex_lock l(sessions_lock_);
     sessions_.erase(std::remove(sessions_.begin(), sessions_.end(), session),
                     sessions_.end());
   }

  private:
   mutex sessions_lock_;
   std::vector<TBBSession*> sessions_ GUARDED_BY(sessions_lock_);
 };

 class TBBSessionRegistrar {
  public:
   TBBSessionRegistrar() {
     SessionFactory::Register("TBB_SESSION", new TBBSessionFactory());
   }
 };
 static TBBSessionRegistrar registrar;

 std::atomic_int_fast64_t TBBSession::step_id_counter_(1);

 // NOTE: On Android with a single device, there is never
 // a risk of an OpKernel blocking indefinitely:
 //
 // 1) No operations do I/O that depends on other simultaneous kernels,
 //
 // 2) Recv nodes always complete immediately: The inputs are sent into
 //    the local rendezvous before we start the executor, so the
 //    corresponding recvs will not block.
 //
 // Based on these assumptions, we can use the same thread pool for
 // both "non-blocking" and "blocking" OpKernels on Android.
 //
 // This may change down the road when we add support for multiple
 // devices that run concurrently, in which case we will need to
 // revisit this decision.
 void TBBSession::SchedClosure(tbb::task_arena& arena, tbb::task_group& g, std::function<void()> c) {
   arena.execute( [&g,&c] () {g.run( c ); } );
 }

 TBBSession::TBBSession(const SessionOptions& options,
                              const DeviceMgr* device_mgr,
                              TBBSessionFactory* const factory)
     : options_(options),
       device_mgr_(device_mgr),
       factory_(factory),
       cancellation_manager_(new CancellationManager()),
       operation_timeout_in_ms_(options_.config.operation_timeout_in_ms()) {
   // The default value of sync_on_finish will be flipped soon and this
   // environment variable will be removed as well.
   Status status =
       ReadBoolFromEnvVar("TF_SYNC_ON_FINISH", true, &sync_on_finish_);
   if (!status.ok()) {
     LOG(ERROR) << status.error_message();
   }
   // NOTE(mrry): We do not need to use a unique string for the session
   // handle, because TBBSession owns its devices. This may change
   // in future versions.
   session_handle_ = "tbb";
   int devices_added = 0;
   if (options.config.log_device_placement()) {
     const string mapping_str = device_mgr_->DeviceMappingString();
     if (mapping_str.empty()) {
       printf("Device mapping: no known devices.\n");
     } else {
       printf("Device mapping:\n%s", mapping_str.c_str());
     }
     LOG(INFO) << "Device mapping:\n" << mapping_str;
   }
   for (auto d : device_mgr_->ListDevices()) {
     devices_.push_back(d);
     device_set_.AddDevice(d);
     d->op_segment()->AddHold(session_handle_);

     // The first device added is special: it is the 'client device' (a
     // CPU device) from which we feed and fetch Tensors.
     if (devices_added == 0) {
       device_set_.set_client_device(d);
     }
     ++devices_added;
   }
 }

 TBBSession::~TBBSession() {
   if (!closed_) Close().IgnoreError();
   for (auto& it : partial_runs_) {
     it.second.reset(nullptr);
   }
   for (auto& it : executors_) {
     it.second.reset();
   }
   for (auto d : device_mgr_->ListDevices()) {
     d->op_segment()->RemoveHold(session_handle_);
   }
   delete cancellation_manager_;

   execution_state_.reset(nullptr);
   flib_def_.reset(nullptr);
 }

 Status TBBSession::MaybeInitializeExecutionState(
     const GraphDef& graph, bool* out_already_initialized) {
   // If already initialized, do nothing.
   if (flib_def_ && execution_state_) {
     *out_already_initialized = true;
     return Status::OK();
   }
   // Set up the per-session execution state.
   // NOTE(mrry): The function library created here will be used for
   // all subsequent extensions of the graph.
   flib_def_.reset(
       new FunctionLibraryDefinition(OpRegistry::Global(), graph.library()));
   SimpleGraphExecutionStateOptions options;
   options.device_set = &device_set_;
   options.session_options = &options_;
   // TODO(mrry,suharshs): We explicitly copy `graph` so that
   // `MakeForBaseGraph()` can take ownership of its
   // contents. Previously this happened implicitly in calls to the
   // `SimpleGraphExecutionState`. Other sessions call
   // `MakeForBaseGraph` in such a way that we can destructively read
   // the passed-in `GraphDef`. In principle we could do the same here,
   // with a wider refactoring; we might revise the direct session so
   // that it copies the graph fewer times.
   GraphDef temp(graph);
   TF_RETURN_IF_ERROR(SimpleGraphExecutionState::MakeForBaseGraph(
       &temp, options, &execution_state_));
   graph_created_ = true;
   *out_already_initialized = false;
   return Status::OK();
 }

 Status TBBSession::Create(const GraphDef& graph) {
   TF_RETURN_IF_ERROR(init_error_);
   if (graph.node_size() > 0) {
     mutex_lock l(graph_def_lock_);
     if (graph_created_) {
       return errors::AlreadyExists(
           "A Graph has already been created for this session.");
     }
     return ExtendLocked(graph);
   }
   return Status::OK();
 }

 Status TBBSession::Extend(const GraphDef& graph) {
   TF_RETURN_IF_ERROR(CheckNotClosed());
   mutex_lock l(graph_def_lock_);
   return ExtendLocked(graph);
 }

 Status TBBSession::ExtendLocked(const GraphDef& graph) {
   bool already_initialized;
   // If this is the first call, we can initialize the execution state
   // with `graph` and do not need to call `Extend()`.
   TF_RETURN_IF_ERROR(
       MaybeInitializeExecutionState(graph, &already_initialized));
   if (already_initialized) {
     TF_RETURN_IF_ERROR(flib_def_->AddLibrary(graph.library()));
     std::unique_ptr<SimpleGraphExecutionState> state;
     TF_RETURN_IF_ERROR(execution_state_->Extend(graph, &state));
     execution_state_.swap(state);
   }
   return Status::OK();
 }

 Status TBBSession::Run(const NamedTensorList& inputs,
                           const std::vector<string>& output_names,
                           const std::vector<string>& target_nodes,
                           std::vector<Tensor>* outputs) {
   RunMetadata run_metadata;
   return Run(RunOptions(), inputs, output_names, target_nodes, outputs,
              &run_metadata);
 }

 Status TBBSession::CreateDebuggerState(
     const DebugOptions& debug_options, int64 session_run_index,
     int64 executor_step_index, const std::vector<string>& input_names,
     const std::vector<string>& output_names,
     const std::vector<string>& target_names,
     std::unique_ptr<DebuggerStateInterface>* debugger_state) {
   TF_RETURN_IF_ERROR(
       DebuggerStateRegistry::CreateState(debug_options, debugger_state));
   TF_RETURN_IF_ERROR(debugger_state->get()->PublishDebugMetadata(
       debug_options.global_step(), session_run_index, executor_step_index,
       input_names, output_names, target_names));
   return Status::OK();
 }

 Status TBBSession::DecorateAndPublishGraphForDebug(
     const DebugOptions& debug_options, Graph* graph, Device* device) {
   std::unique_ptr<DebugGraphDecoratorInterface> decorator;
   TF_RETURN_IF_ERROR(
       DebugGraphDecoratorRegistry::CreateDecorator(debug_options, &decorator));

   TF_RETURN_IF_ERROR(decorator->DecorateGraph(graph, device));
   TF_RETURN_IF_ERROR(decorator->PublishGraph(*graph, device->name()));
   return Status::OK();
 }

 Status TBBSession::Run(const RunOptions& run_options,
                           const NamedTensorList& inputs,
                           const std::vector<string>& output_names,
                           const std::vector<string>& target_nodes,
                           std::vector<Tensor>* outputs,
                           RunMetadata* run_metadata) {
   TF_RETURN_IF_ERROR(CheckNotClosed());
   tbb_session_runs->GetCell()->IncrementBy(1);
   {
     mutex_lock l(graph_def_lock_);
     if (!graph_created_) {
       return errors::InvalidArgument(
           "Session was not created with a graph before Run()!");
     }
   }

   // Extract the inputs names for this run of the session.
   std::vector<string> input_tensor_names;
   input_tensor_names.reserve(inputs.size());
   for (const auto& it : inputs) {
     input_tensor_names.push_back(it.first);
   }


   // Check if we already have an executor for these arguments.
   ExecutorsAndKeys* executors_and_keys;
   RunStateArgs run_state_args(run_options.debug_options());

   Executor::Args args;
   args.step_id = step_id_counter_.fetch_add(1);

   TF_RETURN_IF_ERROR(
       GetOrCreateExecutors(input_tensor_names, output_names, target_nodes,
                            &executors_and_keys, &run_state_args));
   const int64 executor_step_count = executors_and_keys->step_count.fetch_add(1);

   std::unique_ptr<DebuggerStateInterface> debugger_state;
   if (!run_options.debug_options().debug_tensor_watch_opts().empty()) {
     TF_RETURN_IF_ERROR(CreateDebuggerState(
         run_options.debug_options(), args.step_id, executor_step_count,
         input_tensor_names, output_names, target_nodes, &debugger_state));
   }

   // Configure a call frame for the step, which we use to feed and
   // fetch values to and from the executors.
   FunctionCallFrame call_frame(executors_and_keys->input_types,
                                executors_and_keys->output_types);
   gtl::InlinedVector<Tensor, 4> feed_args(inputs.size());
   for (const auto& it : inputs) {
     if (it.second.dtype() == DT_RESOURCE) {
       Tensor tensor_from_handle;
       TF_RETURN_IF_ERROR(
           ResourceHandleToInputTensor(it.second, &tensor_from_handle));
       feed_args[executors_and_keys->input_name_to_index[it.first]] =
           tensor_from_handle;
     } else {
       feed_args[executors_and_keys->input_name_to_index[it.first]] = it.second;
     }
   }
   Status s = call_frame.SetArgs(feed_args);
   if (errors::IsInternal(s)) {
     return errors::InvalidArgument(s.error_message());
   } else if (!s.ok()) {
     return s;
   }

   // Create a run state and start execution.
   RunState run_state(args.step_id, &devices_);
   run_state.rendez = new IntraProcessRendezvous(device_mgr_.get());
   CancellationManager step_cancellation_manager;
   args.call_frame = &call_frame;

   // Use a task_arena to avoid having unrelated tasks start
   // running on this thread (which could start deadlocks)
   tbb::task_arena taskArena;
   tbb::task_group taskGroup;
   //we are required to always call wait before destructor
   auto doneWithTaskGroup = [&taskArena, &taskGroup](void *) { taskArena.execute([&taskGroup]() { taskGroup.wait();}); };
   std::unique_ptr<tbb::task_group, decltype(doneWithTaskGroup) > guard(&taskGroup, doneWithTaskGroup);

   // Start parallel Executors.
   const size_t num_executors = executors_and_keys->items.size();
   ExecutorBarrier* barrier = new ExecutorBarrier(
     num_executors, run_state.rendez, [&run_state](const Status& ret) {
         {
           mutex_lock l(run_state.mu_);
           run_state.status.Update(ret);
         }
         run_state.executors_done.Notify();
       });

   args.rendezvous = run_state.rendez;
   args.cancellation_manager = &step_cancellation_manager;
   args.runner = [this, &taskArena, &taskGroup](Executor::Args::Closure c) {
     SchedClosure(taskArena, taskGroup, std::move(c));
   };
   args.session_state = &session_state_;
   args.tensor_store = &run_state.tensor_store;
   args.step_container = &run_state.step_container;
   if (LogMemory::IsEnabled()) {
     LogMemory::RecordStep(args.step_id, run_state_args.handle);
   }
   args.sync_on_finish = sync_on_finish_;

   const bool do_trace = (run_options.trace_level() > RunOptions::NO_TRACE);

   bool update_cost_model = false;
   if (options_.config.graph_options().build_cost_model() > 0) {
     const int64 build_cost_model_every =
         options_.config.graph_options().build_cost_model();
     const int64 build_cost_model_after =
         options_.config.graph_options().build_cost_model_after();
     int64 measure_step_count = executor_step_count - build_cost_model_after;
     if (measure_step_count >= 0) {
       update_cost_model =
           ((measure_step_count + 1) % build_cost_model_every == 0);
     }
   }
   if (do_trace || update_cost_model) {
     run_state.collector.reset(
         new StepStatsCollector(run_metadata->mutable_step_stats()));
     args.stats_collector = run_state.collector.get();
   }

 #if GOOGLE_CUDA
   std::unique_ptr<GPUTracer> tracer;
   if (run_options.trace_level() >= RunOptions::HARDWARE_TRACE) {
     tracer.reset(CreateGPUTracer());
     // tracer will be NULL on non-GPU platforms.
     // TODO(b/32704451): Don't just ignore the ::tensorflow::Status object!
     if (tracer) tracer->Start().IgnoreError();
   }
 #endif  // GOOGLE_CUDA

   // Register this step with session's cancellation manager, so that
   // `Session::Close()` will cancel the step.
   CancellationToken cancellation_token =
       cancellation_manager_->get_cancellation_token();
   bool already_cancelled = !cancellation_manager_->RegisterCallback(
       cancellation_token, [&step_cancellation_manager]() {
         step_cancellation_manager.StartCancel();
       });
   if (already_cancelled) {
     // NOTE(mrry): If we don't explicitly notify
     // `run_state.executors_done`, the RunState destructor would
     // block on this notification.
     run_state.executors_done.Notify();
     delete barrier;
     return errors::Cancelled("Run call was cancelled");
   }

   for (const auto& item : executors_and_keys->items) {
     item.executor->RunAsync(args, barrier->Get());
   }

   //WaitForNotification will handle calling wait on taskGroup
   guard.release();
   WaitForNotification(taskArena, taskGroup, &run_state, &step_cancellation_manager,
                       run_options.timeout_in_ms() > 0
                           ? run_options.timeout_in_ms()
                           : operation_timeout_in_ms_);

   if (!cancellation_manager_->DeregisterCallback(cancellation_token)) {
     // The step has been cancelled: make sure we don't attempt to receive the
     // outputs as this would make it block forever.
     mutex_lock l(run_state.mu_);
     run_state.status.Update(errors::Cancelled("Run call was cancelled"));
   }

 #if GOOGLE_CUDA
   if (tracer) {
     // TODO(b/32704451): Don't just ignore the ::tensorflow::Status object!
     tracer->Stop().IgnoreError();
     tracer->Collect(args.stats_collector).IgnoreError();
   }
 #endif  // GOOGLE_CUDA

   {
     mutex_lock l(run_state.mu_);
     TF_RETURN_IF_ERROR(run_state.status);
   }

   // Receive outputs.
   if (outputs) {
     std::vector<Tensor> sorted_outputs;
     Status s = call_frame.ConsumeRetvals(&sorted_outputs);
     if (errors::IsInternal(s)) {
       return errors::InvalidArgument(s.error_message());
     } else if (!s.ok()) {
       return s;
     }
     const bool unique_outputs =
         output_names.size() == executors_and_keys->output_name_to_index.size();
     // first_indices[i] = j implies that j is the smallest value for which
     // output_names[i] == output_names[j].
     std::vector<int> first_indices;
     if (!unique_outputs) {
       first_indices.resize(output_names.size());
       for (int i = 0; i < static_cast<int>(output_names.size()); ++i) {
         for (int j = 0; j <= i; ++j) {
           if (output_names[i] == output_names[j]) {
             first_indices[i] = j;
             break;
           }
         }
       }
     }
     outputs->clear();
     outputs->reserve(sorted_outputs.size());
     for (int i = 0; i < static_cast<int>(output_names.size()); ++i) {
       const string& output_name = output_names[i];
       if (first_indices.empty() || first_indices[i] == i) {
         outputs->emplace_back(
             std::move(sorted_outputs[executors_and_keys
                                          ->output_name_to_index[output_name]]));
       } else {
         outputs->push_back((*outputs)[first_indices[i]]);
       }
     }
   }

   // Save the output tensors of this run we choose to keep.
   TF_RETURN_IF_ERROR(
       run_state.tensor_store.SaveTensors(output_names, &session_state_));

   // Build and return the cost model as instructed.
   mutex_lock l(executor_lock_);
   if (update_cost_model) {
     // Build the cost model
     std::unordered_map<string, const Graph*> device_to_graph;
     for (const PerPartitionExecutorsAndLib& partition :
          executors_and_keys->items) {
       const Graph* graph = partition.graph;
       const string device = partition.flib->device()->name();
       device_to_graph[device] = graph;
     }
     args.stats_collector->BuildCostModel(&cost_model_manager_, device_to_graph);

     // annotate stats onto cost graph.
     CostGraphDef* cost_graph = run_metadata->mutable_cost_graph();
     for (const auto& item : executors_and_keys->items) {
       TF_RETURN_IF_ERROR(
           cost_model_manager_.AddToCostGraphDef(item.graph, cost_graph));
     }
   }

   // If requested via RunOptions, output the partition graphs.
   if (run_options.output_partition_graphs()) {
     protobuf::RepeatedPtrField<GraphDef>* partition_graph_defs =
         run_metadata->mutable_partition_graphs();
     for (const PerPartitionExecutorsAndLib& exec_and_lib :
          executors_and_keys->items) {
       GraphDef* partition_graph_def = partition_graph_defs->Add();
       exec_and_lib.graph->ToGraphDef(partition_graph_def);
     }
   }

   return Status::OK();
 }


 Status TBBSession::ResourceHandleToInputTensor(const Tensor& resource_tensor,
                                                   Tensor* retrieved_tensor) {
   if (resource_tensor.dtype() != DT_RESOURCE) {
     return errors::InvalidArgument(strings::StrCat(
         "ResourceHandleToInputTensor() received non-DT_RESOURCE Tensor: ",
         resource_tensor.dtype()));
   }

   ResourceHandle resource_handle = resource_tensor.scalar<ResourceHandle>()();

   if (resource_handle.container() ==
       SessionState::kTensorHandleResourceTypeName) {
     return session_state_.GetTensor(resource_handle.name(), retrieved_tensor);
   } else {
     return errors::InvalidArgument(strings::StrCat(
         "Invalid resource type hash code: ", resource_handle.hash_code(),
         "(name: ", resource_handle.name(),
         " type: ", resource_handle.maybe_type_name(), ")"));
   }
 }

 Status TBBSession::GetOrCreateExecutors(
     gtl::ArraySlice<string> inputs,
     gtl::ArraySlice<string> outputs, gtl::ArraySlice<string> target_nodes,
     ExecutorsAndKeys** executors_and_keys, RunStateArgs* run_state_args) {
   int64 handle_name_counter_value = -1;
   if (LogMemory::IsEnabled() || run_state_args->is_partial_run) {
     handle_name_counter_value = handle_name_counter_.fetch_add(1);
   }

   string debug_tensor_watches_summary;
   if (!run_state_args->debug_options.debug_tensor_watch_opts().empty()) {
     debug_tensor_watches_summary = SummarizeDebugTensorWatches(
         run_state_args->debug_options.debug_tensor_watch_opts());
   }

   // Fast lookup path, no sorting.
   const string key = strings::StrCat(
       str_util::Join(inputs, ","), "->", str_util::Join(outputs, ","), "/",
       str_util::Join(target_nodes, ","), "/", run_state_args->is_partial_run,
       "/", debug_tensor_watches_summary);
   // Set the handle, if it's needed to log memory or for partial run.
   if (handle_name_counter_value >= 0) {
     run_state_args->handle =
         strings::StrCat(key, ";", handle_name_counter_value);
   }

   // See if we already have the executors for this run.
   {
     mutex_lock l(executor_lock_);  // could use reader lock
     auto it = executors_.find(key);
     if (it != executors_.end()) {
       *executors_and_keys = it->second.get();
       return Status::OK();
     }
   }

   // Slow lookup path, the unsorted key missed the cache.
   // Sort the inputs and outputs, and look up with the sorted key in case an
   // earlier call used a different order of inputs and outputs.
   //
   // We could consider some other signature instead of sorting that
   // preserves the same property to avoid the sort in the future.
   std::vector<string> inputs_sorted(inputs.begin(), inputs.end());
   std::sort(inputs_sorted.begin(), inputs_sorted.end());
   std::vector<string> outputs_sorted(outputs.begin(), outputs.end());
   std::sort(outputs_sorted.begin(), outputs_sorted.end());
   std::vector<string> tn_sorted(target_nodes.begin(), target_nodes.end());
   std::sort(tn_sorted.begin(), tn_sorted.end());

   const string sorted_key = strings::StrCat(
       str_util::Join(inputs_sorted, ","), "->",
       str_util::Join(outputs_sorted, ","), "/", str_util::Join(tn_sorted, ","),
       "/", run_state_args->is_partial_run, "/", debug_tensor_watches_summary);
   // Set the handle, if its needed to log memory or for partial run.
   if (handle_name_counter_value >= 0) {
     run_state_args->handle =
         strings::StrCat(sorted_key, ";", handle_name_counter_value);
   }

   // See if we already have the executors for this run.
   {
     mutex_lock l(executor_lock_);
     auto it = executors_.find(sorted_key);
     if (it != executors_.end()) {
       *executors_and_keys = it->second.get();
       // Insert this under the original key.
       executors_.emplace(key, it->second);
       return Status::OK();
     }
   }

   // Nothing found, so create the executors and store in the cache.
   BuildGraphOptions options;
   options.feed_endpoints = inputs_sorted;
   options.fetch_endpoints = outputs_sorted;
   options.target_nodes = tn_sorted;
   options.use_function_convention = !run_state_args->is_partial_run;
   if (!run_state_args->debug_options.debug_tensor_watch_opts().empty()) {
     options.debug_options = run_state_args->debug_options;
   }

   std::shared_ptr<ExecutorsAndKeys> ek(new ExecutorsAndKeys);

   // The executor_lock_ is intentionally released while executor is
   // being created.
   std::unordered_map<string, std::unique_ptr<Graph>> graphs;
   TF_RETURN_IF_ERROR(CreateGraphs(options, &graphs, &ek->flib_def,
                                   run_state_args, &ek->input_types,
                                   &ek->output_types));

   if (run_state_args->is_partial_run) {
     ek->graph = std::move(run_state_args->graph);
     std::unordered_set<StringPiece, StringPiece::Hasher> names;
     for (const string& input : inputs) {
       TensorId id(ParseTensorName(input));
       names.emplace(id.first);
     }
     for (const string& output : outputs) {
       TensorId id(ParseTensorName(output));
       names.emplace(id.first);
     }
     for (Node* n : ek->graph->nodes()) {
       if (names.count(n->name()) > 0) {
         ek->name_to_node.insert({n->name(), n});
       }
     }
   }
   ek->items.reserve(graphs.size());
   const auto& optimizer_opts =
       options_.config.graph_options().optimizer_options();
   GraphOptimizer optimizer(optimizer_opts);
   for (auto iter = graphs.begin(); iter != graphs.end(); ++iter) {
     const string& partition_name = iter->first;
     std::unique_ptr<Graph>& partition_graph = iter->second;
     const int graph_def_version = partition_graph->versions().producer();

     Device* device;
     TF_RETURN_IF_ERROR(device_mgr_->LookupDevice(partition_name, &device));

     ek->items.resize(ek->items.size() + 1);
     auto* item = &(ek->items.back());
     item->flib.reset(NewFunctionLibraryRuntime(
         device_mgr_.get(), options_.env, device, graph_def_version,
         ek->flib_def.get(), optimizer_opts));

     LocalExecutorParams params;
     params.device = device;
     params.function_library = item->flib.get();
     auto lib = item->flib.get();
     auto opseg = device->op_segment();
     params.create_kernel = [this, lib, opseg](const NodeDef& ndef,
                                               OpKernel** kernel) {
       // Caches the kernel only if the node is stateful.
       if (!lib->IsStateful(ndef.op())) {
         return lib->CreateKernel(ndef, kernel);
       }
       auto create_fn = [lib, &ndef](OpKernel** kernel) {
         return lib->CreateKernel(ndef, kernel);
       };
       // Kernels created for subgraph nodes need to be cached.  On
       // cache miss, create_fn() is invoked to create a kernel based
       // on the function library here + global op registry.
       return opseg->FindOrCreate(session_handle_, ndef.name(), kernel,
                                  create_fn);
     };
     params.delete_kernel = [lib](OpKernel* kernel) {
       // If the node is stateful, opseg owns it. Otherwise, delete it.
       if (kernel && !lib->IsStateful(kernel->type_string())) {
         delete kernel;
       }
     };
     params.node_outputs_cb = node_outputs_callback_;

     optimizer.Optimize(lib, options_.env, device, &iter->second);

     // EXPERIMENTAL: tfdbg inserts debug nodes in the graph.
     if (!options.debug_options.debug_tensor_watch_opts().empty()) {
       TF_RETURN_IF_ERROR(DecorateAndPublishGraphForDebug(
           options.debug_options, partition_graph.get(), params.device));
     }

     TF_RETURN_IF_ERROR(EnsureMemoryTypes(DeviceType(device->device_type()),
                                          device->name(),
                                          partition_graph.get()));
     // NewLocalExecutor takes ownership of partition_graph.
     item->graph = partition_graph.get();
     item->executor = nullptr;
     Executor* executor;
     TF_RETURN_IF_ERROR(
         NewLocalExecutor(params, partition_graph.release(), &executor));
     item->executor.reset(executor);
   }

   // Cache the mapping from input/output names to graph elements to
   // avoid recomputing it every time.
   if (!run_state_args->is_partial_run) {
     // For regular `Run()`, we use the function calling convention, and so
     // maintain a mapping from input/output names to
     // argument/return-value ordinal index.
     for (size_t i = 0; i < inputs_sorted.size(); ++i) {
       const string& input = inputs_sorted[i];
       ek->input_name_to_index[input] = i;
     }
     for (size_t i = 0; i < outputs_sorted.size(); ++i) {
       const string& output = outputs_sorted[i];
       ek->output_name_to_index[output] = i;
     }
   } else {
     // For `PRun()`, we use the rendezvous calling convention, and so
     // maintain a mapping from input/output names to rendezvous keys.
     //
     // We always use the first device as the device name portion of the
     // key, even if we're feeding another graph.
     for (size_t i = 0; i < inputs_sorted.size(); ++i) {
       const string& input = inputs_sorted[i];
       ek->input_name_to_rendezvous_key[input] = GetRendezvousKey(
           input, device_set_.client_device()->attributes(), FrameAndIter(0, 0));
     }
     for (size_t i = 0; i < outputs_sorted.size(); ++i) {
       const string& output = outputs_sorted[i];
       ek->output_name_to_rendezvous_key[output] =
           GetRendezvousKey(output, device_set_.client_device()->attributes(),
                            FrameAndIter(0, 0));
     }
   }

   // Reacquire the lock, try to insert into the map.
   mutex_lock l(executor_lock_);

   // Another thread may have created the entry before us, in which case we will
   // reuse the already created one.
   auto insert_result = executors_.emplace(sorted_key, ek);
   // Insert the value under the original key, so the fast path lookup will work
   // if the user uses the same order of inputs, outputs, and targets again.
   executors_.emplace(key, insert_result.first->second);
   *executors_and_keys = insert_result.first->second.get();

   return Status::OK();
 }

 Status TBBSession::CreateGraphs(
     const BuildGraphOptions& subgraph_options,
     std::unordered_map<string, std::unique_ptr<Graph>>* outputs,
     std::unique_ptr<FunctionLibraryDefinition>* flib_def,
     RunStateArgs* run_state_args, DataTypeVector* input_types,
     DataTypeVector* output_types) {
   mutex_lock l(graph_def_lock_);
   std::unique_ptr<SimpleClientGraph> client_graph;

   std::unique_ptr<SimpleGraphExecutionState> temp_exec_state_holder;
   SimpleGraphExecutionState* execution_state = nullptr;
   if (options_.config.graph_options().place_pruned_graph()) {
     // Because we are placing pruned graphs, we need to create a
     // new SimpleGraphExecutionState for every new unseen graph,
     // and then place it.
     SimpleGraphExecutionStateOptions prune_options;
     prune_options.device_set = &device_set_;
     prune_options.session_options = &options_;
     prune_options.stateful_placements = stateful_placements_;
     TF_RETURN_IF_ERROR(SimpleGraphExecutionState::MakeForPrunedGraph(
         execution_state_->original_graph_def().library(), prune_options,
         execution_state_->original_graph_def(), subgraph_options,
         &temp_exec_state_holder, &client_graph));
     execution_state = temp_exec_state_holder.get();
   } else {
     execution_state = execution_state_.get();
     TF_RETURN_IF_ERROR(
         execution_state->BuildGraph(subgraph_options, &client_graph));
   }

   if (subgraph_options.feed_endpoints.size() !=
       client_graph->feed_types.size()) {
     return errors::Internal(
         "Graph pruning failed: requested number of feed endpoints = ",
         subgraph_options.feed_endpoints.size(),
         " versus number of pruned feed endpoints = ",
         client_graph->feed_types.size());
   }
   if (subgraph_options.fetch_endpoints.size() !=
       client_graph->fetch_types.size()) {
     return errors::Internal(
         "Graph pruning failed: requested number of fetch endpoints = ",
         subgraph_options.fetch_endpoints.size(),
         " versus number of pruned fetch endpoints = ",
         client_graph->fetch_types.size());
   }

   auto current_stateful_placements = execution_state->GetStatefulPlacements();
   // Update our current state based on the execution_state's
   // placements.  If there are any mismatches for a node,
   // we should fail, as this should never happen.
   for (auto placement_pair : current_stateful_placements) {
     const string& node_name = placement_pair.first;
     const string& placement = placement_pair.second;
     auto iter = stateful_placements_.find(node_name);
     if (iter == stateful_placements_.end()) {
       stateful_placements_.insert(std::make_pair(node_name, placement));
     } else if (iter->second != placement) {
       return errors::Internal(
           "Stateful placement mismatch. "
           "Current assignment of ",
           node_name, " to ", iter->second, " does not match ", placement);
     }
   }

   stateful_placements_ = execution_state->GetStatefulPlacements();

   // Remember the graph in run state if this is a partial run.
   if (run_state_args->is_partial_run) {
     run_state_args->graph.reset(new Graph(flib_def_.get()));
     CopyGraph(*execution_state->full_graph(), run_state_args->graph.get());
   }

   // Partition the graph across devices.
   PartitionOptions popts;
   popts.node_to_loc = [](const Node* node) {
     assert(node != nullptr);
     return node->assigned_device_name();
   };
   popts.new_name = [this](const string& prefix) {
     return strings::StrCat(prefix, "/_", edge_name_counter_.fetch_add(1));
   };
   popts.get_incarnation = [](const string& name) {
     // The direct session does not have changing incarnation numbers.
     // Just return '1'.
     return 1;
   };
   popts.control_flow_added = false;

   std::unordered_map<string, GraphDef> partitions;
   TF_RETURN_IF_ERROR(Partition(popts, &client_graph->graph, &partitions));

   std::vector<string> device_names;
   for (auto device : devices_) {
     // Extract the LocalName from the device.
     device_names.push_back(DeviceNameUtils::LocalName(device->name()));
   }

   // Check for valid partitions.
   for (const auto& partition : partitions) {
     const string local_partition_name =
         DeviceNameUtils::LocalName(partition.first);
     if (std::count(device_names.begin(), device_names.end(),
                    local_partition_name) == 0) {
       return errors::InvalidArgument(
           "Creating a partition for ", local_partition_name,
           " which doesn't exist in the list of available devices. Available "
           "devices: ",
           str_util::Join(device_names, ","));
     }
   }

   for (const auto& partition : partitions) {
     std::unique_ptr<Graph> device_graph(
         new Graph(client_graph->flib_def.get()));
     GraphConstructorOptions device_opts;
     // There are internal operations (e.g., send/recv) that we now allow.
     device_opts.allow_internal_ops = true;
     device_opts.expect_device_spec = true;
     TF_RETURN_IF_ERROR(ConvertGraphDefToGraph(device_opts, partition.second,
                                               device_graph.get()));
     outputs->emplace(partition.first, std::move(device_graph));
   }

   GraphOptimizationPassOptions optimization_options;
   optimization_options.session_options = &options_;
   optimization_options.flib_def = client_graph->flib_def.get();
   optimization_options.partition_graphs = outputs;
   TF_RETURN_IF_ERROR(OptimizationPassRegistry::Global()->RunGrouping(
       OptimizationPassRegistry::POST_PARTITIONING, optimization_options));

   Status s;
   for (auto& partition : *outputs) {
     const string& partition_name = partition.first;
     std::unique_ptr<Graph>* graph = &partition.second;

     VLOG(2) << "Created " << DebugString(graph->get()) << " for "
             << partition_name;

     // Give the device an opportunity to rewrite its subgraph.
     Device* d;
     s = device_mgr_->LookupDevice(partition_name, &d);
     if (!s.ok()) break;
     // TODO(pbar) The library is currently shared and immutable. There
     // may be possible use cases where a device may want to modify
     // function definitions - in which case the library would need to be
     // replicated per device.
     s = d->MaybeRewriteGraph(client_graph->flib_def->ToProto(), graph);
     if (!s.ok()) {
       break;
     }
   }
   *flib_def = std::move(client_graph->flib_def);
   std::swap(*input_types, client_graph->feed_types);
   std::swap(*output_types, client_graph->fetch_types);
   return s;
 }

 ::tensorflow::Status TBBSession::ListDevices(
     std::vector<DeviceAttributes>* response) {
   response->clear();
   response->reserve(devices_.size());
   for (Device* d : devices_) {
     const DeviceAttributes& attrs = d->attributes();
     response->emplace_back(attrs);
   }
   return ::tensorflow::Status::OK();
 }

 ::tensorflow::Status TBBSession::Reset(
     const std::vector<string>& containers) {
   device_mgr_->ClearContainers(containers);
   return ::tensorflow::Status::OK();
 }

 ::tensorflow::Status TBBSession::Close() {
   cancellation_manager_->StartCancel();
   {
     mutex_lock l(closed_lock_);
     if (closed_) return ::tensorflow::Status::OK();
     closed_ = true;
   }
   if (factory_ != nullptr) factory_->Deregister(this);
   return ::tensorflow::Status::OK();
 }

 TBBSession::RunState::RunState(
     const std::vector<string>& pending_input_names,
     const std::vector<string>& pending_output_names, int64 step_id,
     const std::vector<Device*>* devices)
     : step_container(step_id, [devices](const string& name) {
         for (auto d : *devices) {
           if (!d->resource_manager()->Cleanup(name).ok()) {
             // Do nothing...
           }
         }
       }) {
   // Initially all the feeds and fetches are pending.
   for (auto& name : pending_input_names) {
     pending_inputs[name] = false;
   }
   for (auto& name : pending_output_names) {
     pending_outputs[name] = false;
   }
 }

 TBBSession::RunState::RunState(int64 step_id,
                                   const std::vector<Device*>* devices)
     : RunState({}, {}, step_id, devices) {}

 TBBSession::RunState::~RunState() {
   if (rendez != nullptr) {
     if (!executors_done.HasBeenNotified()) {
       rendez->StartAbort(errors::Cancelled("PRun cancellation"));
       executors_done.WaitForNotification();
     }
     rendez->Unref();
   }
 }

 bool TBBSession::RunState::PendingDone() const {
   for (const auto& it : pending_inputs) {
     if (!it.second) return false;
   }
   for (const auto& it : pending_outputs) {
     if (!it.second) return false;
   }
   return true;
 }

 void TBBSession::WaitForNotification(tbb::task_arena& arena,
                                      tbb::task_group& taskGroup,
                                        RunState* run_state,
                                         CancellationManager* cm,
                                         int64 timeout_in_ms) {
   // Doing the wait in the arena adds this thread to the arena
   // and therefore tasks associated to the group can run on this thread
   arena.execute([&taskGroup]() { taskGroup.wait();} );

   Status status =
       WaitForNotification(&run_state->executors_done, timeout_in_ms);
   if (!status.ok()) {
     {
       mutex_lock l(run_state->mu_);
       run_state->status.Update(status);
     }
     cm->StartCancel();
     // We must wait for the executors to complete, because they have borrowed
     // references to `cm` and other per-step state. After this notification, it
     // is safe to clean up the step.
     run_state->executors_done.WaitForNotification();
   }
 }

 ::tensorflow::Status TBBSession::WaitForNotification(
     Notification* notification, int64 timeout_in_ms) {
   if (timeout_in_ms > 0) {
     int64 timeout_in_us = timeout_in_ms * 1000;
     bool notified = WaitForNotificationWithTimeout(notification, timeout_in_us);
     if (!notified) {
       return Status(error::DEADLINE_EXCEEDED,
                     "Timed out waiting for notification");
     }
   } else {
     notification->WaitForNotification();
   }
   return Status::OK();
 }

 }  // namespace tensorflow
tensorflow::TBBSession::flib_def_
std::unique_ptr< FunctionLibraryDefinition > flib_def_
Definition: TBBSession.h:305

tensorflow::TBBSession::ExecutorsAndKeys::items
std::vector< PerPartitionExecutorsAndLib > items
Definition: TBBSession.h:152

KineDebug3::count
void count()
Definition: KinematicConstrainedVertexUpdatorT.h:20

tensorflow::TBBSession::RunState::RunState
RunState(int64 step_id, const std::vector< Device * > *devices)
Definition: TBBSession.cc:1069

tensorflow::TBBSession::ExecutorsAndKeys::output_types
DataTypeVector output_types
Definition: TBBSession.h:159

tensorflow::TBBSession::RunStateArgs::handle
string handle
Definition: TBBSession.h:193

tensorflow::TBBSession::ExecutorsAndKeys::input_name_to_index
std::unordered_map< string, size_t > input_name_to_index
Definition: TBBSession.h:153

mps_fire.i
i
Definition: mps_fire.py:269

cscdqm::h::names
static const HistoName names[]
Definition: CSCDQM_HistoDef.h:831

tensorflow::TBBSession::RunState::executors_done
Notification executors_done
Definition: TBBSession.h:171

tensorflow::TBBSession::Close
::tensorflow::Status Close() override
Definition: TBBSession.cc:1038

mutex
static boost::mutex mutex
Definition: LHEProxy.cc:11

tensorflow::TBBSession::devices_
std::vector< Device * > devices_
Definition: TBBSession.h:257

PatBasicFWLiteJetAnalyzer_Selector_cfg.outputs
outputs
Definition: PatBasicFWLiteJetAnalyzer_Selector_cfg.py:48

tensorflow::TBBSession::handle_name_counter_
std::atomic< int64 > handle_name_counter_
Definition: TBBSession.h:313

tensorflow::TBBSession::NamedTensorList
std::vector< std::pair< string, Tensor > > NamedTensorList
Definition: TBBSession.h:90

AlCaHLTBitMon_QueryRunRegistry.string
string
Definition: AlCaHLTBitMon_QueryRunRegistry.py:255

mps_check.lib
lib
Definition: mps_check.py:19

tensorflow::TBBSession::edge_name_counter_
std::atomic< int64 > edge_name_counter_
Definition: TBBSession.h:312

tensorflow::TBBSession::RunState::mu_
mutex mu_
Definition: TBBSession.h:167

options
Definition: options.py:1

alignCSCRings.s
s
Definition: alignCSCRings.py:91

EnergyCorrector.c
c
Definition: EnergyCorrector.py:43

tensorflow::TBBSession::WaitForNotification
::tensorflow::Status WaitForNotification(Notification *n, int64 timeout_in_ms)
Definition: TBBSession.cc:1117

groupFilesInBlocks.temp
temp
Definition: groupFilesInBlocks.py:140

tensorflow::TBBSession::PerPartitionExecutorsAndLib::flib
std::unique_ptr< FunctionLibraryRuntime > flib
Definition: TBBSession.h:129

thread_safety_macros.h

FunctorTask.h

RecoTauPiZeroBuilderPlugins_cfi.function
function
Definition: RecoTauPiZeroBuilderPlugins_cfi.py:82

tensorflow::TBBSession::DecorateAndPublishGraphForDebug
::tensorflow::Status DecorateAndPublishGraphForDebug(const DebugOptions &debug_options, Graph *graph, Device *device)
Definition: TBBSession.cc:350

tensorflow::TBBSessionFactory
Definition: TBBSession.cc:110

convertSQLitetoXML_cfg.output
output
Definition: convertSQLitetoXML_cfg.py:32

tensorflow::TBBSession::executor_lock_
mutex executor_lock_
Definition: TBBSession.h:272

tensorflow::TBBSession::cost_model_manager_
CostModelManager cost_model_manager_
Definition: TBBSession.h:322

LOG
#define LOG(A)
Definition: Simplify_begin.h:61

config
Definition: config.py:1

tensorflow::TBBSession
Definition: TBBSession.h:78

tensorflow::TBBSession::session_handle_
string session_handle_
Definition: TBBSession.h:260

crabWrapper.key
key
Definition: crabWrapper.py:17

tensorflow::TBBSession::RunState::pending_inputs
std::unordered_map< string, bool > pending_inputs
Definition: TBBSession.h:172

tensorflow::TBBSession::Create
::tensorflow::Status Create(const GraphDef &graph) override
Definition: TBBSession.cc:293

tensorflow::TBBSessionRegistrar
Definition: TBBSession.cc:173

mps_update.status
status
Definition: mps_update.py:67

PatBasicFWLiteJetAnalyzer_Selector_cfg.inputs
inputs
Definition: PatBasicFWLiteJetAnalyzer_Selector_cfg.py:40

tensorflow::TBBSession::device_set_
DeviceSet device_set_
Definition: TBBSession.h:258

g
The Signals That Services Can Subscribe To This is based on ActivityRegistry and is current per Services can connect to the signals distributed by the ActivityRegistry in order to monitor the activity of the application Each possible callback has some defined which we here list in angle e g
Definition: Activities.doc:4

tensorflow::TBBSessionFactory::Reset
Status Reset(const SessionOptions &options, const std::vector< string > &containers) override
Definition: TBBSession.cc:140

tensorflow::TBBSessionFactory::NewSession
Session * NewSession(const SessionOptions &options) override
Definition: TBBSession.cc:118

tensorflow::TBBSession::RunState::PendingDone
bool PendingDone() const
Definition: TBBSession.cc:1083

input
static std::string const input
Definition: EdmProvDump.cc:44

Partition
Partition
Definition: HLTHPDFilter.cc:32

tensorflow::TBBSessionFactory::Deregister
void Deregister(const TBBSession *session)
Definition: TBBSession.cc:162

tensorflow::TBBSession::MaybeInitializeExecutionState
Status MaybeInitializeExecutionState(const GraphDef &graph, bool *out_already_initialized) EXCLUSIVE_LOCKS_REQUIRED(graph_def_lock_)
Definition: TBBSession.cc:262

tensorflow::TBBSession::~TBBSession
~TBBSession() override
Definition: TBBSession.cc:245

tensorflow::TBBSession::PerPartitionExecutorsAndLib
Definition: TBBSession.h:127

tensorflow::TBBSession::GetOrCreateExecutors
::tensorflow::Status GetOrCreateExecutors(gtl::ArraySlice< string > inputs, gtl::ArraySlice< string > outputs, gtl::ArraySlice< string > target_nodes, ExecutorsAndKeys **executors_and_keys, RunStateArgs *run_state_args)
Definition: TBBSession.cc:643

tensorflow::registrar
static NTSessionRegistrar registrar
Definition: NTSession.cc:176

tensorflow::TBBSessionFactory::TBBSessionFactory
TBBSessionFactory()
Definition: TBBSession.cc:112

tensorflow::TBBSession::RunState::rendez
IntraProcessRendezvous * rendez
Definition: TBBSession.h:169

triggerObjects_cff.id
id
Definition: triggerObjects_cff.py:28

std::swap
void swap(edm::DataFrameContainer &lhs, edm::DataFrameContainer &rhs)
Definition: DataFrameContainer.h:236

tensorflow::TBBSessionFactory::GUARDED_BY
std::vector< TBBSession * > sessions_ GUARDED_BY(sessions_lock_)

tensorflow::TBBSession::RunState::~RunState
~RunState()
Definition: TBBSession.cc:1073

tensorflow::TBBSession::SchedClosure
void SchedClosure(tbb::task_arena &arena, tbb::task_group &g, std::function< void()> c)
Definition: TBBSession.cc:198

tensorflow::TBBSession::ResourceHandleToInputTensor
::tensorflow::Status ResourceHandleToInputTensor(const Tensor &resource_tensor, Tensor *retrieved_tensor)
Definition: TBBSession.cc:622

tensorflow::TBBSession::cancellation_manager_
CancellationManager * cancellation_manager_
Definition: TBBSession.h:289

MessageLogger_cfi.INFO
INFO
Definition: MessageLogger_cfi.py:16

tensorflow::TBBSession::RunStateArgs
Definition: TBBSession.h:189

tensorflow::TBBSession::CreateGraphs
::tensorflow::Status CreateGraphs(const BuildGraphOptions &options, std::unordered_map< string, std::unique_ptr< Graph >> *outputs, std::unique_ptr< FunctionLibraryDefinition > *flib_def, RunStateArgs *run_state_args, DataTypeVector *input_types, DataTypeVector *output_types)
Definition: TBBSession.cc:863

CMS_THREAD_SAFE
#define CMS_THREAD_SAFE

tablePrinter.prefix
prefix
Definition: tablePrinter.py:63

tensorflow::TBBSession::PerPartitionExecutorsAndLib::graph
Graph * graph
Definition: TBBSession.h:128

tensorflow::TBBSession::Reset
::tensorflow::Status Reset(const std::vector< string > &containers)
Definition: TBBSession.cc:1032

tensorflow::TBBSession::RunStateArgs::debug_options
const DebugOptions & debug_options
Definition: TBBSession.h:195

tensorflow::TBBSession::Extend
::tensorflow::Status Extend(const GraphDef &graph) override
Definition: TBBSession.cc:306

edmIntegrityCheck.d
d
Definition: edmIntegrityCheck.py:65

tensorflow::TBBSession::init_error_
Status init_error_
Definition: TBBSession.h:266

tensorflow::TBBSession::ExecutorsAndKeys::input_types
DataTypeVector input_types
Definition: TBBSession.h:158

tensorflow::TBBSession::ExecutorsAndKeys
Definition: TBBSession.h:145

reco::OK
std::pair< int, edm::FunctionWithDict > OK
Definition: findMethod.cc:136

tensorflow::TBBSession::RunState::pending_outputs
std::unordered_map< string, bool > pending_outputs
Definition: TBBSession.h:173

tensorflow::TBBSession::CheckNotClosed
::tensorflow::Status CheckNotClosed()
Definition: TBBSession.h:237

tensorflow::TBBSessionRegistrar::TBBSessionRegistrar
TBBSessionRegistrar()
Definition: TBBSession.cc:175

createfilelist.args
args
Definition: createfilelist.py:13

Session

tensorflow::TBBSessionFactory::sessions_lock_
mutex sessions_lock_
Definition: TBBSession.cc:169

tensorflow::TBBSession::ExecutorsAndKeys::step_count
std::atomic_int_fast64_t step_count
Definition: TBBSession.h:148

tensorflow::TBBSession::options_
const SessionOptions options_
Definition: TBBSession.h:253

tensorflow::TBBSession::factory_
TBBSessionFactory *const factory_
Definition: TBBSession.h:288

plotBeamSpotDB.first
first
Definition: plotBeamSpotDB.py:379

tensorflow::TBBSession::step_id_counter_
static std::atomic_int_fast64_t step_id_counter_
Definition: TBBSession.h:316

MatrixUtil.remove
def remove(d, key, TELL=False)
Definition: MatrixUtil.py:209

tensorflow::TBBSession::device_mgr_
const std::unique_ptr< const DeviceMgr > device_mgr_
Definition: TBBSession.h:256

gen::n
int n
Definition: Cascade2Hadronizer.cc:79

dataDML.session
session
Definition: dataDML.py:2333

tensorflow::TBBSession::operation_timeout_in_ms_
const int64 operation_timeout_in_ms_
Definition: TBBSession.h:319

tensorflow::TBBSession::node_outputs_callback_
Executor::Args::NodeOutputsCallback node_outputs_callback_
Definition: TBBSession.h:324

tensorflow
Definition: TensorFlow.h:22

tensorflow::TBBSession::Run
::tensorflow::Status Run(const NamedTensorList &inputs, const std::vector< string > &output_names, const std::vector< string > &target_nodes, std::vector< Tensor > *outputs) override
Definition: TBBSession.cc:327

tensorflow::TBBSession::sync_on_finish_
bool sync_on_finish_
Definition: TBBSession.h:269

checklumidiff.l
l
Definition: checklumidiff.py:65

tensorflow::TBBSession::graph_def_lock_
mutex graph_def_lock_
Definition: TBBSession.h:263

tensorflow::TBBSession::TBBSession
TBBSession(const SessionOptions &options, const DeviceMgr *device_mgr, TBBSessionFactory *factory)
Definition: TBBSession.cc:202

tensorflow::TBBSession::RunStateArgs::graph
std::unique_ptr< Graph > graph
Definition: TBBSession.h:194

btagGenBb_cfi.Status
Status
Definition: btagGenBb_cfi.py:4

tensorflow::TBBSession::CreateDebuggerState
::tensorflow::Status CreateDebuggerState(const DebugOptions &debug_options, int64 session_run_index, int64 executor_step_index, const std::vector< string > &input_names, const std::vector< string > &output_names, const std::vector< string > &target_names, std::unique_ptr< DebuggerStateInterface > *debugger_state)
Definition: TBBSession.cc:336

tensorflow::TBBSession::session_state_
SessionState session_state_
Definition: TBBSession.h:286

tensorflow::TBBSession::RunStateArgs::is_partial_run
bool is_partial_run
Definition: TBBSession.h:192

tensorflow::TBBSession::ExtendLocked
::tensorflow::Status ExtendLocked(const GraphDef &graph) EXCLUSIVE_LOCKS_REQUIRED(graph_def_lock_)
Definition: TBBSession.cc:312

tensorflow::TBBSession::closed_lock_
mutex closed_lock_
Definition: TBBSession.h:308

cuy.graphs
graphs
Definition: cuy.py:960

dataset.name
name
Definition: dataset.py:45

tensorflow::TBBSession::RunState
Definition: TBBSession.h:166

tensorflow::TBBSession::ListDevices
::tensorflow::Status ListDevices(std::vector< DeviceAttributes > *response) override
Definition: TBBSession.cc:1021

AlcaSiPixelAliHarvester0T_cff.options
options
Definition: AlcaSiPixelAliHarvester0T_cff.py:42

eostools.move
def move(src, dest)
Definition: eostools.py:510

TBBSession.h

dqm::qstatus::ERROR
static const int ERROR
Definition: DQMDefinitions.h:19

tensorflow::TBBSessionFactory::AcceptsOptions
bool AcceptsOptions(const SessionOptions &options) override
Definition: TBBSession.cc:114