dd/d39/hlo__ordering_8h_source.html

 /* Copyright 2016 The TensorFlow Authors. All Rights Reserved.

 Licensed under the Apache License, Version 2.0 (the "License");
 you may not use this file except in compliance with the License.
 You may obtain a copy of the License at

     http://www.apache.org/licenses/LICENSE-2.0

 Unless required by applicable law or agreed to in writing, software
 distributed under the License is distributed on an "AS IS" BASIS,
 WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 See the License for the specific language governing permissions and
 limitations under the License.
 ==============================================================================*/

 #ifndef TENSORFLOW_COMPILER_XLA_SERVICE_HLO_ORDERING_H_
 #define TENSORFLOW_COMPILER_XLA_SERVICE_HLO_ORDERING_H_

 #include <memory>
 #include <string>
 #include <utility>

 #include "tensorflow/compiler/xla/service/call_graph.h"
 #include "tensorflow/compiler/xla/service/hlo.pb.h"
 #include "tensorflow/compiler/xla/service/hlo_dataflow_analysis.h"
 #include "tensorflow/compiler/xla/service/hlo_instruction.h"
 #include "tensorflow/compiler/xla/service/hlo_module.h"
 #include "tensorflow/compiler/xla/service/hlo_value.h"
 #include "tensorflow/compiler/xla/types.h"
 #include "tensorflow/core/lib/gtl/flatmap.h"

 namespace xla {

 class HloOrdering {
  public:
   HloOrdering(const HloModule* module)
       : module_(module), call_graph_(CallGraph::Build(module)) {}
   virtual ~HloOrdering() = default;

   // Returns true if instruction 'a' executes before instruction 'b'. This is
   // not reflexive, that is, an instruction does not execute before itself.
   bool ExecutesBefore(const HloInstruction* a, const HloInstruction* b) const;

   // Returns whether the value 'a' is defined before the value 'b' under the
   // given ordering.
   bool IsDefinedBefore(const HloValue& a, const HloValue& b) const;

   // Returns whether the given use is before the given value definition under
   // the given ordering.
   bool UseIsBeforeValueDefinition(const HloUse& use, const HloValue& value,
                                   const HloDataflowAnalysis& dataflow) const;
   // Returns whether the given values interfere. Two values interfere if they
   // may both be simultaneously live.
   bool MayInterfere(const HloValue& a, const HloValue& b,
                     const HloDataflowAnalysis& dataflow) const;

   // Returns true if the live range of the given value 'a' is strictly before
   // the live range of value 'b' using the given HLO ordering.
   bool LiveRangeStrictlyBefore(const HloValue& a, const HloValue& b,
                                const HloDataflowAnalysis& dataflow) const;

   // Returns the sequential instruction order for the given computation, or
   // nullptr if the computation does not have a sequential ordering.
   virtual const std::vector<const HloInstruction*>* SequentialOrder(
       const HloComputation& computation) const = 0;

   // Return the call graph of the module used to compute ordering.
   const CallGraph& call_graph() const { return *call_graph_; }

   virtual string ToString() const = 0;

   // Returns the serialized representation of this ordering.
   // Only sequential computation orders are represented.
   HloOrderingProto ToProto() const;

  protected:
   // Returns true if instruction 'a' executes before instruction 'b'.
   // Precondition: 'a' and 'b' are in the same computation.
   //
   // Derived classes should implement this method for determining order of
   // instructions in the same computation. ExecutesBefore() analyzes the
   // callgraph and uses this method to determine ordering of instructions in
   // different computations.
   virtual bool ExecutesBeforeInSameComputation(
       const HloInstruction* a, const HloInstruction* b) const = 0;

   const HloModule* module_;

   std::unique_ptr<CallGraph> call_graph_;
 };

 /*
  * Google Docs:
  * > Base class for partial orderings implemented by a map of predecessors for
  * > each instruction. Subclasses should fill in predecessors_.
  */
 class PredecessorHloOrdering : public HloOrdering {
  public:
   ~PredecessorHloOrdering() override = default;

   // Returns nullptr indicating the computation does not have a sequential
   // ordering.
   const std::vector<const HloInstruction*>* SequentialOrder(
       const HloComputation& computation) const override {
     return nullptr;
   }

   HloReachabilityMap& reachability_map(const HloComputation* computation) {
     return *predecessors_.at(computation);
   }
   const HloReachabilityMap& reachability_map(
       const HloComputation* computation) const {
     return *predecessors_.at(computation);
   }

  protected:
   explicit PredecessorHloOrdering(const HloModule* module);
   string ToStringHelper(const string& name) const;

   bool ExecutesBeforeInSameComputation(const HloInstruction* a,
                                        const HloInstruction* b) const override;

   // For each computation in the module, this is the set of the instruction's
   // predecessors. An instruction is an element of its own predecessor set.
   //
   // Subclasses should fill this in to define the desired ordering.
   tensorflow::gtl::FlatMap<const HloComputation*,
                            std::unique_ptr<HloReachabilityMap>>
       predecessors_;
 };

 /*
  * The following are all from Google Docs
  * An HLO ordering based on data dependencies in the HLO graph. In this partial
  * order, instruction A executes before instruction B only if there is a path
  * from A to B in the HLO graph. For example, given the following graph:
  * ```
  *        param
  *       /     \
  *    negate   exp
  *        \    /
  *         add
  * ```
  *
  *  DependencyHloOrdering gives the following executes-before relations:
  *    param executes before negate, exp, and add
  *    negate executes before add
  *    exp executes before add
  *    add executes before nothing
  *  negate and exp are not ordered because the dependencies allow either to
  *  execute before the other (or in parallel). DependencyHloOrdering ordering
  *  allows maximum parallelism and enables any execution order which satisfies
  *  data dependencies. This requires pessimistic assumptions about buffer live
  *  ranges and can result in more memory used than more constrained orderings.
  */
 class DependencyHloOrdering : public PredecessorHloOrdering {
  public:
   explicit DependencyHloOrdering(const HloModule* module);
   ~DependencyHloOrdering() override = default;

   string ToString() const override;
 };

 class SequentialHloOrdering : public HloOrdering {
  public:
   using HloModuleSequence =
       tensorflow::gtl::FlatMap<const HloComputation*,
                                std::vector<const HloInstruction*>>;

   SequentialHloOrdering(const HloModule* module,
                         const HloModuleSequence& module_sequence);
   ~SequentialHloOrdering() override = default;

   // Returns the sequential instruction order for the given computation.
   const std::vector<const HloInstruction*>* SequentialOrder(
       const HloComputation& computation) const override;

   string ToString() const override;

  protected:
   bool ExecutesBeforeInSameComputation(const HloInstruction* a,
                                        const HloInstruction* b) const override;

   const HloModuleSequence module_sequence_;

   // The position of every instruction in the HLO module in its respective
   // computation sequence (a value of zero indicates the instruction is first in
   // the sequence, etc). Instructions from all computations are contained in
   // this map so more than one instruction may have the same position
   // value. This is not a problem because ExecutesBefore also verifies
   // instructions are in the same computation.
   tensorflow::gtl::FlatMap<const HloInstruction*, int> order_position_;
 };

 std::ostream& operator<<(
     std::ostream& out,
     const SequentialHloOrdering::HloModuleSequence& module_sequence);

 }  // namespace xla

 #endif  // TENSORFLOW_COMPILER_XLA_SERVICE_HLO_ORDERING_H_
xla::SequentialHloOrdering
Definition: hlo_ordering.h:203

xla::HloComputation
Definition: hlo_computation.h:60

xla::HloInstruction
Definition: hlo_instruction.h:165

xla
namespace for xla
Definition: client_library.cc:26

hlo_instruction.h

hlo_module.h

xla::SequentialHloOrdering::HloModuleSequence
tensorflow::gtl::FlatMap< const HloComputation *, std::vector< const HloInstruction * > > HloModuleSequence
Definition: hlo_ordering.h:208

xla::HloModule
Definition: hlo_module.h:52

xla::HloOrdering
Definition: hlo_ordering.h:41