87 lines
2.9 KiB
C++
87 lines
2.9 KiB
C++
/* Copyright 2020 The OpenXLA Authors.
|
|
|
|
Licensed under the Apache License, Version 2.0 (the "License");
|
|
you may not use this file except in compliance with the License.
|
|
You may obtain a copy of the License at
|
|
|
|
http://www.apache.org/licenses/LICENSE-2.0
|
|
|
|
Unless required by applicable law or agreed to in writing, software
|
|
distributed under the License is distributed on an "AS IS" BASIS,
|
|
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
See the License for the specific language governing permissions and
|
|
limitations under the License.
|
|
==============================================================================*/
|
|
|
|
#ifndef XLA_SERVICE_TOPK_REWRITER_H_
|
|
#define XLA_SERVICE_TOPK_REWRITER_H_
|
|
|
|
#include <functional>
|
|
#include <memory>
|
|
#include <optional>
|
|
#include <utility>
|
|
|
|
#include "xla/hlo/ir/dfs_hlo_visitor_with_default.h"
|
|
#include "xla/hlo/ir/hlo_instruction.h"
|
|
#include "xla/hlo/ir/hlo_instructions.h"
|
|
#include "xla/hlo/ir/hlo_module.h"
|
|
#include "xla/service/hlo_pass_interface.h"
|
|
|
|
namespace xla {
|
|
|
|
// This pass pattern-matches soups of HLOs executing a TopK operation and
|
|
// replaces them with a TopK CustomCall when the given values are supported by
|
|
// the CustomCall and it is more efficient to use that implementation.
|
|
class TopkRewriter : public HloModulePass {
|
|
public:
|
|
explicit TopkRewriter(std::function<bool(const HloSortInstruction*, int64_t)>
|
|
is_profitable_to_convert)
|
|
: is_profitable_to_convert_(std::move(is_profitable_to_convert)) {}
|
|
|
|
absl::string_view name() const override { return "topk-rewriter"; }
|
|
|
|
using HloPassInterface::Run;
|
|
StatusOr<bool> Run(
|
|
HloModule* module,
|
|
const absl::flat_hash_set<absl::string_view>& execution_threads) override;
|
|
|
|
protected:
|
|
// Check if the sort instruction is in TopK.
|
|
std::optional<int64_t> SortIsInTopK(HloInstruction* inst);
|
|
|
|
// Transform to CustomCall.
|
|
StatusOr<bool> TransformToCustomCall(
|
|
HloModule* module,
|
|
const absl::flat_hash_set<absl::string_view>& execution_threads);
|
|
|
|
private:
|
|
// Predicate that returns true if a sort instruction is profitable to be
|
|
// converted into a custom call.
|
|
std::function<bool(const HloSortInstruction*, int64_t)>
|
|
is_profitable_to_convert_;
|
|
|
|
// Matches the input to the sort+iota+slice pattern and converts to custom
|
|
// call if profitable. Returns the custom call if one was created.
|
|
StatusOr<HloInstruction*> TransformPatternToCustomCall(HloInstruction* inst);
|
|
};
|
|
|
|
class TopkDecomposer : public HloModulePass {
|
|
public:
|
|
absl::string_view name() const override { return "topk-decomposer"; }
|
|
|
|
explicit TopkDecomposer(HloPredicate should_decompose = {})
|
|
: should_decompose_(should_decompose) {}
|
|
|
|
using HloPassInterface::Run;
|
|
StatusOr<bool> Run(
|
|
HloModule* module,
|
|
const absl::flat_hash_set<absl::string_view>& execution_threads) override;
|
|
|
|
private:
|
|
HloPredicate should_decompose_;
|
|
};
|
|
|
|
} // namespace xla
|
|
|
|
#endif // XLA_SERVICE_TOPK_REWRITER_H_
|