• Home
  • Line#
  • Scopes#
  • Navigate#
  • Raw
  • Download
1 /* Copyright 2018 The TensorFlow Authors. All Rights Reserved.
2 
3 Licensed under the Apache License, Version 2.0 (the "License");
4 you may not use this file except in compliance with the License.
5 You may obtain a copy of the License at
6 
7     http://www.apache.org/licenses/LICENSE-2.0
8 
9 Unless required by applicable law or agreed to in writing, software
10 distributed under the License is distributed on an "AS IS" BASIS,
11 WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 See the License for the specific language governing permissions and
13 limitations under the License.
14 ==============================================================================*/
15 
16 #ifndef TENSORFLOW_COMPILER_XLA_SERVICE_GPU_TESTS_GPU_CODEGEN_TEST_H_
17 #define TENSORFLOW_COMPILER_XLA_SERVICE_GPU_TESTS_GPU_CODEGEN_TEST_H_
18 
19 #include <memory>
20 #include <string>
21 
22 #include "tensorflow/compiler/xla/tests/llvm_irgen_test_base.h"
23 #include "tensorflow/compiler/xla/tests/verified_hlo_module.h"
24 
25 namespace xla {
26 namespace gpu {
27 
28 // Tests that verify IR or PTX emitted by the GPU backend is as expected.
29 class GpuCodegenTest : public LlvmIrGenTestBase {
30  public:
GpuCodegenTest()31   GpuCodegenTest()
32       : is_built_with_rocm_(
33             se::MultiPlatformManager::PlatformWithName("ROCM").ok()) {}
34 
35  protected:
36   // Like HloTestBase::CreateNewVerifiedModule(), with a flag for configuring
37   // the ftz option.
38   std::unique_ptr<VerifiedHloModule> CreateNewVerifiedModuleWithFTZ(bool ftz);
39 
40   // Compiles the given HLO module to PTX and verifies the PTX matches the given
41   // FileCheck pattern.  (See http://llvm.org/docs/CommandGuide/FileCheck.html).
42   // The "VerifyPtx" part only happens on the CUDA platform,
43   // and hence the "Optionally" in function name.
44   // For ROCm platform this routine will only do the "Compile" part.
45   void CompileAndOptionallyVerifyPtx(
46       std::unique_ptr<VerifiedHloModule> hlo_module, absl::string_view pattern);
47 
48   bool is_built_with_rocm_;
49 };
50 
51 }  // namespace gpu
52 }  // namespace xla
53 
54 #endif  // TENSORFLOW_COMPILER_XLA_SERVICE_GPU_TESTS_GPU_CODEGEN_TEST_H_
55