Skip to content

Commit 95194df

Browse files
committed
fix
1 parent f4cee19 commit 95194df

File tree

3 files changed

+33
-28
lines changed

3 files changed

+33
-28
lines changed

deps/ReactantExtra/.bazelrc

Lines changed: 22 additions & 22 deletions
Original file line numberDiff line numberDiff line change
@@ -29,32 +29,32 @@ build --repo_env=RULES_PYTHON_ENABLE_PYSTAR=0
2929

3030
build -c opt
3131

32-
build:cuda --repo_env TF_NEED_CUDA=1
33-
build:cuda --repo_env TF_NVCC_CLANG=1
34-
build:cuda --repo_env TF_NCCL_USE_STUB=1
35-
build:cuda --repo_env=HERMETIC_CUDA_VERSION="12.8.1"
36-
build:cuda --repo_env=HERMETIC_CUDNN_VERSION="9.8.0"
37-
build:cuda --repo_env=HERMETIC_NVSHMEM_VERSION="3.2.5"
32+
common:cuda --repo_env TF_NEED_CUDA=1
33+
common:cuda --repo_env TF_NVCC_CLANG=1
34+
common:cuda --repo_env TF_NCCL_USE_STUB=1
35+
common:cuda --repo_env=HERMETIC_CUDA_VERSION="12.8.1"
36+
common:cuda --repo_env=HERMETIC_CUDNN_VERSION="9.8.0"
37+
common:cuda --repo_env=HERMETIC_NVSHMEM_VERSION="3.2.5"
3838
# "sm" means we emit only cubin, which is forward compatible within a GPU generation.
3939
# "compute" means we emit both cubin and PTX, which is larger but also forward compatible to future GPU generations.
40-
build:cuda --repo_env HERMETIC_CUDA_COMPUTE_CAPABILITIES="sm_60,sm_70,sm_80,compute_90"
41-
build:cuda --crosstool_top="@local_config_cuda//crosstool:toolchain"
42-
build:cuda --@local_config_cuda//:enable_cuda
40+
common:cuda --repo_env HERMETIC_CUDA_COMPUTE_CAPABILITIES="sm_60,sm_70,sm_80,compute_90"
41+
common:cuda --crosstool_top="@local_config_cuda//crosstool:toolchain"
42+
common:cuda --@local_config_cuda//:enable_cuda
4343
# Default hermetic CUDA and CUDNN versions.
44-
build:cuda --@local_config_cuda//cuda:include_cuda_libs=true
45-
build:cuda --@local_config_cuda//:cuda_compiler=nvcc
46-
# build:cuda --@local_config_nvshmem//:override_include_nvshmem_libs=true
47-
# build:cuda --@local_config_nvshmem//cuda:include_nvshmem_libs=true
44+
common:cuda --@local_config_cuda//cuda:include_cuda_libs=true
45+
common:cuda --@local_config_cuda//:cuda_compiler=nvcc
46+
# common:cuda --@local_config_nvshmem//:override_include_nvshmem_libs=true
47+
# common:cuda --@local_config_nvshmem//cuda:include_nvshmem_libs=true
4848

4949

50-
build:rocm --crosstool_top=@local_config_rocm//crosstool:toolchain
51-
build:rocm --define=using_rocm=true --define=using_rocm_hipcc=true
52-
build:rocm --repo_env TF_NEED_ROCM=1
53-
build:rocm --action_env TF_ROCM_AMDGPU_TARGETS="gfx900,gfx906,gfx908,gfx90a,gfx940,gfx941,gfx942,gfx1030,gfx1100,gfx1200,gfx1201"
50+
common:rocm --crosstool_top=@local_config_rocm//crosstool:toolchain
51+
common:rocm --define=using_rocm=true --define=using_rocm_hipcc=true
52+
common:rocm --repo_env TF_NEED_ROCM=1
53+
common:rocm --action_env TF_ROCM_AMDGPU_TARGETS="gfx900,gfx906,gfx908,gfx90a,gfx940,gfx941,gfx942,gfx1030,gfx1100,gfx1200,gfx1201"
5454

5555
# Build with hipcc for ROCm and clang for the host.
56-
build:rocm --action_env=TF_ROCM_CLANG="1"
57-
build:rocm --action_env=CLANG_COMPILER_PATH="/usr/lib/llvm-18/bin/clang"
58-
build:rocm --copt=-Wno-gnu-offsetof-extensions
59-
build:rocm --copt=-Qunused-arguments
60-
build:rocm --action_env=TF_HIPCC_CLANG="1"
56+
common:rocm --action_env=TF_ROCM_CLANG="1"
57+
common:rocm --action_env=CLANG_COMPILER_PATH="/usr/lib/llvm-18/bin/clang"
58+
common:rocm --copt=-Wno-gnu-offsetof-extensions
59+
common:rocm --copt=-Qunused-arguments
60+
common:rocm --action_env=TF_HIPCC_CLANG="1"

deps/ReactantExtra/API.cpp

Lines changed: 5 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -1626,8 +1626,9 @@ REACTANT_ABI HeldIfrtArray *ifrt_client_assemble_array_from_single_shards(
16261626
REACTANT_ABI HeldIfrtArray *
16271627
ifrt_pjrt_array_create(ifrt::PjRtClient *client,
16281628
HeldValue<std::shared_ptr<xla::PjRtBuffer>> *buffer) {
1629-
return reactant::capture(tsl::RCReference<ifrt::Array>(
1630-
MyValueOrThrow(xla::ifrt::PjRtArray::Create(client, buffer->obj()))));
1629+
return reactant::capture(
1630+
tsl::RCReference<ifrt::Array>(MyValueOrThrow(xla::ifrt::PjRtArray::Create(
1631+
client, buffer->obj(), /*has_custom_layout*/ false))));
16311632
}
16321633

16331634
// we might me interested in the `Compiler::Compile` method variant that accepts
@@ -2373,7 +2374,7 @@ REACTANT_ABI bool hlo_sharding_check_eq(xla::HloSharding *hloSharding,
23732374

23742375
#pragma endregion
23752376

2376-
typedef ifrt::Future<> IfRtFutureType;
2377+
typedef tsl::Future<> IfRtFutureType;
23772378

23782379
REACTANT_ABI void ifrt_free_future(IfRtFutureType *Future) { delete Future; }
23792380

@@ -2600,7 +2601,7 @@ REACTANT_ABI void ifrt_loaded_executable_execute(
26002601
// there is only 1 status and is valid because we set `options.fill_status =
26012602
// true`
26022603
*futures = true;
2603-
*status = new FutureType(result.status);
2604+
*status = new IfRtFutureType(result.status);
26042605

26052606
for (int i = 0; i < num_results; i++) {
26062607
op_results[i] = reactant::capture(result.outputs[i]);

deps/ReactantExtra/WORKSPACE

Lines changed: 6 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -3,7 +3,7 @@ load("@bazel_tools//tools/build_defs/repo:http.bzl", "http_archive")
33
NSYNC_COMMIT = "82b118aa7ace3132e517e2c467f8732978cf4023"
44
NSYNC_SHA256 = ""
55

6-
ENZYMEXLA_COMMIT = "96bcf384c5dce3341b347554c32bd02b2defc0eb"
6+
ENZYMEXLA_COMMIT = "f46d7016fbc50dc87125bbdfddf71ea6782073fd"
77
ENZYMEXLA_SHA256 = ""
88

99
http_archive(
@@ -34,7 +34,11 @@ LLVM_TARGETS = [
3434
"AArch64",
3535
"X86",
3636
"ARM",
37-
]
37+
]
38+
#+ [
39+
# "PowerPC",
40+
# "SystemZ"
41+
#]
3842

3943
# Uncomment these lines to use a custom LLVM commit
4044
# LLVM_COMMIT = "b39c5cb6977f35ad727d86b2dd6232099734ffd3"

0 commit comments

Comments
 (0)