Skip to content

Commit

Permalink
Change CI agent
Browse files Browse the repository at this point in the history
  • Loading branch information
hiento09 committed Aug 4, 2024
1 parent b70f95d commit b643423
Show file tree
Hide file tree
Showing 3 changed files with 15 additions and 11 deletions.
8 changes: 4 additions & 4 deletions .github/workflows/build.yml
Original file line number Diff line number Diff line change
Expand Up @@ -40,15 +40,15 @@ jobs:
include:
- os: "windows"
name: "cuda-12-4"
runs-on: "windows-tensorrt-llm-0-10-0-cuda-12-4"
runs-on: "windows-tensorrt-llm-0-11-0-cuda-12-4"
run-e2e: false
s3-key-prefix: "windows-tensorrt-llm-tensorrt-llm-0-10-0-ccache"
s3-key-prefix: "windows-tensorrt-llm-tensorrt-llm-0-11-0-ccache"
ccache-dir: 'C:\Users\ContainerAdministrator\AppData\Local\ccache'
- os: "linux"
name: "cuda-12-4"
runs-on: "linux-tensorrt-llm-0-10-0-cuda-12-4"
runs-on: "linux-tensorrt-llm-0-11-0-cuda-12-4"
run-e2e: false
s3-key-prefix: "linux-tensorrt-llm-tensorrt-llm-0-10-0-sccache"
s3-key-prefix: "linux-tensorrt-llm-tensorrt-llm-0-11-0-ccache"
ccache-dir: '/home/runner/.cache/ccache'
permissions:
contents: write
Expand Down
8 changes: 4 additions & 4 deletions .github/workflows/quality-gate.yml
Original file line number Diff line number Diff line change
Expand Up @@ -15,15 +15,15 @@ jobs:
include:
- os: "windows"
name: "cuda-12-4"
runs-on: "windows-tensorrt-llm-0-10-0-cuda-12-4"
runs-on: "windows-tensorrt-llm-0-11-0-cuda-12-4"
run-e2e: false
s3-key-prefix: "windows-tensorrt-llm-tensorrt-llm-0-10-0-ccache"
s3-key-prefix: "windows-tensorrt-llm-tensorrt-llm-0-11-0-ccache"
ccache-dir: 'C:\Users\ContainerAdministrator\AppData\Local\ccache'
- os: "linux"
name: "cuda-12-4"
runs-on: "linux-tensorrt-llm-0-10-0-cuda-12-4"
runs-on: "linux-tensorrt-llm-0-11-0-cuda-12-4"
run-e2e: false
s3-key-prefix: "linux-tensorrt-llm-tensorrt-llm-0-10-0-sccache"
s3-key-prefix: "linux-tensorrt-llm-tensorrt-llm-0-11-0-ccache"
ccache-dir: '/home/runner/.cache/ccache'
permissions:
contents: write
Expand Down
10 changes: 7 additions & 3 deletions scripts/build_wheel.py
Original file line number Diff line number Diff line change
Expand Up @@ -84,7 +84,7 @@ def main(*,
build_run('git submodule update --init --recursive')
on_windows = platform.system() == "Windows"
requirements_filename = "requirements-dev-windows.txt" if on_windows else "requirements-dev.txt"
build_run(f"\"{sys.executable}\" -m pip install -r {requirements_filename}")
# build_run(f"\"{sys.executable}\" -m pip install -r {requirements_filename}")
# Ensure TRT is installed on windows to prevent surprises.
reqs = check_output([sys.executable, "-m", "pip", "freeze"])
installed_packages = [r.decode().split("==")[0] for r in reqs.split()]
Expand All @@ -105,7 +105,7 @@ def main(*,
if cuda_architectures is not None else "")

cmake_def_args = []
cmake_generator = ""
cmake_generator = "-GNinja"

hardware_arch = platform.machine()

Expand Down Expand Up @@ -223,6 +223,10 @@ def main(*,
build_dir /
"tensorrt_llm/kernels/decoderMaskedMultiheadAttention/decoderXQAImplJIT/nvrtcWrapper/libtensorrt_llm_nvrtc_wrapper.so",
lib_dir / "libtensorrt_llm_nvrtc_wrapper.so")
copy(
build_dir /
"tensorrt_llm/kernels/decoderMaskedMultiheadAttention/libdecoder_attention.so",
lib_dir / "libdecoder_attention.so")

bin_dir = pkg_dir / "bin"
if bin_dir.exists():
Expand Down Expand Up @@ -384,4 +388,4 @@ def add_arguments(parser: ArgumentParser):
parser = ArgumentParser()
add_arguments(parser)
args = parser.parse_args()
main(**vars(args))
main(**vars(args))

0 comments on commit b643423

Please sign in to comment.