From 00458b90bef441c375ba44bf6e18a7f656160e68 Mon Sep 17 00:00:00 2001 From: Siddharth Venkatesan Date: Wed, 13 Nov 2024 11:34:38 -0800 Subject: [PATCH] [djl][trtllm] adding lmi-trt inference images for patch/release (#4419) --- release_images_inference.yml | 40 +++++++++++++++++++++++++++++------- 1 file changed, 33 insertions(+), 7 deletions(-) diff --git a/release_images_inference.yml b/release_images_inference.yml index 6b9bcaf688b5..ccc6ad547c03 100644 --- a/release_images_inference.yml +++ b/release_images_inference.yml @@ -58,14 +58,14 @@ release_images: force_release: False 5: framework: "djl" - version: "0.28.0" + version: "0.26.0" arch_type: "x86" inference: device_types: [ "gpu" ] python_versions: [ "py310" ] os_version: "ubuntu22.04" - lmi_version: "10.0.0" - cuda_version: "cu124" + tensorrtllm_version: "0.7.1" + cuda_version: "cu122" example: False disable_sm_tag: True force_release: False @@ -146,6 +146,32 @@ release_images: disable_sm_tag: False force_release: False 12: + framework: "djl" + version: "0.27.0" + arch_type: "x86" + inference: + device_types: [ "gpu" ] + python_versions: [ "py310" ] + os_version: "ubuntu22.04" + tensorrtllm_version: "0.8.0" + cuda_version: "cu122" + example: False + disable_sm_tag: True + force_release: False + 13: + framework: "djl" + version: "0.28.0" + arch_type: "x86" + inference: + device_types: [ "gpu" ] + python_versions: [ "py310" ] + os_version: "ubuntu22.04" + tensorrtllm_version: "0.9.0" + cuda_version: "cu122" + example: False + disable_sm_tag: True + force_release: False + 14: framework: "djl" version: "0.29.0" arch_type: "x86" @@ -153,12 +179,12 @@ release_images: device_types: [ "gpu" ] python_versions: [ "py310" ] os_version: "ubuntu22.04" - lmi_version: "11.0.0" + tensorrtllm_version: "0.11.0" cuda_version: "cu124" example: False disable_sm_tag: True force_release: False - 13: + 15: framework: "djl" version: "0.30.0" arch_type: "x86" @@ -166,8 +192,8 @@ release_images: device_types: [ "gpu" ] python_versions: [ "py310" ] os_version: "ubuntu22.04" - lmi_version: "12.0.0" - cuda_version: "cu124" + tensorrtllm_version: "0.12.0" + cuda_version: "cu125" example: False disable_sm_tag: True force_release: False