-
Notifications
You must be signed in to change notification settings - Fork 3
/
inferless.yaml
45 lines (40 loc) · 1.36 KB
/
inferless.yaml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
version: 1.0.0
name: idefics-9b-instruct-8bit
import_source: GIT
# you can choose the options between ONNX, TENSORFLOW, PYTORCH
source_framework_type: PYTORCH
configuration:
# if you want to use a custom runtime, add the runtime id and name below,
# you can find it by running `inferless runtime list` or create one with `inferless runtime upload`
# NOTE: this is not yet supported for Serverless
custom_runtime_id: ''
custom_runtime_url: ''
# if you want to use a custom volume, add the volume id and name below,
# you can find it by running `inferless volume list` or create one with `inferless volume create -n {VOLUME_NAME}`
# NOTE: this is not yet supported for Serverless
custom_volume_id: ''
custom_volume_name: ''
gpu_type: T4
inference_time: '180'
is_dedicated: true
is_serverless: false
max_replica: '1'
min_replica: '0'
scale_down_delay: '600'
region: region-1
vcpu: '3'
ram: '20'
env:
# Add your environment variables here
# ENV: 'PROD'
secrets:
# Add your secret ids here you can find it by running `inferless secrets list`
# - 65723205-ce21-4392-a10b-3tf00c58988c
optional:
# you can update file names here
input_file_name: input.json
output_file_name: output.json
runtime_file_name: inferless-runtime-config.yaml
model_url: https://github.com/inferless/idefics-9b-instruct-8bit.git
provider: GITHUB
io_schema: true