update
This commit is contained in:
parent
9ba4f36a76
commit
4eda5900c3
@ -13,17 +13,14 @@ resource_packages:
|
|||||||
memory: 20Gi
|
memory: 20Gi
|
||||||
description: 适用于非常驻服务7b/14b-int4推理
|
description: 适用于非常驻服务7b/14b-int4推理
|
||||||
- name: contest_on_demand_a100_x2
|
- name: contest_on_demand_a100_x2
|
||||||
deploy_engines:
|
|
||||||
- ascend_infer
|
|
||||||
- vllm
|
|
||||||
default_deploy_engine: vllm
|
default_deploy_engine: vllm
|
||||||
resources:
|
resources:
|
||||||
gpu:
|
gpu:
|
||||||
type: gpu
|
type: gpu
|
||||||
device_label: NVIDIA GeForce RTX 3090
|
device_label: A10080G
|
||||||
gpu_key: nvidia.com/gpu
|
gpu_key: nvidia.com/gpu
|
||||||
gpu_value: 2
|
gpu_value: 2
|
||||||
cpu: 10
|
cpu: 4
|
||||||
memory: 20Gi
|
memory: 20Gi
|
||||||
description: 适用于非常驻服务7b/14b-int4推理
|
description: 适用于非常驻服务7b/14b-int4推理
|
||||||
|
|
||||||
|
|||||||
Loading…
Reference in New Issue
Block a user