update
This commit is contained in:
parent
b7828ae733
commit
a5d3888fca
294
resource.yaml
294
resource.yaml
@ -1,297 +1,13 @@
|
||||
|
||||
|
||||
resource_packages:
|
||||
- name: contest_on_demand_a100_x1
|
||||
default_deploy_engine: vllm
|
||||
description: 适用于非常驻服务7b/14b-int4推理
|
||||
resources:
|
||||
memory: 20Gi
|
||||
cpu: 4
|
||||
gpu:
|
||||
type: gpu
|
||||
device_label: A10080G
|
||||
gpu_key: nvidia.com/gpu
|
||||
gpu_value: 1
|
||||
cpu: 4
|
||||
memory: 20Gi
|
||||
description: 适用于非常驻服务7b/14b-int4推理
|
||||
- name: contest_on_demand_a100_x4
|
||||
default_deploy_engine: vllm
|
||||
resources:
|
||||
gpu:
|
||||
type: gpu
|
||||
device_label: A10080G
|
||||
gpu_key: nvidia.com/gpu
|
||||
gpu_value: 4
|
||||
cpu: 5
|
||||
memory: 100Gi
|
||||
description: 适用于非常驻服务7b/14b-int4推理
|
||||
- name: contest_on_demand_a100_x2
|
||||
default_deploy_engine: vllm
|
||||
resources:
|
||||
gpu:
|
||||
type: gpu
|
||||
device_label: A10080G
|
||||
gpu_key: nvidia.com/gpu
|
||||
gpu_value: 2
|
||||
cpu: 4
|
||||
memory: 20Gi
|
||||
description: 适用于非常驻服务7b/14b-int4推理
|
||||
|
||||
- name: Ephemeral-RTX3090*1
|
||||
default_deploy_engine: vllm
|
||||
resources:
|
||||
gpu:
|
||||
type: gpu
|
||||
device_label: 3090
|
||||
gpu_key: nvidia.com/gpu
|
||||
gpu_value: 1
|
||||
cpu: 4
|
||||
memory: 20Gi
|
||||
description: 适用于非常驻服务7b/14b-int4推理
|
||||
- name: Ephemeral-RTX3090*2
|
||||
default_deploy_engine: vllm
|
||||
resources:
|
||||
gpu:
|
||||
type: gpu
|
||||
device_label: 3090
|
||||
gpu_key: nvidia.com/gpu
|
||||
gpu_value: 2
|
||||
cpu: 4
|
||||
memory: 20Gi
|
||||
description: 适用于非常驻服务7b/14b-int4推理
|
||||
- name: R200-8F*1
|
||||
deploy_engines:
|
||||
- slx-infer-kunlunxin
|
||||
default_deploy_engine: slx-infer-kunlunxin
|
||||
resources:
|
||||
gpu:
|
||||
type: gpu
|
||||
device_label: R200-8F
|
||||
gpu_key: baidu.com/xpu
|
||||
gpu_value: 1
|
||||
cpu: 20
|
||||
memory: 100Gi
|
||||
description: 适用于7b/14b-int4推理
|
||||
- name: R200-8F*2
|
||||
deploy_engines:
|
||||
- slx-infer-kunlunxin
|
||||
default_deploy_engine: slx-infer-kunlunxin
|
||||
resources:
|
||||
gpu:
|
||||
type: gpu
|
||||
device_label: R200-8F
|
||||
gpu_key: baidu.com/xpu
|
||||
gpu_value: 2
|
||||
cpu: 20
|
||||
memory: 100Gi
|
||||
description: 适用于7b/14b-int4推理
|
||||
- name: R200-8F*4
|
||||
deploy_engines:
|
||||
- slx-infer-kunlunxin
|
||||
default_deploy_engine: slx-infer-kunlunxin
|
||||
resources:
|
||||
gpu:
|
||||
type: gpu
|
||||
device_label: R200-8F
|
||||
gpu_key: baidu.com/xpu
|
||||
gpu_value: 4
|
||||
cpu: 20
|
||||
memory: 100Gi
|
||||
description: 适用于7b/14b-int4推理
|
||||
- name: MLU370-X4*1
|
||||
deploy_engines:
|
||||
- slx-infer-cambricon
|
||||
default_deploy_engine: slx-infer-cambricon
|
||||
resources:
|
||||
gpu:
|
||||
type: gpu
|
||||
device_label: MLU370-X4
|
||||
gpu_key: cambricon.com/mlu
|
||||
gpu_value: 1
|
||||
cpu: 10
|
||||
memory: 20Gi
|
||||
description: 适用于7b/14b-int4推理
|
||||
|
||||
- name: MLU370-X4*2
|
||||
deploy_engines:
|
||||
- slx-infer-cambricon
|
||||
default_deploy_engine: slx-infer-cambricon
|
||||
resources:
|
||||
gpu:
|
||||
type: gpu
|
||||
device_label: MLU370-X4
|
||||
gpu_key: cambricon.com/mlu
|
||||
gpu_value: 2
|
||||
cpu: 10
|
||||
memory: 20Gi
|
||||
description: 适用于7b/14b-int4推理
|
||||
- name: Iluvatar MR-V100*1
|
||||
deploy_engines:
|
||||
- slx-infer-iluvatar
|
||||
default_deploy_engine: slx-infer-iluvatar
|
||||
resources:
|
||||
gpu:
|
||||
type: gpu
|
||||
device_label: Iluvatar MR-V100
|
||||
gpu_key: iluvatar.ai/gpu
|
||||
gpu_value: 1
|
||||
cpu: 10
|
||||
memory: 20Gi
|
||||
description: 适用于7b/14b-int4推理
|
||||
- name: Iluvatar MR-V100*2
|
||||
deploy_engines:
|
||||
- slx-infer-iluvatar
|
||||
default_deploy_engine: slx-infer-iluvatar
|
||||
resources:
|
||||
gpu:
|
||||
type: gpu
|
||||
device_label: Iluvatar MR-V100
|
||||
gpu_key: iluvatar.ai/gpu
|
||||
gpu_value: 2
|
||||
cpu: 10
|
||||
memory: 20Gi
|
||||
description: 适用于7b/14b-int4推理
|
||||
- name: Iluvatar MR-V100*4
|
||||
resources:
|
||||
gpu:
|
||||
type: gpu
|
||||
device_label: Iluvatar MR-V100
|
||||
gpu_key: iluvatar.ai/gpu
|
||||
gpu_value: 4
|
||||
cpu: 10
|
||||
memory: 20Gi
|
||||
description: 适用于7b/14b-int4推理
|
||||
- name: RTX3090*1
|
||||
deploy_engines:
|
||||
- ascend_infer
|
||||
- vllm
|
||||
default_deploy_engine: vllm
|
||||
resources:
|
||||
gpu:
|
||||
type: gpu
|
||||
device_label: NVIDIA GeForce RTX 3090
|
||||
gpu_key: nvidia.com/gpu
|
||||
gpu_value: 1
|
||||
cpu: 10
|
||||
memory: 20Gi
|
||||
description: 适用于7b/14b-int4推理
|
||||
- name: RTX3090*2
|
||||
resources:
|
||||
gpu:
|
||||
type: gpu
|
||||
device_label: NVIDIA GeForce RTX 3090
|
||||
gpu_key: nvidia.com/gpu
|
||||
gpu_value: 2
|
||||
cpu: 10
|
||||
memory: 80Gi
|
||||
description: 适用于 sagegpt / 34b-int4
|
||||
- name: RTX3090*4
|
||||
resources:
|
||||
gpu:
|
||||
type: gpu
|
||||
device_label: NVIDIA GeForce RTX 3090
|
||||
gpu_key: nvidia.com/gpu
|
||||
gpu_value: 4
|
||||
cpu: 10
|
||||
memory: 40Gi
|
||||
description: 适用于 72b-int4
|
||||
- name: vmemory-24Gi
|
||||
resources:
|
||||
gpu:
|
||||
type: vgpu
|
||||
device_label: NVIDIA GeForce RTX 3090
|
||||
gpu_key: nvidia.com/gpu
|
||||
gpu_value: 1
|
||||
memory_key: nvidia.com/gpumem
|
||||
memory_value: 24576
|
||||
cpu: 10
|
||||
memory: 20Gi
|
||||
description: 适用于14b-int4/7b模型上线推理
|
||||
|
||||
- name: vmemory-2-48Gi
|
||||
resources:
|
||||
gpu:
|
||||
type: vgpu
|
||||
device_label: NVIDIA GeForce RTX 3090
|
||||
gpu_key: nvidia.com/gpu
|
||||
gpu_value: 2
|
||||
memory_key: nvidia.com/gpumem
|
||||
memory_value: 24576
|
||||
cpu: 10
|
||||
memory: 100Gi
|
||||
description: 适用于式说大模型
|
||||
|
||||
- name: vmemory-10Gi
|
||||
resources:
|
||||
gpu:
|
||||
type: vgpu
|
||||
device_label: NVIDIA GeForce RTX 3090
|
||||
gpu_key: nvidia.com/gpu
|
||||
gpu_value: 1
|
||||
memory_key: nvidia.com/gpumem
|
||||
memory_value: 10000
|
||||
cpu: 1
|
||||
memory: 10Gi
|
||||
description: 适用于7b-int4/embedding模型上线推理
|
||||
- name: A100-14b模型推理套餐
|
||||
resources:
|
||||
gpu:
|
||||
type: gpu
|
||||
device_label: Nvidia A100(80G)
|
||||
gpu_key: nvidia.com/gpu
|
||||
gpu_value: 1
|
||||
cpu: 4
|
||||
memory: 20Gi
|
||||
description: 适用于14b模型上线推理
|
||||
- name: A100-14b模型推理套餐1
|
||||
resources:
|
||||
gpu:
|
||||
type: gpu
|
||||
device_label: Nvidia A100(80G)
|
||||
gpu_key: nvidia.com/gpu
|
||||
gpu_value: 1
|
||||
cpu: 4
|
||||
memory: 20Gi
|
||||
description: 适用于14b模型上线推理
|
||||
- name: A100-7b模型训练套餐(此种情况为非vgpu)
|
||||
resources:
|
||||
gpu:
|
||||
type: gpu
|
||||
device_label: Nvidia A100(80G)
|
||||
gpu_key: nvidia.com/gpu
|
||||
gpu_value: 2
|
||||
cpu: 40
|
||||
memory: 128Gi
|
||||
description: 适用于7b模型finetune
|
||||
|
||||
- name: 演示空间入门套餐
|
||||
resources:
|
||||
cpu: 1
|
||||
memory: 2Gi
|
||||
description: 适用于7b模型int4推理
|
||||
- name: 演示空间初级套餐
|
||||
resources:
|
||||
gpu: {}
|
||||
cpu: 2
|
||||
memory: 4Gi
|
||||
description: 适用于演示空间
|
||||
- name: 演示空间中级套餐
|
||||
resources:
|
||||
gpu: {}
|
||||
cpu: 4
|
||||
memory: 16Gi
|
||||
description: 适用于演示空间
|
||||
- name: 演示空间高级套餐
|
||||
resources:
|
||||
gpu: {}
|
||||
cpu: 8
|
||||
memory: 32Gi
|
||||
description: 适用于演示空间
|
||||
- name: RTX3090*8
|
||||
resources:
|
||||
gpu:
|
||||
type: gpu
|
||||
device_label: NVIDIA GeForce RTX 3090
|
||||
gpu_key: nvidia.com/gpu
|
||||
gpu_value: 8
|
||||
cpu: 10
|
||||
memory: 200Gi
|
||||
description: 适用于finetune
|
||||
memory_key: null
|
||||
memory_value: null
|
||||
|
||||
Loading…
Reference in New Issue
Block a user