diff --git a/resource.yaml b/resource.yaml index 396c0df..8e227af 100644 --- a/resource.yaml +++ b/resource.yaml @@ -1,297 +1,13 @@ - - resource_packages: - name: contest_on_demand_a100_x1 - default_deploy_engine: vllm + description: 适用于非常驻服务7b/14b-int4推理 resources: + memory: 20Gi + cpu: 4 gpu: type: gpu device_label: A10080G gpu_key: nvidia.com/gpu gpu_value: 1 - cpu: 4 - memory: 20Gi - description: 适用于非常驻服务7b/14b-int4推理 -- name: contest_on_demand_a100_x4 - default_deploy_engine: vllm - resources: - gpu: - type: gpu - device_label: A10080G - gpu_key: nvidia.com/gpu - gpu_value: 4 - cpu: 5 - memory: 100Gi - description: 适用于非常驻服务7b/14b-int4推理 -- name: contest_on_demand_a100_x2 - default_deploy_engine: vllm - resources: - gpu: - type: gpu - device_label: A10080G - gpu_key: nvidia.com/gpu - gpu_value: 2 - cpu: 4 - memory: 20Gi - description: 适用于非常驻服务7b/14b-int4推理 - -- name: Ephemeral-RTX3090*1 - default_deploy_engine: vllm - resources: - gpu: - type: gpu - device_label: 3090 - gpu_key: nvidia.com/gpu - gpu_value: 1 - cpu: 4 - memory: 20Gi - description: 适用于非常驻服务7b/14b-int4推理 -- name: Ephemeral-RTX3090*2 - default_deploy_engine: vllm - resources: - gpu: - type: gpu - device_label: 3090 - gpu_key: nvidia.com/gpu - gpu_value: 2 - cpu: 4 - memory: 20Gi - description: 适用于非常驻服务7b/14b-int4推理 -- name: R200-8F*1 - deploy_engines: - - slx-infer-kunlunxin - default_deploy_engine: slx-infer-kunlunxin - resources: - gpu: - type: gpu - device_label: R200-8F - gpu_key: baidu.com/xpu - gpu_value: 1 - cpu: 20 - memory: 100Gi - description: 适用于7b/14b-int4推理 -- name: R200-8F*2 - deploy_engines: - - slx-infer-kunlunxin - default_deploy_engine: slx-infer-kunlunxin - resources: - gpu: - type: gpu - device_label: R200-8F - gpu_key: baidu.com/xpu - gpu_value: 2 - cpu: 20 - memory: 100Gi - description: 适用于7b/14b-int4推理 -- name: R200-8F*4 - deploy_engines: - - slx-infer-kunlunxin - default_deploy_engine: slx-infer-kunlunxin - resources: - gpu: - type: gpu - device_label: R200-8F - gpu_key: baidu.com/xpu - gpu_value: 4 - cpu: 20 - memory: 100Gi - description: 适用于7b/14b-int4推理 -- name: MLU370-X4*1 - deploy_engines: - - slx-infer-cambricon - default_deploy_engine: slx-infer-cambricon - resources: - gpu: - type: gpu - device_label: MLU370-X4 - gpu_key: cambricon.com/mlu - gpu_value: 1 - cpu: 10 - memory: 20Gi - description: 适用于7b/14b-int4推理 - -- name: MLU370-X4*2 - deploy_engines: - - slx-infer-cambricon - default_deploy_engine: slx-infer-cambricon - resources: - gpu: - type: gpu - device_label: MLU370-X4 - gpu_key: cambricon.com/mlu - gpu_value: 2 - cpu: 10 - memory: 20Gi - description: 适用于7b/14b-int4推理 -- name: Iluvatar MR-V100*1 - deploy_engines: - - slx-infer-iluvatar - default_deploy_engine: slx-infer-iluvatar - resources: - gpu: - type: gpu - device_label: Iluvatar MR-V100 - gpu_key: iluvatar.ai/gpu - gpu_value: 1 - cpu: 10 - memory: 20Gi - description: 适用于7b/14b-int4推理 -- name: Iluvatar MR-V100*2 - deploy_engines: - - slx-infer-iluvatar - default_deploy_engine: slx-infer-iluvatar - resources: - gpu: - type: gpu - device_label: Iluvatar MR-V100 - gpu_key: iluvatar.ai/gpu - gpu_value: 2 - cpu: 10 - memory: 20Gi - description: 适用于7b/14b-int4推理 -- name: Iluvatar MR-V100*4 - resources: - gpu: - type: gpu - device_label: Iluvatar MR-V100 - gpu_key: iluvatar.ai/gpu - gpu_value: 4 - cpu: 10 - memory: 20Gi - description: 适用于7b/14b-int4推理 -- name: RTX3090*1 - deploy_engines: - - ascend_infer - - vllm - default_deploy_engine: vllm - resources: - gpu: - type: gpu - device_label: NVIDIA GeForce RTX 3090 - gpu_key: nvidia.com/gpu - gpu_value: 1 - cpu: 10 - memory: 20Gi - description: 适用于7b/14b-int4推理 -- name: RTX3090*2 - resources: - gpu: - type: gpu - device_label: NVIDIA GeForce RTX 3090 - gpu_key: nvidia.com/gpu - gpu_value: 2 - cpu: 10 - memory: 80Gi - description: 适用于 sagegpt / 34b-int4 -- name: RTX3090*4 - resources: - gpu: - type: gpu - device_label: NVIDIA GeForce RTX 3090 - gpu_key: nvidia.com/gpu - gpu_value: 4 - cpu: 10 - memory: 40Gi - description: 适用于 72b-int4 -- name: vmemory-24Gi - resources: - gpu: - type: vgpu - device_label: NVIDIA GeForce RTX 3090 - gpu_key: nvidia.com/gpu - gpu_value: 1 - memory_key: nvidia.com/gpumem - memory_value: 24576 - cpu: 10 - memory: 20Gi - description: 适用于14b-int4/7b模型上线推理 - -- name: vmemory-2-48Gi - resources: - gpu: - type: vgpu - device_label: NVIDIA GeForce RTX 3090 - gpu_key: nvidia.com/gpu - gpu_value: 2 - memory_key: nvidia.com/gpumem - memory_value: 24576 - cpu: 10 - memory: 100Gi - description: 适用于式说大模型 - -- name: vmemory-10Gi - resources: - gpu: - type: vgpu - device_label: NVIDIA GeForce RTX 3090 - gpu_key: nvidia.com/gpu - gpu_value: 1 - memory_key: nvidia.com/gpumem - memory_value: 10000 - cpu: 1 - memory: 10Gi - description: 适用于7b-int4/embedding模型上线推理 -- name: A100-14b模型推理套餐 - resources: - gpu: - type: gpu - device_label: Nvidia A100(80G) - gpu_key: nvidia.com/gpu - gpu_value: 1 - cpu: 4 - memory: 20Gi - description: 适用于14b模型上线推理 -- name: A100-14b模型推理套餐1 - resources: - gpu: - type: gpu - device_label: Nvidia A100(80G) - gpu_key: nvidia.com/gpu - gpu_value: 1 - cpu: 4 - memory: 20Gi - description: 适用于14b模型上线推理 -- name: A100-7b模型训练套餐(此种情况为非vgpu) - resources: - gpu: - type: gpu - device_label: Nvidia A100(80G) - gpu_key: nvidia.com/gpu - gpu_value: 2 - cpu: 40 - memory: 128Gi - description: 适用于7b模型finetune - -- name: 演示空间入门套餐 - resources: - cpu: 1 - memory: 2Gi - description: 适用于7b模型int4推理 -- name: 演示空间初级套餐 - resources: - gpu: {} - cpu: 2 - memory: 4Gi - description: 适用于演示空间 -- name: 演示空间中级套餐 - resources: - gpu: {} - cpu: 4 - memory: 16Gi - description: 适用于演示空间 -- name: 演示空间高级套餐 - resources: - gpu: {} - cpu: 8 - memory: 32Gi - description: 适用于演示空间 -- name: RTX3090*8 - resources: - gpu: - type: gpu - device_label: NVIDIA GeForce RTX 3090 - gpu_key: nvidia.com/gpu - gpu_value: 8 - cpu: 10 - memory: 200Gi - description: 适用于finetune \ No newline at end of file + memory_key: null + memory_value: null