326 lines
		
	
	
		
			7.0 KiB
		
	
	
	
		
			YAML
		
	
	
	
	
	
			
		
		
	
	
			326 lines
		
	
	
		
			7.0 KiB
		
	
	
	
		
			YAML
		
	
	
	
	
	
| resource_packages:
 | |
| - name: contest_on_demand_a100_x1
 | |
|   description: 适用于非常驻服务7b/14b-int4推理
 | |
|   resources:
 | |
|     memory: 20Gi
 | |
|     cpu: 4
 | |
|     gpu:
 | |
|       type: gpu
 | |
|       device_label: A10080G
 | |
|       gpu_key: nvidia.com/gpu
 | |
|       gpu_value: 1
 | |
|       memory_key: null
 | |
|       memory_value: '80'
 | |
| - name: contest_on_demand_a100_x4
 | |
|   description: 适用于非常驻服务7b/14b-int4推理
 | |
|   resources:
 | |
|     memory: 100Gi
 | |
|     cpu: 5
 | |
|     gpu:
 | |
|       type: gpu
 | |
|       device_label: A10080G
 | |
|       gpu_key: nvidia.com/gpu
 | |
|       gpu_value: 4
 | |
|       memory_key: null
 | |
|       memory_value: '80'
 | |
| - name: Ephemeral-RTX3090*1
 | |
|   description: 适用于非常驻服务7b/14b-int4推理
 | |
|   resources:
 | |
|     memory: 20Gi
 | |
|     cpu: 4
 | |
|     gpu:
 | |
|       type: gpu
 | |
|       device_label: '3090'
 | |
|       gpu_key: nvidia.com/gpu
 | |
|       gpu_value: 1
 | |
|       memory_key: null
 | |
|       memory_value: null
 | |
| - name: Ephemeral-RTX3090*2
 | |
|   description: 适用于非常驻服务7b/14b-int4推理
 | |
|   resources:
 | |
|     memory: 20Gi
 | |
|     cpu: 4
 | |
|     gpu:
 | |
|       type: gpu
 | |
|       device_label: '3090'
 | |
|       gpu_key: nvidia.com/gpu
 | |
|       gpu_value: 2
 | |
|       memory_key: null
 | |
|       memory_value: null
 | |
| - name: R200-8F*1
 | |
|   description: 适用于7b/14b-int4推理
 | |
|   resources:
 | |
|     memory: 100Gi
 | |
|     cpu: 20
 | |
|     gpu:
 | |
|       type: gpu
 | |
|       device_label: R200-8F
 | |
|       gpu_key: baidu.com/xpu
 | |
|       gpu_value: 1
 | |
|       memory_key: null
 | |
|       memory_value: null
 | |
| - name: R200-8F*2
 | |
|   description: 适用于7b/14b-int4推理
 | |
|   resources:
 | |
|     memory: 100Gi
 | |
|     cpu: 20
 | |
|     gpu:
 | |
|       type: gpu
 | |
|       device_label: R200-8F
 | |
|       gpu_key: baidu.com/xpu
 | |
|       gpu_value: 2
 | |
|       memory_key: null
 | |
|       memory_value: null
 | |
| - name: R200-8F*4
 | |
|   description: 适用于7b/14b-int4推理
 | |
|   resources:
 | |
|     memory: 100Gi
 | |
|     cpu: 20
 | |
|     gpu:
 | |
|       type: gpu
 | |
|       device_label: R200-8F
 | |
|       gpu_key: baidu.com/xpu
 | |
|       gpu_value: 4
 | |
|       memory_key: null
 | |
|       memory_value: null
 | |
| - name: MLU370-X4*1
 | |
|   description: 适用于7b/14b-int4推理
 | |
|   resources:
 | |
|     memory: 20Gi
 | |
|     cpu: 10
 | |
|     gpu:
 | |
|       type: gpu
 | |
|       device_label: MLU370-X4
 | |
|       gpu_key: cambricon.com/mlu
 | |
|       gpu_value: 1
 | |
|       memory_key: null
 | |
|       memory_value: null
 | |
| - name: MLU370-X4*2
 | |
|   description: 适用于7b/14b-int4推理
 | |
|   resources:
 | |
|     memory: 20Gi
 | |
|     cpu: 10
 | |
|     gpu:
 | |
|       type: gpu
 | |
|       device_label: MLU370-X4
 | |
|       gpu_key: cambricon.com/mlu
 | |
|       gpu_value: 2
 | |
|       memory_key: null
 | |
|       memory_value: null
 | |
| - name: MR-V100*1
 | |
|   description: 适用于7b/14b-int4推理
 | |
|   resources:
 | |
|     memory: 20Gi
 | |
|     cpu: 10
 | |
|     gpu:
 | |
|       type: gpu
 | |
|       device_label: Iluvatar MR-V100
 | |
|       gpu_key: iluvatar.ai/gpu
 | |
|       gpu_value: 1
 | |
|       memory_key: null
 | |
|       memory_value: null
 | |
| - name: MR-V100*2
 | |
|   description: 适用于7b/14b-int4推理
 | |
|   resources:
 | |
|     memory: 20Gi
 | |
|     cpu: 10
 | |
|     gpu:
 | |
|       type: gpu
 | |
|       device_label: Iluvatar MR-V100
 | |
|       gpu_key: iluvatar.ai/gpu
 | |
|       gpu_value: 2
 | |
|       memory_key: null
 | |
|       memory_value: null
 | |
| - name: MR-V100*4
 | |
|   description: 适用于7b/14b-int4推理
 | |
|   resources:
 | |
|     memory: 20Gi
 | |
|     cpu: 10
 | |
|     gpu:
 | |
|       type: gpu
 | |
|       device_label: Iluvatar MR-V100
 | |
|       gpu_key: iluvatar.ai/gpu
 | |
|       gpu_value: 4
 | |
|       memory_key: null
 | |
|       memory_value: null
 | |
| - name: ' RTX3090*1'
 | |
|   description: 适用于7b/14b-int4推理
 | |
|   resources:
 | |
|     memory: 20Gi
 | |
|     cpu: 10
 | |
|     gpu:
 | |
|       type: gpu
 | |
|       device_label: NVIDIA GeForce RTX 3090
 | |
|       gpu_key: nvidia.com/gpu
 | |
|       gpu_value: 1
 | |
|       memory_key: null
 | |
|       memory_value: null
 | |
| - name: RTX3090*2
 | |
|   description: 适用于 sagegpt / 34b-int4
 | |
|   resources:
 | |
|     memory: 80Gi
 | |
|     cpu: 10
 | |
|     gpu:
 | |
|       type: gpu
 | |
|       device_label: NVIDIA GeForce RTX 3090
 | |
|       gpu_key: nvidia.com/gpu
 | |
|       gpu_value: 2
 | |
|       memory_key: null
 | |
|       memory_value: null
 | |
| - name: RTX3090*4
 | |
|   description: '适用于 72b-int4 '
 | |
|   resources:
 | |
|     memory: 40Gi
 | |
|     cpu: 10
 | |
|     gpu:
 | |
|       type: gpu
 | |
|       device_label: NVIDIA GeForce RTX 3090
 | |
|       gpu_key: nvidia.com/gpu
 | |
|       gpu_value: 4
 | |
|       memory_key: null
 | |
|       memory_value: null
 | |
| - name: vmemory-24Gi
 | |
|   description: 适用于14b-int4/7b模型上线推理
 | |
|   resources:
 | |
|     memory: 20Gi
 | |
|     cpu: 10
 | |
|     gpu:
 | |
|       type: vgpu
 | |
|       device_label: NVIDIA GeForce RTX 3090
 | |
|       gpu_key: nvidia.com/gpu
 | |
|       gpu_value: 1
 | |
|       memory_key: null
 | |
|       memory_value: '24'
 | |
| - name: vmemory-2-48Gi
 | |
|   description: '适用于式说大模型 '
 | |
|   resources:
 | |
|     memory: 100Gi
 | |
|     cpu: 10
 | |
|     gpu:
 | |
|       type: vgpu
 | |
|       device_label: NVIDIA GeForce RTX 3090
 | |
|       gpu_key: nvidia.com/gpu
 | |
|       gpu_value: 2
 | |
|       memory_key: null
 | |
|       memory_value: '24'
 | |
| - name: vmemory-10Gi
 | |
|   description: 适用于7b-int4/embedding模型上线推理
 | |
|   resources:
 | |
|     memory: 10Gi
 | |
|     cpu: 1
 | |
|     gpu:
 | |
|       type: vgpu
 | |
|       device_label: NVIDIA GeForce RTX 3090
 | |
|       gpu_key: nvidia.com/gpu
 | |
|       gpu_value: 1
 | |
|       memory_key: null
 | |
|       memory_value: '24'
 | |
| - name: A100-14b模型推理套餐
 | |
|   description: 适用于14b模型上线推理
 | |
|   resources:
 | |
|     memory: 20Gi
 | |
|     cpu: 4
 | |
|     gpu:
 | |
|       type: gpu
 | |
|       device_label: Nvidia A100(80G)
 | |
|       gpu_key: nvidia.com/gpu
 | |
|       gpu_value: 1
 | |
|       memory_key: null
 | |
|       memory_value: '80'
 | |
| - name: A100-14b模型推理套餐1
 | |
|   description: 适用于14b模型上线推理
 | |
|   resources:
 | |
|     memory: 20Gi
 | |
|     cpu: 4
 | |
|     gpu:
 | |
|       type: gpu
 | |
|       device_label: Nvidia A100(80G)
 | |
|       gpu_key: nvidia.com/gpu
 | |
|       gpu_value: 1
 | |
|       memory_key: null
 | |
|       memory_value: '80'
 | |
| - name: A100-7b模型训练套餐(此种情况为非vgpu)
 | |
|   description: 适用于7b模型finetune
 | |
|   resources:
 | |
|     memory: 128Gi
 | |
|     cpu: 40
 | |
|     gpu:
 | |
|       type: gpu
 | |
|       device_label: Nvidia A100(80G)
 | |
|       gpu_key: nvidia.com/gpu
 | |
|       gpu_value: 2
 | |
|       memory_key: null
 | |
|       memory_value: '80'
 | |
| - name: RTX3090*8
 | |
|   description: 适用于finetune
 | |
|   resources:
 | |
|     memory: 200Gi
 | |
|     cpu: 10
 | |
|     gpu:
 | |
|       type: gpu
 | |
|       device_label: NVIDIA GeForce RTX 3090
 | |
|       gpu_key: nvidia.com/gpu
 | |
|       gpu_value: 8
 | |
|       memory_key: null
 | |
|       memory_value: null
 | |
| - name: 沐曦C500资源套餐
 | |
|   description: null
 | |
|   resources:
 | |
|     memory: 20Gi
 | |
|     cpu: 4
 | |
|     gpu:
 | |
|       type: gpu
 | |
|       device_label: MXC500
 | |
|       gpu_key: metax-tech.com/gpu
 | |
|       gpu_value: 2
 | |
|       memory_key: null
 | |
|       memory_value: '64'
 | |
| - name: 天数BIV100资源套餐
 | |
|   description: null
 | |
|   resources:
 | |
|     memory: 50Gi
 | |
|     cpu: 4
 | |
|     gpu:
 | |
|       type: gpu
 | |
|       device_label: IluvatarBIV100
 | |
|       gpu_key: iluvatar.ai/gpu
 | |
|       gpu_value: 2
 | |
|       memory_key: null
 | |
|       memory_value: '32'
 | |
| - name: 华为910B*4 资源套餐
 | |
|   description: null
 | |
|   resources:
 | |
|     memory: 50Gi
 | |
|     cpu: 8
 | |
|     gpu:
 | |
|       type: gpu
 | |
|       device_label: 910b
 | |
|       gpu_key: huawei.com/Ascend910B
 | |
|       gpu_value: 4
 | |
|       memory_key: null
 | |
|       memory_value: null
 | |
| - name: 华为910B*1 资源套餐
 | |
|   description: null
 | |
|   resources:
 | |
|     memory: 50Gi
 | |
|     cpu: 4
 | |
|     gpu:
 | |
|       type: gpu
 | |
|       device_label: 910b
 | |
|       gpu_key: huawei.com/Ascend910B
 | |
|       gpu_value: 1
 | |
|       memory_key: null
 | |
|       memory_value: null
 | |
| - name: 华为910B*2 资源套餐
 | |
|   description: null
 | |
|   resources:
 | |
|     memory: 50Gi
 | |
|     cpu: 4
 | |
|     gpu:
 | |
|       type: gpu
 | |
|       device_label: 910b
 | |
|       gpu_key: huawei.com/Ascend910B
 | |
|       gpu_value: 2
 | |
|       memory_key: null
 | |
|       memory_value: null
 |