resource_packages: - name: contest_on_demand_a100_x1 description: 适用于非常驻服务7b/14b-int4推理 resources: memory: 20Gi cpu: 4 gpu: type: gpu device_label: A10080G gpu_key: nvidia.com/gpu gpu_value: 1 memory_key: null memory_value: null - name: contest_on_demand_a100_x4 description: 适用于非常驻服务7b/14b-int4推理 resources: memory: 100Gi cpu: 5 gpu: type: gpu device_label: A10080G gpu_key: nvidia.com/gpu gpu_value: 4 memory_key: null memory_value: null - name: Ephemeral-RTX3090*1 description: 适用于非常驻服务7b/14b-int4推理 resources: memory: 20Gi cpu: 4 gpu: type: gpu device_label: '3090' gpu_key: nvidia.com/gpu gpu_value: 1 memory_key: null memory_value: null - name: Ephemeral-RTX3090*2 description: 适用于非常驻服务7b/14b-int4推理 resources: memory: 20Gi cpu: 4 gpu: type: gpu device_label: '3090' gpu_key: nvidia.com/gpu gpu_value: 2 memory_key: null memory_value: null - name: R200-8F*1 description: 适用于7b/14b-int4推理 resources: memory: 100Gi cpu: 20 gpu: type: gpu device_label: R200-8F gpu_key: baidu.com/xpu gpu_value: 1 memory_key: null memory_value: null - name: R200-8F*2 description: 适用于7b/14b-int4推理 resources: memory: 100Gi cpu: 20 gpu: type: gpu device_label: R200-8F gpu_key: baidu.com/xpu gpu_value: 2 memory_key: null memory_value: null - name: R200-8F*4 description: 适用于7b/14b-int4推理 resources: memory: 100Gi cpu: 20 gpu: type: gpu device_label: R200-8F gpu_key: baidu.com/xpu gpu_value: 4 memory_key: null memory_value: null - name: MLU370-X4*1 description: 适用于7b/14b-int4推理 resources: memory: 20Gi cpu: 10 gpu: type: gpu device_label: MLU370-X4 gpu_key: cambricon.com/mlu gpu_value: 1 memory_key: null memory_value: null - name: MLU370-X4*2 description: 适用于7b/14b-int4推理 resources: memory: 20Gi cpu: 10 gpu: type: gpu device_label: MLU370-X4 gpu_key: cambricon.com/mlu gpu_value: 2 memory_key: null memory_value: null - name: MR-V100*1 description: 适用于7b/14b-int4推理 resources: memory: 20Gi cpu: 10 gpu: type: gpu device_label: Iluvatar MR-V100 gpu_key: iluvatar.ai/gpu gpu_value: 1 memory_key: null memory_value: null - name: MR-V100*2 description: 适用于7b/14b-int4推理 resources: memory: 20Gi cpu: 10 gpu: type: gpu device_label: Iluvatar MR-V100 gpu_key: iluvatar.ai/gpu gpu_value: 2 memory_key: null memory_value: null - name: MR-V100*4 description: 适用于7b/14b-int4推理 resources: memory: 20Gi cpu: 10 gpu: type: gpu device_label: Iluvatar MR-V100 gpu_key: iluvatar.ai/gpu gpu_value: 4 memory_key: null memory_value: null - name: ' RTX3090*1' description: 适用于7b/14b-int4推理 resources: memory: 20Gi cpu: 10 gpu: type: gpu device_label: NVIDIA GeForce RTX 3090 gpu_key: nvidia.com/gpu gpu_value: 1 memory_key: null memory_value: null - name: RTX3090*2 description: 适用于 sagegpt / 34b-int4 resources: memory: 80Gi cpu: 10 gpu: type: gpu device_label: NVIDIA GeForce RTX 3090 gpu_key: nvidia.com/gpu gpu_value: 2 memory_key: null memory_value: null - name: RTX3090*4 description: '适用于 72b-int4 ' resources: memory: 40Gi cpu: 10 gpu: type: gpu device_label: NVIDIA GeForce RTX 3090 gpu_key: nvidia.com/gpu gpu_value: 4 memory_key: null memory_value: null - name: vmemory-24Gi description: 适用于14b-int4/7b模型上线推理 resources: memory: 20Gi cpu: 10 gpu: type: vgpu device_label: NVIDIA GeForce RTX 3090 gpu_key: nvidia.com/gpu gpu_value: 1 memory_key: null memory_value: '24' - name: vmemory-2-48Gi description: '适用于式说大模型 ' resources: memory: 100Gi cpu: 10 gpu: type: vgpu device_label: NVIDIA GeForce RTX 3090 gpu_key: nvidia.com/gpu gpu_value: 2 memory_key: null memory_value: '24' - name: vmemory-10Gi description: 适用于7b-int4/embedding模型上线推理 resources: memory: 10Gi cpu: 1 gpu: type: vgpu device_label: NVIDIA GeForce RTX 3090 gpu_key: nvidia.com/gpu gpu_value: 1 memory_key: null memory_value: '24'