master

分支 (13)

标签 (22)

管理

管理

master

branch_v7.1.RC1

branch_v7.0.0-RC1

branch_v6.0.0

branch_v6.0.0-RC3

branch_v6.0.0-RC2

branch_v6.0.0-RC1

branch_V5.0.RC2

20211230-v2.0.4

2022930-V3.0.RC3

2022330-V3.0.RC1

2022630-V3.0.RC2

20210330-V2.0.1-bugfix

20250117-V6.0.0

20240720-V6.0.RC2

20240520-V6.0.RC1

20240105-V5.0.0

20231110-V5.0.RC3.2

20231025-V5.0.RC3.1

2023930-V5.0.RC3

2023915-V5.0.RC2.2

2023815-V5.0.RC2.1

2023630-V5.0.RC2

2023330-V5.0.RC1

20221230-V3.0.0

2022930-V3.0.RC3

2022630-V3.0.RC2

2022330-V3.0.RC1

20211230-V2.0.4

20210930-V2.0.3

20210715-V2.0.2

20210330-V2.0.1-bugfix

20210330-V2.0.1

mindxdl-deploy
/
samples
/
inference
/
volcano
/
infer-vcjob-910.yaml

apiVersion: batch.volcano.sh/v1alpha1
kind: Job
metadata:
  name: mindx-infer-test
  namespace: vcjob                      # Select a proper namespace based on the site requirements.
  labels:
    ring-controller.atlas: ascend-910b
    fault-scheduling: "force"
spec:
  minAvailable: 1                       # The value of minAvailable is 1 in a single-node scenario, only set as 1 when infer task
  schedulerName: volcano                # Use the Volcano scheduler to schedule jobs.
  policies:
    - event: PodEvicted
      action: RestartJob
  maxRetry: 3
  queue: default
  tasks:
  - name: "default-test"
    replicas: 1                         # The value of replicas is 1 in a single-node scenario, only set as 1 when infer task
    template:
      metadata:
        labels:
          app: infer
          ring-controller.atlas: ascend-910b
      spec:
        automountServiceAccountToken: false
        containers:
          - image: infer_image:latest             # Inference image, which can be modified.
            imagePullPolicy: IfNotPresent
            name: infer
            command: ["/bin/bash", "-c", "./infer.sh"]
            env:
            # ASCEND_VISIBLE_DEVICES env variable is used by ascend-docker-runtime when in the whole card scheduling scene with volcano scheduler. please delete it when in the static or dynamic vNPU scheduling scene or without volcano.
            - name: ASCEND_VISIBLE_DEVICES
              valueFrom:
                fieldRef:
                  fieldPath: metadata.annotations['huawei.com/Ascend910']               # The value must be the same as resources.requests.
            resources:
              requests:
                huawei.com/Ascend910: 1          # Number of required NPUs. The maximum value is 2. You can add lines below to configure resources such as memory and CPU.
              limits:
                huawei.com/Ascend910: 1          # The value must be consistent with that in requests.
            volumeMounts:
              - name: localtime                  # The container time must be the same as the host time.
                mountPath: /etc/localtime
        nodeSelector:
          host-arch: huawei-arm                  # Configure the label based on the actual job.
          accelerator-type: module-910b-8      # servers (with Atlas 800I A2 cards)
        volumes:
        - name: localtime
          hostPath:
            path: /etc/localtime
        restartPolicy: OnFailure