Skip to content

Latest commit

 

History

History
155 lines (152 loc) · 4.33 KB

README.md

File metadata and controls

155 lines (152 loc) · 4.33 KB

model-server

apiVersion: argoproj.io/v1alpha1
kind: Application
metadata:
  name: vllm-mistral-7b
  namespace: openshift-gitops
  annotations:
    argocd.argoproj.io/compare-options: IgnoreExtraneous
    argocd.argoproj.io/sync-options: SkipDryRunOnMissingResource=true
spec:
  project: default
  destination:
    server: 'https://kubernetes.default.svc'
    namespace: vllm-mistral-7b
  source:
    path: .
    repoURL: https://github.com/alpha-hack-program/model-server.git
    targetRevision: main
    helm:
      parameters:
        - name: instanceName
          value: "vllm-mistral-7b"
        - name: dataScienceProjectNamespace
          value: "vllm-mistral-7b"
        - name: dataScienceProjectDisplayName
          value: "vllm-mistral-7b"
        - name: model.root
          value: mistralai
        - name: model.id
          value: Mistral-7B-Instruct-v0.2
        - name: model.name
          value: mistral-7b
        - name: model.displayName
          value: "Mistral 7b"
        - name: model.maxModelLen
          value: '6144'
        - name: model.runtime.displayName
          value: "vLLM Mistral 7B"
        - name: model.runtime.templateName
          value: "vllm-mistral-7b-serving-template"
        - name: model.accelerator.productName
          value: "NVIDIA-A10G"
        - name: model.accelerator.min
          value: '1'
        - name: model.accelerator.max
          value: '1'
  syncPolicy:
    automated:
      # prune: true
      selfHeal: true
apiVersion: argoproj.io/v1alpha1
kind: Application
metadata:
  name: vllm-llama-3-8b
  namespace: openshift-gitops
  annotations:
    argocd.argoproj.io/compare-options: IgnoreExtraneous
    argocd.argoproj.io/sync-options: SkipDryRunOnMissingResource=true
spec:
  project: default
  destination:
    server: 'https://kubernetes.default.svc'
    namespace: vllm-llama-3-8b
  source:
    path: .
    repoURL: https://github.com/alpha-hack-program/model-server.git
    targetRevision: main
    helm:
      parameters:
        - name: instanceName
          value: "vllm-llama-3-8b"
        - name: dataScienceProjectNamespace
          value: "vllm-llama-3-8b"
        - name: dataScienceProjectDisplayName
          value: "vllm-llama-3-8b"
        - name: model.root
          value: meta-llama
        - name: model.id
          value: Meta-Llama-3-8B-Instruct
        - name: model.name
          value: llama-3-8b
        - name: model.displayName
          value: "Llama 3 8B"
        - name: model.runtime.displayName
          value: "vLLM Llama 3 8B"
        - name: model.runtime.templateName
          value: "vllm-llama-3-8b-serving-template"
        - name: model.accelerator.productName
          value: "NVIDIA-A10G"
        - name: model.accelerator.min
          value: '1'
        - name: model.accelerator.max
          value: '1'
  syncPolicy:
    automated:
      # prune: true
      selfHeal: true
apiVersion: argoproj.io/v1alpha1
kind: Application
metadata:
  name: vllm-granite-8b
  namespace: openshift-gitops
  annotations:
    argocd.argoproj.io/compare-options: IgnoreExtraneous
    argocd.argoproj.io/sync-options: SkipDryRunOnMissingResource=true
spec:
  project: default
  destination:
    server: 'https://kubernetes.default.svc'
    namespace: vllm-granite-8b
  source:
    path: .
    repoURL: https://github.com/alpha-hack-program/model-server.git
    targetRevision: main
    helm:
      parameters:
        - name: instanceName
          value: "vllm-granite-8b"
        - name: dataScienceProjectNamespace
          value: "vllm-granite-8b"
        - name: dataScienceProjectDisplayName
          value: "vllm-granite-8b"
        - name: model.root
          value: ibm-granite
        - name: model.id
          value: granite-8b-code-instruct
        - name: model.name
          value: granite-8b
        - name: model.displayName
          value: "Granite 8B Code Instruct"
        - name: model.maxModelLen
          value: '4096'
        - name: model.runtime.displayName
          value: "vLLM Granite 3 8B"
        - name: model.runtime.templateName
          value: "vllm-granite-8b-serving-template"
        - name: model.accelerator.productName
          value: "NVIDIA-A10G"
        - name: model.accelerator.min
          value: '1'
        - name: model.accelerator.max
          value: '1'
  syncPolicy:
    automated:
      # prune: true
      selfHeal: true