Skip to content

alpha-hack-program/model-server

Folders and files

NameName
Last commit message
Last commit date

Latest commit

 

History

14 Commits
 
 
 
 
 
 
 
 
 
 

Repository files navigation

model-server

apiVersion: argoproj.io/v1alpha1
kind: Application
metadata:
  name: vllm-mistral-7b
  namespace: openshift-gitops
  annotations:
    argocd.argoproj.io/compare-options: IgnoreExtraneous
    argocd.argoproj.io/sync-options: SkipDryRunOnMissingResource=true
spec:
  project: default
  destination:
    server: 'https://kubernetes.default.svc'
    namespace: vllm-mistral-7b
  source:
    path: .
    repoURL: https://github.com/alpha-hack-program/model-server.git
    targetRevision: main
    helm:
      parameters:
        - name: instanceName
          value: "vllm-mistral-7b"
        - name: dataScienceProjectNamespace
          value: "vllm-mistral-7b"
        - name: dataScienceProjectDisplayName
          value: "vllm-mistral-7b"
        - name: model.root
          value: mistralai
        - name: model.id
          value: Mistral-7B-Instruct-v0.2
        - name: model.name
          value: mistral-7b
        - name: model.displayName
          value: "Mistral 7b"
        - name: model.maxModelLen
          value: '6144'
        - name: model.runtime.displayName
          value: "vLLM Mistral 7B"
        - name: model.runtime.templateName
          value: "vllm-mistral-7b-serving-template"
        - name: model.accelerator.productName
          value: "NVIDIA-A10G"
        - name: model.accelerator.min
          value: '1'
        - name: model.accelerator.max
          value: '1'
  syncPolicy:
    automated:
      # prune: true
      selfHeal: true
apiVersion: argoproj.io/v1alpha1
kind: Application
metadata:
  name: vllm-llama-3-8b
  namespace: openshift-gitops
  annotations:
    argocd.argoproj.io/compare-options: IgnoreExtraneous
    argocd.argoproj.io/sync-options: SkipDryRunOnMissingResource=true
spec:
  project: default
  destination:
    server: 'https://kubernetes.default.svc'
    namespace: vllm-llama-3-8b
  source:
    path: .
    repoURL: https://github.com/alpha-hack-program/model-server.git
    targetRevision: main
    helm:
      parameters:
        - name: instanceName
          value: "vllm-llama-3-8b"
        - name: dataScienceProjectNamespace
          value: "vllm-llama-3-8b"
        - name: dataScienceProjectDisplayName
          value: "vllm-llama-3-8b"
        - name: model.root
          value: meta-llama
        - name: model.id
          value: Meta-Llama-3-8B-Instruct
        - name: model.name
          value: llama-3-8b
        - name: model.displayName
          value: "Llama 3 8B"
        - name: model.runtime.displayName
          value: "vLLM Llama 3 8B"
        - name: model.runtime.templateName
          value: "vllm-llama-3-8b-serving-template"
        - name: model.accelerator.productName
          value: "NVIDIA-A10G"
        - name: model.accelerator.min
          value: '1'
        - name: model.accelerator.max
          value: '1'
  syncPolicy:
    automated:
      # prune: true
      selfHeal: true
apiVersion: argoproj.io/v1alpha1
kind: Application
metadata:
  name: vllm-granite-8b
  namespace: openshift-gitops
  annotations:
    argocd.argoproj.io/compare-options: IgnoreExtraneous
    argocd.argoproj.io/sync-options: SkipDryRunOnMissingResource=true
spec:
  project: default
  destination:
    server: 'https://kubernetes.default.svc'
    namespace: vllm-granite-8b
  source:
    path: .
    repoURL: https://github.com/alpha-hack-program/model-server.git
    targetRevision: main
    helm:
      parameters:
        - name: instanceName
          value: "vllm-granite-8b"
        - name: dataScienceProjectNamespace
          value: "vllm-granite-8b"
        - name: dataScienceProjectDisplayName
          value: "vllm-granite-8b"
        - name: model.root
          value: ibm-granite
        - name: model.id
          value: granite-8b-code-instruct
        - name: model.name
          value: granite-8b
        - name: model.displayName
          value: "Granite 8B Code Instruct"
        - name: model.maxModelLen
          value: '4096'
        - name: model.runtime.displayName
          value: "vLLM Granite 3 8B"
        - name: model.runtime.templateName
          value: "vllm-granite-8b-serving-template"
        - name: model.accelerator.productName
          value: "NVIDIA-A10G"
        - name: model.accelerator.min
          value: '1'
        - name: model.accelerator.max
          value: '1'
  syncPolicy:
    automated:
      # prune: true
      selfHeal: true

About

No description, website, or topics provided.

Resources

Stars

Watchers

Forks

Releases

No releases published

Packages

No packages published

Languages