Skip to content

Commit

Permalink
remove deprecated owner field in models chart (#336)
Browse files Browse the repository at this point in the history
  • Loading branch information
samos123 authored Dec 4, 2024
1 parent bcda5c2 commit 5c73336
Show file tree
Hide file tree
Showing 24 changed files with 3 additions and 37 deletions.
4 changes: 3 additions & 1 deletion charts/models/templates/models.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -7,7 +7,9 @@ metadata:
name: {{ $name }}
spec:
features: {{ $model.features }}
owner: {{ $model.owner }}
{{- with $model.owner }}
owner: {{ . }}
{{- end }}
url: {{ $model.url }}
{{- with $model.adapters }}
adapters:
Expand Down
14 changes: 0 additions & 14 deletions charts/models/values.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -27,7 +27,6 @@ catalog:
e5-mistral-7b-instruct-cpu:
enabled: false
features: ["TextEmbedding"]
owner: intfloat
url: "hf://intfloat/e5-mistral-7b-instruct"
engine: VLLM
# TODO: Adjust - the memory associated with this request is too low.
Expand All @@ -38,14 +37,12 @@ catalog:
gemma2-2b-cpu:
enabled: false
features: ["TextGeneration"]
owner: google
url: "ollama://gemma2:2b"
engine: OLlama
resourceProfile: cpu:2
gemma-2b-it-tpu:
enabled: false
features: ["TextGeneration"]
owner: google
url: "hf://google/gemma-2b-it"
engine: VLLM
resourceProfile: google-tpu-v5e-1x1:1
Expand All @@ -54,7 +51,6 @@ catalog:
# gemma2-9b-it-fp8-tpu:
# enabled: false
# features: ["TextGeneration"]
# owner: neuralmagic
# # vLLM logs: "ValueError: fp8 quantization is currently not supported in TPU Backend."
# #url: "hf://neuralmagic/gemma-2-9b-it-FP8"
# engine: VLLM
Expand All @@ -64,7 +60,6 @@ catalog:
# gemma2-9b-it-int8-tpu:
# enabled: false
# features: ["TextGeneration"]
# owner: neuralmagic
# # vLLM logs: "ValueError: compressed-tensors quantization is currently not supported in TPU Backend."
# #url: "hf://neuralmagic/gemma-2-9b-it-quantized.w8a8"
# #url: "hf://neuralmagic/gemma-2-9b-it-quantized.w8a16"
Expand All @@ -76,7 +71,6 @@ catalog:
llama-3.1-8b-instruct-cpu:
enabled: false
features: ["TextGeneration"]
owner: "meta-llama"
url: "hf://meta-llama/Meta-Llama-3.1-8B-Instruct"
engine: VLLM
resourceProfile: cpu:6
Expand All @@ -88,7 +82,6 @@ catalog:
llama-3.1-8b-instruct-tpu:
enabled: false
features: ["TextGeneration"]
owner: meta-llama
url: "hf://meta-llama/Meta-Llama-3.1-8B-Instruct"
engine: VLLM
resourceProfile: google-tpu-v5e-2x2:4
Expand Down Expand Up @@ -120,7 +113,6 @@ catalog:
llama-3.1-8b-instruct-fp8-l4:
enabled: false
features: ["TextGeneration"]
owner: "neuralmagic"
url: "hf://neuralmagic/Meta-Llama-3.1-8B-Instruct-FP8"
engine: VLLM
resourceProfile: nvidia-gpu-l4:1
Expand Down Expand Up @@ -242,30 +234,26 @@ catalog:
nomic-embed-text-cpu:
enabled: false
features: ["TextEmbedding"]
owner: nomic
url: "ollama://nomic-embed-text"
engine: OLlama
resourceProfile: cpu:1
bge-embed-text-cpu:
enabled: false
features: ["TextEmbedding"]
owner: baai
url: "hf://BAAI/bge-small-en-v1.5"
engine: Infinity
resourceProfile: cpu:1
# Opt #
opt-125m-cpu:
enabled: false
features: ["TextGeneration"]
owner: facebook
url: "hf://facebook/opt-125m"
engine: VLLM
# TODO: Adjust - the memory associated with this request is too low.
resourceProfile: cpu:1
opt-125m-l4:
enabled: false
features: ["TextGeneration"]
owner: facebook
url: "hf://facebook/opt-125m"
engine: VLLM
resourceProfile: nvidia-gpu-l4:1
Expand Down Expand Up @@ -299,14 +287,12 @@ catalog:
qwen2-500m-cpu:
enabled: false
features: ["TextGeneration"]
owner: alibaba
url: "ollama://qwen2:0.5b"
engine: OLlama
resourceProfile: cpu:1
faster-whisper-medium-en-cpu:
enabled: false
features: ["SpeechToText"]
owner: Systran
url: "hf://Systran/faster-whisper-medium.en"
engine: FasterWhisper
resourceProfile: cpu:1
1 change: 0 additions & 1 deletion manifests/models/bge-embed-text-cpu.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -5,7 +5,6 @@ metadata:
name: bge-embed-text-cpu
spec:
features: [TextEmbedding]
owner: baai
url: hf://BAAI/bge-small-en-v1.5
engine: Infinity
resourceProfile: cpu:1
1 change: 0 additions & 1 deletion manifests/models/e5-mistral-7b-instruct-cpu.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -5,7 +5,6 @@ metadata:
name: e5-mistral-7b-instruct-cpu
spec:
features: [TextEmbedding]
owner: intfloat
url: hf://intfloat/e5-mistral-7b-instruct
engine: VLLM
args:
Expand Down
1 change: 0 additions & 1 deletion manifests/models/faster-whisper-medium-en-cpu.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -5,7 +5,6 @@ metadata:
name: faster-whisper-medium-en-cpu
spec:
features: [SpeechToText]
owner: Systran
url: hf://Systran/faster-whisper-medium.en
engine: FasterWhisper
resourceProfile: cpu:1
1 change: 0 additions & 1 deletion manifests/models/gemma-2b-it-tpu.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -5,7 +5,6 @@ metadata:
name: gemma-2b-it-tpu
spec:
features: [TextGeneration]
owner: google
url: hf://google/gemma-2b-it
engine: VLLM
args:
Expand Down
1 change: 0 additions & 1 deletion manifests/models/gemma2-2b-cpu.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -5,7 +5,6 @@ metadata:
name: gemma2-2b-cpu
spec:
features: [TextGeneration]
owner: google
url: ollama://gemma2:2b
engine: OLlama
resourceProfile: cpu:2
1 change: 0 additions & 1 deletion manifests/models/llama-3.1-405b-instruct-fp8-a100-80b.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -5,7 +5,6 @@ metadata:
name: llama-3.1-405b-instruct-fp8-a100-80b
spec:
features: [TextGeneration]
owner:
url: hf://neuralmagic/Meta-Llama-3.1-405B-Instruct-FP8
engine: VLLM
args:
Expand Down
1 change: 0 additions & 1 deletion manifests/models/llama-3.1-405b-instruct-fp8-h100.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -5,7 +5,6 @@ metadata:
name: llama-3.1-405b-instruct-fp8-h100
spec:
features: [TextGeneration]
owner:
url: hf://neuralmagic/Meta-Llama-3.1-405B-Instruct-FP8
engine: VLLM
args:
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -5,7 +5,6 @@ metadata:
name: llama-3.1-70b-instruct-awq-int4-gh200
spec:
features: [TextGeneration]
owner:
url: hf://hugging-quants/Meta-Llama-3.1-70B-Instruct-AWQ-INT4
engine: VLLM
args:
Expand Down
1 change: 0 additions & 1 deletion manifests/models/llama-3.1-70b-instruct-fp8-gh200.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -5,7 +5,6 @@ metadata:
name: llama-3.1-70b-instruct-fp8-gh200
spec:
features: [TextGeneration]
owner:
url: hf://neuralmagic/Meta-Llama-3.1-70B-Instruct-FP8
engine: VLLM
args:
Expand Down
1 change: 0 additions & 1 deletion manifests/models/llama-3.1-70b-instruct-fp8-h100.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -5,7 +5,6 @@ metadata:
name: llama-3.1-70b-instruct-fp8-h100
spec:
features: [TextGeneration]
owner:
url: hf://neuralmagic/Meta-Llama-3.1-70B-Instruct-FP8
engine: VLLM
args:
Expand Down
1 change: 0 additions & 1 deletion manifests/models/llama-3.1-70b-instruct-fp8-l4.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -5,7 +5,6 @@ metadata:
name: llama-3.1-70b-instruct-fp8-l4
spec:
features: [TextGeneration]
owner:
url: hf://neuralmagic/Meta-Llama-3.1-70B-Instruct-FP8
engine: VLLM
args:
Expand Down
1 change: 0 additions & 1 deletion manifests/models/llama-3.1-8b-instruct-cpu.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -5,7 +5,6 @@ metadata:
name: llama-3.1-8b-instruct-cpu
spec:
features: [TextGeneration]
owner: meta-llama
url: hf://meta-llama/Meta-Llama-3.1-8B-Instruct
engine: VLLM
args:
Expand Down
1 change: 0 additions & 1 deletion manifests/models/llama-3.1-8b-instruct-fp8-l4.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -5,7 +5,6 @@ metadata:
name: llama-3.1-8b-instruct-fp8-l4
spec:
features: [TextGeneration]
owner: neuralmagic
url: hf://neuralmagic/Meta-Llama-3.1-8B-Instruct-FP8
engine: VLLM
args:
Expand Down
1 change: 0 additions & 1 deletion manifests/models/llama-3.1-8b-instruct-tpu.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -5,7 +5,6 @@ metadata:
name: llama-3.1-8b-instruct-tpu
spec:
features: [TextGeneration]
owner: meta-llama
url: hf://meta-llama/Meta-Llama-3.1-8B-Instruct
engine: VLLM
args:
Expand Down
1 change: 0 additions & 1 deletion manifests/models/llama-3.2-11b-vision-instruct-l4.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -5,7 +5,6 @@ metadata:
name: llama-3.2-11b-vision-instruct-l4
spec:
features: [TextGeneration]
owner:
url: hf://neuralmagic/Llama-3.2-11B-Vision-Instruct-FP8-dynamic
engine: VLLM
args:
Expand Down
1 change: 0 additions & 1 deletion manifests/models/nomic-embed-text-cpu.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -5,7 +5,6 @@ metadata:
name: nomic-embed-text-cpu
spec:
features: [TextEmbedding]
owner: nomic
url: ollama://nomic-embed-text
engine: OLlama
resourceProfile: cpu:1
1 change: 0 additions & 1 deletion manifests/models/opt-125m-cpu.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -5,7 +5,6 @@ metadata:
name: opt-125m-cpu
spec:
features: [TextGeneration]
owner: facebook
url: hf://facebook/opt-125m
engine: VLLM
resourceProfile: cpu:1
1 change: 0 additions & 1 deletion manifests/models/opt-125m-l4.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -5,7 +5,6 @@ metadata:
name: opt-125m-l4
spec:
features: [TextGeneration]
owner: facebook
url: hf://facebook/opt-125m
engine: VLLM
resourceProfile: nvidia-gpu-l4:1
1 change: 0 additions & 1 deletion manifests/models/qwen2-500m-cpu.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -5,7 +5,6 @@ metadata:
name: qwen2-500m-cpu
spec:
features: [TextGeneration]
owner: alibaba
url: ollama://qwen2:0.5b
engine: OLlama
resourceProfile: cpu:1
1 change: 0 additions & 1 deletion manifests/models/qwen2.5-7b-cpu.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -5,7 +5,6 @@ metadata:
name: qwen2.5-7b-cpu
spec:
features: [TextGeneration]
owner:
url: ollama://qwen2.5:7b
engine: OLlama
resourceProfile: cpu:2
1 change: 0 additions & 1 deletion manifests/models/qwen2.5-coder-1.5b-cpu.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -5,7 +5,6 @@ metadata:
name: qwen2.5-coder-1.5b-cpu
spec:
features: [TextGeneration]
owner:
url: ollama://qwen2.5-coder:1.5b
engine: OLlama
resourceProfile: cpu:1
1 change: 0 additions & 1 deletion manifests/models/qwen2.5-coder-1.5b-rtx4070-8gb.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -5,7 +5,6 @@ metadata:
name: qwen2.5-coder-1.5b-rtx4070-8gb
spec:
features: [TextGeneration]
owner:
url: hf://Qwen/Qwen2.5-Coder-1.5B-Instruct
engine: VLLM
args:
Expand Down

0 comments on commit 5c73336

Please sign in to comment.