Skip to content

Commit 37883f7

Browse files
committed
Some nemotron replacements
1 parent 9d2091f commit 37883f7

10 files changed

+8
-8
lines changed

helm/README.md

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -298,7 +298,7 @@ You can also use NV-Ingest's Python client API to interact with the service runn
298298
| envVars.AUDIO_GRPC_ENDPOINT | string | `"audio:50051"` | |
299299
| envVars.AUDIO_INFER_PROTOCOL | string | `"grpc"` | |
300300
| envVars.COMPONENTS_TO_READY_CHECK | string | `"ALL"` | |
301-
| envVars.EMBEDDING_NIM_ENDPOINT | string | `"http://llama-32-nv-embedqa-1b-v2:8000/v1"` | |
301+
| envVars.EMBEDDING_NIM_ENDPOINT | string | `"http://llama-nemotron-embed-1b-v2:8000/v1"` | |
302302
| envVars.EMBEDDING_NIM_MODEL_NAME | string | `"nvidia/llama-nemotron-embed-1b-v2"` | |
303303
| envVars.IMAGE_STORAGE_PUBLIC_BASE_URL | string | `""` | |
304304
| envVars.IMAGE_STORAGE_URI | string | `"s3://nv-ingest/artifacts/store/images"` | |

helm/mig/nv-ingest-mig-values-25x.yaml

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -38,7 +38,7 @@ nemotron-table-structure-v1:
3838
nvidia.com/gpu: 0
3939
nvidia.com/mig-1g.10gb: 1
4040

41-
nvidia-nim-llama-32-nv-embedqa-1b-v2:
41+
nvidia-nim-llama-nemotron-embed-1b-v2:
4242
resources:
4343
limits:
4444
nvidia.com/gpu: 0
@@ -75,8 +75,8 @@ text-embedding-nim:
7575
nvidia.com/gpu: 0
7676
nvidia.com/mig-1g.10gb: 1
7777

78-
# If you want to deploy llama-32-nv-rerankqa-1b-v2
79-
llama-32-nv-rerankqa-1b-v2:
78+
# If you want to deploy llama-nemotron-rerank-1b-v2
79+
llama-nemotron-rerank-1b-v2:
8080
resources:
8181
limits:
8282
nvidia.com/gpu: 0

helm/mig/nv-ingest-mig-values.yaml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -48,7 +48,7 @@ nimOperator:
4848
nvidia.com/gpu: "0"
4949
nvidia.com/mig-1g.20gb: 1
5050

51-
# If you want to deploy llama-32-nv-rerankqa-1b-v2
51+
# If you want to deploy llama-nemotron-rerank-1b-v2
5252
llama_3_2_nv_rerankqa_1b_v2:
5353
enabled: true
5454
resources:

helm/templates/llama-3.2-nv-embedqa-1b-v2.yaml renamed to helm/templates/llama-nemotron-embed-1b-v2.yaml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -21,7 +21,7 @@ spec:
2121
apiVersion: apps.nvidia.com/v1alpha1
2222
kind: NIMService
2323
metadata:
24-
name: llama-32-nv-embedqa-1b-v2
24+
name: llama-nemotron-embed-1b-v2
2525
spec:
2626
image:
2727
repository: {{ .Values.nimOperator.embedqa.image.repository }}

helm/templates/llama-3.2-nv-rerankqa-1b-v2.yaml renamed to helm/templates/llama-nemotron-rerank-1b-v2.yaml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -21,7 +21,7 @@ spec:
2121
apiVersion: apps.nvidia.com/v1alpha1
2222
kind: NIMService
2323
metadata:
24-
name: llama-32-nv-rerankqa-1b-v2
24+
name: llama-nemotron-rerank-1b-v2
2525
spec:
2626
image:
2727
repository: {{ .Values.nimOperator.llama_3_2_nv_rerankqa_1b_v2.image.repository }}
File renamed without changes.
File renamed without changes.
File renamed without changes.

helm/values.yaml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -170,7 +170,7 @@ envVars:
170170
AUDIO_GRPC_ENDPOINT: "audio:50051"
171171
AUDIO_INFER_PROTOCOL: "grpc"
172172

173-
EMBEDDING_NIM_ENDPOINT: "http://llama-32-nv-embedqa-1b-v2:8000/v1"
173+
EMBEDDING_NIM_ENDPOINT: "http://llama-nemotron-embed-1b-v2:8000/v1"
174174
EMBEDDING_NIM_MODEL_NAME: "nvidia/llama-nemotron-embed-1b-v2"
175175

176176
NEMOTRON_PARSE_HTTP_ENDPOINT: http://nemotron-parse:8000/v1/chat/completions

0 commit comments

Comments
 (0)