diff --git a/docs/docs/extraction/quickstart-library-mode.md b/docs/docs/extraction/quickstart-library-mode.md index e27b7e413..9122c4e79 100644 --- a/docs/docs/extraction/quickstart-library-mode.md +++ b/docs/docs/extraction/quickstart-library-mode.md @@ -5,4 +5,3 @@ NVIDIA Ingest (nv-ingest) has been renamed to the NeMo Retriever Library. Use the [Quick Start for NeMo Retriever Library](https://github.com/NVIDIA/NeMo-Retriever/blob/26.03/nemo_retriever/README.md) to set up and run the NeMo Retriever Library locally, so you can build a GPU‑accelerated, multimodal RAG ingestion pipeline that parses PDFs, HTML, text, audio, and video into LanceDB vector embeddings, integrates with Nemotron RAG models (locally or via NIM endpoints), which includes Ray‑based scaling plus built‑in recall evaluation. - diff --git a/helm/templates/llama-nemotron-embed-1b-v2.yaml b/helm/templates/llama-nemotron-embed-1b-v2.yaml index 199bcdc9c..de0b429b7 100644 --- a/helm/templates/llama-nemotron-embed-1b-v2.yaml +++ b/helm/templates/llama-nemotron-embed-1b-v2.yaml @@ -17,6 +17,10 @@ spec: storageClass: {{ .Values.nimOperator.embedqa.storage.pvc.storageClass }} size: {{ .Values.nimOperator.embedqa.storage.pvc.size }} volumeAccessMode: {{ .Values.nimOperator.embedqa.storage.pvc.volumeAccessMode }} + nodeSelector: +{{ toYaml .Values.nimOperator.embedqa.nodeSelector | nindent 4 }} + tolerations: +{{ toYaml .Values.nimOperator.embedqa.tolerations | nindent 4 }} --- apiVersion: apps.nvidia.com/v1alpha1 kind: NIMService diff --git a/helm/templates/llama-nemotron-rerank-1b-v2.yaml b/helm/templates/llama-nemotron-rerank-1b-v2.yaml index 6cfc2fcfc..e85490a30 100644 --- a/helm/templates/llama-nemotron-rerank-1b-v2.yaml +++ b/helm/templates/llama-nemotron-rerank-1b-v2.yaml @@ -17,6 +17,10 @@ spec: storageClass: {{ .Values.nimOperator.rerankqa.storage.pvc.storageClass }} size: {{ .Values.nimOperator.rerankqa.storage.pvc.size }} volumeAccessMode: {{ .Values.nimOperator.rerankqa.storage.pvc.volumeAccessMode }} + nodeSelector: +{{ toYaml .Values.nimOperator.rerankqa.nodeSelector | nindent 4 }} + tolerations: +{{ toYaml .Values.nimOperator.rerankqa.tolerations | nindent 4 }} --- apiVersion: apps.nvidia.com/v1alpha1 kind: NIMService diff --git a/helm/templates/nemotron-graphic-elements-v1.yaml b/helm/templates/nemotron-graphic-elements-v1.yaml index 1fbdcbaf7..1549991e5 100644 --- a/helm/templates/nemotron-graphic-elements-v1.yaml +++ b/helm/templates/nemotron-graphic-elements-v1.yaml @@ -17,6 +17,10 @@ spec: storageClass: {{ .Values.nimOperator.graphic_elements.storage.pvc.storageClass }} size: {{ .Values.nimOperator.graphic_elements.storage.pvc.size }} volumeAccessMode: {{ .Values.nimOperator.graphic_elements.storage.pvc.volumeAccessMode }} + nodeSelector: +{{ toYaml .Values.nimOperator.graphic_elements.nodeSelector | nindent 4 }} + tolerations: +{{ toYaml .Values.nimOperator.graphic_elements.tolerations | nindent 4 }} --- apiVersion: apps.nvidia.com/v1alpha1 kind: NIMService diff --git a/helm/templates/nemotron-nano-12b-v2-vl.yaml b/helm/templates/nemotron-nano-12b-v2-vl.yaml index 1b5c1ca9d..a8ffaf8e3 100644 --- a/helm/templates/nemotron-nano-12b-v2-vl.yaml +++ b/helm/templates/nemotron-nano-12b-v2-vl.yaml @@ -17,6 +17,10 @@ spec: storageClass: {{ .Values.nimOperator.nemotron_nano_12b_v2_vl.storage.pvc.storageClass }} size: {{ .Values.nimOperator.nemotron_nano_12b_v2_vl.storage.pvc.size }} volumeAccessMode: {{ .Values.nimOperator.nemotron_nano_12b_v2_vl.storage.pvc.volumeAccessMode }} + nodeSelector: +{{ toYaml .Values.nimOperator.nemotron_nano_12b_v2_vl.nodeSelector | nindent 4 }} + tolerations: +{{ toYaml .Values.nimOperator.nemotron_nano_12b_v2_vl.tolerations | nindent 4 }} --- apiVersion: apps.nvidia.com/v1alpha1 kind: NIMService @@ -34,6 +38,8 @@ spec: nimCache: name: nemotron-nano-12b-v2-vl replicas: {{ .Values.nimOperator.nemotron_nano_12b_v2_vl.replicas }} + nodeSelector: +{{ toYaml .Values.nimOperator.nemotron_nano_12b_v2_vl.nodeSelector | nindent 4 }} resources: {{ toYaml .Values.nimOperator.nemotron_nano_12b_v2_vl.resources | nindent 4 }} tolerations: diff --git a/helm/templates/nemotron-ocr-v1.yaml b/helm/templates/nemotron-ocr-v1.yaml index 7ae0f2dea..60ab1a0ce 100644 --- a/helm/templates/nemotron-ocr-v1.yaml +++ b/helm/templates/nemotron-ocr-v1.yaml @@ -17,6 +17,10 @@ spec: storageClass: {{ .Values.nimOperator.ocr.storage.pvc.storageClass }} size: {{ .Values.nimOperator.ocr.storage.pvc.size }} volumeAccessMode: {{ .Values.nimOperator.ocr.storage.pvc.volumeAccessMode }} + nodeSelector: +{{ toYaml .Values.nimOperator.ocr.nodeSelector | nindent 4 }} + tolerations: +{{ toYaml .Values.nimOperator.ocr.tolerations | nindent 4 }} --- apiVersion: apps.nvidia.com/v1alpha1 kind: NIMService diff --git a/helm/templates/nemotron-page-elements-v3.yaml b/helm/templates/nemotron-page-elements-v3.yaml index 223c7db24..2f8aa3ee4 100644 --- a/helm/templates/nemotron-page-elements-v3.yaml +++ b/helm/templates/nemotron-page-elements-v3.yaml @@ -17,7 +17,10 @@ spec: storageClass: {{ .Values.nimOperator.page_elements.storage.pvc.storageClass }} size: {{ .Values.nimOperator.page_elements.storage.pvc.size }} volumeAccessMode: {{ .Values.nimOperator.page_elements.storage.pvc.volumeAccessMode }} - resources: {} + nodeSelector: +{{ toYaml .Values.nimOperator.page_elements.nodeSelector | nindent 4 }} + tolerations: +{{ toYaml .Values.nimOperator.page_elements.tolerations | nindent 4 }} --- apiVersion: apps.nvidia.com/v1alpha1 kind: NIMService diff --git a/helm/templates/nemotron-parse.yaml b/helm/templates/nemotron-parse.yaml index 25f3e07ac..114aa1c39 100644 --- a/helm/templates/nemotron-parse.yaml +++ b/helm/templates/nemotron-parse.yaml @@ -17,6 +17,10 @@ spec: storageClass: {{ .Values.nimOperator.nemotron_parse.storage.pvc.storageClass }} size: {{ .Values.nimOperator.nemotron_parse.storage.pvc.size }} volumeAccessMode: {{ .Values.nimOperator.nemotron_parse.storage.pvc.volumeAccessMode }} + nodeSelector: +{{ toYaml .Values.nimOperator.nemotron_parse.nodeSelector | nindent 4 }} + tolerations: +{{ toYaml .Values.nimOperator.nemotron_parse.tolerations | nindent 4 }} --- apiVersion: apps.nvidia.com/v1alpha1 kind: NIMService @@ -34,6 +38,8 @@ spec: nimCache: name: nemotron-parse replicas: {{ .Values.nimOperator.nemotron_parse.replicas }} + nodeSelector: +{{ toYaml .Values.nimOperator.nemotron_parse.nodeSelector | nindent 4 }} resources: {{ toYaml .Values.nimOperator.nemotron_parse.resources | nindent 4 }} tolerations: diff --git a/helm/templates/nemotron-table-structure-v1.yaml b/helm/templates/nemotron-table-structure-v1.yaml index b305a1e09..0320e9246 100644 --- a/helm/templates/nemotron-table-structure-v1.yaml +++ b/helm/templates/nemotron-table-structure-v1.yaml @@ -17,6 +17,10 @@ spec: storageClass: {{ .Values.nimOperator.table_structure.storage.pvc.storageClass }} size: {{ .Values.nimOperator.table_structure.storage.pvc.size }} volumeAccessMode: {{ .Values.nimOperator.table_structure.storage.pvc.volumeAccessMode }} + nodeSelector: +{{ toYaml .Values.nimOperator.table_structure.nodeSelector | nindent 4 }} + tolerations: +{{ toYaml .Values.nimOperator.table_structure.tolerations | nindent 4 }} --- apiVersion: apps.nvidia.com/v1alpha1 kind: NIMService