forked from NVIDIA/nv-ingest
-
Notifications
You must be signed in to change notification settings - Fork 0
/
values.yaml
534 lines (474 loc) · 19.8 KB
/
values.yaml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
## @section Deployment parameters
## ref: https://kubernetes.io/docs/concepts/scheduling-eviction/assign-pod-node/#affinity-and-anti-affinity
## @param affinity [object] [default: {}] Affinity settings for deployment.
affinity: {}
## @param nodeSelector [object] Sets node selectors for the NIM -- for example `nvidia.com/gpu.present: "true"`
nodeSelector: {}
## @param logLevel Log level of NVIngest service. Possible values of the variable are TRACE, DEBUG, INFO, WARNING, ERROR, CRITICAL.
logLevel: DEBUG
## @param extraEnvVarsCM [string] [default: ""] A Config map holding Enviroment variables to include in the NVIngest containerextraEnvVarsCM: ""
extraEnvVarsCM: ""
## @param extraEnvVarsSecret [string] [default: ""] A K8S Secret to map to Enviroment variables to include in the NVIngest container
extraEnvVarsSecret: ""
## @param fullnameOverride [string] [default: ""] A name to force the fullname of the NVIngest container to have, defaults to the Helm Release Name
fullnameOverride: ""
## @param nameOverride [string] [default: ""] A name to base the objects created by this helm chart
nameOverride: ""
## @param image.repository [string] NIM Image Repository
## @param image.tag [string] Image tag or version
## @param image.pullPolicy [string] Image pull policy
image:
pullPolicy: IfNotPresent
repository: "nvcr.io/ohlfw0olaadg/ea-participants/nv-ingest"
tag: "24.08"
## @param podAnnotations [object] Sets additional annotations on the main deployment pods
podAnnotations:
traffic.sidecar.istio.io/excludeOutboundPorts: '8007'
## @param podLabels [object] Specify extra labels to be add to on deployed pods.
podLabels: {}
## @extra podSecurityContext Specify privilege and access control settings for pod
## @param podSecurityContext.fsGroup Specify file system owner group id.
podSecurityContext:
fsGroup: 1000
## @param extraVolumes [object] Adds arbitrary additional volumes to the deployment set definition
extraVolumes: {}
## @param extraVolumeMounts [object] Specify volume mounts to the main container from `extraVolumes`
extraVolumeMounts: {}
## @extra imagePullSecrets Specify list of secret names that are needed for the main container and any init containers.
## @skip imagePullSecrets[0].name
imagePullSecrets:
- name: nvcrimagepullsecret
## @param containerSecurityContext [object] Sets privilege and access control settings for container (Only affects the main container, not pod-level)
containerSecurityContext: {}
## @skip tolerations
## @extra tolerations [ default: Empty Array ] Specify tolerations for pod assignment. Allows the scheduler to schedule pods with matching taints.
## @skip tolerations[0].key
## @skip tolerations[0].operator
## @skip tolerations[0].effect
tolerations: []
# TODO: jdyer - uncomment this when microservice is added, currently no /health endpoint exists to check ...
## @param replicaCount [default: 1] The number of replicas for NVIngest when autoscaling is disabled
replicaCount: 1
## @skip resources Specify resources limits and requests for the running service.
## @extra resources.limits."nvidia.com/gpu" Specify number of GPUs to present to the running service.
## @param resources.limits.memory [default: 32Gi] Specify limit for memory
## @param resources.requests.memory [default: 16Gi] Specify request for memory
resources:
limits:
memory: 32Gi
nvidia.com/gpu: 1
requests:
memory: 16Gi
## @param tmpDirSize [default: 8Gi] Specify the amount of space to reserve for temporary storage
tmpDirSize: 8Gi
## @section NIM Configuration
## @descriptionStart
## Define additional values to the dependent NIM helm charts by updating the "yolox-nim", "cached-nim", "deplot-nim", and "paddleocr-nim"
## values. A sane set of configurations are already included in this value file and only the "image.repository" and "image.tag" fields are
## explicitly called out here.
## @descriptionEnd
## @skip yoloxDeployed
## @skip yolox-nim
## @extra yolox-nim.image.repository The repository to override the location of the YOLOX
## @extra yolox-nim.image.tag The tag override for YOLOX
yoloxDeployed: true
yolox-nim:
fullnameOverride: nv-ingest-yolox
image:
repository: nvcr.io/ohlfw0olaadg/ea-participants/nv-yolox-structured-images-v1
tag: "0.1.0"
service:
name: nv-ingest-yolox
grpcPort: 8001
nim:
grpcPort: 8001
env:
- name: NIM_HTTP_API_PORT
value: "8000"
## @skip cachedDeployed
## @skip cached-nim
## @extra cached-nim.image.repository The repository to override the location of the Cached Model NIM
## @extra cached-nim.image.tag The tag override for Cached Model NIM
cachedDeployed: true
cached-nim:
fullnameOverride: nv-ingest-cached
image:
repository: nvcr.io/ohlfw0olaadg/ea-participants/cached
tag: "0.1.0"
service:
name: nv-ingest-cached
grpcPort: 8001
nim:
grpcPort: 8001
env:
- name: NIM_HTTP_API_PORT
value: "8000"
## @skip paddleocrDeployed
## @skip paddleocr-nim
## @extra paddleocr-nim.image.repository The repository to override the location of the Paddle OCR NIM
## @extra paddleocr-nim.image.tag The tag override for Paddle OCR NIM
paddleocrDeployed: true
paddleocr-nim:
fullnameOverride: nv-ingest-paddle
image:
repository: nvcr.io/ohlfw0olaadg/ea-participants/paddleocr
tag: "0.1.0"
service:
name: nv-ingest-paddle
grpcPort: 8001
nim:
grpcPort: 8001
env:
- name: NIM_HTTP_API_PORT
value: "8000"
## @skip deplotDeployed
## @skip deplot-nim
## @extra deplot-nim.image.repository The repository to override the location of the Deplot NIM
## @extra deplot-nim.image.tag The tag override for Deplot NIM
deplotDeployed: true
deplot-nim:
fullnameOverride: nv-ingest-deplot
image:
repository: nvcr.io/ohlfw0olaadg/ea-participants/deplot
tag: "1.0.0"
service:
name: nv-ingest-deplot
grpcPort: 8001
nim:
grpcPort: 8001
env:
- name: NIM_HTTP_API_PORT
value: "8000"
# Use this to load an image Pre NIM Factory via triton
## @skip triton
triton:
enabled: false
## @section Milvus Deployment parameters
## @descriptionStart
## NVIngest uses Milvus and Minio to store extracted images from a document
## This chart by default sets up a Milvus standalone instance in the namespace using the
## Helm chart at found https://artifacthub.io/packages/helm/milvus-helm/milvus
## @descriptionEnd
## @param milvusDeployed [default: true] Whether to deploy Milvus and Minio from this helm chart
milvusDeployed: true
## @param milvus [default: sane {}] Find values at https://artifacthub.io/packages/helm/milvus-helm/milvus
milvus:
cluster:
enabled: false
etcd:
replicaCount: 1
persistence:
storageClass: null
minio:
mode: standalone
persistence:
size: 10Gi
storageClass: null
pulsar:
enabled: false
standalone:
persistence:
persistentVolumeClaim:
size: 10Gi
storageClass: null
extraEnv:
- name: LOG_LEVEL
value: error
## @section Autoscaling parameters
## @descriptionStart
## Values used for creating a `Horizontal Pod Autoscaler`. If autoscaling is not enabled, the rest are ignored.
## NVIDIA recommends usage of the custom metrics API, commonly implemented with the prometheus-adapter.
## Standard metrics of CPU and memory are of limited use in scaling NIM.
## @descriptionEnd
## @param autoscaling.enabled Enables horizontal pod autoscaler.
## @param autoscaling.minReplicas Specify minimum replicas for autoscaling.
## @param autoscaling.maxReplicas Specify maximum replicas for autoscaling.
## @param autoscaling.metrics Array of metrics for autoscaling.
autoscaling:
enabled: false
maxReplicas: 100
minReplicas: 1
metrics: []
## @section Redis configurations
## @descriptionStart
## Include any redis configuration that you'd like with the deployed Redis
## Find values at https://github.com/bitnami/charts/tree/main/bitnami/redis
## @descriptionEnd
## @param redisDeployed [default: true] Whether to deploy Redis from this helm chart
redisDeployed: true
## @param redis [default: sane {}] Find values at https://github.com/bitnami/charts/tree/main/bitnami/redis
redis:
auth:
enabled: false
replica:
replicaCount: 1
master:
resourcesPreset: xlarge
## @section Environment Variables
## @descriptionStart
## Define environment variables as key/value dictionary pairs
## @descriptionEnd
## @param envVars [default: sane {}] Adds arbitrary environment variables to the main container using key-value pairs, for example NAME: value
## @param envVars.MESSAGE_CLIENT_HOST [default: "nv-ingest-ms-runtime"] Override this value to specify a differeing REST endpoint host.
## @param envVars.MESSAGE_CLIENT_PORT [default: "7670"] Override this value to specify a differing REST endpoint port.
## @param envVars.NV_INGEST_DEFAULT_TIMEOUT_MS [default: "1234"] Override the Timeout of the NVIngest requests.
## @param envVars.MINIO_INTERNAL_ADDRESS [default: "nv-ingest-minio:9000"] Override this to the cluster local DNS name of minio
## @param envVars.MINIO_PUBLIC_ADDRESS [default: "http://localhost:9000"] Override this to publicly routable minio address, default assumes port-forwarding
## @param envVars.MINIO_BUCKET [default: "nv-ingest"] Override this for specific minio bucket to upload extracted images to
## @skip envVars.REDIS_MORPHEUS_TASK_QUEUE
## @skip envVars.TABLE_DETECTION_GRPC_TRITON
## @skip envVars.TABLE_DETECTION_HTTP_TRITON
## @skip envVars.CACHED_GRPC_ENDPOINT
## @skip envVars.CACHED_HTTP_ENDPOINT
## @skip envVars.PADDLE_GRPC_ENDPOINT
## @skip envVars.PADDLE_HTTP_ENDPOINT
## @skip envVars.YOLOX_GRPC_ENDPOINT
## @skip envVars.YOLOX_HTTP_ENDPOINT
## @skip envVars.DEPLOT_GRPC_ENDPOINT
## @skip envVars.DEPLOT_HTTP_ENDPOINT
envVars:
MESSAGE_CLIENT_HOST: "nv-ingest-ms-runtime"
MESSAGE_CLIENT_PORT: "7670"
REDIS_MORPHEUS_TASK_QUEUE: "morpheus_task_queue"
NV_INGEST_DEFAULT_TIMEOUT_MS: "1234"
MINIO_INTERNAL_ADDRESS: nv-ingest-minio:9000
MINIO_PUBLIC_ADDRESS: http://localhost:9000
MINIO_BUCKET: nv-ingest
TABLE_DETECTION_GRPC_TRITON: nv-ingest-yolox:8001
TABLE_DETECTION_HTTP_TRITON: ""
CACHED_GRPC_ENDPOINT: nv-ingest-cached:8001
CACHED_HTTP_ENDPOINT: ""
PADDLE_GRPC_ENDPOINT: nv-ingest-paddle:8001
PADDLE_HTTP_ENDPOINT: ""
YOLOX_GRPC_ENDPOINT: nv-ingest-yolox:8001
YOLOX_HTTP_ENDPOINT: ""
DEPLOT_GRPC_ENDPOINT: ""
DEPLOT_HTTP_ENDPOINT: http://nv-ingest-deplot:8000/v1/chat/completions
EMBEDDING_NIM_ENDPOINT: "http://nv-ingest-embedding:8000/v1"
MILVUS_ENDPOINT: "http://nv-ingest-milvus:19530"
## @section Open Telemetry
## @descriptionStart
## Define environment variables as key/value dictionary pairs for configuring OTEL Deployments
## A sane set of parameters is set for the deployed version of OpenTelemetry with this Helm Chart.
## Override any values to the Open Telemetry helm chart by overriding the `open-telemetry` value.
## @descriptionEnd
## @param otelEnabled [default: true] Whether to enable OTEL collection
otelEnabled: true
## @param otelDeployed [default: true] Whether to deploy OTEL from this helm chart
otelDeployed: true
## @skip opentelemetry-collector
## @extra opentelemetry-collector [default: sane {}] Configures the opentelemetry helm chart - see https://github.com/open-telemetry/opentelemetry-helm-charts/blob/main/charts/opentelemetry-collector/values.yaml
opentelemetry-collector:
mode: deployment
config:
receivers:
otlp:
protocols:
grpc:
endpoint: '${env:MY_POD_IP}:4317'
http:
cors:
allowed_origins:
- "*"
exporters:
# NOTE: Prior to v0.86.0 use `logging` instead of `debug`.
zipkin:
endpoint: "http://nv-ingest-zipkin:9411/api/v2/spans"
debug:
verbosity: detailed
extensions:
health_check: {}
zpages:
endpoint: 0.0.0.0:55679
processors:
batch: {}
tail_sampling:
# filter out health checks
# https://github.com/open-telemetry/opentelemetry-collector/issues/2310#issuecomment-1268157484
policies:
- name: drop_noisy_traces_url
type: string_attribute
string_attribute:
key: http.target
values:
- \/health
enabled_regex_matching: true
invert_match: true
transform:
trace_statements:
- context: span
statements:
- set(status.code, 1) where attributes["http.path"] == "/health"
# after the http target has been anonymized, replace other aspects of the span
- replace_match(attributes["http.route"], "/v1", attributes["http.target"]) where attributes["http.target"] != nil
# replace the title of the span with the route to be more descriptive
- replace_pattern(name, "/v1", attributes["http.route"]) where attributes["http.route"] != nil
# set the route to equal the URL if it's nondescriptive (for the embedding case)
- set(name, Concat([name, attributes["http.url"]], " ")) where name == "POST"
service:
extensions: [zpages, health_check]
pipelines:
traces:
receivers: [otlp]
exporters: [debug, zipkin]
processors: [tail_sampling, transform]
metrics:
receivers: [otlp]
exporters: [debug]
processors: [batch]
logs:
receivers: [otlp]
exporters: [debug]
processors: [batch]
## @param otelEnvVars [default: sane {}] Adds arbitrary environment variables for configuring OTEL using key-value pairs, for example NAME: value
## @extra otelEnvVars.OTEL_EXPORTER_OTLP_ENDPOINT Default deployment target for GRPC otel - Default "http://{{ .Release.Name }}-opentelemetry-collector:4317"
## @param otelEnvVars.OTEL_SERVICE_NAME [default: "nemo-retrieval-service" ]
## @param otelEnvVars.OTEL_TRACES_EXPORTER [default: "otlp" ]
## @param otelEnvVars.OTEL_METRICS_EXPORTER [default: "otlp" ]
## @param otelEnvVars.OTEL_LOGS_EXPORTER [default: "none" ]
## @param otelEnvVars.OTEL_PROPAGATORS [default: "tracecontext baggage" ]
## @param otelEnvVars.OTEL_RESOURCE_ATTRIBUTES [default: "deployment.environment=$(NAMESPACE)" ]
## @param otelEnvVars.OTEL_PYTHON_EXCLUDED_URLS [default: "health" ]
otelEnvVars:
# OpenTelemetry
OTEL_SERVICE_NAME: "nemo-retrieval-service"
OTEL_TRACES_EXPORTER: otlp
OTEL_METRICS_EXPORTER: otlp
OTEL_LOGS_EXPORTER: none
OTEL_PROPAGATORS: "tracecontext,baggage"
OTEL_RESOURCE_ATTRIBUTES: "deployment.environment=$(NAMESPACE)"
OTEL_PYTHON_EXCLUDED_URLS: "health"
## @param zipkinDeployed [default: true] Whether to deploy Zipkin with OpenTelemetry from this helm chart
zipkinDeployed: true
## @section Ingress parameters
## @param ingress.enabled Enables ingress.
## @param ingress.className Specify class name for Ingress.
## @param ingress.annotations Specify additional annotations for ingress.
## @extra ingress.hosts Specify list of hosts each containing lists of paths.
## @param ingress.hosts[0].host Specify name of host.
## @param ingress.hosts[0].paths[0].path Specify ingress path.
## @param ingress.hosts[0].paths[0].pathType Specify path type.
## @param ingress.tls Specify list of pairs of TLS `secretName` and hosts.
ingress:
enabled: false
className: ""
annotations: {}
hosts:
- host: chart-example.local
paths:
- path: /
pathType: ImplementationSpecific
tls: []
## @section Probe parameters
## @param livenessProbe.enabled Enables `livenessProbe``
## @param livenessProbe.httpGet.path `LivenessProbe`` endpoint path
## @param livenessProbe.httpGet.port `LivenessProbe`` endpoint port
## @param livenessProbe.initialDelaySeconds Initial delay seconds for `livenessProbe`
## @param livenessProbe.timeoutSeconds Timeout seconds for `livenessProbe`
## @param livenessProbe.periodSeconds Period seconds for `livenessProbe`
## @param livenessProbe.successThreshold Success threshold for `livenessProbe`
## @param livenessProbe.failureThreshold Failure threshold for `livenessProbe`
livenessProbe:
enabled: false
httpGet:
path: /health
port: http
initialDelaySeconds: 120
periodSeconds: 10
timeoutSeconds: 20
failureThreshold: 20
successThreshold: 1
## @section Probe parameters
## @param startupProbe.enabled Enables `startupProbe``
## @param startupProbe.httpGet.path `StartupProbe`` endpoint path
## @param startupProbe.httpGet.port `StartupProbe`` endpoint port
## @param startupProbe.initialDelaySeconds Initial delay seconds for `startupProbe`
## @param startupProbe.timeoutSeconds Timeout seconds for `startupProbe`
## @param startupProbe.periodSeconds Period seconds for `startupProbe`
## @param startupProbe.successThreshold Success threshold for `startupProbe`
## @param startupProbe.failureThreshold Failure threshold for `startupProbe`
startupProbe:
enabled: false
httpGet:
path: /health
port: http
initialDelaySeconds: 120
periodSeconds: 30
timeoutSeconds: 10
failureThreshold: 220
successThreshold: 1
## @section Probe parameters
## @param readinessProbe.enabled Enables `readinessProbe``
## @param readinessProbe.httpGet.path `ReadinessProbe`` endpoint path
## @param readinessProbe.httpGet.port `ReadinessProbe`` endpoint port
## @param readinessProbe.initialDelaySeconds Initial delay seconds for `readinessProbe`
## @param readinessProbe.timeoutSeconds Timeout seconds for `readinessProbe`
## @param readinessProbe.periodSeconds Period seconds for `readinessProbe`
## @param readinessProbe.successThreshold Success threshold for `readinessProbe`
## @param readinessProbe.failureThreshold Failure threshold for `readinessProbe`
readinessProbe:
enabled: false
httpGet:
path: /health
port: http
initialDelaySeconds: 120
periodSeconds: 30
timeoutSeconds: 10
failureThreshold: 220
successThreshold: 1
## @section Service parameters
## @param service.type Specifies the service type for the deployment.
## @param service.name Overrides the default service name
## @param service.port Specifies the HTTP Port for the service.
## @param service.nodePort Specifies an optional HTTP Node Port for the service.
## @param service.annotations [object] Specify additional annotations to be added to service.
## @param service.labels [object] Specifies additional labels to be added to service.
service:
type: ClusterIP
port: 8000
annotations: {}
labels: {}
name: "" # override the default service name
nodePort: null
## @extra serviceAccount Options to specify service account for the deployment.
## @param serviceAccount.create Specifies whether a service account should be created.
## @param serviceAccount.annotations [object] Sets annotations to be added to the service account.
## @param serviceAccount.name Specifies the name of the service account to use. If it is not set and create is "true", a name is generated using a "fullname" template.
## @skip serviceAccount.automount
serviceAccount:
annotations: {}
automount: true
create: true
name: ""
## @section Secret Creation
## @descriptionStart
## Manage the creation of secrets used by the helm chart
## @descriptionEnd
## @param ngcSecret.create Specifies whether to create the ngc api secret
## @param ngcSecret.password The password to use for the NGC Secret
ngcSecret:
# If set to false, the chart expects a secret with name ngc-api to exist in the namespace
# credentials are needed.
create: false
password: ""
## @param imagePullSecret.create Specifies whether to create the NVCR Image Pull secret
## @param imagePullSecret.password The password to use for the NVCR Image Pull Secret
## @skip imagePullSecret.registry
## @skip imagePullSecret.name
## @skip imagePullSecret.username
imagePullSecret:
create: false
# Leave blank, if no imagePullSecret is needed.
registry: "nvcr.io"
name: "nvcrimagepullsecret"
# If set to false, the chart expects either a imagePullSecret
# with the name configured above to be present on the cluster or that no
# credentials are needed.
username: '$oauthtoken'
password: ""
## @skip nemo
nemo:
userID: "1000"
groupID: "1000"
## @skip containerArgs
containerArgs: []