Skip to content

Commit

Permalink
Updating server config keys
Browse files Browse the repository at this point in the history
  • Loading branch information
nv-braf committed Feb 20, 2024
1 parent 2607a5d commit c485490
Showing 1 changed file with 71 additions and 21 deletions.
92 changes: 71 additions & 21 deletions model_analyzer/triton/server/server_config.py
Original file line number Diff line number Diff line change
Expand Up @@ -24,55 +24,105 @@ class TritonServerConfig:
"""

server_arg_keys = [
# Server
"id",
"exit-timeout-secs",
# Logging
"log-verbose",
"log-info",
"log-warning",
"log-error",
"id",
"log-format",
"log-file",
# Model Repository
"model-store",
"model-repository",
# Exit
"exit-timeout-secs",
"exit-on-error",
# Strictness
"strict-model-config",
"disable-auto-complete-config",
"strict-readiness",
# API Servers
"model-control-mode",
"repository-poll-secs",
"load-model",
"model-load-thread-count",
"model-load-retry-count",
"model-namespacing",
# HTTP
"allow-http",
"http-address",
"http-port",
"reuse-http-port",
"http-header-forward-pattern",
"http-thread-count",
"http-restricted-api",
# GRPC
"allow-grpc",
"grpc-address",
"grpc-port",
"reuse-grpc-port",
"grpc-header-forward-pattern",
"grpc-infer-allocation-pool-size",
"grpc-use-ssl",
"grpc-use-ssl-mutual",
"grpc-server-cert",
"grpc-server-key",
"grpc-root-cert",
"grpc-infer-response-compression-level",
"grpc-keepalive-time",
"grpc-keepalive-timeout",
"grpc-keepalive-permit-without-calls",
"grpc-http2-max-pings-without-data",
"grpc-http2-min-recv-ping-interval-without-data",
"grpc-http2-max-ping-strikes",
"grpc-max-connection-age",
"grpc-max-connection-age-grace",
"grpc-restricted-protocol"
# Sagemaker
"allow-sagemaker",

Check warning

Code scanning / CodeQL

Implicit string concatenation in a list Warning

Implicit string concatenation. Maybe missing a comma?
"sagemaker-port",
"sagemaker-safe-port-range",
"sagemaker-thread-count",
# Vertex
"allow-vertex-ai",
"vertex-ai-port",
"vertex-ai-thread-count",
"vertex-ai-default-model",
# Metrics
"allow-metrics",
"allow-gpu-metrics",
"metrics-interval-ms",
"allow-cpu-metrics",
"metrics-address",
"metrics-port",
"metrics-interval-ms",
"metrics-config",
# Tracing
"trace-file",
"trace-level",
"trace-rate",
# Model control
"model-control-mode",
"repository-poll-secs",
"load-model",
# Memory and GPU
"trace-config",
# Backend
"backend-directory",
"backend-config",
# Repository Agent
"repoagent-directory",
# Response Cache
"cache-config",
"cache-directory"
# Rate Limiter
"rate-limit",

Check warning

Code scanning / CodeQL

Implicit string concatenation in a list Warning

Implicit string concatenation. Maybe missing a comma?
"rate-limit-resource",
# Memory/Device Management
"pinned-memory-pool-byte-size",
"cuda-memory-pool-byte-size",
"cuda-virtual-address-size",
"min-supported-compute-capability",
# Backend config
"backend-directory",
"backend-config",
"allow-soft-placement",
"gpu-memory-fraction",
"tensorflow-version",
"buffer-management-thread-count",
"host-policy",
"model-load-gpu-limit",
# DEPRECATED
"strict-model-config",
"response-cache-byte-size",
"trace-file",
"trace-level",
"trace-rate",
"trace-count",
"trace-log-frequency",
]

def __init__(self):
Expand Down

0 comments on commit c485490

Please sign in to comment.