Skip to content

Commit d3720f6

Browse files
committed
Merge branch 'main' of https://github.com/ai-dynamo/dynamo into hzhou/metrics
2 parents 7ed7332 + 98a5fab commit d3720f6

File tree

45 files changed

+517
-366
lines changed

Some content is hidden

Large Commits have some content hidden by default. Use the searchbox below for content that may be hidden.

45 files changed

+517
-366
lines changed

components/metrics/README.md

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -82,7 +82,7 @@ metrics --component VllmWorker --endpoint load_metrics
8282

8383
**NOTE**: `load_metrics` is currently a
8484
[hard-coded](https://github.com/ai-dynamo/dynamo/blob/d5220c7b1151372ba3d2a061c7d0a7ed72724789/lib/llm/src/kv_router/publisher.rs#L108)
85-
endpoint name used for python-based workers that register a `KvMetricsPublisher`.
85+
endpoint name used for python-based workers that register a `WorkerMetricsPublisher`.
8686

8787
## Visualization
8888

components/planner/README.md

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -17,7 +17,7 @@ limitations under the License.
1717

1818
# Planner
1919

20-
The planner is a component that monitors the state of the system and makes adjustments to the number of workers to ensure that the system is running efficiently. It can dynamically scale prefill/decode workers up and down based on a variety of KV metrics. You can find documentation and benchmarking examples in the [planner docs](../../docs/planner.md).
20+
The planner is a component that monitors the state of the system and makes adjustments to the number of workers to ensure that the system is running efficiently. It can dynamically scale prefill/decode workers up and down based on a variety of KV metrics. You can find documentation and benchmarking examples in the [planner docs](../../docs/guides/planner.md).
2121

2222
## Usage
2323

container/Dockerfile.sglang

Lines changed: 3 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -325,6 +325,9 @@ COPY --from=wheel_builder /opt/nvidia/nvda_nixl /opt/nvidia/nvda_nixl
325325
# Copy Cargo cache to avoid re-downloading dependencies
326326
COPY --from=wheel_builder $CARGO_HOME $CARGO_HOME
327327

328+
# Copy rest of the code
329+
COPY . /workspace
330+
328331
# Build C bindings, creates lib/bindings/c/include
329332
RUN cd /workspace/lib/bindings/c && cargo build --release --locked
330333

@@ -365,8 +368,6 @@ ARG GENAI_PERF_VERSION
365368
# Install genai-perf for benchmarking
366369
RUN uv pip install genai-perf==$GENAI_PERF_VERSION
367370

368-
COPY . /workspace
369-
370371
ENTRYPOINT ["/opt/nvidia/nvidia_entrypoint.sh"]
371372

372373
CMD []

container/Dockerfile.tensorrt_llm

Lines changed: 3 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -300,6 +300,9 @@ COPY --from=wheel_builder /workspace /workspace
300300
# Copy Cargo cache to avoid re-downloading dependencies
301301
COPY --from=wheel_builder $CARGO_HOME $CARGO_HOME
302302

303+
# Copy rest of the code
304+
COPY . /workspace
305+
303306
# Build C bindings, creates lib/bindings/c/include
304307
RUN cd /workspace/lib/bindings/c && cargo build --release --locked
305308

container/Dockerfile.vllm

Lines changed: 3 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -403,6 +403,9 @@ COPY --from=wheel_builder /opt/nvidia/nvda_nixl /opt/nvidia/nvda_nixl
403403
# Copy Cargo cache to avoid re-downloading dependencies
404404
COPY --from=wheel_builder $CARGO_HOME $CARGO_HOME
405405

406+
# Copy rest of the code
407+
COPY . /workspace
408+
406409
# Build C bindings, creates lib/bindings/c/include
407410
#
408411
# TODO: In theory the 'cargo build' in earlier stage covers this, we "just" need to copy the
@@ -447,8 +450,6 @@ ARG GENAI_PERF_VERSION
447450
# Install genai-perf for benchmarking
448451
RUN uv pip install genai-perf==$GENAI_PERF_VERSION
449452

450-
COPY . /workspace
451-
452453
ENTRYPOINT ["/opt/nvidia/nvidia_entrypoint.sh"]
453454

454455
CMD []
Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -14,7 +14,7 @@
1414
# limitations under the License.
1515
apiVersion: v2
1616
name: dynamo-crds
17-
description: A Helm chart for CRDs of dynamo operator
17+
description: A Helm chart for dynamo CRDs
1818
type: application
1919
version: 0.1.6
2020
dependencies: []
Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -19,6 +19,8 @@ kind: CustomResourceDefinition
1919
metadata:
2020
annotations:
2121
controller-gen.kubebuilder.io/version: v0.16.4
22+
# never delete this resource with helm delete
23+
helm.sh/resource-policy: keep
2224
name: dynamocomponentdeployments.nvidia.com
2325
spec:
2426
group: nvidia.com
Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -19,6 +19,8 @@ kind: CustomResourceDefinition
1919
metadata:
2020
annotations:
2121
controller-gen.kubebuilder.io/version: v0.16.4
22+
# never delete this resource with helm delete
23+
helm.sh/resource-policy: keep
2224
name: dynamocomponents.nvidia.com
2325
spec:
2426
group: nvidia.com
Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -19,6 +19,8 @@ kind: CustomResourceDefinition
1919
metadata:
2020
annotations:
2121
controller-gen.kubebuilder.io/version: v0.16.4
22+
# never delete this resource with helm delete
23+
helm.sh/resource-policy: keep
2224
name: dynamographdeployments.nvidia.com
2325
spec:
2426
group: nvidia.com

deploy/cloud/helm/deploy.sh

Lines changed: 13 additions & 10 deletions
Original file line numberDiff line numberDiff line change
@@ -41,7 +41,7 @@ export ENABLE_LWS="${ENABLE_LWS:=false}"
4141

4242
# Add command line options
4343
INTERACTIVE=false
44-
44+
INSTALL_CRDS=false
4545
# Parse command line arguments
4646
while [[ $# -gt 0 ]]; do
4747
key="$1"
@@ -50,11 +50,16 @@ while [[ $# -gt 0 ]]; do
5050
INTERACTIVE=true
5151
shift
5252
;;
53+
--crds)
54+
INSTALL_CRDS=true
55+
shift
56+
;;
5357
--help)
5458
echo "Usage: $0 [options]"
5559
echo "Options:"
5660
echo " --interactive Run in interactive mode"
5761
echo " --help Show this help message"
62+
echo " --crds Also install the CRDs"
5863
exit 0
5964
;;
6065
*)
@@ -115,15 +120,6 @@ retry_command "$HELM_CMD repo add bitnami https://charts.bitnami.com/bitnami" 5
115120
retry_command "$HELM_CMD repo add minio https://charts.min.io/" 5 5 && \
116121
retry_command "$HELM_CMD repo update" 5 5
117122

118-
cd platform
119-
cd components/operator
120-
retry_command "$HELM_CMD dependency update" 5 5
121-
cd ../..
122-
cd components/api-store
123-
retry_command "$HELM_CMD dependency update" 5 5
124-
cd ../..
125-
retry_command "$HELM_CMD dep update" 7 5
126-
cd ..
127123

128124
# Generate the values file
129125
echo "Generating values file with:"
@@ -143,6 +139,7 @@ echo "INGRESS_CLASS: $INGRESS_CLASS"
143139
echo "ISTIO_GATEWAY: $ISTIO_GATEWAY"
144140
echo "DYNAMO_INGRESS_SUFFIX: $DYNAMO_INGRESS_SUFFIX"
145141
echo "VIRTUAL_SERVICE_SUPPORTS_HTTPS: $VIRTUAL_SERVICE_SUPPORTS_HTTPS"
142+
echo "INSTALL_CRDS: $INSTALL_CRDS"
146143

147144
envsubst '${NAMESPACE} ${RELEASE_NAME} ${DOCKER_USERNAME} ${DOCKER_PASSWORD} ${DOCKER_SERVER} ${IMAGE_TAG} ${DYNAMO_INGRESS_SUFFIX} ${PIPELINES_DOCKER_SERVER} ${PIPELINES_DOCKER_USERNAME} ${PIPELINES_DOCKER_PASSWORD} ${DOCKER_SECRET_NAME} ${INGRESS_ENABLED} ${ISTIO_ENABLED} ${INGRESS_CLASS} ${ISTIO_GATEWAY} ${VIRTUAL_SERVICE_SUPPORTS_HTTPS} ${ENABLE_LWS}' < dynamo-platform-values.yaml > generated-values.yaml
148145
echo "generated file contents:"
@@ -157,6 +154,12 @@ cd platform
157154
retry_command "$HELM_CMD dep build" 5 5
158155
cd ..
159156

157+
# Install/upgrade the helm chart for the CRDs
158+
if [ "$INSTALL_CRDS" = true ]; then
159+
echo "Installing/upgrading helm chart for the CRDs..."
160+
$HELM_CMD upgrade --install dynamo-crds crds/ --namespace default --wait --atomic
161+
fi
162+
160163
# Install/upgrade the helm chart
161164
echo "Installing/upgrading helm chart..."
162165
$HELM_CMD upgrade --install $RELEASE_NAME platform/ \

0 commit comments

Comments
 (0)