Skip to content
Open
Show file tree
Hide file tree
Changes from all commits
Commits
Show all changes
45 commits
Select commit Hold shift + click to select a range
4b9ca2f
sglang ec2
Jan 21, 2026
c0f056d
add ec2 in docker file
Jan 22, 2026
9ffd708
add ec2 entrypoint
Jan 22, 2026
5818fb4
add buildspec ec2
Jan 22, 2026
f6b9775
add tests
Jan 22, 2026
4e848f8
modify tests
Jan 22, 2026
3d2204f
fix formatting
Jan 22, 2026
341e551
run
Jan 22, 2026
220180a
fix cuda compat
Jan 22, 2026
54cb7f2
add sglang framework
Jan 22, 2026
a0a4e03
fix
Jan 22, 2026
480ed98
skip telemetry
Jan 24, 2026
be65b0e
fix tests
Jan 24, 2026
fa736ac
fix tests
Jan 25, 2026
fa98c05
fix
Jan 25, 2026
7dc98fb
fix tests
Jan 25, 2026
06cb7fc
fix upstream tests
Jan 25, 2026
8f426b1
fix hf token
Jan 28, 2026
0e41e99
fix
Jan 28, 2026
eb7c7a7
fix
Jan 28, 2026
96a7921
fix
Jan 28, 2026
2879dbe
fix
Jan 28, 2026
76555c1
fix
Jan 28, 2026
12c9975
fix
Jan 28, 2026
18808af
rerun sglang ec2 tests
Jan 28, 2026
032bbe3
skip telemetry tests
Jan 29, 2026
2794a34
skip telemetry tests
Jan 29, 2026
e00d836
skip telemetry tests
Jan 29, 2026
7bfba04
skip telemetry tests
Jan 30, 2026
cd59194
skip telemetry tests
Jan 30, 2026
c6461aa
skip telemetry tests
Jan 30, 2026
1552199
skip telemetry tests
Jan 30, 2026
2891306
skip telemetry tests
Jan 30, 2026
8d14b8c
skip telemetry tests
Jan 30, 2026
1598854
skip telemetry tests
Jan 30, 2026
aac8ca2
rerun to debug
Jan 30, 2026
0c9a6cd
skip telemetry tests
Jan 30, 2026
2bdc82e
skip logic for telemetry tests
Jan 30, 2026
2186229
skip logic for telemetry tests
Jan 30, 2026
a2635f3
change skip logic
Feb 3, 2026
8b283f5
change skip logic
Feb 3, 2026
b1df749
change skip logic
Feb 3, 2026
e8bb0ee
add pytest filter to exclude telemetry marked tests in ec2 test suite
Feb 3, 2026
7825388
add pytest filter to exclude telemetry marked tests in ec2 test suite
Feb 3, 2026
2a8460a
raise error for hf_token if not found
Feb 5, 2026
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
2 changes: 1 addition & 1 deletion dlc_developer_config.toml
Original file line number Diff line number Diff line change
Expand Up @@ -37,7 +37,7 @@ deep_canary_mode = false
[build]
# Add in frameworks you would like to build. By default, builds are disabled unless you specify building an image.
# available frameworks - ["base", "vllm", "sglang", "autogluon", "huggingface_tensorflow", "huggingface_pytorch", "huggingface_tensorflow_trcomp", "huggingface_pytorch_trcomp", "pytorch_trcomp", "tensorflow", "pytorch", "stabilityai_pytorch"]
build_frameworks = []
build_frameworks = ["sglang"]


# By default we build both training and inference containers. Set true/false values to determine which to build.
Expand Down
6 changes: 6 additions & 0 deletions sglang/build_artifacts/dockerd_entrypoint.sh
Original file line number Diff line number Diff line change
@@ -0,0 +1,6 @@
#!/usr/bin/env bash
# Check if telemetry file exists before executing
# Execute telemetry script if it exists, suppress errors
bash /usr/local/bin/bash_telemetry.sh >/dev/null 2>&1 || true

python3 -m sglang.launch_server "$@"
56 changes: 56 additions & 0 deletions sglang/buildspec-ec2.yml
Original file line number Diff line number Diff line change
@@ -0,0 +1,56 @@
account_id: &ACCOUNT_ID <set-$ACCOUNT_ID-in-environment>
prod_account_id: &PROD_ACCOUNT_ID 763104351884
region: &REGION <set-$REGION-in-environment>
framework: &FRAMEWORK sglang
version: &VERSION "0.5.6"
short_version: &SHORT_VERSION "0.5"
arch_type: &ARCH_TYPE x86_64
autopatch_build: "False"

repository_info:
build_repository: &BUILD_REPOSITORY
image_type: &IMAGE_TYPE gpu
root: .
repository_name: &REPOSITORY_NAME !join [ pr, "-", *FRAMEWORK ]
repository: &REPOSITORY !join [ *ACCOUNT_ID, .dkr.ecr., *REGION, .amazonaws.com/, *REPOSITORY_NAME ]
release_repository_name: &RELEASE_REPOSITORY_NAME !join [ *FRAMEWORK ]
release_repository: &RELEASE_REPOSITORY !join [ *PROD_ACCOUNT_ID, .dkr.ecr., *REGION, .amazonaws.com/, *RELEASE_REPOSITORY_NAME ]

context:
build_context: &BUILD_CONTEXT
deep_learning_container:
source: src/deep_learning_container.py
target: deep_learning_container.py
install_efa:
source: scripts/install_efa.sh
target: install_efa.sh
start_cuda_compat:
source: sglang/build_artifacts/start_cuda_compat.sh
target: start_cuda_compat.sh
sagemaker_entrypoint:
source: sglang/build_artifacts/dockerd_entrypoint.sh
target: dockerd_entrypoint.sh

images:
sglang_ec2:
<<: *BUILD_REPOSITORY
context:
<<: *BUILD_CONTEXT
image_size_baseline: 26000
device_type: &DEVICE_TYPE gpu
cuda_version: &CUDA_VERSION cu129
python_version: &DOCKER_PYTHON_VERSION py3
tag_python_version: &TAG_PYTHON_VERSION py312
os_version: &OS_VERSION ubuntu22.04
tag: !join [ *VERSION, "-", *DEVICE_TYPE, "-", *TAG_PYTHON_VERSION, "-", *CUDA_VERSION, "-", *OS_VERSION, "-ec2" ]
latest_release_tag: !join [ *VERSION, "-", *DEVICE_TYPE, "-", *TAG_PYTHON_VERSION, "-", *CUDA_VERSION, "-", *OS_VERSION, "-ec2" ]
skip_build: "False"
docker_file: !join [ *FRAMEWORK, /, *ARCH_TYPE, /, *DEVICE_TYPE, /Dockerfile ]
target: sglang-ec2
build: true
enable_common_stage_build: false
test_configs:
test_platforms:
- sanity
- security
- ec2
2 changes: 1 addition & 1 deletion sglang/buildspec.yml
Original file line number Diff line number Diff line change
@@ -1 +1 @@
buildspec_pointer: buildspec-sm.yml
buildspec_pointer: buildspec-ec2.yml
18 changes: 18 additions & 0 deletions sglang/x86_64/gpu/Dockerfile
Original file line number Diff line number Diff line change
Expand Up @@ -83,6 +83,24 @@ RUN echo 'source /usr/local/bin/bash_telemetry.sh' >> /etc/bash.bashrc \
&& rm -rf /var/lib/apt/lists/* \
&& rm -rf /root/.cache | true

# =======================================================
# ====================== EC2 ============================
# =======================================================

FROM base AS sglang-ec2

RUN dpkg -l | grep -E "cuda|nvidia|libnv" | awk '{print $2}' | xargs apt-mark hold \
&& apt-get update \
&& apt-get upgrade -y \
&& apt-get clean

RUN rm -rf /tmp/*

COPY dockerd_entrypoint.sh /usr/local/bin/dockerd_entrypoint.sh
RUN chmod +x /usr/local/bin/dockerd_entrypoint.sh

ENTRYPOINT ["/usr/local/bin/dockerd_entrypoint.sh"]

# =======================================================
# ====================== sagemaker ======================
# =======================================================
Expand Down
2 changes: 2 additions & 0 deletions test/dlc_tests/conftest.py
Original file line number Diff line number Diff line change
Expand Up @@ -109,6 +109,8 @@
"pytorch_trcomp_training",
# Autogluon
"autogluon_training",
# SGLang
"sglang",
# Processor fixtures
"gpu",
"cpu",
Expand Down
Empty file.
Empty file.
Loading