diff --git a/templates/config.json b/templates/config.json
index 00ffb149..e0068876 100644
--- a/templates/config.json
+++ b/templates/config.json
@@ -3748,5 +3748,27 @@
       "diskSize": 20
     },
     "tags": ["LLM Inference & Model Serving", "Developer Tools", "AI Agents"]
-  }
+  },
+{
+  "id": "deepspeed",
+  "name": "deepspeedai/DeepSpeed",
+  "description": "CPU-safe DeepSpeed source/runtime verifier with health, demo, and model-list endpoints. It verifies upstream launcher/runtime/inference/config files without importing DeepSpeed, downloading models, running training, or requiring GPU access.",
+  "repo": "https://github.com/Phala-Network/phala-cloud/tree/main/templates/prebuilt/deepspeed",
+  "author": "deepspeedai",
+  "icon": "deepspeed.svg",
+  "envs": [
+    {
+      "key": "DEEPSPEED_SOURCE_REF",
+      "required": false,
+      "description": "DeepSpeed Git tag, branch, or commit used for CPU-safe source verification.",
+      "default": "v0.19.1"
+    }
+  ],
+  "defaultResource": {
+    "vCPU": 1,
+    "memory": 2048,
+    "diskSize": 10
+  },
+  "tags": ["LLM Inference & Model Serving", "Developer Tools", "AI Agents"]
+}
 ]
diff --git a/templates/icons/deepspeed.svg b/templates/icons/deepspeed.svg
new file mode 100644
index 00000000..77a86ace
--- /dev/null
+++ b/templates/icons/deepspeed.svg
@@ -0,0 +1,27 @@
+<svg width="287" height="107" viewBox="0 0 287 107" fill="none" xmlns="http://www.w3.org/2000/svg">
+<g clip-path="url(#clip0)">
+<rect width="287" height="107" fill="white"/>
+<path d="M110.738 65.5H108.096V62.6963H108.031C106.807 64.8232 104.916 65.8867 102.359 65.8867C100.286 65.8867 98.6265 65.1509 97.3804 63.6792C96.145 62.1968 95.5273 60.1826 95.5273 57.6367C95.5273 54.9082 96.2148 52.7222 97.5898 51.0786C98.9648 49.4351 100.796 48.6133 103.084 48.6133C105.351 48.6133 107 49.5049 108.031 51.2881H108.096V41.0723H110.738V65.5ZM108.096 58.0396V55.6064C108.096 54.2744 107.655 53.1465 106.774 52.2227C105.894 51.2988 104.776 50.8369 103.423 50.8369C101.812 50.8369 100.544 51.4277 99.6201 52.6094C98.6963 53.791 98.2344 55.4238 98.2344 57.5078C98.2344 59.4092 98.6748 60.9131 99.5557 62.0195C100.447 63.1152 101.64 63.6631 103.133 63.6631C104.604 63.6631 105.797 63.1313 106.71 62.0679C107.634 61.0044 108.096 59.6616 108.096 58.0396ZM129.349 57.9106H117.699C117.742 59.7476 118.236 61.1655 119.182 62.1646C120.127 63.1636 121.427 63.6631 123.081 63.6631C124.939 63.6631 126.647 63.0508 128.205 61.8262V64.3076C126.755 65.3604 124.837 65.8867 122.453 65.8867C120.122 65.8867 118.29 65.1401 116.958 63.647C115.626 62.1431 114.96 60.0322 114.96 57.3145C114.96 54.7471 115.685 52.6577 117.135 51.0464C118.596 49.4243 120.406 48.6133 122.565 48.6133C124.725 48.6133 126.395 49.3115 127.577 50.708C128.758 52.1045 129.349 54.0435 129.349 56.5249V57.9106ZM126.642 55.6709C126.631 54.1455 126.261 52.9585 125.53 52.1099C124.811 51.2612 123.806 50.8369 122.517 50.8369C121.271 50.8369 120.213 51.2827 119.343 52.1743C118.473 53.0659 117.936 54.2314 117.731 55.6709H126.642ZM146.623 57.9106H134.973C135.016 59.7476 135.51 61.1655 136.455 62.1646C137.4 63.1636 138.7 63.6631 140.354 63.6631C142.213 63.6631 143.921 63.0508 145.479 61.8262V64.3076C144.028 65.3604 142.111 65.8867 139.726 65.8867C137.395 65.8867 135.563 65.1401 134.231 63.647C132.899 62.1431 132.233 60.0322 132.233 57.3145C132.233 54.7471 132.958 52.6577 134.409 51.0464C135.87 49.4243 137.68 48.6133 139.839 48.6133C141.998 48.6133 143.668 49.3115 144.85 50.708C146.032 52.1045 146.623 54.0435 146.623 56.5249V57.9106ZM143.916 55.6709C143.905 54.1455 143.534 52.9585 142.804 52.1099C142.084 51.2612 141.08 50.8369 139.791 50.8369C138.544 50.8369 137.486 51.2827 136.616 52.1743C135.746 53.0659 135.209 54.2314 135.005 55.6709H143.916ZM153.342 63.1152H153.277V73.0894H150.635V49H153.277V51.9004H153.342C154.642 49.709 156.543 48.6133 159.046 48.6133C161.173 48.6133 162.833 49.3545 164.025 50.8369C165.217 52.3086 165.813 54.2852 165.813 56.7666C165.813 59.5273 165.142 61.7402 163.799 63.4053C162.457 65.0596 160.62 65.8867 158.289 65.8867C156.151 65.8867 154.502 64.9629 153.342 63.1152ZM153.277 56.4604V58.7646C153.277 60.1289 153.718 61.2891 154.599 62.2451C155.49 63.1904 156.618 63.6631 157.982 63.6631C159.583 63.6631 160.834 63.0508 161.737 61.8262C162.65 60.6016 163.106 58.8989 163.106 56.7183C163.106 54.8813 162.682 53.4419 161.833 52.3999C160.985 51.3579 159.835 50.8369 158.385 50.8369C156.849 50.8369 155.614 51.374 154.679 52.4482C153.745 53.5117 153.277 54.8491 153.277 56.4604ZM169.036 64.9038V62.0679C170.476 63.1313 172.06 63.6631 173.79 63.6631C176.11 63.6631 177.27 62.8896 177.27 61.3428C177.27 60.9023 177.168 60.5317 176.964 60.231C176.771 59.9194 176.502 59.6455 176.158 59.4092C175.825 59.1729 175.428 58.9634 174.966 58.7808C174.515 58.5874 174.026 58.3887 173.5 58.1846C172.769 57.8945 172.125 57.6045 171.566 57.3145C171.018 57.0137 170.556 56.6807 170.18 56.3154C169.815 55.9395 169.536 55.5151 169.342 55.0425C169.16 54.5698 169.068 54.0166 169.068 53.3828C169.068 52.6094 169.246 51.9272 169.6 51.3364C169.955 50.7349 170.427 50.2354 171.018 49.8379C171.609 49.4297 172.28 49.1235 173.032 48.9194C173.795 48.7153 174.579 48.6133 175.385 48.6133C176.813 48.6133 178.092 48.8604 179.22 49.3545V52.0293C178.006 51.2344 176.609 50.8369 175.03 50.8369C174.536 50.8369 174.09 50.896 173.693 51.0142C173.295 51.1216 172.952 51.2773 172.662 51.4814C172.382 51.6855 172.162 51.9326 172.001 52.2227C171.851 52.502 171.775 52.8135 171.775 53.1572C171.775 53.5869 171.851 53.9468 172.001 54.2368C172.162 54.5269 172.393 54.7847 172.694 55.0103C172.995 55.2358 173.36 55.4399 173.79 55.6226C174.219 55.8052 174.708 56.0039 175.256 56.2188C175.986 56.498 176.642 56.7881 177.222 57.0889C177.802 57.3789 178.296 57.7119 178.704 58.0879C179.112 58.4531 179.424 58.8774 179.639 59.3608C179.864 59.8442 179.977 60.4189 179.977 61.085C179.977 61.9014 179.794 62.6104 179.429 63.2119C179.075 63.8135 178.597 64.313 177.995 64.7104C177.394 65.1079 176.701 65.4033 175.917 65.5967C175.132 65.79 174.311 65.8867 173.451 65.8867C171.754 65.8867 170.282 65.5591 169.036 64.9038ZM186.761 63.1152H186.696V73.0894H184.054V49H186.696V51.9004H186.761C188.061 49.709 189.962 48.6133 192.465 48.6133C194.592 48.6133 196.251 49.3545 197.444 50.8369C198.636 52.3086 199.232 54.2852 199.232 56.7666C199.232 59.5273 198.561 61.7402 197.218 63.4053C195.875 65.0596 194.039 65.8867 191.708 65.8867C189.57 65.8867 187.921 64.9629 186.761 63.1152ZM186.696 56.4604V58.7646C186.696 60.1289 187.137 61.2891 188.018 62.2451C188.909 63.1904 190.037 63.6631 191.401 63.6631C193.002 63.6631 194.253 63.0508 195.156 61.8262C196.069 60.6016 196.525 58.8989 196.525 56.7183C196.525 54.8813 196.101 53.4419 195.252 52.3999C194.404 51.3579 193.254 50.8369 191.804 50.8369C190.268 50.8369 189.033 51.374 188.098 52.4482C187.164 53.5117 186.696 54.8491 186.696 56.4604ZM216.715 57.9106H205.065C205.108 59.7476 205.603 61.1655 206.548 62.1646C207.493 63.1636 208.793 63.6631 210.447 63.6631C212.306 63.6631 214.014 63.0508 215.571 61.8262V64.3076C214.121 65.3604 212.204 65.8867 209.819 65.8867C207.488 65.8867 205.656 65.1401 204.324 63.647C202.992 62.1431 202.326 60.0322 202.326 57.3145C202.326 54.7471 203.051 52.6577 204.501 51.0464C205.962 49.4243 207.772 48.6133 209.932 48.6133C212.091 48.6133 213.761 49.3115 214.943 50.708C216.125 52.1045 216.715 54.0435 216.715 56.5249V57.9106ZM214.008 55.6709C213.998 54.1455 213.627 52.9585 212.896 52.1099C212.177 51.2612 211.172 50.8369 209.883 50.8369C208.637 50.8369 207.579 51.2827 206.709 52.1743C205.839 53.0659 205.302 54.2314 205.098 55.6709H214.008ZM233.989 57.9106H222.339C222.382 59.7476 222.876 61.1655 223.821 62.1646C224.767 63.1636 226.066 63.6631 227.721 63.6631C229.579 63.6631 231.287 63.0508 232.845 61.8262V64.3076C231.395 65.3604 229.477 65.8867 227.092 65.8867C224.761 65.8867 222.93 65.1401 221.598 63.647C220.266 62.1431 219.6 60.0322 219.6 57.3145C219.6 54.7471 220.325 52.6577 221.775 51.0464C223.236 49.4243 225.046 48.6133 227.205 48.6133C229.364 48.6133 231.035 49.3115 232.216 50.708C233.398 52.1045 233.989 54.0435 233.989 56.5249V57.9106ZM231.282 55.6709C231.271 54.1455 230.9 52.9585 230.17 52.1099C229.45 51.2612 228.446 50.8369 227.157 50.8369C225.911 50.8369 224.853 51.2827 223.982 52.1743C223.112 53.0659 222.575 54.2314 222.371 55.6709H231.282ZM252.084 65.5H249.441V62.6963H249.377C248.152 64.8232 246.262 65.8867 243.705 65.8867C241.632 65.8867 239.972 65.1509 238.726 63.6792C237.491 62.1968 236.873 60.1826 236.873 57.6367C236.873 54.9082 237.561 52.7222 238.936 51.0786C240.311 49.4351 242.142 48.6133 244.43 48.6133C246.697 48.6133 248.346 49.5049 249.377 51.2881H249.441V41.0723H252.084V65.5ZM249.441 58.0396V55.6064C249.441 54.2744 249.001 53.1465 248.12 52.2227C247.239 51.2988 246.122 50.8369 244.769 50.8369C243.157 50.8369 241.89 51.4277 240.966 52.6094C240.042 53.791 239.58 55.4238 239.58 57.5078C239.58 59.4092 240.021 60.9131 240.901 62.0195C241.793 63.1152 242.985 63.6631 244.479 63.6631C245.95 63.6631 247.143 63.1313 248.056 62.0679C248.979 61.0044 249.441 59.6616 249.441 58.0396Z" fill="black"/>
+<path d="M34.1305 67.6806C36.4372 65.3739 39.6428 64.8396 41.2905 66.4872C42.9381 68.1349 42.4039 71.3405 40.0971 73.6472C37.7904 75.954 23.9871 83.7906 23.9871 83.7906C23.9871 83.7906 31.8238 69.9873 34.1305 67.6806Z" fill="#FFC60F"/>
+<circle cx="40.0974" cy="37.2509" r="3.79717" transform="rotate(45 40.0974 37.2509)" fill="#F17F00"/>
+<circle cx="55.6108" cy="52.764" r="3.79717" transform="rotate(45 55.6108 52.764)" fill="#F17F00"/>
+<circle cx="78.881" cy="29.494" r="3.79717" transform="rotate(45 78.881 29.494)" fill="#F17F00"/>
+<circle cx="38.3074" cy="56.9408" r="3.79717" transform="rotate(45 38.3074 56.9408)" fill="#F17F00"/>
+<circle cx="70.5278" cy="67.681" r="3.79717" transform="rotate(45 70.5278 67.681)" fill="#F17F00"/>
+<circle cx="50.8379" cy="69.4711" r="3.79717" transform="rotate(45 50.8379 69.4711)" fill="#F17F00"/>
+<line x1="39.947" y1="37.4136" x2="78.8092" y2="29.4793" stroke="#F17F00" stroke-width="1.5"/>
+<line x1="70.3643" y1="68.1263" x2="78.8823" y2="29.3333" stroke="#F17F00" stroke-width="1.5"/>
+<line x1="40.4924" y1="36.7975" x2="38.4654" y2="57.0154" stroke="#F17F00" stroke-width="1.5"/>
+<line x1="38.1289" y1="56.8053" x2="56.0291" y2="52.4134" stroke="#F17F00" stroke-width="1.5"/>
+<line x1="56.148" y1="52.3093" x2="51.1777" y2="69.9078" stroke="#F17F00" stroke-width="1.5"/>
+<line x1="50.7678" y1="69.1781" x2="70.8194" y2="67.3004" stroke="#F17F00" stroke-width="1.5"/>
+<line x1="50.4041" y1="69.6991" x2="39.9762" y2="37.0126" stroke="#F17F00" stroke-width="1.5"/>
+<line x1="70.6683" y1="67.6962" x2="38.0867" y2="57.6573" stroke="#F17F00" stroke-width="1.5"/>
+<line x1="55.3219" y1="52.5941" x2="78.8712" y2="29.3586" stroke="#F17F00" stroke-width="1.5"/>
+</g>
+<defs>
+<clipPath id="clip0">
+<rect width="287" height="107" fill="white"/>
+</clipPath>
+</defs>
+</svg>
diff --git a/templates/prebuilt/deepspeed/README.md b/templates/prebuilt/deepspeed/README.md
new file mode 100644
index 00000000..b6ef31cd
--- /dev/null
+++ b/templates/prebuilt/deepspeed/README.md
@@ -0,0 +1,162 @@
+# deepspeedai/DeepSpeed on Phala Cloud
+
+Deploy a CPU-safe DeepSpeed source/runtime verifier on Phala Cloud.
+
+## Overview
+
+[DeepSpeed](https://github.com/deepspeedai/DeepSpeed) is a GPU-oriented distributed training and inference optimization framework from the DeepSpeed team. Full DeepSpeed workloads normally involve PyTorch, accelerator-specific kernels, distributed launchers, CUDA/ROCm or other accelerator backends, model checkpoints, and training or inference jobs that must be sized for the selected hardware.
+
+This prebuilt template intentionally does not run a full DeepSpeed training or inference server. The default deployment is a minimal HTTP verifier that is safe for a CPU-only Phala Cloud `tdx.small`-style deployment. It downloads selected public DeepSpeed source and documentation files from a pinned upstream Git ref, verifies markers for core concepts, and `py_compile` checks selected Python source files without importing `deepspeed` or `torch`.
+
+The demo does not download model weights, run distributed training, start inference, require CUDA/GPU access, require provider credentials, require Hugging Face tokens, mount host paths, or use privileged container features.
+
+## Metadata
+
+- Template id: `deepspeed`
+- Display name: `deepspeedai/DeepSpeed`
+- Upstream repository: https://github.com/deepspeedai/DeepSpeed
+- Upstream documentation: https://www.deepspeed.ai/
+- Default source ref: `v0.19.1`
+- Icon source: upstream DeepSpeed README logo at `docs/assets/images/DeepSpeed_light.svg`
+- Upstream author: DeepSpeed Team, via the `deepspeedai/DeepSpeed` GitHub repository
+- Phala prebuilt source: https://github.com/Phala-Network/phala-cloud/tree/main/templates/prebuilt/deepspeed
+
+## What This Template Runs
+
+The compose file starts one public HTTP service:
+
+- `app`: A `python:3.12-slim-bookworm` container that runs an inline Python HTTP server on port `8080`.
+
+On startup, the verifier fetches these upstream files from `deepspeedai/DeepSpeed` at `DEEPSPEED_SOURCE_REF`:
+
+- `README.md`
+- `deepspeed/launcher/runner.py`
+- `deepspeed/runtime/engine.py`
+- `deepspeed/runtime/config.py`
+- `deepspeed/inference/engine.py`
+- `docs/_pages/config-json.md`
+- `docs/_pages/inference.md`
+
+The verifier checks for launcher, runtime engine, inference engine, and JSON config documentation markers, then compiles the selected Python source files with `py_compile`. It never imports DeepSpeed at module import time or request time, which avoids Torch/CUDA initialization and extension compilation on small CPU-only CVMs.
+
+## Deploy
+
+1. Deploy the `deepspeed` prebuilt template on Phala Cloud.
+2. Keep the default CPU-only resource profile for the source verifier.
+3. Optionally set `DEEPSPEED_SOURCE_REF` to another public DeepSpeed tag, branch, or commit.
+4. Open the generated public endpoint for port `8080`.
+5. Visit `https://<your-app-domain>/healthz`.
+
+The first startup fetches a small set of public source files from GitHub. No private repositories, model registries, paid provider APIs, GPU devices, host bind mounts, Docker socket access, host networking, external build contexts, `env_file`, or privileged mode are required.
+
+## Environment Variables
+
+No credentials are required for the default verifier.
+
+| Variable | Required | Default | Description |
+| --- | --- | --- | --- |
+| `DEEPSPEED_SOURCE_REF` | No | `v0.19.1` | Public DeepSpeed Git tag, branch, or commit used for source checks. |
+
+If you adapt this template to run real DeepSpeed training or inference, add only the variables required by your selected model, dataset, storage backend, or provider. For gated Hugging Face models, use a required secret or environment variable such as `HF_TOKEN`; do not hardcode real tokens in `docker-compose.yml` or this README.
+
+## Usage Endpoints
+
+The public endpoint exposes JSON on port `8080`:
+
+- `GET /healthz`: Readiness and verifier status. It returns HTTP `200` with `"ok": true` once the source check passes, and includes errors if a ref or marker check fails.
+- `GET /demo`: Detailed verifier output, including fetched files, SHA-256 hashes, marker checks, compile checks, and flags confirming that no model, GPU, training, or provider credentials are used.
+- `GET /v1/models`: OpenAI-compatible model-list shape with an empty `data` array because this template does not run an inference server.
+- `GET /`: Same basic payload as `/healthz`.
+
+Example:
+
+```bash
+curl -fsS https://<your-app-domain>/healthz
+curl -fsS https://<your-app-domain>/demo
+curl -fsS https://<your-app-domain>/v1/models
+```
+
+Expected `/demo` fields after the source check completes include:
+
+```json
+{
+  "ok": true,
+  "source_check": {
+    "cpu_only": true,
+    "deepspeed_imported": false,
+    "torch_imported": false,
+    "cuda_required": false,
+    "distributed_training_started": false,
+    "model_downloaded": false,
+    "provider_credentials_required": false
+  }
+}
+```
+
+The `/v1/models` response intentionally has an empty `data` list:
+
+```json
+{
+  "object": "list",
+  "data": [],
+  "demo": {
+    "message": "No DeepSpeed model server is running in this CPU-safe source verifier."
+  }
+}
+```
+
+## Verification/Smoke Test
+
+Run from the parent monorepo worktree:
+
+```bash
+python3 templates/validate.py
+git diff --check origin/main...HEAD
+docker compose -f templates/prebuilt/deepspeed/docker-compose.yml config >/dev/null
+```
+
+Optional local runtime check from the parent monorepo worktree:
+
+```bash
+docker compose -f templates/prebuilt/deepspeed/docker-compose.yml up -d
+curl -fsS http://localhost:8080/healthz
+curl -fsS http://localhost:8080/demo
+curl -fsS http://localhost:8080/v1/models
+docker compose -f templates/prebuilt/deepspeed/docker-compose.yml down
+```
+
+A healthy verifier returns `"ok": true` after it downloads the selected files, verifies the expected DeepSpeed markers, and compiles the selected Python files.
+
+## Resource Notes
+
+The default resource profile is intentionally conservative for a Phala Cloud `tdx.small`-style CPU deployment:
+
+- 1 vCPU
+- 2 GiB memory
+- 10 GiB disk
+
+The default container downloads only selected source files into `/tmp` and does not create named volumes. A real DeepSpeed deployment can require substantially more CPU, memory, disk, network bandwidth, GPUs or other accelerators, PyTorch/CUDA-compatible images, distributed job coordination, model checkpoints, and dataset or object-storage access.
+
+## Production Extension Notes
+
+- Replace the verifier with a purpose-built DeepSpeed training, inference, or launcher command only after choosing the model, dataset, checkpoint format, and hardware target.
+- Pin DeepSpeed, PyTorch, CUDA/ROCm, base image, and model versions for reproducibility.
+- Review upstream DeepSpeed installation guidance before enabling ops or JIT extension compilation.
+- Use Phala Cloud secrets or required environment variables for credentials such as `HF_TOKEN`, object storage keys, or provider API keys. Keep placeholder names in examples and never commit real values.
+- Add authentication before exposing real training controls, model inference, logs, or private metadata.
+- Keep host bind mounts, Docker socket mounts, host networking, and privileged mode out of production templates unless there is a reviewed operational reason.
+
+## Security Notes
+
+- The default HTTP verifier is unauthenticated and returns source metadata only.
+- The compose file uses a public image and inline Compose configs only.
+- The compose file does not use host bind mounts, `env_file`, real secrets, privileged mode, host networking, external build contexts, Docker socket access, or GPU device requests.
+- `/v1/models` is a compatibility stub, not proof that a model server is running.
+
+## Upstream Attribution
+
+DeepSpeed is developed by the DeepSpeed Team in the `deepspeedai/DeepSpeed` repository: https://github.com/deepspeedai/DeepSpeed.
+
+This Phala Cloud prebuilt template preserves upstream attribution in the template metadata and README while routing deployable assets through the Phala prebuilt template path: https://github.com/Phala-Network/phala-cloud/tree/main/templates/prebuilt/deepspeed.
+
+The icon saved as `deepspeed.svg` is the upstream DeepSpeed README logo from `docs/assets/images/DeepSpeed_light.svg` in the `deepspeedai/DeepSpeed` repository.
diff --git a/templates/prebuilt/deepspeed/docker-compose.yml b/templates/prebuilt/deepspeed/docker-compose.yml
new file mode 100644
index 00000000..92ec0e05
--- /dev/null
+++ b/templates/prebuilt/deepspeed/docker-compose.yml
@@ -0,0 +1,300 @@
+services:
+  app:
+    image: python:3.12-slim-bookworm
+    ports:
+      - "8080:8080"
+    environment:
+      DEEPSPEED_SOURCE_REF: ${DEEPSPEED_SOURCE_REF:-v0.19.1}
+      PYTHONUNBUFFERED: "1"
+    command:
+      - python
+      - /server.py
+    configs:
+      - source: server_py
+        target: /server.py
+    healthcheck:
+      test:
+        - CMD
+        - python
+        - -c
+        - import urllib.request; urllib.request.urlopen("http://127.0.0.1:8080/healthz", timeout=5).read()
+      interval: 30s
+      timeout: 10s
+      retries: 3
+      start_period: 30s
+    restart: unless-stopped
+
+configs:
+  server_py:
+    content: |
+      import hashlib
+      import json
+      import os
+      import platform
+      import py_compile
+      import shutil
+      import sys
+      import threading
+      import time
+      import urllib.parse
+      import urllib.request
+      from http.server import BaseHTTPRequestHandler, ThreadingHTTPServer
+      from pathlib import Path
+
+      STARTED_AT = time.time()
+      SOURCE_REPO = "deepspeedai/DeepSpeed"
+      UPSTREAM = f"https://github.com/{SOURCE_REPO}"
+      RAW_BASE = f"https://raw.githubusercontent.com/{SOURCE_REPO}"
+      DEFAULT_REF = "v0.19.1"
+      SOURCE_REF = os.environ.get("DEEPSPEED_SOURCE_REF", DEFAULT_REF).strip() or DEFAULT_REF
+      SOURCE_ROOT = Path("/tmp/deepspeed-source")
+      MAX_SOURCE_BYTES = 2 * 1024 * 1024
+
+      SOURCE_FILES = [
+          {
+              "path": "README.md",
+              "purpose": "Project README and high-level DeepSpeed positioning",
+              "markers": ["Extreme Speed and Scale", "ZeRO", "DeepSpeed"],
+              "compile": False,
+          },
+          {
+              "path": "deepspeed/launcher/runner.py",
+              "purpose": "Distributed launcher front-end source",
+              "markers": ["DeepSpeed runner", "--num_gpus", "PDSHRunner"],
+              "compile": True,
+          },
+          {
+              "path": "deepspeed/runtime/engine.py",
+              "purpose": "DeepSpeed runtime engine source",
+              "markers": ["class DeepSpeedEngine", "def backward", "zero_optimization"],
+              "compile": True,
+          },
+          {
+              "path": "deepspeed/runtime/config.py",
+              "purpose": "DeepSpeed runtime configuration parser source",
+              "markers": ["class DeepSpeedConfig", "train_batch_size", "gradient_accumulation_steps"],
+              "compile": True,
+          },
+          {
+              "path": "deepspeed/inference/engine.py",
+              "purpose": "DeepSpeed inference engine source",
+              "markers": ["class InferenceEngine", "replace_with_kernel_inject", "enable_cuda_graph"],
+              "compile": True,
+          },
+          {
+              "path": "docs/_pages/config-json.md",
+              "purpose": "DeepSpeed JSON configuration documentation",
+              "markers": ["DeepSpeed Configuration JSON", "train_micro_batch_size_per_gpu", "zero_optimization"],
+              "compile": False,
+          },
+          {
+              "path": "docs/_pages/inference.md",
+              "purpose": "DeepSpeed inference documentation",
+              "markers": ["DeepSpeed-Inference", "model parallelism", "inference-customized kernels"],
+              "compile": False,
+          },
+      ]
+
+      STATE_LOCK = threading.Lock()
+      CHECK_STATE = {
+          "ok": False,
+          "status": "starting",
+          "message": "Source verification has not completed yet.",
+          "ref": SOURCE_REF,
+      }
+
+
+      def source_url(path):
+          encoded_ref = urllib.parse.quote(SOURCE_REF, safe="")
+          encoded_path = urllib.parse.quote(path, safe="/")
+          return f"{RAW_BASE}/{encoded_ref}/{encoded_path}"
+
+
+      def fetch_file(spec):
+          path = spec["path"]
+          target = SOURCE_ROOT / path
+          target.parent.mkdir(parents=True, exist_ok=True)
+          request = urllib.request.Request(
+              source_url(path),
+              headers={"User-Agent": "phala-cloud-deepspeed-template/1.0"},
+          )
+          with urllib.request.urlopen(request, timeout=30) as response:
+              data = response.read(MAX_SOURCE_BYTES + 1)
+          if len(data) > MAX_SOURCE_BYTES:
+              raise RuntimeError(f"{path} exceeds {MAX_SOURCE_BYTES} bytes")
+          target.write_bytes(data)
+          text = data.decode("utf-8", errors="replace")
+          marker_results = {marker: marker in text for marker in spec["markers"]}
+          missing_markers = [marker for marker, present in marker_results.items() if not present]
+          return {
+              "path": path,
+              "purpose": spec["purpose"],
+              "url": source_url(path),
+              "bytes": len(data),
+              "sha256": hashlib.sha256(data).hexdigest(),
+              "markers": marker_results,
+              "missing_markers": missing_markers,
+              "compile": spec["compile"],
+          }
+
+
+      def verify_source():
+          state = {
+              "ok": False,
+              "status": "checking",
+              "source_repo": SOURCE_REPO,
+              "upstream": UPSTREAM,
+              "ref": SOURCE_REF,
+              "files": [],
+              "compiled": [],
+              "errors": [],
+              "cpu_only": True,
+              "deepspeed_imported": False,
+              "torch_imported": False,
+              "cuda_required": False,
+              "distributed_training_started": False,
+              "model_downloaded": False,
+              "provider_credentials_required": False,
+          }
+
+          try:
+              shutil.rmtree(SOURCE_ROOT, ignore_errors=True)
+              SOURCE_ROOT.mkdir(parents=True, exist_ok=True)
+
+              for spec in SOURCE_FILES:
+                  try:
+                      result = fetch_file(spec)
+                      state["files"].append(result)
+                      if result["missing_markers"]:
+                          state["errors"].append({
+                              "path": spec["path"],
+                              "error": "Expected source markers were not found",
+                              "missing_markers": result["missing_markers"],
+                          })
+                      if spec["compile"]:
+                          py_compile.compile(str(SOURCE_ROOT / spec["path"]), doraise=True)
+                          state["compiled"].append(spec["path"])
+                  except Exception as exc:
+                      state["errors"].append({
+                          "path": spec["path"],
+                          "error": f"{type(exc).__name__}: {exc}",
+                      })
+
+              state["ok"] = not state["errors"]
+              state["status"] = "ready" if state["ok"] else "source_check_failed"
+              state["message"] = (
+                  "Downloaded selected upstream DeepSpeed source and documentation files, "
+                  "verified launcher/runtime/inference/config markers, and py_compile checked "
+                  "selected Python source files. The demo did not import deepspeed, import torch, "
+                  "download model weights, start distributed training, or request CUDA/GPU access."
+              )
+          except Exception as exc:
+              state["status"] = "source_check_failed"
+              state["errors"].append({"error": f"{type(exc).__name__}: {exc}"})
+              state["message"] = (
+                  "The HTTP verifier is running, but upstream source verification failed. "
+                  "Retry later or set DEEPSPEED_SOURCE_REF to a reachable branch, tag, or commit."
+              )
+
+          with STATE_LOCK:
+              global CHECK_STATE
+              CHECK_STATE = state
+
+
+      def current_state():
+          with STATE_LOCK:
+              return json.loads(json.dumps(CHECK_STATE))
+
+
+      def base_payload():
+          return {
+              "service": "deepspeed-source-verifier",
+              "display_name": "deepspeedai/DeepSpeed",
+              "upstream": UPSTREAM,
+              "python": sys.version.split()[0],
+              "platform": platform.platform(),
+              "uptime_seconds": round(time.time() - STARTED_AT, 3),
+              "demo_scope": (
+                  "CPU-safe source/runtime verifier. It is not a DeepSpeed training, "
+                  "inference, or distributed launcher server."
+              ),
+          }
+
+
+      class Handler(BaseHTTPRequestHandler):
+          server_version = "deepspeed-source-verifier/1.0"
+
+          def log_message(self, fmt, *args):
+              print("%s - %s" % (self.address_string(), fmt % args), flush=True)
+
+          def respond_json(self, status, payload):
+              body = json.dumps(payload, sort_keys=True).encode("utf-8")
+              self.send_response(status)
+              self.send_header("Content-Type", "application/json")
+              self.send_header("Content-Length", str(len(body)))
+              self.end_headers()
+              self.wfile.write(body)
+
+          def do_GET(self):
+              path = urllib.parse.urlparse(self.path).path.rstrip("/") or "/"
+              state = current_state()
+
+              if path in ("/", "/healthz"):
+                  payload = base_payload()
+                  payload.update({
+                      "ok": state.get("ok") is True,
+                      "status": state.get("status", "unknown"),
+                      "source_ref": state.get("ref", SOURCE_REF),
+                      "cpu_only": True,
+                      "cuda_required": False,
+                      "model_downloaded": False,
+                      "distributed_training_started": False,
+                      "provider_credentials_required": False,
+                      "deepspeed_imported": False,
+                      "endpoints": ["/healthz", "/demo", "/v1/models"],
+                  })
+                  if state.get("errors"):
+                      payload["errors"] = state["errors"]
+                  self.respond_json(200, payload)
+                  return
+
+              if path == "/demo":
+                  payload = base_payload()
+                  payload.update({
+                      "ok": state.get("ok") is True,
+                      "check": (
+                          "Fetch a pinned DeepSpeed ref from GitHub, verify source markers "
+                          "for launcher/runtime/inference/config concepts, and compile selected "
+                          "Python source files without importing DeepSpeed."
+                      ),
+                      "source_check": state,
+                  })
+                  self.respond_json(200, payload)
+                  return
+
+              if path == "/v1/models":
+                  payload = {
+                      "object": "list",
+                      "data": [],
+                      "demo": {
+                          "message": (
+                              "No DeepSpeed model server is running in this CPU-safe source verifier."
+                          ),
+                          "source_ok": state.get("ok") is True,
+                          "source_ref": state.get("ref", SOURCE_REF),
+                          "model_downloaded": False,
+                          "inference_started": False,
+                      },
+                  }
+                  if state.get("errors"):
+                      payload["errors"] = state["errors"]
+                  self.respond_json(200, payload)
+                  return
+
+              self.respond_json(404, {"ok": False, "error": "not found"})
+
+
+      threading.Thread(target=verify_source, daemon=True).start()
+      server = ThreadingHTTPServer(("0.0.0.0", 8080), Handler)
+      print("deepspeed source verifier listening on 0.0.0.0:8080", flush=True)
+      server.serve_forever()