Skip to content

Commit 134446a

Browse files
committed
save fp8 disagg test
1 parent 50436a1 commit 134446a

File tree

2 files changed

+44
-0
lines changed

2 files changed

+44
-0
lines changed
Lines changed: 40 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,40 @@
1+
hostname: localhost
2+
port: 8000
3+
model: DeepSeek-V3-Lite/fp8
4+
free_gpu_memory_fraction: 0.25
5+
backend: "pytorch"
6+
disable_overlap_scheduler: True
7+
cuda_graph_config: null
8+
context_servers:
9+
num_instances: 1
10+
enable_chunked_prefill: False
11+
kv_cache_config:
12+
enable_block_reuse: False
13+
enable_partial_reuse: False
14+
moe_config:
15+
backend: DEEPGEMM
16+
tensor_parallel_size: 2
17+
pipeline_parallel_size: 1
18+
cache_transceiver_config:
19+
backend: "UCX"
20+
max_tokens_in_buffer: 4096
21+
urls:
22+
- "localhost:8001"
23+
generation_servers:
24+
num_instances: 1
25+
tensor_parallel_size: 1
26+
pipeline_parallel_size: 1
27+
context_parallel_size: 2
28+
cp_config:
29+
cp_type: helix
30+
enable_chunked_prefill: False
31+
kv_cache_config:
32+
enable_block_reuse: False
33+
enable_partial_reuse: False
34+
cache_transceiver_config:
35+
backend: "UCX"
36+
max_tokens_in_buffer: 4096
37+
moe_config:
38+
backend: DEEPGEMM
39+
urls:
40+
- "localhost:8002"

tests/integration/defs/disaggregated/test_disaggregated.py

Lines changed: 4 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -271,6 +271,10 @@ def get_test_config(test_desc, example_dir, test_root):
271271
(4,
272272
f"{test_configs_root}/disagg_config_ctxtp2_gentp1cp2_deepseek_v3_lite_bf16_tllm_gen.yaml"
273273
),
274+
"deepseek_v3_lite_fp8_tllm_gen_helix":
275+
(4,
276+
f"{test_configs_root}/disagg_config_ctxtp2_gentp1cp2_deepseek_v3_lite_fp8_tllm_gen.yaml"
277+
),
274278
}
275279

276280
if test_desc not in config_map:

0 commit comments

Comments
 (0)