Skip to content

Commit 4062b5f

Browse files
committed
slurm jobs working well.
1 parent fe2dab8 commit 4062b5f

File tree

2 files changed

+20
-14
lines changed

2 files changed

+20
-14
lines changed

llumnix_slurm_job.sh

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -5,7 +5,7 @@
55
#SBATCH --time=02:00:00
66
#SBATCH --array=0-119
77
#SBATCH --cpus-per-task=4
8-
#SBATCH --mem=32G
8+
#SBATCH --mem=24G
99
#SBATCH --output=logs/test_%A_%a.out
1010
#SBATCH --error=logs/test_%A_%a.err
1111

vidur/metrics/latency_config.py

Lines changed: 19 additions & 13 deletions
Original file line numberDiff line numberDiff line change
@@ -25,7 +25,7 @@
2525
"--zipf_request_length_generator_config_min_tokens 64",
2626
"--zipf_request_length_generator_config_prefill_to_decode_ratio 2.0",
2727
"--interval_generator_config_type poisson",
28-
"--poisson_request_interval_generator_config_qps 100",
28+
"--poisson_request_interval_generator_config_qps 1250",
2929
"--llumlet_scheduler_config_num_blocks 128",
3030
"--llumlet_scheduler_config_block_size 16",
3131
"--llumlet_scheduler_config_batch_size_cap 64",
@@ -55,12 +55,13 @@ def cmd_with_overrides(*overrides: str) -> str:
5555
"description": "Baseline with migration enabled at nominal 100 QPS.",
5656
"cmd": cmd_with_overrides(),
5757
},
58-
5958
# Test Type 1: Migration & Load Balancing Sensitivity
6059
{
6160
"name": "migration_disabled",
6261
"description": "Migration disabled to evaluate imbalance and preemption without rescheduling.",
63-
"cmd": cmd_with_overrides("--no-llumnix_global_scheduler_config_enable_migration"),
62+
"cmd": cmd_with_overrides(
63+
"--no-llumnix_global_scheduler_config_enable_migration"
64+
),
6465
},
6566
{
6667
"name": "rebalance_aggressive",
@@ -70,7 +71,6 @@ def cmd_with_overrides(*overrides: str) -> str:
7071
"--llumnix_global_scheduler_config_load_imbalance_threshold 0.1",
7172
),
7273
},
73-
7474
# Test Type 2: KV Capacity & Fragmentation Stress
7575
{
7676
"name": "kv_capacity_tight",
@@ -83,18 +83,18 @@ def cmd_with_overrides(*overrides: str) -> str:
8383
]
8484

8585
PRIORITY_DISTRIBUTIONS = [
86-
#{"type": 1, "slug": "round_robin", "name": "ROUND_ROBIN"},
86+
# {"type": 1, "slug": "round_robin", "name": "ROUND_ROBIN"},
8787
{"type": 2, "slug": "uniform", "name": "UNIFORM"},
8888
{"type": 3, "slug": "normal", "name": "NORMAL"},
8989
{"type": 4, "slug": "power_law", "name": "POWER_LAW"},
90-
#{"type": 5, "slug": "enterprise", "name": "ENTERPRISE"},
91-
#{"type": 6, "slug": "burstier", "name": "BURSTIER"},
92-
#{"type": 7, "slug": "time_of_day", "name": "TIME_OF_DAY"},
93-
#{"type": 8, "slug": "traffic_class", "name": "TRAFFIC_CLASS"},
90+
# {"type": 5, "slug": "enterprise", "name": "ENTERPRISE"},
91+
# {"type": 6, "slug": "burstier", "name": "BURSTIER"},
92+
# {"type": 7, "slug": "time_of_day", "name": "TIME_OF_DAY"},
93+
# {"type": 8, "slug": "traffic_class", "name": "TRAFFIC_CLASS"},
9494
]
9595

9696
PRIORITY_LEVELS = [1, 2, 3, 4, 5]
97-
REQUEST_COUNTS = [500, 2000]
97+
REQUEST_COUNTS = [10000, 15000]
9898

9999

100100
def _apply_priority_distribution(cmd: str, dist_type: int) -> str:
@@ -110,7 +110,9 @@ def _apply_priority_distribution(cmd: str, dist_type: int) -> str:
110110
skip = True
111111
continue
112112
filtered.append(tok)
113-
filtered.append(f"--synthetic_request_generator_config_priority_distribution_type {dist_type}")
113+
filtered.append(
114+
f"--synthetic_request_generator_config_priority_distribution_type {dist_type}"
115+
)
114116
return " ".join(filtered)
115117

116118

@@ -130,8 +132,12 @@ def _apply_priority_levels(cmd: str, num_levels: int) -> str:
130132
skip = True
131133
continue
132134
filtered.append(tok)
133-
filtered.append(f"--llumnix_global_scheduler_config_num_priority_levels {num_levels}")
134-
filtered.append(f"--synthetic_request_generator_config_num_priority_levels {num_levels}")
135+
filtered.append(
136+
f"--llumnix_global_scheduler_config_num_priority_levels {num_levels}"
137+
)
138+
filtered.append(
139+
f"--synthetic_request_generator_config_num_priority_levels {num_levels}"
140+
)
135141
return " ".join(filtered)
136142

137143

0 commit comments

Comments
 (0)