2525 "--zipf_request_length_generator_config_min_tokens 64" ,
2626 "--zipf_request_length_generator_config_prefill_to_decode_ratio 2.0" ,
2727 "--interval_generator_config_type poisson" ,
28- "--poisson_request_interval_generator_config_qps 100 " ,
28+ "--poisson_request_interval_generator_config_qps 1250 " ,
2929 "--llumlet_scheduler_config_num_blocks 128" ,
3030 "--llumlet_scheduler_config_block_size 16" ,
3131 "--llumlet_scheduler_config_batch_size_cap 64" ,
@@ -55,12 +55,13 @@ def cmd_with_overrides(*overrides: str) -> str:
5555 "description" : "Baseline with migration enabled at nominal 100 QPS." ,
5656 "cmd" : cmd_with_overrides (),
5757 },
58-
5958 # Test Type 1: Migration & Load Balancing Sensitivity
6059 {
6160 "name" : "migration_disabled" ,
6261 "description" : "Migration disabled to evaluate imbalance and preemption without rescheduling." ,
63- "cmd" : cmd_with_overrides ("--no-llumnix_global_scheduler_config_enable_migration" ),
62+ "cmd" : cmd_with_overrides (
63+ "--no-llumnix_global_scheduler_config_enable_migration"
64+ ),
6465 },
6566 {
6667 "name" : "rebalance_aggressive" ,
@@ -70,7 +71,6 @@ def cmd_with_overrides(*overrides: str) -> str:
7071 "--llumnix_global_scheduler_config_load_imbalance_threshold 0.1" ,
7172 ),
7273 },
73-
7474 # Test Type 2: KV Capacity & Fragmentation Stress
7575 {
7676 "name" : "kv_capacity_tight" ,
@@ -83,18 +83,18 @@ def cmd_with_overrides(*overrides: str) -> str:
8383]
8484
8585PRIORITY_DISTRIBUTIONS = [
86- #{"type": 1, "slug": "round_robin", "name": "ROUND_ROBIN"},
86+ # {"type": 1, "slug": "round_robin", "name": "ROUND_ROBIN"},
8787 {"type" : 2 , "slug" : "uniform" , "name" : "UNIFORM" },
8888 {"type" : 3 , "slug" : "normal" , "name" : "NORMAL" },
8989 {"type" : 4 , "slug" : "power_law" , "name" : "POWER_LAW" },
90- #{"type": 5, "slug": "enterprise", "name": "ENTERPRISE"},
91- #{"type": 6, "slug": "burstier", "name": "BURSTIER"},
92- #{"type": 7, "slug": "time_of_day", "name": "TIME_OF_DAY"},
93- #{"type": 8, "slug": "traffic_class", "name": "TRAFFIC_CLASS"},
90+ # {"type": 5, "slug": "enterprise", "name": "ENTERPRISE"},
91+ # {"type": 6, "slug": "burstier", "name": "BURSTIER"},
92+ # {"type": 7, "slug": "time_of_day", "name": "TIME_OF_DAY"},
93+ # {"type": 8, "slug": "traffic_class", "name": "TRAFFIC_CLASS"},
9494]
9595
9696PRIORITY_LEVELS = [1 , 2 , 3 , 4 , 5 ]
97- REQUEST_COUNTS = [500 , 2000 ]
97+ REQUEST_COUNTS = [10000 , 15000 ]
9898
9999
100100def _apply_priority_distribution (cmd : str , dist_type : int ) -> str :
@@ -110,7 +110,9 @@ def _apply_priority_distribution(cmd: str, dist_type: int) -> str:
110110 skip = True
111111 continue
112112 filtered .append (tok )
113- filtered .append (f"--synthetic_request_generator_config_priority_distribution_type { dist_type } " )
113+ filtered .append (
114+ f"--synthetic_request_generator_config_priority_distribution_type { dist_type } "
115+ )
114116 return " " .join (filtered )
115117
116118
@@ -130,8 +132,12 @@ def _apply_priority_levels(cmd: str, num_levels: int) -> str:
130132 skip = True
131133 continue
132134 filtered .append (tok )
133- filtered .append (f"--llumnix_global_scheduler_config_num_priority_levels { num_levels } " )
134- filtered .append (f"--synthetic_request_generator_config_num_priority_levels { num_levels } " )
135+ filtered .append (
136+ f"--llumnix_global_scheduler_config_num_priority_levels { num_levels } "
137+ )
138+ filtered .append (
139+ f"--synthetic_request_generator_config_num_priority_levels { num_levels } "
140+ )
135141 return " " .join (filtered )
136142
137143
0 commit comments