@@ -110,7 +110,7 @@ def __init__(self,
110
110
ttl : int = 900 ,
111
111
min_load_score : float = 3 ,
112
112
max_model_len : int = 8192 ,
113
- load_shrads_num : int = 1 ,
113
+ load_shards_num : int = 1 ,
114
114
enable_chunked_prefill : bool = False ,
115
115
max_num_partial_prefills : int = 1 ,
116
116
max_long_partial_prefills : int = 1 ,
@@ -129,7 +129,7 @@ def __init__(self,
129
129
ttl: Time-to-live in seconds for Redis keys (default 900s)
130
130
min_load_score: Minimum load score for task assignment (default 3)
131
131
max_model_len: Maximum model context length in tokens
132
- load_shrads_num : Number of load balancing shards
132
+ load_shards_num : Number of load balancing shards
133
133
enable_chunked_prefill: Whether to enable chunked prefill processing
134
134
max_num_partial_prefills: Max partial prefill operations allowed
135
135
max_long_partial_prefills: Max long-running partial prefill ops
@@ -147,7 +147,7 @@ def __init__(self,
147
147
self .topic = topic
148
148
self .ttl = ttl
149
149
self .min_load_score = min_load_score
150
- self .load_shrads_num = load_shrads_num
150
+ self .load_shards_num = load_shards_num
151
151
152
152
self .max_model_len = max_model_len
153
153
self .enable_chunked_prefill = enable_chunked_prefill
@@ -169,8 +169,8 @@ def check(self):
169
169
raise ValueError ("ttl should be greater than 60" )
170
170
if self .min_load_score < 1 :
171
171
raise ValueError ("min_load_score should be greater than 0" )
172
- if self .load_shrads_num < 1 :
173
- raise ValueError ("load_shrads_num should be greater than 0" )
172
+ if self .load_shards_num < 1 :
173
+ raise ValueError ("load_shards_num should be greater than 0" )
174
174
175
175
r = redis .Redis (self .host , self .port , self .db , self .password )
176
176
try :
@@ -262,7 +262,7 @@ def scheduler(self):
262
262
topic = self .config .topic ,
263
263
ttl = self .config .ttl ,
264
264
min_load_score = self .config .min_load_score ,
265
- load_shrads_num = self .config .load_shrads_num ,
265
+ load_shards_num = self .config .load_shards_num ,
266
266
enable_chunked_prefill = self .config .enable_chunked_prefill ,
267
267
max_num_partial_prefills = self .config .max_num_partial_prefills ,
268
268
max_long_partial_prefills = self .config .max_long_partial_prefills ,
0 commit comments