File tree Expand file tree Collapse file tree 2 files changed +12
-3
lines changed Expand file tree Collapse file tree 2 files changed +12
-3
lines changed Original file line number Diff line number Diff line change 1
1
[tool .poetry ]
2
2
name = " truss"
3
- version = " 0.9.81rc001 "
3
+ version = " 0.9.81rc003 "
4
4
description = " A seamless bridge from model development to model delivery"
5
5
license = " MIT"
6
6
readme = " README.md"
Original file line number Diff line number Diff line change @@ -600,11 +600,20 @@ def trt_llm_validation(config: "TrussConfig") -> "TrussConfig":
600
600
"FP8 quantization is only supported on L4, H100, H200 "
601
601
"accelerators or newer (CUDA_COMPUTE>=89)"
602
602
)
603
- tensor_parallel_count = config .trt_llm .build .tensor_parallel_count
603
+ world_size = (
604
+ config .trt_llm .build .tensor_parallel_count
605
+ * config .trt_llm .build .pipeline_parallel_count
606
+ * config .trt_llm .build .sequence_parallel_count
607
+ )
604
608
605
- if tensor_parallel_count != config .resources .accelerator .count :
609
+ if world_size != config .resources .accelerator .count :
606
610
raise ValueError (
607
611
"Tensor parallelism and GPU count must be the same for TRT-LLM"
612
+ f"You have set tensor_parallel_count={ config .trt_llm .build .tensor_parallel_count } , "
613
+ f"pipeline_parallel_count={ config .trt_llm .build .pipeline_parallel_count } , "
614
+ f"sequence_parallel_count={ config .trt_llm .build .sequence_parallel_count } "
615
+ f"== world_size->{ world_size } "
616
+ f"and accelerator.count={ config .resources .accelerator .count } . "
608
617
)
609
618
610
619
return config
You can’t perform that action at this time.
0 commit comments