@@ -3577,26 +3577,28 @@ def onready_subprocess():
3577
3577
s_pp = float (benchmaxctx - benchlen )/ t_pp
3578
3578
s_gen = float (benchlen )/ t_gen
3579
3579
datetimestamp = datetime .now (timezone .utc )
3580
+ benchflagstr = f"NoAVX2={ args .noavx2 } Threads={ args .threads } HighPriority={ args .highpriority } NoBlas={ args .noblas } Cublas_Args={ args .usecublas } Tensor_Split={ args .tensor_split } BlasThreads={ args .blasthreads } BlasBatchSize={ args .blasbatchsize } FlashAttention={ args .flashattention } KvCache={ args .quantkv } "
3580
3581
print (f"\n Benchmark Completed - v{ KcppVersion } Results:\n ======" )
3582
+ print (f"Flags: { benchflagstr } " )
3581
3583
print (f"Timestamp: { datetimestamp } " )
3582
3584
print (f"Backend: { libname } " )
3583
3585
print (f"Layers: { args .gpulayers } " )
3584
3586
print (f"Model: { benchmodel } " )
3585
3587
print (f"MaxCtx: { benchmaxctx } " )
3586
3588
print (f"GenAmount: { benchlen } \n -----" )
3587
- print (f"ProcessingTime: { t_pp :.2f } s" )
3589
+ print (f"ProcessingTime: { t_pp :.3f } s" )
3588
3590
print (f"ProcessingSpeed: { s_pp :.2f} T/s" )
3589
- print (f"GenerationTime: { t_gen :.2f } s" )
3591
+ print (f"GenerationTime: { t_gen :.3f } s" )
3590
3592
print (f"GenerationSpeed: { s_gen :.2f} T/s" )
3591
- print (f"TotalTime: { (t_pp + t_gen ):.2f } s" )
3593
+ print (f"TotalTime: { (t_pp + t_gen ):.3f } s" )
3592
3594
print (f"Output: { result } \n -----" )
3593
3595
if save_to_file :
3594
3596
try :
3595
3597
with open (args .benchmark , "a" ) as file :
3596
3598
file .seek (0 , 2 )
3597
3599
if file .tell () == 0 : #empty file
3598
- file .write (f"Timestamp,Backend,Layers,Model,MaxCtx,GenAmount,ProcessingTime,ProcessingSpeed,GenerationTime,GenerationSpeed,TotalTime,Output" )
3599
- file .write (f"\n { datetimestamp } ,{ libname } ,{ args .gpulayers } ,{ benchmodel } ,{ benchmaxctx } ,{ benchlen } ,{ t_pp :.2f} ,{ s_pp :.2f} ,{ t_gen :.2f} ,{ s_gen :.2f} ,{ (t_pp + t_gen ):.2f} ,{ result } " )
3600
+ file .write (f"Timestamp,Backend,Layers,Model,MaxCtx,GenAmount,ProcessingTime,ProcessingSpeed,GenerationTime,GenerationSpeed,TotalTime,Output,Flags " )
3601
+ file .write (f"\n { datetimestamp } ,{ libname } ,{ args .gpulayers } ,{ benchmodel } ,{ benchmaxctx } ,{ benchlen } ,{ t_pp :.2f} ,{ s_pp :.2f} ,{ t_gen :.2f} ,{ s_gen :.2f} ,{ (t_pp + t_gen ):.2f} ,{ result } , { benchflagstr } " )
3600
3602
except Exception as e :
3601
3603
print (f"Error writing benchmark to file: { e } " )
3602
3604
global using_gui_launcher
0 commit comments