File tree Expand file tree Collapse file tree 3 files changed +7
-5
lines changed Expand file tree Collapse file tree 3 files changed +7
-5
lines changed Original file line number Diff line number Diff line change @@ -20,6 +20,6 @@ public class InferenceOptions
20
20
public IReadOnlyList < string > AntiPrompts { get ; set ; } = Array . Empty < string > ( ) ;
21
21
22
22
/// <inheritdoc />
23
- public required ISamplingPipeline SamplingPipeline { get ; set ; }
23
+ public ISamplingPipeline SamplingPipeline { get ; set ; } = new DefaultSamplingPipeline ( ) ;
24
24
}
25
25
}
Original file line number Diff line number Diff line change 3
3
"Logging" : {
4
4
"LogLevel" : {
5
5
"Default" : " Information" ,
6
- "Microsoft.AspNetCore" : " Warning"
6
+ "Microsoft.AspNetCore" : " Warning" ,
7
+ "Microsoft.AspNetCore.SignalR" : " Debug" ,
8
+ "Microsoft.AspNetCore.Http.Connections" : " Debug"
7
9
}
8
10
}
9
11
}
Original file line number Diff line number Diff line change 10
10
"ModelLoadType" : 0 ,
11
11
"Models" : [
12
12
{
13
- "Name" : " Example LLama2-7b-Chat " ,
13
+ "Name" : " Example LLava-v1.6-mistral " ,
14
14
"MaxInstances" : 20 ,
15
- "ModelPath" : " ..\\ LLama.Unittest\\ Models\\ llama-2-7b-chat.Q4_0 .gguf" ,
15
+ "ModelPath" : " ..\\ LLama.Unittest\\ Models\\ llava-v1.6-mistral-7b.Q3_K_XS .gguf" ,
16
16
"ContextSize" : 2048 ,
17
17
"BatchSize" : 2048 ,
18
18
"Threads" : 4 ,
19
- "GpuLayerCount" : 6 ,
19
+ "GpuLayerCount" : 32 ,
20
20
"UseMemorymap" : true ,
21
21
"UseMemoryLock" : false ,
22
22
"MainGpu" : 0 ,
You can’t perform that action at this time.
0 commit comments