lmstudio-ai
diff --git a/‎src/lmstudio/async_api.py
Lines changed: 24 additions & 0 deletions b/‎src/lmstudio/async_api.py
Lines changed: 24 additions & 0 deletions
diff --git a/‎src/lmstudio/json_api.py
Lines changed: 13 additions & 0 deletions b/‎src/lmstudio/json_api.py
Lines changed: 13 additions & 0 deletions
@@ -1018,6 +1018,7 @@ async def _complete_stream(
         *,
         response_format: Literal[None] = ...,
         config: LlmPredictionConfig | LlmPredictionConfigDict | None = ...,
+        preset: str | None = ...,
         on_message: PredictionMessageCallback | None = ...,
         on_first_token: PredictionFirstTokenCallback | None = ...,
         on_prediction_fragment: PredictionFragmentCallback | None = ...,
@@ -1031,6 +1032,7 @@ async def _complete_stream(
         *,
         response_format: Type[ModelSchema] | DictSchema = ...,
         config: LlmPredictionConfig | LlmPredictionConfigDict | None = ...,
+        preset: str | None = ...,
         on_message: PredictionMessageCallback | None = ...,
         on_first_token: PredictionFirstTokenCallback | None = ...,
         on_prediction_fragment: PredictionFragmentCallback | None = ...,
@@ -1043,6 +1045,7 @@ async def _complete_stream(
         *,
         response_format: Type[ModelSchema] | DictSchema | None = None,
         config: LlmPredictionConfig | LlmPredictionConfigDict | None = None,
+        preset: str | None = None,
         on_message: PredictionMessageCallback | None = None,
         on_first_token: PredictionFirstTokenCallback | None = None,
         on_prediction_fragment: PredictionFragmentCallback | None = None,
@@ -1057,6 +1060,7 @@ async def _complete_stream(
             prompt,
             response_format,
             config,
+            preset,
             on_message,
             on_first_token,
             on_prediction_fragment,
@@ -1074,6 +1078,7 @@ async def _respond_stream(
         *,
         response_format: Literal[None] = ...,
         config: LlmPredictionConfig | LlmPredictionConfigDict | None = ...,
+        preset: str | None = ...,
         on_message: PredictionMessageCallback | None = ...,
         on_first_token: PredictionFirstTokenCallback | None = ...,
         on_prediction_fragment: PredictionFragmentCallback | None = ...,
@@ -1087,6 +1092,7 @@ async def _respond_stream(
         *,
         response_format: Type[ModelSchema] | DictSchema = ...,
         config: LlmPredictionConfig | LlmPredictionConfigDict | None = ...,
+        preset: str | None = ...,
         on_message: PredictionMessageCallback | None = ...,
         on_first_token: PredictionFirstTokenCallback | None = ...,
         on_prediction_fragment: PredictionFragmentCallback | None = ...,
@@ -1100,6 +1106,7 @@ async def _respond_stream(
         response_format: Type[ModelSchema] | DictSchema | None = None,
         on_message: PredictionMessageCallback | None = None,
         config: LlmPredictionConfig | LlmPredictionConfigDict | None = None,
+        preset: str | None = None,
         on_first_token: PredictionFirstTokenCallback | None = None,
         on_prediction_fragment: PredictionFragmentCallback | None = None,
         on_prompt_processing_progress: PromptProcessingCallback | None = None,
@@ -1115,6 +1122,7 @@ async def _respond_stream(
             history,
             response_format,
             config,
+            preset,
             on_message,
             on_first_token,
             on_prediction_fragment,
@@ -1248,6 +1256,7 @@ async def complete_stream(
         *,
         response_format: Literal[None] = ...,
         config: LlmPredictionConfig | LlmPredictionConfigDict | None = ...,
+        preset: str | None = ...,
         on_message: PredictionMessageCallback | None = ...,
         on_first_token: PredictionFirstTokenCallback | None = ...,
         on_prediction_fragment: PredictionFragmentCallback | None = ...,
@@ -1260,6 +1269,7 @@ async def complete_stream(
         *,
         response_format: Type[ModelSchema] | DictSchema = ...,
         config: LlmPredictionConfig | LlmPredictionConfigDict | None = ...,
+        preset: str | None = ...,
         on_message: PredictionMessageCallback | None = ...,
         on_first_token: PredictionFirstTokenCallback | None = ...,
         on_prediction_fragment: PredictionFragmentCallback | None = ...,
@@ -1272,6 +1282,7 @@ async def complete_stream(
         *,
         response_format: Type[ModelSchema] | DictSchema | None = None,
         config: LlmPredictionConfig | LlmPredictionConfigDict | None = None,
+        preset: str | None = None,
         on_message: PredictionMessageCallback | None = None,
         on_first_token: PredictionFirstTokenCallback | None = None,
         on_prediction_fragment: PredictionFragmentCallback | None = None,
@@ -1286,6 +1297,7 @@ async def complete_stream(
             prompt,
             response_format=response_format,
             config=config,
+            preset=preset,
             on_message=on_message,
             on_first_token=on_first_token,
             on_prediction_fragment=on_prediction_fragment,
@@ -1299,6 +1311,7 @@ async def complete(
         *,
         response_format: Literal[None] = ...,
         config: LlmPredictionConfig | LlmPredictionConfigDict | None = ...,
+        preset: str | None = ...,
         on_message: PredictionMessageCallback | None = ...,
         on_first_token: PredictionFirstTokenCallback | None = ...,
         on_prediction_fragment: PredictionFragmentCallback | None = ...,
@@ -1311,6 +1324,7 @@ async def complete(
         *,
         response_format: Type[ModelSchema] | DictSchema = ...,
         config: LlmPredictionConfig | LlmPredictionConfigDict | None = ...,
+        preset: str | None = ...,
         on_message: PredictionMessageCallback | None = ...,
         on_first_token: PredictionFirstTokenCallback | None = ...,
         on_prediction_fragment: PredictionFragmentCallback | None = ...,
@@ -1323,6 +1337,7 @@ async def complete(
         *,
         response_format: Type[ModelSchema] | DictSchema | None = None,
         config: LlmPredictionConfig | LlmPredictionConfigDict | None = None,
+        preset: str | None = None,
         on_message: PredictionMessageCallback | None = None,
         on_first_token: PredictionFirstTokenCallback | None = None,
         on_prediction_fragment: PredictionFragmentCallback | None = None,
@@ -1337,6 +1352,7 @@ async def complete(
             prompt,
             response_format=response_format,
             config=config,
+            preset=preset,
             on_message=on_message,
             on_first_token=on_first_token,
             on_prediction_fragment=on_prediction_fragment,
@@ -1355,6 +1371,7 @@ async def respond_stream(
         *,
         response_format: Literal[None] = ...,
         config: LlmPredictionConfig | LlmPredictionConfigDict | None = ...,
+        preset: str | None = ...,
         on_message: PredictionMessageCallback | None = ...,
         on_first_token: PredictionFirstTokenCallback | None = ...,
         on_prediction_fragment: PredictionFragmentCallback | None = ...,
@@ -1367,6 +1384,7 @@ async def respond_stream(
         *,
         response_format: Type[ModelSchema] | DictSchema = ...,
         config: LlmPredictionConfig | LlmPredictionConfigDict | None = ...,
+        preset: str | None = ...,
         on_message: PredictionMessageCallback | None = ...,
         on_first_token: PredictionFirstTokenCallback | None = ...,
         on_prediction_fragment: PredictionFragmentCallback | None = ...,
@@ -1379,6 +1397,7 @@ async def respond_stream(
         *,
         response_format: Type[ModelSchema] | DictSchema | None = None,
         config: LlmPredictionConfig | LlmPredictionConfigDict | None = None,
+        preset: str | None = None,
         on_message: PredictionMessageCallback | None = None,
         on_first_token: PredictionFirstTokenCallback | None = None,
         on_prediction_fragment: PredictionFragmentCallback | None = None,
@@ -1393,6 +1412,7 @@ async def respond_stream(
             history,
             response_format=response_format,
             config=config,
+            preset=preset,
             on_message=on_message,
             on_first_token=on_first_token,
             on_prediction_fragment=on_prediction_fragment,
@@ -1406,6 +1426,7 @@ async def respond(
         *,
         response_format: Literal[None] = ...,
         config: LlmPredictionConfig | LlmPredictionConfigDict | None = ...,
+        preset: str | None = ...,
         on_message: PredictionMessageCallback | None = ...,
         on_first_token: PredictionFirstTokenCallback | None = ...,
         on_prediction_fragment: PredictionFragmentCallback | None = ...,
@@ -1418,6 +1439,7 @@ async def respond(
         *,
         response_format: Type[ModelSchema] | DictSchema = ...,
         config: LlmPredictionConfig | LlmPredictionConfigDict | None = ...,
+        preset: str | None = ...,
         on_message: PredictionMessageCallback | None = ...,
         on_first_token: PredictionFirstTokenCallback | None = ...,
         on_prediction_fragment: PredictionFragmentCallback | None = ...,
@@ -1430,6 +1452,7 @@ async def respond(
         *,
         response_format: Type[ModelSchema] | DictSchema | None = None,
         config: LlmPredictionConfig | LlmPredictionConfigDict | None = None,
+        preset: str | None = None,
         on_message: PredictionMessageCallback | None = None,
         on_first_token: PredictionFirstTokenCallback | None = None,
         on_prediction_fragment: PredictionFragmentCallback | None = None,
@@ -1444,6 +1467,7 @@ async def respond(
             history,
             response_format=response_format,
             config=config,
+            preset=preset,
             on_message=on_message,
             on_first_token=on_first_token,
             on_prediction_fragment=on_prediction_fragment,
 
@@ -151,6 +151,7 @@
     "LMStudioChannelClosedError",
     "LMStudioModelNotFoundError",
     "LMStudioPredictionError",
+    "LMStudioPresetNotFoundError",
     "LMStudioServerError",
     "LMStudioUnknownMessageError",
     "LMStudioWebsocketError",
@@ -371,6 +372,8 @@ def from_details(message: str, details: DictObject) -> "LMStudioServerError":
             match display_data:
                 case {"code": "generic.noModelMatchingQuery"}:
                     specific_error = LMStudioModelNotFoundError(str(default_error))
+                case {"code": "generic.presetNotFound"}:
+                    specific_error = LMStudioPresetNotFoundError(str(default_error))
             if specific_error is not None:
                 specific_error._raw_error = default_error._raw_error
                 specific_error.server_error = default_error.server_error
@@ -383,6 +386,11 @@ class LMStudioModelNotFoundError(LMStudioServerError):
     """No model matching the given specifier could be located on the server."""
 
 
+@sdk_public_type
+class LMStudioPresetNotFoundError(LMStudioServerError):
+    """No preset config matching the given identifier could be located on the server."""
+
+
 @sdk_public_type
 class LMStudioChannelClosedError(LMStudioServerError):
     """Streaming channel unexpectedly closed by the LM Studio instance."""
@@ -1116,6 +1124,7 @@ def __init__(
         history: Chat,
         response_format: Type[ModelSchema] | DictSchema | None = None,
         config: LlmPredictionConfig | LlmPredictionConfigDict | None = None,
+        preset_config: str | None = None,
         on_message: PredictionMessageCallback | None = None,
         on_first_token: PredictionFirstTokenCallback | None = None,
         on_prediction_fragment: PredictionFragmentCallback | None = None,
@@ -1152,6 +1161,8 @@ def __init__(
                 "predictionConfigStack": config_stack.to_dict(),
             }
         )
+        if preset_config is not None:
+            params.fuzzy_preset_identifier = preset_config
         super().__init__(params)
         # Status tracking for the prediction progress and result reporting
         self._is_cancelled = False
@@ -1376,6 +1387,7 @@ def __init__(
         prompt: str,
         response_format: Type[ModelSchema] | DictSchema | None = None,
         config: LlmPredictionConfig | LlmPredictionConfigDict | None = None,
+        preset_config: str | None = None,
         on_message: PredictionMessageCallback | None = None,
         on_first_token: PredictionFirstTokenCallback | None = None,
         on_prediction_fragment: PredictionFragmentCallback | None = None,
@@ -1389,6 +1401,7 @@ def __init__(
             history,
             response_format,
             config,
+            preset_config,
             on_message,
             on_first_token,
             on_prediction_fragment,