added "minimal" reasoning option (better for coding)
This commit is contained in:
@@ -93,7 +93,7 @@ curl http://127.0.0.1:8000/v1/chat/completions \
|
|||||||
|
|
||||||
### Thinking effort
|
### Thinking effort
|
||||||
|
|
||||||
- `--reasoning-effort` (choice of low,medium,high)<br>
|
- `--reasoning-effort` (choice of minimal,low,medium,high)<br>
|
||||||
GPT-5 has a configurable amount of "effort" it can put into thinking, which may cause it to take more time for a response to return, but may overall give a smarter answer. Applying this parameter after `serve` forces the server to use this reasoning effort by default, unless overrided by the API request with a different effort set. The default reasoning effort without setting this parameter is `medium`.
|
GPT-5 has a configurable amount of "effort" it can put into thinking, which may cause it to take more time for a response to return, but may overall give a smarter answer. Applying this parameter after `serve` forces the server to use this reasoning effort by default, unless overrided by the API request with a different effort set. The default reasoning effort without setting this parameter is `medium`.
|
||||||
|
|
||||||
### Thinking summaries
|
### Thinking summaries
|
||||||
|
|||||||
@@ -85,7 +85,7 @@ def main() -> None:
|
|||||||
)
|
)
|
||||||
p_serve.add_argument(
|
p_serve.add_argument(
|
||||||
"--reasoning-effort",
|
"--reasoning-effort",
|
||||||
choices=["low", "medium", "high", "none"],
|
choices=["minimal", "low", "medium", "high"],
|
||||||
default=os.getenv("CHATGPT_LOCAL_REASONING_EFFORT", "medium").lower(),
|
default=os.getenv("CHATGPT_LOCAL_REASONING_EFFORT", "medium").lower(),
|
||||||
help="Reasoning effort level for Responses API (default: medium)",
|
help="Reasoning effort level for Responses API (default: medium)",
|
||||||
)
|
)
|
||||||
|
|||||||
@@ -9,7 +9,7 @@ def build_reasoning_param(
|
|||||||
effort = (base_effort or "").strip().lower()
|
effort = (base_effort or "").strip().lower()
|
||||||
summary = (base_summary or "").strip().lower()
|
summary = (base_summary or "").strip().lower()
|
||||||
|
|
||||||
valid_efforts = {"low", "medium", "high", "none"}
|
valid_efforts = {"minimal", "low", "medium", "high"}
|
||||||
valid_summaries = {"auto", "concise", "detailed", "none"}
|
valid_summaries = {"auto", "concise", "detailed", "none"}
|
||||||
|
|
||||||
if isinstance(overrides, dict):
|
if isinstance(overrides, dict):
|
||||||
|
|||||||
@@ -58,7 +58,7 @@ def start_upstream_request(
|
|||||||
return None, resp
|
return None, resp
|
||||||
|
|
||||||
include: List[str] = []
|
include: List[str] = []
|
||||||
if isinstance(reasoning_param, dict) and reasoning_param.get("effort") != "none":
|
if isinstance(reasoning_param, dict):
|
||||||
include.append("reasoning.encrypted_content")
|
include.append("reasoning.encrypted_content")
|
||||||
|
|
||||||
client_session_id = None
|
client_session_id = None
|
||||||
|
|||||||
2
gui.py
2
gui.py
@@ -298,7 +298,7 @@ class MainWindow(QtWidgets.QMainWindow):
|
|||||||
opts.setVerticalSpacing(8)
|
opts.setVerticalSpacing(8)
|
||||||
opts.addWidget(QtWidgets.QLabel("Reasoning Effort"), 0, 0)
|
opts.addWidget(QtWidgets.QLabel("Reasoning Effort"), 0, 0)
|
||||||
self.effort = QtWidgets.QComboBox()
|
self.effort = QtWidgets.QComboBox()
|
||||||
self.effort.addItems(["low", "medium", "high", "none"]) # default medium
|
self.effort.addItems(["minimal", "low", "medium", "high"]) # default medium
|
||||||
self.effort.setCurrentText("medium")
|
self.effort.setCurrentText("medium")
|
||||||
self.effort.setSizeAdjustPolicy(QtWidgets.QComboBox.AdjustToContents)
|
self.effort.setSizeAdjustPolicy(QtWidgets.QComboBox.AdjustToContents)
|
||||||
self.effort.setMinimumContentsLength(7)
|
self.effort.setMinimumContentsLength(7)
|
||||||
|
|||||||
Reference in New Issue
Block a user