feat(config): default reasoning effort to max (#36)
parent
4eebf78351
commit
3ed8da6307
|
|
@ -20,7 +20,7 @@ DEFAULT_PORT = 9000
|
||||||
DEFAULT_UPSTREAM_BASE_URL = "https://api.deepseek.com"
|
DEFAULT_UPSTREAM_BASE_URL = "https://api.deepseek.com"
|
||||||
DEFAULT_UPSTREAM_MODEL = "deepseek-v4-pro"
|
DEFAULT_UPSTREAM_MODEL = "deepseek-v4-pro"
|
||||||
DEFAULT_THINKING = "enabled"
|
DEFAULT_THINKING = "enabled"
|
||||||
DEFAULT_REASONING_EFFORT = "high"
|
DEFAULT_REASONING_EFFORT = "max"
|
||||||
DEFAULT_DISPLAY_REASONING = True
|
DEFAULT_DISPLAY_REASONING = True
|
||||||
DEFAULT_COLLAPSIBLE_REASONING = True
|
DEFAULT_COLLAPSIBLE_REASONING = True
|
||||||
DEFAULT_NGROK = True
|
DEFAULT_NGROK = True
|
||||||
|
|
|
||||||
|
|
@ -861,7 +861,7 @@ def build_arg_parser() -> argparse.ArgumentParser:
|
||||||
parser.add_argument(
|
parser.add_argument(
|
||||||
"--reasoning-effort",
|
"--reasoning-effort",
|
||||||
choices=["low", "medium", "high", "max", "xhigh"],
|
choices=["low", "medium", "high", "max", "xhigh"],
|
||||||
help="DeepSeek reasoning effort, default from config or high",
|
help="DeepSeek reasoning effort, default from config or max",
|
||||||
)
|
)
|
||||||
parser.add_argument(
|
parser.add_argument(
|
||||||
"--reasoning-content-path",
|
"--reasoning-content-path",
|
||||||
|
|
@ -997,8 +997,9 @@ def log_cursor_request(
|
||||||
) -> None:
|
) -> None:
|
||||||
model = str(payload.get("model") or config.upstream_model)
|
model = str(payload.get("model") or config.upstream_model)
|
||||||
LOG.info(
|
LOG.info(
|
||||||
"┌ cursor model=%s messages=%s tools=%s",
|
"┌ cursor model=%s effort=%s messages=%s tools=%s",
|
||||||
model,
|
model,
|
||||||
|
config.reasoning_effort,
|
||||||
format_count(message_count(payload)),
|
format_count(message_count(payload)),
|
||||||
format_count(tool_count(payload)),
|
format_count(tool_count(payload)),
|
||||||
)
|
)
|
||||||
|
|
@ -1332,7 +1333,7 @@ def main(argv: list[str] | None = None) -> int:
|
||||||
store.close()
|
store.close()
|
||||||
return 2
|
return 2
|
||||||
LOG.info("ngrok tunnel forwarding %s -> %s", public_url, target_url)
|
LOG.info("ngrok tunnel forwarding %s -> %s", public_url, target_url)
|
||||||
LOG.info("Cursor Base URL: %s/v1", public_url.rstrip("/"))
|
LOG.info("api base url: %s/v1", public_url.rstrip("/"))
|
||||||
try:
|
try:
|
||||||
server.serve_forever()
|
server.serve_forever()
|
||||||
except KeyboardInterrupt:
|
except KeyboardInterrupt:
|
||||||
|
|
|
||||||
|
|
@ -795,7 +795,7 @@ def prepare_upstream_request(
|
||||||
thinking_disabled = config.thinking == "disabled"
|
thinking_disabled = config.thinking == "disabled"
|
||||||
if thinking_enabled:
|
if thinking_enabled:
|
||||||
prepared["reasoning_effort"] = normalize_reasoning_effort(
|
prepared["reasoning_effort"] = normalize_reasoning_effort(
|
||||||
prepared.get("reasoning_effort") or config.reasoning_effort
|
config.reasoning_effort
|
||||||
)
|
)
|
||||||
|
|
||||||
cache_namespace = reasoning_cache_namespace(
|
cache_namespace = reasoning_cache_namespace(
|
||||||
|
|
|
||||||
|
|
@ -35,7 +35,7 @@ def _default_cache_namespace() -> str:
|
||||||
ProxyConfig(),
|
ProxyConfig(),
|
||||||
"deepseek-v4-pro",
|
"deepseek-v4-pro",
|
||||||
{"type": "enabled"},
|
{"type": "enabled"},
|
||||||
"high",
|
"max",
|
||||||
)
|
)
|
||||||
|
|
||||||
|
|
||||||
|
|
@ -366,14 +366,14 @@ class CrossModeAndModelTests(unittest.TestCase):
|
||||||
config,
|
config,
|
||||||
"deepseek-v4-pro",
|
"deepseek-v4-pro",
|
||||||
{"type": "enabled"},
|
{"type": "enabled"},
|
||||||
"high",
|
"max",
|
||||||
"Bearer key-a",
|
"Bearer key-a",
|
||||||
)
|
)
|
||||||
namespace_flash = reasoning_cache_namespace(
|
namespace_flash = reasoning_cache_namespace(
|
||||||
config,
|
config,
|
||||||
"deepseek-v4-flash",
|
"deepseek-v4-flash",
|
||||||
{"type": "enabled"},
|
{"type": "enabled"},
|
||||||
"high",
|
"max",
|
||||||
"Bearer key-a",
|
"Bearer key-a",
|
||||||
)
|
)
|
||||||
self.assertEqual(namespace_pro, namespace_flash)
|
self.assertEqual(namespace_pro, namespace_flash)
|
||||||
|
|
|
||||||
Loading…
Reference in New Issue