mirror of
https://github.com/langbot-app/LangBot.git
synced 2026-06-02 03:55:55 +00:00
* feat(provider): add rerank model management as a core model type * feat(provider): add rerank support to existing requesters and new rerank providers * feat(web): add rerank model management UI and pipeline config * fix(provider): correct rerank support_type after verification - Add rerank to OpenRouter (confirmed /api/v1/rerank endpoint) - Remove rerank from Ollama (no native support, PR #7219 unmerged) - Remove rerank from JiekouAI (no rerank docs found, URL path mismatch) * fix(provider): remove alru_cache from model getters and add rerank param hints * fix: resolve lint errors - Remove unused alru_cache import from modelmgr.py - Remove unused error_message variable in invoke_rerank - Fix prettier formatting in frontend files Co-Authored-By: Claude Opus 4.7 <noreply@anthropic.com> * fix: remove unused exception variable - Change `except Exception as e:` to `except Exception:` since e is not used - Fix prettier formatting in ProviderCard.tsx Co-Authored-By: Claude Opus 4.7 <noreply@anthropic.com> * fix: apply ruff format Co-Authored-By: Claude Opus 4.7 <noreply@anthropic.com> * feat(template): add rerank config fields to default pipeline config Co-Authored-By: Claude Opus 4.7 <noreply@anthropic.com> * chore: remove PR.md Co-Authored-By: Claude Opus 4.7 <noreply@anthropic.com> * fix(ui): remove duplicate rerank model form in AddModelPopover The form was being rendered twice: once in TabsContent manual mode and again in a separate conditional block for rerank tab. Co-Authored-By: Claude Opus 4.7 <noreply@anthropic.com> --------- Co-authored-by: Claude Opus 4.7 <noreply@anthropic.com>
57 lines
2.9 KiB
Python
57 lines
2.9 KiB
Python
import quart
|
|
|
|
from ... import group
|
|
|
|
|
|
@group.group_class('models/providers', '/api/v1/provider/providers')
|
|
class ModelProvidersRouterGroup(group.RouterGroup):
|
|
async def initialize(self) -> None:
|
|
@self.route('', methods=['GET', 'POST'], auth_type=group.AuthType.USER_TOKEN_OR_API_KEY)
|
|
async def _() -> str:
|
|
if quart.request.method == 'GET':
|
|
providers = await self.ap.provider_service.get_providers()
|
|
# Add model counts
|
|
for provider in providers:
|
|
counts = await self.ap.provider_service.get_provider_model_counts(provider['uuid'])
|
|
provider['llm_count'] = counts['llm_count']
|
|
provider['embedding_count'] = counts['embedding_count']
|
|
provider['rerank_count'] = counts['rerank_count']
|
|
return self.success(data={'providers': providers})
|
|
elif quart.request.method == 'POST':
|
|
json_data = await quart.request.json
|
|
provider_uuid = await self.ap.provider_service.create_provider(json_data)
|
|
return self.success(data={'uuid': provider_uuid})
|
|
|
|
@self.route(
|
|
'/<provider_uuid>', methods=['GET', 'PUT', 'DELETE'], auth_type=group.AuthType.USER_TOKEN_OR_API_KEY
|
|
)
|
|
async def _(provider_uuid: str) -> str:
|
|
if quart.request.method == 'GET':
|
|
provider = await self.ap.provider_service.get_provider(provider_uuid)
|
|
if provider is None:
|
|
return self.http_status(404, -1, 'provider not found')
|
|
counts = await self.ap.provider_service.get_provider_model_counts(provider_uuid)
|
|
provider['llm_count'] = counts['llm_count']
|
|
provider['embedding_count'] = counts['embedding_count']
|
|
provider['rerank_count'] = counts['rerank_count']
|
|
return self.success(data={'provider': provider})
|
|
elif quart.request.method == 'PUT':
|
|
json_data = await quart.request.json
|
|
await self.ap.provider_service.update_provider(provider_uuid, json_data)
|
|
return self.success()
|
|
elif quart.request.method == 'DELETE':
|
|
try:
|
|
await self.ap.provider_service.delete_provider(provider_uuid)
|
|
return self.success()
|
|
except ValueError as e:
|
|
return self.http_status(400, -1, str(e))
|
|
|
|
@self.route('/<provider_uuid>/scan-models', methods=['GET'], auth_type=group.AuthType.USER_TOKEN_OR_API_KEY)
|
|
async def _(provider_uuid: str) -> str:
|
|
try:
|
|
model_type = quart.request.args.get('type')
|
|
result = await self.ap.provider_service.scan_provider_models(provider_uuid, model_type)
|
|
return self.success(data=result)
|
|
except ValueError as e:
|
|
return self.http_status(400, -1, str(e))
|