mirror of
https://github.com/1Panel-dev/MaxKB.git
synced 2025-12-27 20:42:52 +00:00
73 lines
3.5 KiB
Python
73 lines
3.5 KiB
Python
# coding=utf-8
|
|
from typing import Dict
|
|
|
|
from django.utils.translation import gettext_lazy as _, gettext
|
|
from langchain_core.messages import HumanMessage
|
|
|
|
from common import forms
|
|
from common.exception.app_exception import AppApiException
|
|
from common.forms import BaseForm, TooltipLabel
|
|
from models_provider.base_model_provider import BaseModelCredential, ValidCode
|
|
from common.utils.logger import maxkb_logger
|
|
|
|
class VLLMModelParams(BaseForm):
|
|
temperature = forms.SliderField(TooltipLabel(_('Temperature'),
|
|
_('Higher values make the output more random, while lower values make it more focused and deterministic')),
|
|
required=True, default_value=0.7,
|
|
_min=0.1,
|
|
_max=1.0,
|
|
_step=0.01,
|
|
precision=2)
|
|
|
|
max_tokens = forms.SliderField(
|
|
TooltipLabel(_('Output the maximum Tokens'),
|
|
_('Specify the maximum number of tokens that the model can generate')),
|
|
required=True, default_value=800,
|
|
_min=1,
|
|
_max=100000,
|
|
_step=1,
|
|
precision=0)
|
|
|
|
|
|
class VLLMModelCredential(BaseForm, BaseModelCredential):
|
|
def is_valid(self, model_type: str, model_name, model_credential: Dict[str, object], model_params, provider,
|
|
raise_exception=False):
|
|
model_type_list = provider.get_model_type_list()
|
|
if not any(list(filter(lambda mt: mt.get('value') == model_type, model_type_list))):
|
|
raise AppApiException(ValidCode.valid_error.value,
|
|
gettext('{model_type} Model type is not supported').format(model_type=model_type))
|
|
try:
|
|
model_list = provider.get_base_model_list(model_credential.get('api_base'), model_credential.get('api_key'))
|
|
except Exception as e:
|
|
raise AppApiException(ValidCode.valid_error.value, gettext('API domain name is invalid'))
|
|
exist = provider.get_model_info_by_name(model_list, model_name)
|
|
if len(exist) == 0:
|
|
raise AppApiException(ValidCode.valid_error.value,
|
|
gettext('The model does not exist, please download the model first'))
|
|
model = provider.get_model(model_type, model_name, model_credential, **model_params)
|
|
try:
|
|
res = model.invoke([HumanMessage(content=gettext('Hello'))])
|
|
except Exception as e:
|
|
maxkb_logger.error(f'Exception: {e}', exc_info=True)
|
|
raise AppApiException(ValidCode.valid_error.value,
|
|
gettext(
|
|
'Verification failed, please check whether the parameters are correct: {error}').format(
|
|
error=str(e)))
|
|
return True
|
|
|
|
def encryption_dict(self, model_info: Dict[str, object]):
|
|
return {**model_info, 'api_key': super().encryption(model_info.get('api_key', ''))}
|
|
|
|
def build_model(self, model_info: Dict[str, object]):
|
|
for key in ['api_key', 'model']:
|
|
if key not in model_info:
|
|
raise AppApiException(500, gettext('{key} is required').format(key=key))
|
|
self.api_key = model_info.get('api_key')
|
|
return self
|
|
|
|
api_base = forms.TextInputField('API URL', required=True)
|
|
api_key = forms.PasswordInputField('API Key', required=True)
|
|
|
|
def get_model_params_setting_form(self, model_name):
|
|
return VLLMModelParams()
|