| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215 | # -*- coding:utf-8 -*-import jsonimport loggingfrom typing import Generator, Unionimport flask_loginfrom flask import Response, stream_with_contextfrom core.login.login import login_requiredfrom werkzeug.exceptions import InternalServerError, NotFoundimport servicesfrom controllers.console import apifrom controllers.console.app import _get_appfrom controllers.console.app.error import ConversationCompletedError, AppUnavailableError, \    ProviderNotInitializeError, CompletionRequestError, ProviderQuotaExceededError, \    ProviderModelCurrentlyNotSupportErrorfrom controllers.console.setup import setup_requiredfrom controllers.console.wraps import account_initialization_requiredfrom core.conversation_message_task import PubHandlerfrom core.model_providers.error import LLMBadRequestError, LLMAPIUnavailableError, LLMAuthorizationError, LLMAPIConnectionError, \    LLMRateLimitError, ProviderTokenNotInitError, QuotaExceededError, ModelCurrentlyNotSupportErrorfrom libs.helper import uuid_valuefrom flask_restful import Resource, reqparsefrom services.completion_service import CompletionService# define completion message api for userclass CompletionMessageApi(Resource):    @setup_required    @login_required    @account_initialization_required    def post(self, app_id):        app_id = str(app_id)        # get app info        app_model = _get_app(app_id, 'completion')        parser = reqparse.RequestParser()        parser.add_argument('inputs', type=dict, required=True, location='json')        parser.add_argument('query', type=str, location='json', default='')        parser.add_argument('model_config', type=dict, required=True, location='json')        parser.add_argument('response_mode', type=str, choices=['blocking', 'streaming'], location='json')        parser.add_argument('retriever_from', type=str, required=False, default='dev', location='json')        args = parser.parse_args()        streaming = args['response_mode'] != 'blocking'        account = flask_login.current_user        try:            response = CompletionService.completion(                app_model=app_model,                user=account,                args=args,                from_source='console',                streaming=streaming,                is_model_config_override=True            )            return compact_response(response)        except services.errors.conversation.ConversationNotExistsError:            raise NotFound("Conversation Not Exists.")        except services.errors.conversation.ConversationCompletedError:            raise ConversationCompletedError()        except services.errors.app_model_config.AppModelConfigBrokenError:            logging.exception("App model config broken.")            raise AppUnavailableError()        except ProviderTokenNotInitError as ex:            raise ProviderNotInitializeError(ex.description)        except QuotaExceededError:            raise ProviderQuotaExceededError()        except ModelCurrentlyNotSupportError:            raise ProviderModelCurrentlyNotSupportError()        except (LLMBadRequestError, LLMAPIConnectionError, LLMAPIUnavailableError,                LLMRateLimitError, LLMAuthorizationError) as e:            raise CompletionRequestError(str(e))        except ValueError as e:            raise e        except Exception as e:            logging.exception("internal server error.")            raise InternalServerError()class CompletionMessageStopApi(Resource):    @setup_required    @login_required    @account_initialization_required    def post(self, app_id, task_id):        app_id = str(app_id)        # get app info        _get_app(app_id, 'completion')        account = flask_login.current_user        PubHandler.stop(account, task_id)        return {'result': 'success'}, 200class ChatMessageApi(Resource):    @setup_required    @login_required    @account_initialization_required    def post(self, app_id):        app_id = str(app_id)        # get app info        app_model = _get_app(app_id, 'chat')        parser = reqparse.RequestParser()        parser.add_argument('inputs', type=dict, required=True, location='json')        parser.add_argument('query', type=str, required=True, location='json')        parser.add_argument('model_config', type=dict, required=True, location='json')        parser.add_argument('conversation_id', type=uuid_value, location='json')        parser.add_argument('response_mode', type=str, choices=['blocking', 'streaming'], location='json')        parser.add_argument('retriever_from', type=str, required=False, default='dev', location='json')        args = parser.parse_args()        streaming = args['response_mode'] != 'blocking'        account = flask_login.current_user        try:            response = CompletionService.completion(                app_model=app_model,                user=account,                args=args,                from_source='console',                streaming=streaming,                is_model_config_override=True            )            return compact_response(response)        except services.errors.conversation.ConversationNotExistsError:            raise NotFound("Conversation Not Exists.")        except services.errors.conversation.ConversationCompletedError:            raise ConversationCompletedError()        except services.errors.app_model_config.AppModelConfigBrokenError:            logging.exception("App model config broken.")            raise AppUnavailableError()        except ProviderTokenNotInitError as ex:            raise ProviderNotInitializeError(ex.description)        except QuotaExceededError:            raise ProviderQuotaExceededError()        except ModelCurrentlyNotSupportError:            raise ProviderModelCurrentlyNotSupportError()        except (LLMBadRequestError, LLMAPIConnectionError, LLMAPIUnavailableError,                LLMRateLimitError, LLMAuthorizationError) as e:            raise CompletionRequestError(str(e))        except ValueError as e:            raise e        except Exception as e:            logging.exception("internal server error.")            raise InternalServerError()def compact_response(response: Union[dict | Generator]) -> Response:    if isinstance(response, dict):        return Response(response=json.dumps(response), status=200, mimetype='application/json')    else:        def generate() -> Generator:            try:                for chunk in response:                    yield chunk            except services.errors.conversation.ConversationNotExistsError:                yield "data: " + json.dumps(api.handle_error(NotFound("Conversation Not Exists.")).get_json()) + "\n\n"            except services.errors.conversation.ConversationCompletedError:                yield "data: " + json.dumps(api.handle_error(ConversationCompletedError()).get_json()) + "\n\n"            except services.errors.app_model_config.AppModelConfigBrokenError:                logging.exception("App model config broken.")                yield "data: " + json.dumps(api.handle_error(AppUnavailableError()).get_json()) + "\n\n"            except ProviderTokenNotInitError as ex:                yield "data: " + json.dumps(api.handle_error(ProviderNotInitializeError(ex.description)).get_json()) + "\n\n"            except QuotaExceededError:                yield "data: " + json.dumps(api.handle_error(ProviderQuotaExceededError()).get_json()) + "\n\n"            except ModelCurrentlyNotSupportError:                yield "data: " + json.dumps(api.handle_error(ProviderModelCurrentlyNotSupportError()).get_json()) + "\n\n"            except (LLMBadRequestError, LLMAPIConnectionError, LLMAPIUnavailableError,                    LLMRateLimitError, LLMAuthorizationError) as e:                yield "data: " + json.dumps(api.handle_error(CompletionRequestError(str(e))).get_json()) + "\n\n"            except ValueError as e:                yield "data: " + json.dumps(api.handle_error(e).get_json()) + "\n\n"            except Exception:                logging.exception("internal server error.")                yield "data: " + json.dumps(api.handle_error(InternalServerError()).get_json()) + "\n\n"        return Response(stream_with_context(generate()), status=200,                        mimetype='text/event-stream')class ChatMessageStopApi(Resource):    @setup_required    @login_required    @account_initialization_required    def post(self, app_id, task_id):        app_id = str(app_id)        # get app info        _get_app(app_id, 'chat')        account = flask_login.current_user        PubHandler.stop(account, task_id)        return {'result': 'success'}, 200api.add_resource(CompletionMessageApi, '/apps/<uuid:app_id>/completion-messages')api.add_resource(CompletionMessageStopApi, '/apps/<uuid:app_id>/completion-messages/<string:task_id>/stop')api.add_resource(ChatMessageApi, '/apps/<uuid:app_id>/chat-messages')api.add_resource(ChatMessageStopApi, '/apps/<uuid:app_id>/chat-messages/<string:task_id>/stop')
 |