| 
									
										
										
										
											2024-09-09 17:18:08 +08:00
										 |  |  |  | # | 
					
						
							|  |  |  |  | #  Copyright 2024 The InfiniFlow Authors. All Rights Reserved. | 
					
						
							|  |  |  |  | # | 
					
						
							|  |  |  |  | #  Licensed under the Apache License, Version 2.0 (the "License"); | 
					
						
							|  |  |  |  | #  you may not use this file except in compliance with the License. | 
					
						
							|  |  |  |  | #  You may obtain a copy of the License at | 
					
						
							|  |  |  |  | # | 
					
						
							|  |  |  |  | #      http://www.apache.org/licenses/LICENSE-2.0 | 
					
						
							|  |  |  |  | # | 
					
						
							|  |  |  |  | #  Unless required by applicable law or agreed to in writing, software | 
					
						
							|  |  |  |  | #  distributed under the License is distributed on an "AS IS" BASIS, | 
					
						
							|  |  |  |  | #  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. | 
					
						
							|  |  |  |  | #  See the License for the specific language governing permissions and | 
					
						
							|  |  |  |  | #  limitations under the License. | 
					
						
							|  |  |  |  | # | 
					
						
							|  |  |  |  | import json | 
					
						
							|  |  |  |  | from uuid import uuid4 | 
					
						
							|  |  |  |  | 
 | 
					
						
							|  |  |  |  | from flask import request, Response | 
					
						
							|  |  |  |  | 
 | 
					
						
							|  |  |  |  | from api.db import StatusEnum | 
					
						
							|  |  |  |  | from api.db.services.dialog_service import DialogService, ConversationService, chat | 
					
						
							| 
									
										
										
										
											2024-09-11 12:03:55 +08:00
										 |  |  |  | from api.settings import RetCode | 
					
						
							| 
									
										
										
										
											2024-09-09 17:18:08 +08:00
										 |  |  |  | from api.utils import get_uuid | 
					
						
							|  |  |  |  | from api.utils.api_utils import get_data_error_result | 
					
						
							|  |  |  |  | from api.utils.api_utils import get_json_result, token_required | 
					
						
							|  |  |  |  | 
 | 
					
						
							|  |  |  |  | 
 | 
					
						
							|  |  |  |  | @manager.route('/save', methods=['POST']) | 
					
						
							|  |  |  |  | @token_required | 
					
						
							|  |  |  |  | def set_conversation(tenant_id): | 
					
						
							|  |  |  |  |     req = request.json | 
					
						
							|  |  |  |  |     conv_id = req.get("id") | 
					
						
							|  |  |  |  |     if "assistant_id" in req: | 
					
						
							|  |  |  |  |         req["dialog_id"] = req.pop("assistant_id") | 
					
						
							|  |  |  |  |     if "id" in req: | 
					
						
							|  |  |  |  |         del req["id"] | 
					
						
							|  |  |  |  |         conv = ConversationService.query(id=conv_id) | 
					
						
							|  |  |  |  |         if not conv: | 
					
						
							|  |  |  |  |             return get_data_error_result(retmsg="Session does not exist") | 
					
						
							|  |  |  |  |         if not DialogService.query(id=conv[0].dialog_id, tenant_id=tenant_id, status=StatusEnum.VALID.value): | 
					
						
							|  |  |  |  |             return get_data_error_result(retmsg="You do not own the session") | 
					
						
							|  |  |  |  |         if req.get("dialog_id"): | 
					
						
							|  |  |  |  |             dia = DialogService.query(tenant_id=tenant_id, id=req["dialog_id"], status=StatusEnum.VALID.value) | 
					
						
							|  |  |  |  |             if not dia: | 
					
						
							|  |  |  |  |                 return get_data_error_result(retmsg="You do not own the assistant") | 
					
						
							|  |  |  |  |         if "dialog_id" in req and not req.get("dialog_id"): | 
					
						
							|  |  |  |  |             return get_data_error_result(retmsg="assistant_id can not be empty.") | 
					
						
							| 
									
										
										
										
											2024-09-11 12:03:55 +08:00
										 |  |  |  |         if "message" in req: | 
					
						
							|  |  |  |  |             return get_data_error_result(retmsg="message can not be change") | 
					
						
							|  |  |  |  |         if "reference" in req: | 
					
						
							|  |  |  |  |             return get_data_error_result(retmsg="reference can not be change") | 
					
						
							| 
									
										
										
										
											2024-09-09 17:18:08 +08:00
										 |  |  |  |         if "name" in req and not req.get("name"): | 
					
						
							|  |  |  |  |             return get_data_error_result(retmsg="name can not be empty.") | 
					
						
							|  |  |  |  |         if not ConversationService.update_by_id(conv_id, req): | 
					
						
							|  |  |  |  |             return get_data_error_result(retmsg="Session updates error") | 
					
						
							|  |  |  |  |         return get_json_result(data=True) | 
					
						
							|  |  |  |  | 
 | 
					
						
							|  |  |  |  |     if not req.get("dialog_id"): | 
					
						
							|  |  |  |  |         return get_data_error_result(retmsg="assistant_id is required.") | 
					
						
							|  |  |  |  |     dia = DialogService.query(tenant_id=tenant_id, id=req["dialog_id"], status=StatusEnum.VALID.value) | 
					
						
							|  |  |  |  |     if not dia: | 
					
						
							|  |  |  |  |         return get_data_error_result(retmsg="You do not own the assistant") | 
					
						
							|  |  |  |  |     conv = { | 
					
						
							|  |  |  |  |         "id": get_uuid(), | 
					
						
							|  |  |  |  |         "dialog_id": req["dialog_id"], | 
					
						
							|  |  |  |  |         "name": req.get("name", "New session"), | 
					
						
							| 
									
										
										
										
											2024-09-11 12:03:55 +08:00
										 |  |  |  |         "message": [{"role": "assistant", "content": "Hi! I am your assistant,can I help you?"}] | 
					
						
							| 
									
										
										
										
											2024-09-09 17:18:08 +08:00
										 |  |  |  |     } | 
					
						
							|  |  |  |  |     if not conv.get("name"): | 
					
						
							|  |  |  |  |         return get_data_error_result(retmsg="name can not be empty.") | 
					
						
							|  |  |  |  |     ConversationService.save(**conv) | 
					
						
							|  |  |  |  |     e, conv = ConversationService.get_by_id(conv["id"]) | 
					
						
							|  |  |  |  |     if not e: | 
					
						
							|  |  |  |  |         return get_data_error_result(retmsg="Fail to new session!") | 
					
						
							|  |  |  |  |     conv = conv.to_dict() | 
					
						
							| 
									
										
										
										
											2024-09-11 12:03:55 +08:00
										 |  |  |  |     conv['messages'] = conv.pop("message") | 
					
						
							| 
									
										
										
										
											2024-09-09 17:18:08 +08:00
										 |  |  |  |     conv["assistant_id"] = conv.pop("dialog_id") | 
					
						
							|  |  |  |  |     del conv["reference"] | 
					
						
							|  |  |  |  |     return get_json_result(data=conv) | 
					
						
							|  |  |  |  | 
 | 
					
						
							|  |  |  |  | 
 | 
					
						
							|  |  |  |  | @manager.route('/completion', methods=['POST']) | 
					
						
							|  |  |  |  | @token_required | 
					
						
							|  |  |  |  | def completion(tenant_id): | 
					
						
							|  |  |  |  |     req = request.json | 
					
						
							|  |  |  |  |     # req = {"conversation_id": "9aaaca4c11d311efa461fa163e197198", "messages": [ | 
					
						
							|  |  |  |  |     #    {"role": "user", "content": "上海有吗?"} | 
					
						
							|  |  |  |  |     # ]} | 
					
						
							| 
									
										
										
										
											2024-09-11 12:03:55 +08:00
										 |  |  |  |     if "id" not in req: | 
					
						
							|  |  |  |  |         return get_data_error_result(retmsg="id is required") | 
					
						
							|  |  |  |  |     conv = ConversationService.query(id=req["id"]) | 
					
						
							|  |  |  |  |     if not conv: | 
					
						
							|  |  |  |  |         return get_data_error_result(retmsg="Session does not exist") | 
					
						
							|  |  |  |  |     conv = conv[0] | 
					
						
							|  |  |  |  |     if not DialogService.query(id=conv.dialog_id, tenant_id=tenant_id, status=StatusEnum.VALID.value): | 
					
						
							|  |  |  |  |         return get_data_error_result(retmsg="You do not own the session") | 
					
						
							| 
									
										
										
										
											2024-09-09 17:18:08 +08:00
										 |  |  |  |     msg = [] | 
					
						
							|  |  |  |  |     question = { | 
					
						
							|  |  |  |  |         "content": req.get("question"), | 
					
						
							|  |  |  |  |         "role": "user", | 
					
						
							|  |  |  |  |         "id": str(uuid4()) | 
					
						
							|  |  |  |  |     } | 
					
						
							| 
									
										
										
										
											2024-09-11 12:03:55 +08:00
										 |  |  |  |     conv.message.append(question) | 
					
						
							|  |  |  |  |     for m in conv.message: | 
					
						
							| 
									
										
										
										
											2024-09-09 17:18:08 +08:00
										 |  |  |  |         if m["role"] == "system": continue | 
					
						
							|  |  |  |  |         if m["role"] == "assistant" and not msg: continue | 
					
						
							|  |  |  |  |         msg.append(m) | 
					
						
							|  |  |  |  |     message_id = msg[-1].get("id") | 
					
						
							|  |  |  |  |     e, dia = DialogService.get_by_id(conv.dialog_id) | 
					
						
							|  |  |  |  |     del req["id"] | 
					
						
							|  |  |  |  | 
 | 
					
						
							|  |  |  |  |     if not conv.reference: | 
					
						
							|  |  |  |  |         conv.reference = [] | 
					
						
							|  |  |  |  |     conv.message.append({"role": "assistant", "content": "", "id": message_id}) | 
					
						
							|  |  |  |  |     conv.reference.append({"chunks": [], "doc_aggs": []}) | 
					
						
							|  |  |  |  | 
 | 
					
						
							|  |  |  |  |     def fillin_conv(ans): | 
					
						
							|  |  |  |  |         nonlocal conv, message_id | 
					
						
							|  |  |  |  |         if not conv.reference: | 
					
						
							|  |  |  |  |             conv.reference.append(ans["reference"]) | 
					
						
							|  |  |  |  |         else: | 
					
						
							|  |  |  |  |             conv.reference[-1] = ans["reference"] | 
					
						
							|  |  |  |  |         conv.message[-1] = {"role": "assistant", "content": ans["answer"], | 
					
						
							|  |  |  |  |                             "id": message_id, "prompt": ans.get("prompt", "")} | 
					
						
							|  |  |  |  |         ans["id"] = message_id | 
					
						
							|  |  |  |  | 
 | 
					
						
							|  |  |  |  |     def stream(): | 
					
						
							|  |  |  |  |         nonlocal dia, msg, req, conv | 
					
						
							|  |  |  |  |         try: | 
					
						
							|  |  |  |  |             for ans in chat(dia, msg, **req): | 
					
						
							|  |  |  |  |                 fillin_conv(ans) | 
					
						
							|  |  |  |  |                 yield "data:" + json.dumps({"retcode": 0, "retmsg": "", "data": ans}, ensure_ascii=False) + "\n\n" | 
					
						
							|  |  |  |  |             ConversationService.update_by_id(conv.id, conv.to_dict()) | 
					
						
							|  |  |  |  |         except Exception as e: | 
					
						
							|  |  |  |  |             yield "data:" + json.dumps({"retcode": 500, "retmsg": str(e), | 
					
						
							|  |  |  |  |                                         "data": {"answer": "**ERROR**: " + str(e), "reference": []}}, | 
					
						
							|  |  |  |  |                                        ensure_ascii=False) + "\n\n" | 
					
						
							|  |  |  |  |         yield "data:" + json.dumps({"retcode": 0, "retmsg": "", "data": True}, ensure_ascii=False) + "\n\n" | 
					
						
							|  |  |  |  | 
 | 
					
						
							|  |  |  |  |     if req.get("stream", True): | 
					
						
							|  |  |  |  |         resp = Response(stream(), mimetype="text/event-stream") | 
					
						
							|  |  |  |  |         resp.headers.add_header("Cache-control", "no-cache") | 
					
						
							|  |  |  |  |         resp.headers.add_header("Connection", "keep-alive") | 
					
						
							|  |  |  |  |         resp.headers.add_header("X-Accel-Buffering", "no") | 
					
						
							|  |  |  |  |         resp.headers.add_header("Content-Type", "text/event-stream; charset=utf-8") | 
					
						
							|  |  |  |  |         return resp | 
					
						
							|  |  |  |  | 
 | 
					
						
							|  |  |  |  |     else: | 
					
						
							|  |  |  |  |         answer = None | 
					
						
							|  |  |  |  |         for ans in chat(dia, msg, **req): | 
					
						
							|  |  |  |  |             answer = ans | 
					
						
							|  |  |  |  |             fillin_conv(ans) | 
					
						
							|  |  |  |  |             ConversationService.update_by_id(conv.id, conv.to_dict()) | 
					
						
							|  |  |  |  |             break | 
					
						
							|  |  |  |  |         return get_json_result(data=answer) | 
					
						
							| 
									
										
										
										
											2024-09-11 12:03:55 +08:00
										 |  |  |  | 
 | 
					
						
							|  |  |  |  | 
 | 
					
						
							|  |  |  |  | @manager.route('/get', methods=['GET']) | 
					
						
							|  |  |  |  | @token_required | 
					
						
							|  |  |  |  | def get(tenant_id): | 
					
						
							|  |  |  |  |     req = request.args | 
					
						
							|  |  |  |  |     if "id" not in req: | 
					
						
							|  |  |  |  |         return get_data_error_result(retmsg="id is required") | 
					
						
							|  |  |  |  |     conv_id = req["id"] | 
					
						
							|  |  |  |  |     conv = ConversationService.query(id=conv_id) | 
					
						
							|  |  |  |  |     if not conv: | 
					
						
							|  |  |  |  |         return get_data_error_result(retmsg="Session does not exist") | 
					
						
							|  |  |  |  |     if not DialogService.query(id=conv[0].dialog_id, tenant_id=tenant_id, status=StatusEnum.VALID.value): | 
					
						
							|  |  |  |  |         return get_data_error_result(retmsg="You do not own the session") | 
					
						
							|  |  |  |  |     conv = conv[0].to_dict() | 
					
						
							|  |  |  |  |     conv['messages'] = conv.pop("message") | 
					
						
							|  |  |  |  |     conv["assistant_id"] = conv.pop("dialog_id") | 
					
						
							|  |  |  |  |     if conv["reference"]: | 
					
						
							|  |  |  |  |         messages = conv["messages"] | 
					
						
							|  |  |  |  |         message_num = 0 | 
					
						
							|  |  |  |  |         chunk_num = 0 | 
					
						
							|  |  |  |  |         while message_num < len(messages): | 
					
						
							|  |  |  |  |             if message_num != 0 and messages[message_num]["role"] != "user": | 
					
						
							|  |  |  |  |                 chunk_list = [] | 
					
						
							|  |  |  |  |                 if "chunks" in conv["reference"][chunk_num]: | 
					
						
							|  |  |  |  |                     chunks = conv["reference"][chunk_num]["chunks"] | 
					
						
							|  |  |  |  |                     for chunk in chunks: | 
					
						
							|  |  |  |  |                         new_chunk = { | 
					
						
							|  |  |  |  |                             "id": chunk["chunk_id"], | 
					
						
							|  |  |  |  |                             "content": chunk["content_with_weight"], | 
					
						
							|  |  |  |  |                             "document_id": chunk["doc_id"], | 
					
						
							|  |  |  |  |                             "document_name": chunk["docnm_kwd"], | 
					
						
							|  |  |  |  |                             "knowledgebase_id": chunk["kb_id"], | 
					
						
							|  |  |  |  |                             "image_id": chunk["img_id"], | 
					
						
							|  |  |  |  |                             "similarity": chunk["similarity"], | 
					
						
							|  |  |  |  |                             "vector_similarity": chunk["vector_similarity"], | 
					
						
							|  |  |  |  |                             "term_similarity": chunk["term_similarity"], | 
					
						
							|  |  |  |  |                             "positions": chunk["positions"], | 
					
						
							|  |  |  |  |                         } | 
					
						
							|  |  |  |  |                         chunk_list.append(new_chunk) | 
					
						
							|  |  |  |  |                 chunk_num += 1 | 
					
						
							|  |  |  |  |                 messages[message_num]["reference"] = chunk_list | 
					
						
							|  |  |  |  |             message_num += 1 | 
					
						
							|  |  |  |  |     del conv["reference"] | 
					
						
							|  |  |  |  |     return get_json_result(data=conv) | 
					
						
							|  |  |  |  | 
 | 
					
						
							|  |  |  |  | 
 | 
					
						
							|  |  |  |  | @manager.route('/list', methods=["GET"]) | 
					
						
							|  |  |  |  | @token_required | 
					
						
							|  |  |  |  | def list(tenant_id): | 
					
						
							|  |  |  |  |     assistant_id = request.args["assistant_id"] | 
					
						
							|  |  |  |  |     if not DialogService.query(tenant_id=tenant_id, id=assistant_id, status=StatusEnum.VALID.value): | 
					
						
							|  |  |  |  |         return get_json_result( | 
					
						
							|  |  |  |  |             data=False, retmsg=f'Only owner of the assistant is authorized for this operation.', | 
					
						
							|  |  |  |  |             retcode=RetCode.OPERATING_ERROR) | 
					
						
							|  |  |  |  |     convs = ConversationService.query( | 
					
						
							|  |  |  |  |         dialog_id=assistant_id, | 
					
						
							|  |  |  |  |         order_by=ConversationService.model.create_time, | 
					
						
							|  |  |  |  |         reverse=True) | 
					
						
							|  |  |  |  |     convs = [d.to_dict() for d in convs] | 
					
						
							|  |  |  |  |     for conv in convs: | 
					
						
							|  |  |  |  |         conv['messages'] = conv.pop("message") | 
					
						
							|  |  |  |  |         conv["assistant_id"] = conv.pop("dialog_id") | 
					
						
							|  |  |  |  |         if conv["reference"]: | 
					
						
							|  |  |  |  |             messages = conv["messages"] | 
					
						
							|  |  |  |  |             message_num = 0 | 
					
						
							|  |  |  |  |             chunk_num = 0 | 
					
						
							|  |  |  |  |             while message_num < len(messages): | 
					
						
							|  |  |  |  |                 if message_num != 0 and messages[message_num]["role"] != "user": | 
					
						
							|  |  |  |  |                     chunk_list = [] | 
					
						
							|  |  |  |  |                     if "chunks" in conv["reference"][chunk_num]: | 
					
						
							|  |  |  |  |                         chunks = conv["reference"][chunk_num]["chunks"] | 
					
						
							|  |  |  |  |                         for chunk in chunks: | 
					
						
							|  |  |  |  |                             new_chunk = { | 
					
						
							|  |  |  |  |                                 "id": chunk["chunk_id"], | 
					
						
							|  |  |  |  |                                 "content": chunk["content_with_weight"], | 
					
						
							|  |  |  |  |                                 "document_id": chunk["doc_id"], | 
					
						
							|  |  |  |  |                                 "document_name": chunk["docnm_kwd"], | 
					
						
							|  |  |  |  |                                 "knowledgebase_id": chunk["kb_id"], | 
					
						
							|  |  |  |  |                                 "image_id": chunk["img_id"], | 
					
						
							|  |  |  |  |                                 "similarity": chunk["similarity"], | 
					
						
							|  |  |  |  |                                 "vector_similarity": chunk["vector_similarity"], | 
					
						
							|  |  |  |  |                                 "term_similarity": chunk["term_similarity"], | 
					
						
							|  |  |  |  |                                 "positions": chunk["positions"], | 
					
						
							|  |  |  |  |                             } | 
					
						
							|  |  |  |  |                             chunk_list.append(new_chunk) | 
					
						
							|  |  |  |  |                     chunk_num += 1 | 
					
						
							|  |  |  |  |                     messages[message_num]["reference"] = chunk_list | 
					
						
							|  |  |  |  |                 message_num += 1 | 
					
						
							|  |  |  |  |         del conv["reference"] | 
					
						
							|  |  |  |  |     return get_json_result(data=convs) | 
					
						
							|  |  |  |  | 
 | 
					
						
							|  |  |  |  | 
 | 
					
						
							|  |  |  |  | @manager.route('/delete', methods=["DELETE"]) | 
					
						
							|  |  |  |  | @token_required | 
					
						
							|  |  |  |  | def delete(tenant_id): | 
					
						
							|  |  |  |  |     id = request.args.get("id") | 
					
						
							|  |  |  |  |     if not id: | 
					
						
							|  |  |  |  |         return get_data_error_result(retmsg="`id` is required in deleting operation") | 
					
						
							|  |  |  |  |     conv = ConversationService.query(id=id) | 
					
						
							|  |  |  |  |     if not conv: | 
					
						
							|  |  |  |  |         return get_data_error_result(retmsg="Session doesn't exist") | 
					
						
							|  |  |  |  |     conv = conv[0] | 
					
						
							|  |  |  |  |     if not DialogService.query(id=conv.dialog_id, tenant_id=tenant_id, status=StatusEnum.VALID.value): | 
					
						
							|  |  |  |  |         return get_data_error_result(retmsg="You don't own the session") | 
					
						
							|  |  |  |  |     ConversationService.delete_by_id(id) | 
					
						
							|  |  |  |  |     return get_json_result(data=True) |