ragflow/api/db/services/dialog_service.py

#
#  Copyright 2024 The InfiniFlow Authors. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
#
import binascii
import logging
import re
import time
from copy import deepcopy
from datetime import datetime
from functools import partial
from timeit import default_timer as timer
import trio
from langfuse import Langfuse
from peewee import fn
from agentic_reasoning import DeepResearcher
from common.constants import LLMType, ParserType, StatusEnum
from api.db.db_models import DB, Dialog
from api.db.services.common_service import CommonService
from api.db.services.document_service import DocumentService
from api.db.services.knowledgebase_service import KnowledgebaseService
from api.db.services.langfuse_service import TenantLangfuseService
from api.db.services.llm_service import LLMBundle
from api.db.services.tenant_llm_service import TenantLLMService
from common.time_utils import current_timestamp, datetime_format
from graphrag.general.mind_map_extractor import MindMapExtractor
from rag.app.resume import forbidden_select_fields4resume
from rag.app.tag import label_question
from rag.nlp.search import index_name
from rag.prompts.generator import chunks_format, citation_prompt, cross_languages, full_question, kb_prompt, keyword_extraction, message_fit_in, \
    gen_meta_filter, PROMPT_JINJA_ENV, ASK_SUMMARY
from common.token_utils import num_tokens_from_string
from rag.utils.tavily_conn import Tavily
from common.string_utils import remove_redundant_spaces
from common import settings


class DialogService(CommonService):
    model = Dialog

    @classmethod
    def save(cls, **kwargs):
        """Save a new record to database.

        This method creates a new record in the database with the provided field values,
        forcing an insert operation rather than an update.

        Args:
            **kwargs: Record field values as keyword arguments.

        Returns:
            Model instance: The created record object.
        """
        sample_obj = cls.model(**kwargs).save(force_insert=True)
        return sample_obj

    @classmethod
    def update_many_by_id(cls, data_list):
        """Update multiple records by their IDs.

        This method updates multiple records in the database, identified by their IDs.
        It automatically updates the update_time and update_date fields for each record.

        Args:
            data_list (list): List of dictionaries containing record data to update.
                             Each dictionary must include an 'id' field.
        """
        with DB.atomic():
            for data in data_list:
                data["update_time"] = current_timestamp()
                data["update_date"] = datetime_format(datetime.now())
                cls.model.update(data).where(cls.model.id == data["id"]).execute()

    @classmethod
    @DB.connection_context()
    def get_list(cls, tenant_id, page_number, items_per_page, orderby, desc, id, name):
        chats = cls.model.select()
        if id:
            chats = chats.where(cls.model.id == id)
        if name:
            chats = chats.where(cls.model.name == name)
        chats = chats.where((cls.model.tenant_id == tenant_id) & (cls.model.status == StatusEnum.VALID.value))
        if desc:
            chats = chats.order_by(cls.model.getter_by(orderby).desc())
        else:
            chats = chats.order_by(cls.model.getter_by(orderby).asc())

        chats = chats.paginate(page_number, items_per_page)

        return list(chats.dicts())

    @classmethod
    @DB.connection_context()
    def get_by_tenant_ids(cls, joined_tenant_ids, user_id, page_number, items_per_page, orderby, desc, keywords, parser_id=None):
        from api.db.db_models import User

        fields = [
            cls.model.id,
            cls.model.tenant_id,
            cls.model.name,
            cls.model.description,
            cls.model.language,
            cls.model.llm_id,
            cls.model.llm_setting,
            cls.model.prompt_type,
            cls.model.prompt_config,
            cls.model.similarity_threshold,
            cls.model.vector_similarity_weight,
            cls.model.top_n,
            cls.model.top_k,
            cls.model.do_refer,
            cls.model.rerank_id,
            cls.model.kb_ids,
            cls.model.icon,
            cls.model.status,
            User.nickname,
            User.avatar.alias("tenant_avatar"),
            cls.model.update_time,
            cls.model.create_time,
        ]
        if keywords:
            dialogs = (
                cls.model.select(*fields)
                .join(User, on=(cls.model.tenant_id == User.id))
                .where(
                    (cls.model.tenant_id.in_(joined_tenant_ids) | (cls.model.tenant_id == user_id)) & (cls.model.status == StatusEnum.VALID.value),
                    (fn.LOWER(cls.model.name).contains(keywords.lower())),
                )
            )
        else:
            dialogs = (
                cls.model.select(*fields)
                .join(User, on=(cls.model.tenant_id == User.id))
                .where(
                    (cls.model.tenant_id.in_(joined_tenant_ids) | (cls.model.tenant_id == user_id)) & (cls.model.status == StatusEnum.VALID.value),
                )
            )
        if parser_id:
            dialogs = dialogs.where(cls.model.parser_id == parser_id)
        if desc:
            dialogs = dialogs.order_by(cls.model.getter_by(orderby).desc())
        else:
            dialogs = dialogs.order_by(cls.model.getter_by(orderby).asc())

        count = dialogs.count()

        if page_number and items_per_page:
            dialogs = dialogs.paginate(page_number, items_per_page)

        return list(dialogs.dicts()), count

    @classmethod
    @DB.connection_context()
    def get_all_dialogs_by_tenant_id(cls, tenant_id):
        fields = [cls.model.id]
        dialogs = cls.model.select(*fields).where(cls.model.tenant_id == tenant_id)
        dialogs.order_by(cls.model.create_time.asc())
        offset, limit = 0, 100
        res = []
        while True:
            d_batch = dialogs.offset(offset).limit(limit)
            _temp = list(d_batch.dicts())
            if not _temp:
                break
            res.extend(_temp)
            offset += limit
        return res

def chat_solo(dialog, messages, stream=True):
    if TenantLLMService.llm_id2llm_type(dialog.llm_id) == "image2text":
        chat_mdl = LLMBundle(dialog.tenant_id, LLMType.IMAGE2TEXT, dialog.llm_id)
    else:
        chat_mdl = LLMBundle(dialog.tenant_id, LLMType.CHAT, dialog.llm_id)

    prompt_config = dialog.prompt_config
    tts_mdl = None
    if prompt_config.get("tts"):
        tts_mdl = LLMBundle(dialog.tenant_id, LLMType.TTS)
    msg = [{"role": m["role"], "content": re.sub(r"##\d+\$\$", "", m["content"])} for m in messages if m["role"] != "system"]
    if stream:
        last_ans = ""
        delta_ans = ""
        for ans in chat_mdl.chat_streamly(prompt_config.get("system", ""), msg, dialog.llm_setting):
            answer = ans
            delta_ans = ans[len(last_ans):]
            if num_tokens_from_string(delta_ans) < 16:
                continue
            last_ans = answer
            yield {"answer": answer, "reference": {}, "audio_binary": tts(tts_mdl, delta_ans), "prompt": "", "created_at": time.time()}
            delta_ans = ""
        if delta_ans:
            yield {"answer": answer, "reference": {}, "audio_binary": tts(tts_mdl, delta_ans), "prompt": "", "created_at": time.time()}
    else:
        answer = chat_mdl.chat(prompt_config.get("system", ""), msg, dialog.llm_setting)
        user_content = msg[-1].get("content", "[content not available]")
        logging.debug("User: {}|Assistant: {}".format(user_content, answer))
        yield {"answer": answer, "reference": {}, "audio_binary": tts(tts_mdl, answer), "prompt": "", "created_at": time.time()}


def get_models(dialog):
    embd_mdl, chat_mdl, rerank_mdl, tts_mdl = None, None, None, None
    kbs = KnowledgebaseService.get_by_ids(dialog.kb_ids)
    embedding_list = list(set([kb.embd_id for kb in kbs]))
    if len(embedding_list) > 1:
        raise Exception("**ERROR**: Knowledge bases use different embedding models.")

    if embedding_list:
        embd_mdl = LLMBundle(dialog.tenant_id, LLMType.EMBEDDING, embedding_list[0])
        if not embd_mdl:
            raise LookupError("Embedding model(%s) not found" % embedding_list[0])

    if TenantLLMService.llm_id2llm_type(dialog.llm_id) == "image2text":
        chat_mdl = LLMBundle(dialog.tenant_id, LLMType.IMAGE2TEXT, dialog.llm_id)
    else:
        chat_mdl = LLMBundle(dialog.tenant_id, LLMType.CHAT, dialog.llm_id)

    if dialog.rerank_id:
        rerank_mdl = LLMBundle(dialog.tenant_id, LLMType.RERANK, dialog.rerank_id)

    if dialog.prompt_config.get("tts"):
        tts_mdl = LLMBundle(dialog.tenant_id, LLMType.TTS)
    return kbs, embd_mdl, rerank_mdl, chat_mdl, tts_mdl


BAD_CITATION_PATTERNS = [
    re.compile(r"\(\s*ID\s*[: ]*\s*(\d+)\s*\)"),  # (ID: 12)
    re.compile(r"\[\s*ID\s*[: ]*\s*(\d+)\s*\]"),  # [ID: 12]
    re.compile(r"【\s*ID\s*[: ]*\s*(\d+)\s*】"),  # 【ID: 12】
    re.compile(r"ref\s*(\d+)", flags=re.IGNORECASE),  # ref12、REF 12
]


def repair_bad_citation_formats(answer: str, kbinfos: dict, idx: set):
    max_index = len(kbinfos["chunks"])

    def safe_add(i):
        if 0 <= i < max_index:
            idx.add(i)
            return True
        return False

    def find_and_replace(pattern, group_index=1, repl=lambda i: f"ID:{i}", flags=0):
        nonlocal answer

        def replacement(match):
            try:
                i = int(match.group(group_index))
                if safe_add(i):
                    return f"[{repl(i)}]"
            except Exception:
                pass
            return match.group(0)

        answer = re.sub(pattern, replacement, answer, flags=flags)

    for pattern in BAD_CITATION_PATTERNS:
        find_and_replace(pattern)

    return answer, idx


def convert_conditions(metadata_condition):
    if metadata_condition is None:
        metadata_condition = {}
    op_mapping = {
        "is": "=",
        "not is": "≠"
    }
    return [
        {
            "op": op_mapping.get(cond["comparison_operator"], cond["comparison_operator"]),
            "key": cond["name"],
            "value": cond["value"]
        }
        for cond in metadata_condition.get("conditions", [])
    ]


def meta_filter(metas: dict, filters: list[dict]):
    doc_ids = set([])

    def filter_out(v2docs, operator, value):
        ids = []
        for input, docids in v2docs.items():
            if operator in ["=", "≠", ">", "<", "≥", "≤"]:
                try:
                    input = float(input)
                    value = float(value)
                except Exception:
                    input = str(input)
                    value = str(value)

            for conds in [
                (operator == "contains", str(value).lower() in str(input).lower()),
                (operator == "not contains", str(value).lower() not in str(input).lower()),
                (operator == "start with", str(input).lower().startswith(str(value).lower())),
                (operator == "end with", str(input).lower().endswith(str(value).lower())),
                (operator == "empty", not input),
                (operator == "not empty", input),
                (operator == "=", input == value),
                (operator == "≠", input != value),
                (operator == ">", input > value),
                (operator == "<", input < value),
                (operator == "≥", input >= value),
                (operator == "≤", input <= value),
            ]:
                try:
                    if all(conds):
                        ids.extend(docids)
                        break
                except Exception:
                    pass
        return ids

    for k, v2docs in metas.items():
        for f in filters:
            if k != f["key"]:
                continue
            ids = filter_out(v2docs, f["op"], f["value"])
            if not doc_ids:
                doc_ids = set(ids)
            else:
                doc_ids = doc_ids & set(ids)
            if not doc_ids:
                return []
    return list(doc_ids)


def chat(dialog, messages, stream=True, **kwargs):
    assert messages[-1]["role"] == "user", "The last content of this conversation is not from user."
    if not dialog.kb_ids and not dialog.prompt_config.get("tavily_api_key"):
        for ans in chat_solo(dialog, messages, stream):
            yield ans
        return None

    chat_start_ts = timer()

    if TenantLLMService.llm_id2llm_type(dialog.llm_id) == "image2text":
        llm_model_config = TenantLLMService.get_model_config(dialog.tenant_id, LLMType.IMAGE2TEXT, dialog.llm_id)
    else:
        llm_model_config = TenantLLMService.get_model_config(dialog.tenant_id, LLMType.CHAT, dialog.llm_id)

    max_tokens = llm_model_config.get("max_tokens", 8192)

    check_llm_ts = timer()

    langfuse_tracer = None
    trace_context = {}
    langfuse_keys = TenantLangfuseService.filter_by_tenant(tenant_id=dialog.tenant_id)
    if langfuse_keys:
        langfuse = Langfuse(public_key=langfuse_keys.public_key, secret_key=langfuse_keys.secret_key, host=langfuse_keys.host)
        if langfuse.auth_check():
            langfuse_tracer = langfuse
            trace_id = langfuse_tracer.create_trace_id()
            trace_context = {"trace_id": trace_id}

    check_langfuse_tracer_ts = timer()
    kbs, embd_mdl, rerank_mdl, chat_mdl, tts_mdl = get_models(dialog)
    toolcall_session, tools = kwargs.get("toolcall_session"), kwargs.get("tools")
    if toolcall_session and tools:
        chat_mdl.bind_tools(toolcall_session, tools)
    bind_models_ts = timer()

    retriever = settings.retriever
    questions = [m["content"] for m in messages if m["role"] == "user"][-3:]
    attachments = kwargs["doc_ids"].split(",") if "doc_ids" in kwargs else []
    if "doc_ids" in messages[-1]:
        attachments = messages[-1]["doc_ids"]

    prompt_config = dialog.prompt_config
    field_map = KnowledgebaseService.get_field_map(dialog.kb_ids)
    # try to use sql if field mapping is good to go
    if field_map:
        logging.debug("Use SQL to retrieval:{}".format(questions[-1]))
        ans = use_sql(questions[-1], field_map, dialog.tenant_id, chat_mdl, prompt_config.get("quote", True), dialog.kb_ids)
        if ans:
            yield ans
            return None

    for p in prompt_config["parameters"]:
        if p["key"] == "knowledge":
            continue
        if p["key"] not in kwargs and not p["optional"]:
            raise KeyError("Miss parameter: " + p["key"])
        if p["key"] not in kwargs:
            prompt_config["system"] = prompt_config["system"].replace("{%s}" % p["key"], " ")

    if len(questions) > 1 and prompt_config.get("refine_multiturn"):
        questions = [full_question(dialog.tenant_id, dialog.llm_id, messages)]
    else:
        questions = questions[-1:]

    if prompt_config.get("cross_languages"):
        questions = [cross_languages(dialog.tenant_id, dialog.llm_id, questions[0], prompt_config["cross_languages"])]

    if dialog.meta_data_filter:
        metas = DocumentService.get_meta_by_kbs(dialog.kb_ids)
        if dialog.meta_data_filter.get("method") == "auto":
            filters = gen_meta_filter(chat_mdl, metas, questions[-1])
            attachments.extend(meta_filter(metas, filters))
            if not attachments:
                attachments = None
        elif dialog.meta_data_filter.get("method") == "manual":
            attachments.extend(meta_filter(metas, dialog.meta_data_filter["manual"]))
            if not attachments:
                attachments = None

    if prompt_config.get("keyword", False):
        questions[-1] += keyword_extraction(chat_mdl, questions[-1])

    refine_question_ts = timer()

    thought = ""
    kbinfos = {"total": 0, "chunks": [], "doc_aggs": []}
    knowledges = []

    if attachments is not None and "knowledge" in [p["key"] for p in prompt_config["parameters"]]:
        tenant_ids = list(set([kb.tenant_id for kb in kbs]))
        knowledges = []
        if prompt_config.get("reasoning", False):
            reasoner = DeepResearcher(
                chat_mdl,
                prompt_config,
                partial(
                    retriever.retrieval,
                    embd_mdl=embd_mdl,
                    tenant_ids=tenant_ids,
                    kb_ids=dialog.kb_ids,
                    page=1,
                    page_size=dialog.top_n,
                    similarity_threshold=0.2,
                    vector_similarity_weight=0.3,
                    doc_ids=attachments,
                ),
            )

            for think in reasoner.thinking(kbinfos, " ".join(questions)):
                if isinstance(think, str):
                    thought = think
                    knowledges = [t for t in think.split("\n") if t]
                elif stream:
                    yield think
        else:
            if embd_mdl:
                kbinfos = retriever.retrieval(
                    " ".join(questions),
                    embd_mdl,
                    tenant_ids,
                    dialog.kb_ids,
                    1,
                    dialog.top_n,
                    dialog.similarity_threshold,
                    dialog.vector_similarity_weight,
                    doc_ids=attachments,
                    top=dialog.top_k,
                    aggs=False,
                    rerank_mdl=rerank_mdl,
                    rank_feature=label_question(" ".join(questions), kbs),
                )
                if prompt_config.get("toc_enhance"):
                    cks = retriever.retrieval_by_toc(" ".join(questions), kbinfos["chunks"], tenant_ids, chat_mdl, dialog.top_n)
                    if cks:
                        kbinfos["chunks"] = cks
            if prompt_config.get("tavily_api_key"):
                tav = Tavily(prompt_config["tavily_api_key"])
                tav_res = tav.retrieve_chunks(" ".join(questions))
                kbinfos["chunks"].extend(tav_res["chunks"])
                kbinfos["doc_aggs"].extend(tav_res["doc_aggs"])
            if prompt_config.get("use_kg"):
                ck = settings.kg_retriever.retrieval(" ".join(questions), tenant_ids, dialog.kb_ids, embd_mdl,
                                                       LLMBundle(dialog.tenant_id, LLMType.CHAT))
                if ck["content_with_weight"]:
                    kbinfos["chunks"].insert(0, ck)

            knowledges = kb_prompt(kbinfos, max_tokens)

    logging.debug("{}->{}".format(" ".join(questions), "\n->".join(knowledges)))

    retrieval_ts = timer()
    if not knowledges and prompt_config.get("empty_response"):
        empty_res = prompt_config["empty_response"]
        yield {"answer": empty_res, "reference": kbinfos, "prompt": "\n\n### Query:\n%s" % " ".join(questions),
               "audio_binary": tts(tts_mdl, empty_res)}
        return {"answer": prompt_config["empty_response"], "reference": kbinfos}

    kwargs["knowledge"] = "\n------\n" + "\n\n------\n\n".join(knowledges)
    gen_conf = dialog.llm_setting

    msg = [{"role": "system", "content": prompt_config["system"].format(**kwargs)}]
    prompt4citation = ""
    if knowledges and (prompt_config.get("quote", True) and kwargs.get("quote", True)):
        prompt4citation = citation_prompt()
    msg.extend([{"role": m["role"], "content": re.sub(r"##\d+\$\$", "", m["content"])} for m in messages if m["role"] != "system"])
    used_token_count, msg = message_fit_in(msg, int(max_tokens * 0.95))
    assert len(msg) >= 2, f"message_fit_in has bug: {msg}"
    prompt = msg[0]["content"]

    if "max_tokens" in gen_conf:
        gen_conf["max_tokens"] = min(gen_conf["max_tokens"], max_tokens - used_token_count)

    def decorate_answer(answer):
        nonlocal embd_mdl, prompt_config, knowledges, kwargs, kbinfos, prompt, retrieval_ts, questions, langfuse_tracer

        refs = []
        ans = answer.split("</think>")
        think = ""
        if len(ans) == 2:
            think = ans[0] + "</think>"
            answer = ans[1]

        if knowledges and (prompt_config.get("quote", True) and kwargs.get("quote", True)):
            idx = set([])
            if embd_mdl and not re.search(r"\[ID:([0-9]+)\]", answer):
                answer, idx = retriever.insert_citations(
                    answer,
                    [ck["content_ltks"] for ck in kbinfos["chunks"]],
                    [ck["vector"] for ck in kbinfos["chunks"]],
                    embd_mdl,
                    tkweight=1 - dialog.vector_similarity_weight,
                    vtweight=dialog.vector_similarity_weight,
                )
            else:
                for match in re.finditer(r"\[ID:([0-9]+)\]", answer):
                    i = int(match.group(1))
                    if i < len(kbinfos["chunks"]):
                        idx.add(i)

            answer, idx = repair_bad_citation_formats(answer, kbinfos, idx)

            idx = set([kbinfos["chunks"][int(i)]["doc_id"] for i in idx])
            recall_docs = [d for d in kbinfos["doc_aggs"] if d["doc_id"] in idx]
            if not recall_docs:
                recall_docs = kbinfos["doc_aggs"]
            kbinfos["doc_aggs"] = recall_docs

            refs = deepcopy(kbinfos)
            for c in refs["chunks"]:
                if c.get("vector"):
                    del c["vector"]

        if answer.lower().find("invalid key") >= 0 or answer.lower().find("invalid api") >= 0:
            answer += " Please set LLM API-Key in 'User Setting -> Model providers -> API-Key'"
        finish_chat_ts = timer()

        total_time_cost = (finish_chat_ts - chat_start_ts) * 1000
        check_llm_time_cost = (check_llm_ts - chat_start_ts) * 1000
        check_langfuse_tracer_cost = (check_langfuse_tracer_ts - check_llm_ts) * 1000
        bind_embedding_time_cost = (bind_models_ts - check_langfuse_tracer_ts) * 1000
        refine_question_time_cost = (refine_question_ts - bind_models_ts) * 1000
        retrieval_time_cost = (retrieval_ts - refine_question_ts) * 1000
        generate_result_time_cost = (finish_chat_ts - retrieval_ts) * 1000

        tk_num = num_tokens_from_string(think + answer)
        prompt += "\n\n### Query:\n%s" % " ".join(questions)
        prompt = (
            f"{prompt}\n\n"
            "## Time elapsed:\n"
            f"  - Total: {total_time_cost:.1f}ms\n"
            f"  - Check LLM: {check_llm_time_cost:.1f}ms\n"
            f"  - Check Langfuse tracer: {check_langfuse_tracer_cost:.1f}ms\n"
            f"  - Bind models: {bind_embedding_time_cost:.1f}ms\n"
            f"  - Query refinement(LLM): {refine_question_time_cost:.1f}ms\n"
            f"  - Retrieval: {retrieval_time_cost:.1f}ms\n"
            f"  - Generate answer: {generate_result_time_cost:.1f}ms\n\n"
            "## Token usage:\n"
            f"  - Generated tokens(approximately): {tk_num}\n"
            f"  - Token speed: {int(tk_num / (generate_result_time_cost / 1000.0))}/s"
        )

        # Add a condition check to call the end method only if langfuse_tracer exists
        if langfuse_tracer and "langfuse_generation" in locals():
            langfuse_output = "\n" + re.sub(r"^.*?(### Query:.*)", r"\1", prompt, flags=re.DOTALL)
            langfuse_output = {"time_elapsed:": re.sub(r"\n", "  \n", langfuse_output), "created_at": time.time()}
            langfuse_generation.update(output=langfuse_output)
            langfuse_generation.end()

        return {"answer": think + answer, "reference": refs, "prompt": re.sub(r"\n", "  \n", prompt), "created_at": time.time()}

    if langfuse_tracer:
        langfuse_generation = langfuse_tracer.start_generation(
            trace_context=trace_context, name="chat", model=llm_model_config["llm_name"],
            input={"prompt": prompt, "prompt4citation": prompt4citation, "messages": msg}
        )

    if stream:
        last_ans = ""
        answer = ""
        for ans in chat_mdl.chat_streamly(prompt + prompt4citation, msg[1:], gen_conf):
            if thought:
                ans = re.sub(r"^.*</think>", "", ans, flags=re.DOTALL)
            answer = ans
            delta_ans = ans[len(last_ans):]
            if num_tokens_from_string(delta_ans) < 16:
                continue
            last_ans = answer
            yield {"answer": thought + answer, "reference": {}, "audio_binary": tts(tts_mdl, delta_ans)}
        delta_ans = answer[len(last_ans):]
        if delta_ans:
            yield {"answer": thought + answer, "reference": {}, "audio_binary": tts(tts_mdl, delta_ans)}
        yield decorate_answer(thought + answer)
    else:
        answer = chat_mdl.chat(prompt + prompt4citation, msg[1:], gen_conf)
        user_content = msg[-1].get("content", "[content not available]")
        logging.debug("User: {}|Assistant: {}".format(user_content, answer))
        res = decorate_answer(answer)
        res["audio_binary"] = tts(tts_mdl, answer)
        yield res

    return None


def use_sql(question, field_map, tenant_id, chat_mdl, quota=True, kb_ids=None):
    sys_prompt = """
You are a Database Administrator. You need to check the fields of the following tables based on the user's list of questions and write the SQL corresponding to the last question. 
Ensure that:
1. Field names should not start with a digit. If any field name starts with a digit, use double quotes around it.
2. Write only the SQL, no explanations or additional text.
"""
    user_prompt = """
Table name: {};
Table of database fields are as follows:
{}

Question are as follows:
{}
Please write the SQL, only SQL, without any other explanations or text.
""".format(index_name(tenant_id), "\n".join([f"{k}: {v}" for k, v in field_map.items()]), question)
    tried_times = 0

    def get_table():
        nonlocal sys_prompt, user_prompt, question, tried_times
        sql = chat_mdl.chat(sys_prompt, [{"role": "user", "content": user_prompt}], {"temperature": 0.06})
        sql = re.sub(r"^.*</think>", "", sql, flags=re.DOTALL)
        logging.debug(f"{question} ==> {user_prompt} get SQL: {sql}")
        sql = re.sub(r"[\r\n]+", " ", sql.lower())
        sql = re.sub(r".*select ", "select ", sql.lower())
        sql = re.sub(r" +", " ", sql)
        sql = re.sub(r"([;；]|```).*", "", sql)
        sql = re.sub(r"&", "and", sql)
        if sql[: len("select ")] != "select ":
            return None, None
        if not re.search(r"((sum|avg|max|min)\(|group by )", sql.lower()):
            if sql[: len("select *")] != "select *":
                sql = "select doc_id,docnm_kwd," + sql[6:]
            else:
                flds = []
                for k in field_map.keys():
                    if k in forbidden_select_fields4resume:
                        continue
                    if len(flds) > 11:
                        break
                    flds.append(k)
                sql = "select doc_id,docnm_kwd," + ",".join(flds) + sql[8:]

        if kb_ids:
            kb_filter = "(" + " OR ".join([f"kb_id = '{kb_id}'" for kb_id in kb_ids]) + ")"
            if "where" not in sql.lower():
                sql += f" WHERE {kb_filter}"
            else:
                sql += f" AND {kb_filter}"

        logging.debug(f"{question} get SQL(refined): {sql}")
        tried_times += 1
        return settings.retriever.sql_retrieval(sql, format="json"), sql

    tbl, sql = get_table()
    if tbl is None:
        return None
    if tbl.get("error") and tried_times <= 2:
        user_prompt = """
        Table name: {};
        Table of database fields are as follows:
        {}

        Question are as follows:
        {}
        Please write the SQL, only SQL, without any other explanations or text.


        The SQL error you provided last time is as follows:
        {}

        Error issued by database as follows:
        {}

        Please correct the error and write SQL again, only SQL, without any other explanations or text.
        """.format(index_name(tenant_id), "\n".join([f"{k}: {v}" for k, v in field_map.items()]), question, sql, tbl["error"])
        tbl, sql = get_table()
        logging.debug("TRY it again: {}".format(sql))

    logging.debug("GET table: {}".format(tbl))
    if tbl.get("error") or len(tbl["rows"]) == 0:
        return None

    docid_idx = set([ii for ii, c in enumerate(tbl["columns"]) if c["name"] == "doc_id"])
    doc_name_idx = set([ii for ii, c in enumerate(tbl["columns"]) if c["name"] == "docnm_kwd"])
    column_idx = [ii for ii in range(len(tbl["columns"])) if ii not in (docid_idx | doc_name_idx)]

    # compose Markdown table
    columns = (
            "|" + "|".join(
        [re.sub(r"(/.*|（[^（）]+）)", "", field_map.get(tbl["columns"][i]["name"], tbl["columns"][i]["name"])) for i in column_idx]) + (
                "|Source|" if docid_idx and docid_idx else "|")
    )

    line = "|" + "|".join(["------" for _ in range(len(column_idx))]) + ("|------|" if docid_idx and docid_idx else "")

    rows = ["|" + "|".join([remove_redundant_spaces(str(r[i])) for i in column_idx]).replace("None", " ") + "|" for r in tbl["rows"]]
    rows = [r for r in rows if re.sub(r"[ |]+", "", r)]
    if quota:
        rows = "\n".join([r + f" ##{ii}$$ |" for ii, r in enumerate(rows)])
    else:
        rows = "\n".join([r + f" ##{ii}$$ |" for ii, r in enumerate(rows)])
    rows = re.sub(r"T[0-9]{2}:[0-9]{2}:[0-9]{2}(\.[0-9]+Z)?\|", "|", rows)

    if not docid_idx or not doc_name_idx:
        logging.warning("SQL missing field: " + sql)
        return {"answer": "\n".join([columns, line, rows]), "reference": {"chunks": [], "doc_aggs": []}, "prompt": sys_prompt}

    docid_idx = list(docid_idx)[0]
    doc_name_idx = list(doc_name_idx)[0]
    doc_aggs = {}
    for r in tbl["rows"]:
        if r[docid_idx] not in doc_aggs:
            doc_aggs[r[docid_idx]] = {"doc_name": r[doc_name_idx], "count": 0}
        doc_aggs[r[docid_idx]]["count"] += 1
    return {
        "answer": "\n".join([columns, line, rows]),
        "reference": {
            "chunks": [{"doc_id": r[docid_idx], "docnm_kwd": r[doc_name_idx]} for r in tbl["rows"]],
            "doc_aggs": [{"doc_id": did, "doc_name": d["doc_name"], "count": d["count"]} for did, d in doc_aggs.items()],
        },
        "prompt": sys_prompt,
    }


def tts(tts_mdl, text):
    if not tts_mdl or not text:
        return None
    bin = b""
    for chunk in tts_mdl.tts(text):
        bin += chunk
    return binascii.hexlify(bin).decode("utf-8")


def ask(question, kb_ids, tenant_id, chat_llm_name=None, search_config={}):
    doc_ids = search_config.get("doc_ids", [])
    rerank_mdl = None
    kb_ids = search_config.get("kb_ids", kb_ids)
    chat_llm_name = search_config.get("chat_id", chat_llm_name)
    rerank_id = search_config.get("rerank_id", "")
    meta_data_filter = search_config.get("meta_data_filter")

    kbs = KnowledgebaseService.get_by_ids(kb_ids)
    embedding_list = list(set([kb.embd_id for kb in kbs]))

    is_knowledge_graph = all([kb.parser_id == ParserType.KG for kb in kbs])
    retriever = settings.retriever if not is_knowledge_graph else settings.kg_retriever

    embd_mdl = LLMBundle(tenant_id, LLMType.EMBEDDING, embedding_list[0])
    chat_mdl = LLMBundle(tenant_id, LLMType.CHAT, chat_llm_name)
    if rerank_id:
        rerank_mdl = LLMBundle(tenant_id, LLMType.RERANK, rerank_id)
    max_tokens = chat_mdl.max_length
    tenant_ids = list(set([kb.tenant_id for kb in kbs]))

    if meta_data_filter:
        metas = DocumentService.get_meta_by_kbs(kb_ids)
        if meta_data_filter.get("method") == "auto":
            filters = gen_meta_filter(chat_mdl, metas, question)
            doc_ids.extend(meta_filter(metas, filters))
            if not doc_ids:
                doc_ids = None
        elif meta_data_filter.get("method") == "manual":
            doc_ids.extend(meta_filter(metas, meta_data_filter["manual"]))
            if not doc_ids:
                doc_ids = None

    kbinfos = retriever.retrieval(
        question=question,
        embd_mdl=embd_mdl,
        tenant_ids=tenant_ids,
        kb_ids=kb_ids,
        page=1,
        page_size=12,
        similarity_threshold=search_config.get("similarity_threshold", 0.1),
        vector_similarity_weight=search_config.get("vector_similarity_weight", 0.3),
        top=search_config.get("top_k", 1024),
        doc_ids=doc_ids,
        aggs=False,
        rerank_mdl=rerank_mdl,
        rank_feature=label_question(question, kbs)
    )

    knowledges = kb_prompt(kbinfos, max_tokens)
    sys_prompt = PROMPT_JINJA_ENV.from_string(ASK_SUMMARY).render(knowledge="\n".join(knowledges))

    msg = [{"role": "user", "content": question}]

    def decorate_answer(answer):
        nonlocal knowledges, kbinfos, sys_prompt
        answer, idx = retriever.insert_citations(answer, [ck["content_ltks"] for ck in kbinfos["chunks"]], [ck["vector"] for ck in kbinfos["chunks"]],
                                                 embd_mdl, tkweight=0.7, vtweight=0.3)
        idx = set([kbinfos["chunks"][int(i)]["doc_id"] for i in idx])
        recall_docs = [d for d in kbinfos["doc_aggs"] if d["doc_id"] in idx]
        if not recall_docs:
            recall_docs = kbinfos["doc_aggs"]
        kbinfos["doc_aggs"] = recall_docs
        refs = deepcopy(kbinfos)
        for c in refs["chunks"]:
            if c.get("vector"):
                del c["vector"]

        if answer.lower().find("invalid key") >= 0 or answer.lower().find("invalid api") >= 0:
            answer += " Please set LLM API-Key in 'User Setting -> Model Providers -> API-Key'"
        refs["chunks"] = chunks_format(refs)
        return {"answer": answer, "reference": refs}

    answer = ""
    for ans in chat_mdl.chat_streamly(sys_prompt, msg, {"temperature": 0.1}):
        answer = ans
        yield {"answer": answer, "reference": {}}
    yield decorate_answer(answer)


def gen_mindmap(question, kb_ids, tenant_id, search_config={}):
    meta_data_filter = search_config.get("meta_data_filter", {})
    doc_ids = search_config.get("doc_ids", [])
    rerank_id = search_config.get("rerank_id", "")
    rerank_mdl = None
    kbs = KnowledgebaseService.get_by_ids(kb_ids)
    if not kbs:
        return {"error": "No KB selected"}
    embedding_list = list(set([kb.embd_id for kb in kbs]))
    tenant_ids = list(set([kb.tenant_id for kb in kbs]))

    embd_mdl = LLMBundle(tenant_id, LLMType.EMBEDDING, llm_name=embedding_list[0])
    chat_mdl = LLMBundle(tenant_id, LLMType.CHAT, llm_name=search_config.get("chat_id", ""))
    if rerank_id:
        rerank_mdl = LLMBundle(tenant_id, LLMType.RERANK, rerank_id)

    if meta_data_filter:
        metas = DocumentService.get_meta_by_kbs(kb_ids)
        if meta_data_filter.get("method") == "auto":
            filters = gen_meta_filter(chat_mdl, metas, question)
            doc_ids.extend(meta_filter(metas, filters))
            if not doc_ids:
                doc_ids = None
        elif meta_data_filter.get("method") == "manual":
            doc_ids.extend(meta_filter(metas, meta_data_filter["manual"]))
            if not doc_ids:
                doc_ids = None

    ranks = settings.retriever.retrieval(
        question=question,
        embd_mdl=embd_mdl,
        tenant_ids=tenant_ids,
        kb_ids=kb_ids,
        page=1,
        page_size=12,
        similarity_threshold=search_config.get("similarity_threshold", 0.2),
        vector_similarity_weight=search_config.get("vector_similarity_weight", 0.3),
        top=search_config.get("top_k", 1024),
        doc_ids=doc_ids,
        aggs=False,
        rerank_mdl=rerank_mdl,
        rank_feature=label_question(question, kbs),
    )
    mindmap = MindMapExtractor(chat_mdl)
    mind_map = trio.run(mindmap, [c["content_with_weight"] for c in ranks["chunks"]])
    return mind_map.output
-												Format file format from Windows/dos to Unix (#1949)

### What problem does this PR solve?

Related source file is in Windows/DOS format, they are format to Unix
format.

### Type of change

- [x] Refactoring

Signed-off-by: Jin Hai <haijin.chn@gmail.com>
											
										
										
											2024-08-15 09:17:36 +08:00
+								#
 								#  Copyright 2024 The InfiniFlow Authors. All Rights Reserved.
 								#
 								#  Licensed under the Apache License, Version 2.0 (the "License");
 								#  you may not use this file except in compliance with the License.
 								#  You may obtain a copy of the License at
 								#
 								#      http://www.apache.org/licenses/LICENSE-2.0
 								#
 								#  Unless required by applicable law or agreed to in writing, software
 								#  distributed under the License is distributed on an "AS IS" BASIS,
 								#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 								#  See the License for the specific language governing permissions and
 								#  limitations under the License.
 								#
-												add stream chat with TTS (#2228)

### What problem does this PR solve?



### Type of change

- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2024-09-03 19:49:14 +08:00
+								import binascii
-												Feat: add basic Langfuse support for LLM module (#6443)

### What problem does this PR solve?

#6155

Add basic Langfuse support for LLM module.

A trace example:

<img width="755" alt="image"
src="https://github.com/user-attachments/assets/25c1f852-5116-486c-a47f-6097187142ca"
/>


### Type of change

- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2025-03-24 13:18:47 +08:00
+								import logging
-												Format file format from Windows/dos to Unix (#1949)

### What problem does this PR solve?

Related source file is in Windows/DOS format, they are format to Unix
format.

### Type of change

- [x] Refactoring

Signed-off-by: Jin Hai <haijin.chn@gmail.com>
											
										
										
											2024-08-15 09:17:36 +08:00
+								import re
-												Feat: add basic Langfuse support for LLM module (#6443)

### What problem does this PR solve?

#6155

Add basic Langfuse support for LLM module.

A trace example:

<img width="755" alt="image"
src="https://github.com/user-attachments/assets/25c1f852-5116-486c-a47f-6097187142ca"
/>


### Type of change

- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2025-03-24 13:18:47 +08:00
+								import time
-												Format file format from Windows/dos to Unix (#1949)

### What problem does this PR solve?

Related source file is in Windows/DOS format, they are format to Unix
format.

### Type of change

- [x] Refactoring

Signed-off-by: Jin Hai <haijin.chn@gmail.com>
											
										
										
											2024-08-15 09:17:36 +08:00
+								from copy import deepcopy
-												Refa: more fallbacks for bad citation format (#7710)

### What problem does this PR solve?

More fallbacks for bad citation format

### Type of change

- [x] Bug Fix (non-breaking change which fixes an issue)
- [x] Refactoring
											
										
										
											2025-05-19 19:34:05 +08:00
+								from datetime import datetime
-												Feat: add basic Langfuse support for LLM module (#6443)

### What problem does this PR solve?

#6155

Add basic Langfuse support for LLM module.

A trace example:

<img width="755" alt="image"
src="https://github.com/user-attachments/assets/25c1f852-5116-486c-a47f-6097187142ca"
/>


### Type of change

- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2025-03-24 13:18:47 +08:00
+								from functools import partial
-												add elapsed time of conversation (#2316)

### What problem does this PR solve?

#2315

### Type of change


- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2024-09-09 12:08:50 +08:00
+								from timeit import default_timer as timer
-												Feat: add meta filter to search app. (#9554)

### What problem does this PR solve?


### Type of change

- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2025-08-19 17:25:44 +08:00
+								import trio
-												Feat: add basic Langfuse support for LLM module (#6443)

### What problem does this PR solve?

#6155

Add basic Langfuse support for LLM module.

A trace example:

<img width="755" alt="image"
src="https://github.com/user-attachments/assets/25c1f852-5116-486c-a47f-6097187142ca"
/>


### Type of change

- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2025-03-24 13:18:47 +08:00
+								from langfuse import Langfuse
-												Feat: advanced list dialogs (#9256)

### What problem does this PR solve?

Advanced list dialogs

### Type of change

- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2025-08-06 10:33:52 +08:00
+								from peewee import fn
-												Code refactor (#5371)

### What problem does this PR solve?

#5173

### Type of change

- [x] Refactoring
											
										
										
											2025-02-26 15:40:52 +08:00
+								from agentic_reasoning import DeepResearcher
-												Move some constants to common (#11004)

### What problem does this PR solve?

As title.

### Type of change

- [x] Refactoring

---------

Signed-off-by: Jin Hai <haijin.chn@gmail.com>
											
										
										
											2025-11-05 08:01:39 +08:00
+								from common.constants import LLMType, ParserType, StatusEnum
-												Feat: add basic Langfuse support for LLM module (#6443)

### What problem does this PR solve?

#6155

Add basic Langfuse support for LLM module.

A trace example:

<img width="755" alt="image"
src="https://github.com/user-attachments/assets/25c1f852-5116-486c-a47f-6097187142ca"
/>


### Type of change

- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2025-03-24 13:18:47 +08:00
+								from api.db.db_models import DB, Dialog
-												Format file format from Windows/dos to Unix (#1949)

### What problem does this PR solve?

Related source file is in Windows/DOS format, they are format to Unix
format.

### Type of change

- [x] Refactoring

Signed-off-by: Jin Hai <haijin.chn@gmail.com>
											
										
										
											2024-08-15 09:17:36 +08:00
+								from api.db.services.common_service import CommonService
-												Feat: add meta data filter. (#9405)

### What problem does this PR solve?

#8531 
#7417 
#6761 
#6573
#6477

### Type of change

- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2025-08-12 14:12:56 +08:00
+								from api.db.services.document_service import DocumentService
-												Format file format from Windows/dos to Unix (#1949)

### What problem does this PR solve?

Related source file is in Windows/DOS format, they are format to Unix
format.

### Type of change

- [x] Refactoring

Signed-off-by: Jin Hai <haijin.chn@gmail.com>
											
										
										
											2024-08-15 09:17:36 +08:00
+								from api.db.services.knowledgebase_service import KnowledgebaseService
-												Feat: add basic Langfuse support for LLM module (#6443)

### What problem does this PR solve?

#6155

Add basic Langfuse support for LLM module.

A trace example:

<img width="755" alt="image"
src="https://github.com/user-attachments/assets/25c1f852-5116-486c-a47f-6097187142ca"
/>


### Type of change

- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2025-03-24 13:18:47 +08:00
+								from api.db.services.langfuse_service import TenantLangfuseService
-												Refa: split services about llm. (#9450)

### What problem does this PR solve?

### Type of change

- [x] Refactoring
											
										
										
											2025-08-13 16:41:01 +08:00
+								from api.db.services.llm_service import LLMBundle
 								from api.db.services.tenant_llm_service import TenantLLMService
-												Add time utils (#10849)

### What problem does this PR solve?

- Add time utilities and unit tests

### Type of change

- [x] Refactoring

---------

Signed-off-by: Jin Hai <haijin.chn@gmail.com>
											
										
										
											2025-10-28 19:09:14 +08:00
+								from common.time_utils import current_timestamp, datetime_format
-												Feat: add meta filter to search app. (#9554)

### What problem does this PR solve?


### Type of change

- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2025-08-19 17:25:44 +08:00
+								from graphrag.general.mind_map_extractor import MindMapExtractor
-												Format file format from Windows/dos to Unix (#1949)

### What problem does this PR solve?

Related source file is in Windows/DOS format, they are format to Unix
format.

### Type of change

- [x] Refactoring

Signed-off-by: Jin Hai <haijin.chn@gmail.com>
											
										
										
											2024-08-15 09:17:36 +08:00
+								from rag.app.resume import forbidden_select_fields4resume
-												Code refactor (#5371)

### What problem does this PR solve?

#5173

### Type of change

- [x] Refactoring
											
										
										
											2025-02-26 15:40:52 +08:00
+								from rag.app.tag import label_question
-												Format file format from Windows/dos to Unix (#1949)

### What problem does this PR solve?

Related source file is in Windows/DOS format, they are format to Unix
format.

### Type of change

- [x] Refactoring

Signed-off-by: Jin Hai <haijin.chn@gmail.com>
											
										
										
											2024-08-15 09:17:36 +08:00
+								from rag.nlp.search import index_name
-												Fix bug: broken import from rag.prompts.prompts (#10217)

### What problem does this PR solve?

Fix broken imports

### Type of change

- [x] Bug Fix (non-breaking change which fixes an issue)

---------

Signed-off-by: jinhai <haijin.chn@gmail.com>
											
										
										
											2025-09-23 10:19:25 +08:00
+								from rag.prompts.generator import chunks_format, citation_prompt, cross_languages, full_question, kb_prompt, keyword_extraction, message_fit_in, \
 								    gen_meta_filter, PROMPT_JINJA_ENV, ASK_SUMMARY
-												Move token related functions to common (#10942)

### What problem does this PR solve?

As title

### Type of change

- [x] Refactoring

Signed-off-by: Jin Hai <haijin.chn@gmail.com>
											
										
										
											2025-11-03 08:50:05 +08:00
+								from common.token_utils import num_tokens_from_string
-												Add tavily as web searh tool. (#5349)

### What problem does this PR solve?

#5198

### Type of change

- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2025-02-26 10:21:04 +08:00
+								from rag.utils.tavily_conn import Tavily
-												Refactor: rename rmSpace to remove_redundant_spaces (#10796)

### What problem does this PR solve?

- rename rmSpace to remove_redundant_spaces
- move clean_markdown_block to common module
- add unit tests for remove_redundant_spaces and clean_markdown_block

### Type of change

- [x] Refactoring

---------

Signed-off-by: Jin Hai <haijin.chn@gmail.com>
											
										
										
											2025-10-28 09:46:32 +08:00
+								from common.string_utils import remove_redundant_spaces
-												Move api.settings to common.settings (#11036)

### What problem does this PR solve?

As title

### Type of change

- [x] Refactoring

---------

Signed-off-by: Jin Hai <haijin.chn@gmail.com>
											
										
										
											2025-11-06 09:36:38 +08:00
+								from common import settings
-												Format file format from Windows/dos to Unix (#1949)

### What problem does this PR solve?

Related source file is in Windows/DOS format, they are format to Unix
format.

### Type of change

- [x] Refactoring

Signed-off-by: Jin Hai <haijin.chn@gmail.com>
											
										
										
											2024-08-15 09:17:36 +08:00
 								class DialogService(CommonService):
 								    model = Dialog
-												Refa. (#7022)

### What problem does this PR solve?


### Type of change

- [x] Refactoring
											
										
										
											2025-04-15 10:20:33 +08:00
+								    @classmethod
 								    def save(cls, **kwargs):
 								        """Save a new record to database.
 								        This method creates a new record in the database with the provided field values,
 								        forcing an insert operation rather than an update.
 								        Args:
 								            **kwargs: Record field values as keyword arguments.
 								        Returns:
 								            Model instance: The created record object.
 								        """
 								        sample_obj = cls.model(**kwargs).save(force_insert=True)
 								        return sample_obj
 								    @classmethod
 								    def update_many_by_id(cls, data_list):
 								        """Update multiple records by their IDs.
 								        This method updates multiple records in the database, identified by their IDs.
 								        It automatically updates the update_time and update_date fields for each record.
 								        Args:
 								            data_list (list): List of dictionaries containing record data to update.
 								                             Each dictionary must include an 'id' field.
 								        """
 								        with DB.atomic():
 								            for data in data_list:
 								                data["update_time"] = current_timestamp()
 								                data["update_date"] = datetime_format(datetime.now())
 								                cls.model.update(data).where(cls.model.id == data["id"]).execute()
-												Refactor Chat API (#2804)

### What problem does this PR solve?

Refactor Chat API

### Type of change

- [x] Refactoring

---------

Co-authored-by: liuhua <10215101452@stu.ecun.edu.cn>
											
										
										
											2024-10-12 13:48:43 +08:00
+								    @classmethod
 								    @DB.connection_context()
-												Feat: add basic Langfuse support for LLM module (#6443)

### What problem does this PR solve?

#6155

Add basic Langfuse support for LLM module.

A trace example:

<img width="755" alt="image"
src="https://github.com/user-attachments/assets/25c1f852-5116-486c-a47f-6097187142ca"
/>


### Type of change

- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2025-03-24 13:18:47 +08:00
+								    def get_list(cls, tenant_id, page_number, items_per_page, orderby, desc, id, name):
-												Refactor Chat API (#2804)

### What problem does this PR solve?

Refactor Chat API

### Type of change

- [x] Refactoring

---------

Co-authored-by: liuhua <10215101452@stu.ecun.edu.cn>
											
										
										
											2024-10-12 13:48:43 +08:00
+								        chats = cls.model.select()
 								        if id:
 								            chats = chats.where(cls.model.id == id)
 								        if name:
 								            chats = chats.where(cls.model.name == name)
-												Feat: add basic Langfuse support for LLM module (#6443)

### What problem does this PR solve?

#6155

Add basic Langfuse support for LLM module.

A trace example:

<img width="755" alt="image"
src="https://github.com/user-attachments/assets/25c1f852-5116-486c-a47f-6097187142ca"
/>


### Type of change

- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2025-03-24 13:18:47 +08:00
+								        chats = chats.where((cls.model.tenant_id == tenant_id) & (cls.model.status == StatusEnum.VALID.value))
-												Refactor Chat API (#2804)

### What problem does this PR solve?

Refactor Chat API

### Type of change

- [x] Refactoring

---------

Co-authored-by: liuhua <10215101452@stu.ecun.edu.cn>
											
										
										
											2024-10-12 13:48:43 +08:00
+								        if desc:
 								            chats = chats.order_by(cls.model.getter_by(orderby).desc())
 								        else:
 								            chats = chats.order_by(cls.model.getter_by(orderby).asc())
 								        chats = chats.paginate(page_number, items_per_page)
 								        return list(chats.dicts())
-												Feat: advanced list dialogs (#9256)

### What problem does this PR solve?

Advanced list dialogs

### Type of change

- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2025-08-06 10:33:52 +08:00
+								    @classmethod
 								    @DB.connection_context()
 								    def get_by_tenant_ids(cls, joined_tenant_ids, user_id, page_number, items_per_page, orderby, desc, keywords, parser_id=None):
 								        from api.db.db_models import User
 								        fields = [
 								            cls.model.id,
 								            cls.model.tenant_id,
 								            cls.model.name,
 								            cls.model.description,
 								            cls.model.language,
 								            cls.model.llm_id,
 								            cls.model.llm_setting,
 								            cls.model.prompt_type,
 								            cls.model.prompt_config,
 								            cls.model.similarity_threshold,
 								            cls.model.vector_similarity_weight,
 								            cls.model.top_n,
 								            cls.model.top_k,
 								            cls.model.do_refer,
 								            cls.model.rerank_id,
 								            cls.model.kb_ids,
-												Feat: Fixed the issue where some fields in the chat configuration could not be displayed #3221 (#9430)

### What problem does this PR solve?

Feat: Fixed the issue where some fields in the chat configuration could
not be displayed #3221
### Type of change


- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2025-08-13 10:26:26 +08:00
+								            cls.model.icon,
-												Feat: advanced list dialogs (#9256)

### What problem does this PR solve?

Advanced list dialogs

### Type of change

- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2025-08-06 10:33:52 +08:00
+								            cls.model.status,
 								            User.nickname,
 								            User.avatar.alias("tenant_avatar"),
 								            cls.model.update_time,
 								            cls.model.create_time,
 								        ]
 								        if keywords:
 								            dialogs = (
 								                cls.model.select(*fields)
 								                .join(User, on=(cls.model.tenant_id == User.id))
 								                .where(
 								                    (cls.model.tenant_id.in_(joined_tenant_ids) | (cls.model.tenant_id == user_id)) & (cls.model.status == StatusEnum.VALID.value),
 								                    (fn.LOWER(cls.model.name).contains(keywords.lower())),
 								                )
 								            )
 								        else:
 								            dialogs = (
 								                cls.model.select(*fields)
 								                .join(User, on=(cls.model.tenant_id == User.id))
 								                .where(
 								                    (cls.model.tenant_id.in_(joined_tenant_ids) | (cls.model.tenant_id == user_id)) & (cls.model.status == StatusEnum.VALID.value),
 								                )
 								            )
 								        if parser_id:
 								            dialogs = dialogs.where(cls.model.parser_id == parser_id)
 								        if desc:
 								            dialogs = dialogs.order_by(cls.model.getter_by(orderby).desc())
 								        else:
 								            dialogs = dialogs.order_by(cls.model.getter_by(orderby).asc())
 								        count = dialogs.count()
 								        if page_number and items_per_page:
 								            dialogs = dialogs.paginate(page_number, items_per_page)
 								        return list(dialogs.dicts()), count
-												Feat/admin drop user (#10342)

### What problem does this PR solve?

- Admin client support drop user.

Issue: #10241 

### Type of change

- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2025-09-29 10:16:13 +08:00
+								    @classmethod
 								    @DB.connection_context()
 								    def get_all_dialogs_by_tenant_id(cls, tenant_id):
 								        fields = [cls.model.id]
 								        dialogs = cls.model.select(*fields).where(cls.model.tenant_id == tenant_id)
 								        dialogs.order_by(cls.model.create_time.asc())
 								        offset, limit = 0, 100
 								        res = []
 								        while True:
 								            d_batch = dialogs.offset(offset).limit(limit)
 								            _temp = list(d_batch.dicts())
 								            if not _temp:
 								                break
 								            res.extend(_temp)
 								            offset += limit
 								        return res
-												Feat: advanced list dialogs (#9256)

### What problem does this PR solve?

Advanced list dialogs

### Type of change

- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2025-08-06 10:33:52 +08:00
-												Support chat solo. (#5218)

### What problem does this PR solve?

#5216

### Type of change

- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2025-02-21 12:24:02 +08:00
+								def chat_solo(dialog, messages, stream=True):
-												Perf: set timeout of some steps in KG. (#8873)

### What problem does this PR solve?

### Type of change


- [x] Performance Improvement
											
										
										
											2025-07-16 18:06:03 +08:00
+								    if TenantLLMService.llm_id2llm_type(dialog.llm_id) == "image2text":
-												Support chat solo. (#5218)

### What problem does this PR solve?

#5216

### Type of change

- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2025-02-21 12:24:02 +08:00
+								        chat_mdl = LLMBundle(dialog.tenant_id, LLMType.IMAGE2TEXT, dialog.llm_id)
 								    else:
 								        chat_mdl = LLMBundle(dialog.tenant_id, LLMType.CHAT, dialog.llm_id)
 								    prompt_config = dialog.prompt_config
 								    tts_mdl = None
 								    if prompt_config.get("tts"):
 								        tts_mdl = LLMBundle(dialog.tenant_id, LLMType.TTS)
-												Feat: add basic Langfuse support for LLM module (#6443)

### What problem does this PR solve?

#6155

Add basic Langfuse support for LLM module.

A trace example:

<img width="755" alt="image"
src="https://github.com/user-attachments/assets/25c1f852-5116-486c-a47f-6097187142ca"
/>


### Type of change

- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2025-03-24 13:18:47 +08:00
+								    msg = [{"role": m["role"], "content": re.sub(r"##\d+\$\$", "", m["content"])} for m in messages if m["role"] != "system"]
-												Support chat solo. (#5218)

### What problem does this PR solve?

#5216

### Type of change

- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2025-02-21 12:24:02 +08:00
+								    if stream:
 								        last_ans = ""
-												Fix: chat solo issue. (#7479)

### What problem does this PR solve?



### Type of change

- [x] Bug Fix (non-breaking change which fixes an issue)
											
										
										
											2025-05-06 19:30:00 +08:00
+								        delta_ans = ""
-												Support chat solo. (#5218)

### What problem does this PR solve?

#5216

### Type of change

- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2025-02-21 12:24:02 +08:00
+								        for ans in chat_mdl.chat_streamly(prompt_config.get("system", ""), msg, dialog.llm_setting):
 								            answer = ans
-												Fix bug: broken import from rag.prompts.prompts (#10217)

### What problem does this PR solve?

Fix broken imports

### Type of change

- [x] Bug Fix (non-breaking change which fixes an issue)

---------

Signed-off-by: jinhai <haijin.chn@gmail.com>
											
										
										
											2025-09-23 10:19:25 +08:00
+								            delta_ans = ans[len(last_ans):]
-												Support chat solo. (#5218)

### What problem does this PR solve?

#5216

### Type of change

- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2025-02-21 12:24:02 +08:00
+								            if num_tokens_from_string(delta_ans) < 16:
 								                continue
 								            last_ans = answer
-												Fix: fix may lose part of information of last stream chunck (#5584)

### What problem does this PR solve?

 Fix may lose part of information of last stream chunck

### Type of change

- [x] Bug Fix (non-breaking change which fixes an issue)
											
										
										
											2025-03-04 11:58:10 +08:00
+								            yield {"answer": answer, "reference": {}, "audio_binary": tts(tts_mdl, delta_ans), "prompt": "", "created_at": time.time()}
-												Fix: chat solo issue. (#7479)

### What problem does this PR solve?



### Type of change

- [x] Bug Fix (non-breaking change which fixes an issue)
											
										
										
											2025-05-06 19:30:00 +08:00
+								            delta_ans = ""
-												Fix: fix may lose part of information of last stream chunck (#5584)

### What problem does this PR solve?

 Fix may lose part of information of last stream chunck

### Type of change

- [x] Bug Fix (non-breaking change which fixes an issue)
											
										
										
											2025-03-04 11:58:10 +08:00
+								        if delta_ans:
 								            yield {"answer": answer, "reference": {}, "audio_binary": tts(tts_mdl, delta_ans), "prompt": "", "created_at": time.time()}
-												Support chat solo. (#5218)

### What problem does this PR solve?

#5216

### Type of change

- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2025-02-21 12:24:02 +08:00
+								    else:
 								        answer = chat_mdl.chat(prompt_config.get("system", ""), msg, dialog.llm_setting)
 								        user_content = msg[-1].get("content", "[content not available]")
 								        logging.debug("User: {}|Assistant: {}".format(user_content, answer))
 								        yield {"answer": answer, "reference": {}, "audio_binary": tts(tts_mdl, answer), "prompt": "", "created_at": time.time()}
-												Fix: issue for tavily only in a assistant. (#8076)

### What problem does this PR solve?


### Type of change

- [x] Bug Fix (non-breaking change which fixes an issue)
											
										
										
											2025-06-05 13:00:43 +08:00
+								def get_models(dialog):
 								    embd_mdl, chat_mdl, rerank_mdl, tts_mdl = None, None, None, None
 								    kbs = KnowledgebaseService.get_by_ids(dialog.kb_ids)
 								    embedding_list = list(set([kb.embd_id for kb in kbs]))
 								    if len(embedding_list) > 1:
 								        raise Exception("**ERROR**: Knowledge bases use different embedding models.")
 								    if embedding_list:
 								        embd_mdl = LLMBundle(dialog.tenant_id, LLMType.EMBEDDING, embedding_list[0])
 								        if not embd_mdl:
 								            raise LookupError("Embedding model(%s) not found" % embedding_list[0])
-												Perf: set timeout of some steps in KG. (#8873)

### What problem does this PR solve?

### Type of change


- [x] Performance Improvement
											
										
										
											2025-07-16 18:06:03 +08:00
+								    if TenantLLMService.llm_id2llm_type(dialog.llm_id) == "image2text":
-												Fix: issue for tavily only in a assistant. (#8076)

### What problem does this PR solve?


### Type of change

- [x] Bug Fix (non-breaking change which fixes an issue)
											
										
										
											2025-06-05 13:00:43 +08:00
+								        chat_mdl = LLMBundle(dialog.tenant_id, LLMType.IMAGE2TEXT, dialog.llm_id)
 								    else:
 								        chat_mdl = LLMBundle(dialog.tenant_id, LLMType.CHAT, dialog.llm_id)
 								    if dialog.rerank_id:
 								        rerank_mdl = LLMBundle(dialog.tenant_id, LLMType.RERANK, dialog.rerank_id)
 								    if dialog.prompt_config.get("tts"):
 								        tts_mdl = LLMBundle(dialog.tenant_id, LLMType.TTS)
 								    return kbs, embd_mdl, rerank_mdl, chat_mdl, tts_mdl
-												Refa: change citation mark as [ID:n] (#7923)

### What problem does this PR solve?

Change citation mark as [ID:n], it's easier for LLMs to follow the
instruction :) #7904

### Type of change

- [x] Refactoring
											
										
										
											2025-05-29 10:03:51 +08:00
+								BAD_CITATION_PATTERNS = [
 								    re.compile(r"\(\s*ID\s*[: ]*\s*(\d+)\s*\)"),  # (ID: 12)
 								    re.compile(r"\[\s*ID\s*[: ]*\s*(\d+)\s*\]"),  # [ID: 12]
 								    re.compile(r"【\s*ID\s*[: ]*\s*(\d+)\s*】"),  # 【ID: 12】
 								    re.compile(r"ref\s*(\d+)", flags=re.IGNORECASE),  # ref12、REF 12
 								]
-												Feat: wrap search app (#8320)

### What problem does this PR solve?

Wrap search app

### Type of change

- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2025-06-18 16:45:42 +08:00
-												Fix: issue for tavily only in a assistant. (#8076)

### What problem does this PR solve?


### Type of change

- [x] Bug Fix (non-breaking change which fixes an issue)
											
										
										
											2025-06-05 13:00:43 +08:00
+								def repair_bad_citation_formats(answer: str, kbinfos: dict, idx: set):
 								    max_index = len(kbinfos["chunks"])
 								    def safe_add(i):
 								        if 0 <= i < max_index:
 								            idx.add(i)
 								            return True
 								        return False
 								    def find_and_replace(pattern, group_index=1, repl=lambda i: f"ID:{i}", flags=0):
 								        nonlocal answer
 								        def replacement(match):
 								            try:
 								                i = int(match.group(group_index))
 								                if safe_add(i):
 								                    return f"[{repl(i)}]"
 								            except Exception:
 								                pass
 								            return match.group(0)
 								        answer = re.sub(pattern, replacement, answer, flags=flags)
 								    for pattern in BAD_CITATION_PATTERNS:
 								        find_and_replace(pattern)
 								    return answer, idx
-												Refa: change citation mark as [ID:n] (#7923)

### What problem does this PR solve?

Change citation mark as [ID:n], it's easier for LLMs to follow the
instruction :) #7904

### Type of change

- [x] Refactoring
											
										
										
											2025-05-29 10:03:51 +08:00
-												Refa: import issue. (#9958)

### What problem does this PR solve?


### Type of change

- [x] Refactoring
											
										
										
											2025-09-05 19:26:15 +08:00
+								def convert_conditions(metadata_condition):
 								    if metadata_condition is None:
 								        metadata_condition = {}
 								    op_mapping = {
 								        "is": "=",
 								        "not is": "≠"
 								    }
 								    return [
-												Fix bug: broken import from rag.prompts.prompts (#10217)

### What problem does this PR solve?

Fix broken imports

### Type of change

- [x] Bug Fix (non-breaking change which fixes an issue)

---------

Signed-off-by: jinhai <haijin.chn@gmail.com>
											
										
										
											2025-09-23 10:19:25 +08:00
+								        {
 								            "op": op_mapping.get(cond["comparison_operator"], cond["comparison_operator"]),
 								            "key": cond["name"],
 								            "value": cond["value"]
 								        }
 								        for cond in metadata_condition.get("conditions", [])
 								    ]
-												Refa: import issue. (#9958)

### What problem does this PR solve?


### Type of change

- [x] Refactoring
											
										
										
											2025-09-05 19:26:15 +08:00
-												Feat: add meta data filter. (#9405)

### What problem does this PR solve?

#8531 
#7417 
#6761 
#6573
#6477

### Type of change

- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2025-08-12 14:12:56 +08:00
+								def meta_filter(metas: dict, filters: list[dict]):
-												Fix: meta data filter with AND logic operations. (#9687)

### What problem does this PR solve?

Close #9648

### Type of change

- [x] Bug Fix (non-breaking change which fixes an issue)
											
										
										
											2025-08-25 18:29:24 +08:00
+								    doc_ids = set([])
-												Feat: conversation completion can specify different model (#9485)

### What problem does this PR solve?

Conversation completion can specify different model

### Type of change

- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2025-08-15 17:44:58 +08:00
-												Feat: add meta data filter. (#9405)

### What problem does this PR solve?

#8531 
#7417 
#6761 
#6573
#6477

### Type of change

- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2025-08-12 14:12:56 +08:00
+								    def filter_out(v2docs, operator, value):
-												Fix: meta data filter with AND logic operations. (#9687)

### What problem does this PR solve?

Close #9648

### Type of change

- [x] Bug Fix (non-breaking change which fixes an issue)
											
										
										
											2025-08-25 18:29:24 +08:00
+								        ids = []
-												Feat: conversation completion can specify different model (#9485)

### What problem does this PR solve?

Conversation completion can specify different model

### Type of change

- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2025-08-15 17:44:58 +08:00
+								        for input, docids in v2docs.items():
-												Fix: numeric string miss transformation. (#11025)

### What problem does this PR solve?

#11024

### Type of change

- [x] Bug Fix (non-breaking change which fixes an issue)
											
										
										
											2025-11-05 15:14:30 +08:00
+								            if operator in ["=", "≠", ">", "<", "≥", "≤"]:
 								                try:
 								                    input = float(input)
 								                    value = float(value)
 								                except Exception:
 								                    input = str(input)
 								                    value = str(value)
-												Feat: add meta data filter. (#9405)

### What problem does this PR solve?

#8531 
#7417 
#6761 
#6573
#6477

### Type of change

- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2025-08-12 14:12:56 +08:00
 								            for conds in [
-												Fix bug: broken import from rag.prompts.prompts (#10217)

### What problem does this PR solve?

Fix broken imports

### Type of change

- [x] Bug Fix (non-breaking change which fixes an issue)

---------

Signed-off-by: jinhai <haijin.chn@gmail.com>
											
										
										
											2025-09-23 10:19:25 +08:00
+								                (operator == "contains", str(value).lower() in str(input).lower()),
 								                (operator == "not contains", str(value).lower() not in str(input).lower()),
 								                (operator == "start with", str(input).lower().startswith(str(value).lower())),
 								                (operator == "end with", str(input).lower().endswith(str(value).lower())),
 								                (operator == "empty", not input),
 								                (operator == "not empty", input),
 								                (operator == "=", input == value),
 								                (operator == "≠", input != value),
 								                (operator == ">", input > value),
 								                (operator == "<", input < value),
 								                (operator == "≥", input >= value),
 								                (operator == "≤", input <= value),
 								            ]:
-												Feat: add meta data filter. (#9405)

### What problem does this PR solve?

#8531 
#7417 
#6761 
#6573
#6477

### Type of change

- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2025-08-12 14:12:56 +08:00
+								                try:
 								                    if all(conds):
-												Fix: meta data filter with AND logic operations. (#9687)

### What problem does this PR solve?

Close #9648

### Type of change

- [x] Bug Fix (non-breaking change which fixes an issue)
											
										
										
											2025-08-25 18:29:24 +08:00
+								                        ids.extend(docids)
 								                        break
-												Feat: add meta data filter. (#9405)

### What problem does this PR solve?

#8531 
#7417 
#6761 
#6573
#6477

### Type of change

- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2025-08-12 14:12:56 +08:00
+								                except Exception:
 								                    pass
-												Fix: meta data filter with AND logic operations. (#9687)

### What problem does this PR solve?

Close #9648

### Type of change

- [x] Bug Fix (non-breaking change which fixes an issue)
											
										
										
											2025-08-25 18:29:24 +08:00
+								        return ids
-												Feat: add meta data filter. (#9405)

### What problem does this PR solve?

#8531 
#7417 
#6761 
#6573
#6477

### Type of change

- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2025-08-12 14:12:56 +08:00
 								    for k, v2docs in metas.items():
 								        for f in filters:
 								            if k != f["key"]:
 								                continue
-												Fix: meta data filter with AND logic operations. (#9687)

### What problem does this PR solve?

Close #9648

### Type of change

- [x] Bug Fix (non-breaking change which fixes an issue)
											
										
										
											2025-08-25 18:29:24 +08:00
+								            ids = filter_out(v2docs, f["op"], f["value"])
 								            if not doc_ids:
 								                doc_ids = set(ids)
 								            else:
 								                doc_ids = doc_ids & set(ids)
 								            if not doc_ids:
 								                return []
 								    return list(doc_ids)
-												Feat: add meta data filter. (#9405)

### What problem does this PR solve?

#8531 
#7417 
#6761 
#6573
#6477

### Type of change

- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2025-08-12 14:12:56 +08:00
-												Format file format from Windows/dos to Unix (#1949)

### What problem does this PR solve?

Related source file is in Windows/DOS format, they are format to Unix
format.

### Type of change

- [x] Refactoring

Signed-off-by: Jin Hai <haijin.chn@gmail.com>
											
										
										
											2024-08-15 09:17:36 +08:00
+								def chat(dialog, messages, stream=True, **kwargs):
 								    assert messages[-1]["role"] == "user", "The last content of this conversation is not from user."
-												Fix: issue for tavily only in a assistant. (#8076)

### What problem does this PR solve?


### Type of change

- [x] Bug Fix (non-breaking change which fixes an issue)
											
										
										
											2025-06-05 13:00:43 +08:00
+								    if not dialog.kb_ids and not dialog.prompt_config.get("tavily_api_key"):
-												Support chat solo. (#5218)

### What problem does this PR solve?

#5216

### Type of change

- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2025-02-21 12:24:02 +08:00
+								        for ans in chat_solo(dialog, messages, stream):
 								            yield ans
-												Minor tweats (#11271)

### What problem does this PR solve?

As title.

### Type of change

- [x] Refactoring

---------

Signed-off-by: Jin Hai <haijin.chn@gmail.com>
											
										
										
											2025-11-16 19:29:20 +08:00
+								        return None
-												Refactor ask decorator (#4116)

### What problem does this PR solve?

Refactor ask decorator

### Type of change

- [x] Refactoring

---------

Signed-off-by: jinhai <haijin.chn@gmail.com>
Co-authored-by: Kevin Hu <kevinhu.sh@gmail.com>
											
										
										
											2024-12-19 18:13:33 +08:00
 								    chat_start_ts = timer()
-												Perf: set timeout of some steps in KG. (#8873)

### What problem does this PR solve?

### Type of change


- [x] Performance Improvement
											
										
										
											2025-07-16 18:06:03 +08:00
+								    if TenantLLMService.llm_id2llm_type(dialog.llm_id) == "image2text":
-												Fix: The max tokens defined by the tenant are not used (#4297) (#2817) (#5066)

### What problem does this PR solve?

Fix: The max tokens defined by the tenant are not used (#4297) (#2817)


### Type of change

- [x] Bug Fix (non-breaking change which fixes an issue)

---------

Co-authored-by: Kevin Hu <kevinhu.sh@gmail.com>
											
										
										
											2025-02-18 13:42:22 +08:00
+								        llm_model_config = TenantLLMService.get_model_config(dialog.tenant_id, LLMType.IMAGE2TEXT, dialog.llm_id)
-												Format file format from Windows/dos to Unix (#1949)

### What problem does this PR solve?

Related source file is in Windows/DOS format, they are format to Unix
format.

### Type of change

- [x] Refactoring

Signed-off-by: Jin Hai <haijin.chn@gmail.com>
											
										
										
											2024-08-15 09:17:36 +08:00
+								    else:
-												Fix: The max tokens defined by the tenant are not used (#4297) (#2817) (#5066)

### What problem does this PR solve?

Fix: The max tokens defined by the tenant are not used (#4297) (#2817)


### Type of change

- [x] Bug Fix (non-breaking change which fixes an issue)

---------

Co-authored-by: Kevin Hu <kevinhu.sh@gmail.com>
											
										
										
											2025-02-18 13:42:22 +08:00
+								        llm_model_config = TenantLLMService.get_model_config(dialog.tenant_id, LLMType.CHAT, dialog.llm_id)
 								    max_tokens = llm_model_config.get("max_tokens", 8192)
-												Refactor ask decorator (#4116)

### What problem does this PR solve?

Refactor ask decorator

### Type of change

- [x] Refactoring

---------

Signed-off-by: jinhai <haijin.chn@gmail.com>
Co-authored-by: Kevin Hu <kevinhu.sh@gmail.com>
											
										
										
											2024-12-19 18:13:33 +08:00
 								    check_llm_ts = timer()
-												Feat: add basic Langfuse support for LLM module (#6443)

### What problem does this PR solve?

#6155

Add basic Langfuse support for LLM module.

A trace example:

<img width="755" alt="image"
src="https://github.com/user-attachments/assets/25c1f852-5116-486c-a47f-6097187142ca"
/>


### Type of change

- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2025-03-24 13:18:47 +08:00
+								    langfuse_tracer = None
-												Fix: migrate deprecated Langfuse API from v2 to v3 (#9204)

### What problem does this PR solve?

Fix:

```bash
'Langfuse' object has no attribute 'trace'
```

### Type of change

- [x] Bug Fix (non-breaking change which fixes an issue)
											
										
										
											2025-08-04 14:45:43 +08:00
+								    trace_context = {}
-												Feat: add basic Langfuse support for LLM module (#6443)

### What problem does this PR solve?

#6155

Add basic Langfuse support for LLM module.

A trace example:

<img width="755" alt="image"
src="https://github.com/user-attachments/assets/25c1f852-5116-486c-a47f-6097187142ca"
/>


### Type of change

- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2025-03-24 13:18:47 +08:00
+								    langfuse_keys = TenantLangfuseService.filter_by_tenant(tenant_id=dialog.tenant_id)
 								    if langfuse_keys:
 								        langfuse = Langfuse(public_key=langfuse_keys.public_key, secret_key=langfuse_keys.secret_key, host=langfuse_keys.host)
 								        if langfuse.auth_check():
 								            langfuse_tracer = langfuse
-												Fix: migrate deprecated Langfuse API from v2 to v3 (#9204)

### What problem does this PR solve?

Fix:

```bash
'Langfuse' object has no attribute 'trace'
```

### Type of change

- [x] Bug Fix (non-breaking change which fixes an issue)
											
										
										
											2025-08-04 14:45:43 +08:00
+								            trace_id = langfuse_tracer.create_trace_id()
 								            trace_context = {"trace_id": trace_id}
-												Feat: add basic Langfuse support for LLM module (#6443)

### What problem does this PR solve?

#6155

Add basic Langfuse support for LLM module.

A trace example:

<img width="755" alt="image"
src="https://github.com/user-attachments/assets/25c1f852-5116-486c-a47f-6097187142ca"
/>


### Type of change

- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2025-03-24 13:18:47 +08:00
 								    check_langfuse_tracer_ts = timer()
-												Fix: issue for tavily only in a assistant. (#8076)

### What problem does this PR solve?


### Type of change

- [x] Bug Fix (non-breaking change which fixes an issue)
											
										
										
											2025-06-05 13:00:43 +08:00
+								    kbs, embd_mdl, rerank_mdl, chat_mdl, tts_mdl = get_models(dialog)
 								    toolcall_session, tools = kwargs.get("toolcall_session"), kwargs.get("tools")
 								    if toolcall_session and tools:
 								        chat_mdl.bind_tools(toolcall_session, tools)
 								    bind_models_ts = timer()
-												Refactor ask decorator (#4116)

### What problem does this PR solve?

Refactor ask decorator

### Type of change

- [x] Refactoring

---------

Signed-off-by: jinhai <haijin.chn@gmail.com>
Co-authored-by: Kevin Hu <kevinhu.sh@gmail.com>
											
										
										
											2024-12-19 18:13:33 +08:00
-												Move api.settings to common.settings (#11036)

### What problem does this PR solve?

As title

### Type of change

- [x] Refactoring

---------

Signed-off-by: Jin Hai <haijin.chn@gmail.com>
											
										
										
											2025-11-06 09:36:38 +08:00
+								    retriever = settings.retriever
-												Format file format from Windows/dos to Unix (#1949)

### What problem does this PR solve?

Related source file is in Windows/DOS format, they are format to Unix
format.

### Type of change

- [x] Refactoring

Signed-off-by: Jin Hai <haijin.chn@gmail.com>
											
										
										
											2024-08-15 09:17:36 +08:00
+								    questions = [m["content"] for m in messages if m["role"] == "user"][-3:]
-												Feat: add meta data filter. (#9405)

### What problem does this PR solve?

#8531 
#7417 
#6761 
#6573
#6477

### Type of change

- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2025-08-12 14:12:56 +08:00
+								    attachments = kwargs["doc_ids"].split(",") if "doc_ids" in kwargs else []
-												Format file format from Windows/dos to Unix (#1949)

### What problem does this PR solve?

Related source file is in Windows/DOS format, they are format to Unix
format.

### Type of change

- [x] Refactoring

Signed-off-by: Jin Hai <haijin.chn@gmail.com>
											
										
										
											2024-08-15 09:17:36 +08:00
+								    if "doc_ids" in messages[-1]:
 								        attachments = messages[-1]["doc_ids"]
-												Feat: add meta data filter. (#9405)

### What problem does this PR solve?

#8531 
#7417 
#6761 
#6573
#6477

### Type of change

- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2025-08-12 14:12:56 +08:00
-												Format file format from Windows/dos to Unix (#1949)

### What problem does this PR solve?

Related source file is in Windows/DOS format, they are format to Unix
format.

### Type of change

- [x] Refactoring

Signed-off-by: Jin Hai <haijin.chn@gmail.com>
											
										
										
											2024-08-15 09:17:36 +08:00
+								    prompt_config = dialog.prompt_config
 								    field_map = KnowledgebaseService.get_field_map(dialog.kb_ids)
 								    # try to use sql if field mapping is good to go
 								    if field_map:
-												Use consistent log file names, introduced initLogger (#3403)

### What problem does this PR solve?

Use consistent log file names, introduced initLogger

### Type of change

- [ ] Bug Fix (non-breaking change which fixes an issue)
- [ ] New Feature (non-breaking change which adds functionality)
- [ ] Documentation Update
- [x] Refactoring
- [ ] Performance Improvement
- [ ] Other (please describe):
											
										
										
											2024-11-14 17:13:48 +08:00
+								        logging.debug("Use SQL to retrieval:{}".format(questions[-1]))
-												During the chat, the assistant's response cited documents outside current chat's kbs (#9900)

### What problem does this PR solve?

During the chat, the assistant's response cited documents outside the
current knowledge base。

### Type of change

- [x] Bug Fix (non-breaking change which fixes an issue)
											
										
										
											2025-09-04 16:51:13 +08:00
+								        ans = use_sql(questions[-1], field_map, dialog.tenant_id, chat_mdl, prompt_config.get("quote", True), dialog.kb_ids)
-												Format file format from Windows/dos to Unix (#1949)

### What problem does this PR solve?

Related source file is in Windows/DOS format, they are format to Unix
format.

### Type of change

- [x] Refactoring

Signed-off-by: Jin Hai <haijin.chn@gmail.com>
											
										
										
											2024-08-15 09:17:36 +08:00
+								        if ans:
 								            yield ans
-												Minor tweats (#11271)

### What problem does this PR solve?

As title.

### Type of change

- [x] Refactoring

---------

Signed-off-by: Jin Hai <haijin.chn@gmail.com>
											
										
										
											2025-11-16 19:29:20 +08:00
+								            return None
-												Format file format from Windows/dos to Unix (#1949)

### What problem does this PR solve?

Related source file is in Windows/DOS format, they are format to Unix
format.

### Type of change

- [x] Refactoring

Signed-off-by: Jin Hai <haijin.chn@gmail.com>
											
										
										
											2024-08-15 09:17:36 +08:00
 								    for p in prompt_config["parameters"]:
 								        if p["key"] == "knowledge":
 								            continue
 								        if p["key"] not in kwargs and not p["optional"]:
 								            raise KeyError("Miss parameter: " + p["key"])
 								        if p["key"] not in kwargs:
-												Feat: add basic Langfuse support for LLM module (#6443)

### What problem does this PR solve?

#6155

Add basic Langfuse support for LLM module.

A trace example:

<img width="755" alt="image"
src="https://github.com/user-attachments/assets/25c1f852-5116-486c-a47f-6097187142ca"
/>


### Type of change

- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2025-03-24 13:18:47 +08:00
+								            prompt_config["system"] = prompt_config["system"].replace("{%s}" % p["key"], " ")
-												Format file format from Windows/dos to Unix (#1949)

### What problem does this PR solve?

Related source file is in Windows/DOS format, they are format to Unix
format.

### Type of change

- [x] Refactoring

Signed-off-by: Jin Hai <haijin.chn@gmail.com>
											
										
										
											2024-08-15 09:17:36 +08:00
-												refine reteival of multi-turn conversation (#2520)

### What problem does this PR solve?

#2362 #2484

### Type of change

- [x] New Feature (non-breaking change which adds functionality)
- [x] Performance Improvement
											
										
										
											2024-09-20 17:25:55 +08:00
+								    if len(questions) > 1 and prompt_config.get("refine_multiturn"):
 								        questions = [full_question(dialog.tenant_id, dialog.llm_id, messages)]
 								    else:
 								        questions = questions[-1:]
-												Refactor ask decorator (#4116)

### What problem does this PR solve?

Refactor ask decorator

### Type of change

- [x] Refactoring

---------

Signed-off-by: jinhai <haijin.chn@gmail.com>
Co-authored-by: Kevin Hu <kevinhu.sh@gmail.com>
											
										
										
											2024-12-19 18:13:33 +08:00
-												Feat: support cross-lang search. (#7557)

### What problem does this PR solve?

#7376
#4503
#5710 
#7470

### Type of change

- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2025-05-09 15:32:02 +08:00
+								    if prompt_config.get("cross_languages"):
 								        questions = [cross_languages(dialog.tenant_id, dialog.llm_id, questions[0], prompt_config["cross_languages"])]
-												Feat: add meta data filter. (#9405)

### What problem does this PR solve?

#8531 
#7417 
#6761 
#6573
#6477

### Type of change

- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2025-08-12 14:12:56 +08:00
+								    if dialog.meta_data_filter:
 								        metas = DocumentService.get_meta_by_kbs(dialog.kb_ids)
 								        if dialog.meta_data_filter.get("method") == "auto":
 								            filters = gen_meta_filter(chat_mdl, metas, questions[-1])
 								            attachments.extend(meta_filter(metas, filters))
-												Fix: no doc hits after meta data filter. (#9435)

### What problem does this PR solve?


### Type of change

- [x] Bug Fix (non-breaking change which fixes an issue)
											
										
										
											2025-08-13 12:43:31 +08:00
+								            if not attachments:
 								                attachments = None
-												Feat: add meta data filter. (#9405)

### What problem does this PR solve?

#8531 
#7417 
#6761 
#6573
#6477

### Type of change

- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2025-08-12 14:12:56 +08:00
+								        elif dialog.meta_data_filter.get("method") == "manual":
 								            attachments.extend(meta_filter(metas, dialog.meta_data_filter["manual"]))
-												Fix: no doc hits after meta data filter. (#9435)

### What problem does this PR solve?


### Type of change

- [x] Bug Fix (non-breaking change which fixes an issue)
											
										
										
											2025-08-13 12:43:31 +08:00
+								            if not attachments:
 								                attachments = None
-												Feat: add meta data filter. (#9405)

### What problem does this PR solve?

#8531 
#7417 
#6761 
#6573
#6477

### Type of change

- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2025-08-12 14:12:56 +08:00
-												Fix: issue for tavily only in a assistant. (#8076)

### What problem does this PR solve?


### Type of change

- [x] Bug Fix (non-breaking change which fixes an issue)
											
										
										
											2025-06-05 13:00:43 +08:00
+								    if prompt_config.get("keyword", False):
 								        questions[-1] += keyword_extraction(chat_mdl, questions[-1])
-												refine reteival of multi-turn conversation (#2520)

### What problem does this PR solve?

#2362 #2484

### Type of change

- [x] New Feature (non-breaking change which adds functionality)
- [x] Performance Improvement
											
										
										
											2024-09-20 17:25:55 +08:00
-												Fix: issue for tavily only in a assistant. (#8076)

### What problem does this PR solve?


### Type of change

- [x] Bug Fix (non-breaking change which fixes an issue)
											
										
										
											2025-06-05 13:00:43 +08:00
+								    refine_question_ts = timer()
-												Format file format from Windows/dos to Unix (#1949)

### What problem does this PR solve?

Related source file is in Windows/DOS format, they are format to Unix
format.

### Type of change

- [x] Refactoring

Signed-off-by: Jin Hai <haijin.chn@gmail.com>
											
										
										
											2024-08-15 09:17:36 +08:00
-												Apply agentic searching. (#5196)

### What problem does this PR solve?

#5173

### Type of change

- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2025-02-20 17:41:01 +08:00
+								    thought = ""
 								    kbinfos = {"total": 0, "chunks": [], "doc_aggs": []}
-												Fix: no doc hits after meta data filter. (#9435)

### What problem does this PR solve?


### Type of change

- [x] Bug Fix (non-breaking change which fixes an issue)
											
										
										
											2025-08-13 12:43:31 +08:00
+								    knowledges = []
-												Refactor ask decorator (#4116)

### What problem does this PR solve?

Refactor ask decorator

### Type of change

- [x] Refactoring

---------

Signed-off-by: jinhai <haijin.chn@gmail.com>
Co-authored-by: Kevin Hu <kevinhu.sh@gmail.com>
											
										
										
											2024-12-19 18:13:33 +08:00
-												Fix: no doc hits after meta data filter. (#9435)

### What problem does this PR solve?


### Type of change

- [x] Bug Fix (non-breaking change which fixes an issue)
											
										
										
											2025-08-13 12:43:31 +08:00
+								    if attachments is not None and "knowledge" in [p["key"] for p in prompt_config["parameters"]]:
-												search between multiple indiices for team function (#3079)

### What problem does this PR solve?

#2834 
### Type of change

- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2024-10-29 13:19:01 +08:00
+								        tenant_ids = list(set([kb.tenant_id for kb in kbs]))
-												Apply agentic searching. (#5196)

### What problem does this PR solve?

#5173

### Type of change

- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2025-02-20 17:41:01 +08:00
+								        knowledges = []
 								        if prompt_config.get("reasoning", False):
-												Feat: add basic Langfuse support for LLM module (#6443)

### What problem does this PR solve?

#6155

Add basic Langfuse support for LLM module.

A trace example:

<img width="755" alt="image"
src="https://github.com/user-attachments/assets/25c1f852-5116-486c-a47f-6097187142ca"
/>


### Type of change

- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2025-03-24 13:18:47 +08:00
+								            reasoner = DeepResearcher(
 								                chat_mdl,
 								                prompt_config,
-												Feat: conversation completion can specify different model (#9485)

### What problem does this PR solve?

Conversation completion can specify different model

### Type of change

- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2025-08-15 17:44:58 +08:00
+								                partial(
 								                    retriever.retrieval,
 								                    embd_mdl=embd_mdl,
 								                    tenant_ids=tenant_ids,
 								                    kb_ids=dialog.kb_ids,
 								                    page=1,
 								                    page_size=dialog.top_n,
 								                    similarity_threshold=0.2,
 								                    vector_similarity_weight=0.3,
 								                    doc_ids=attachments,
 								                ),
-												Feat: add basic Langfuse support for LLM module (#6443)

### What problem does this PR solve?

#6155

Add basic Langfuse support for LLM module.

A trace example:

<img width="755" alt="image"
src="https://github.com/user-attachments/assets/25c1f852-5116-486c-a47f-6097187142ca"
/>


### Type of change

- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2025-03-24 13:18:47 +08:00
+								            )
-												Code refactor (#5371)

### What problem does this PR solve?

#5173

### Type of change

- [x] Refactoring
											
										
										
											2025-02-26 15:40:52 +08:00
 								            for think in reasoner.thinking(kbinfos, " ".join(questions)):
-												Apply agentic searching. (#5196)

### What problem does this PR solve?

#5173

### Type of change

- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2025-02-20 17:41:01 +08:00
+								                if isinstance(think, str):
 								                    thought = think
 								                    knowledges = [t for t in think.split("\n") if t]
-												Fix: rm think if stream is Flase. (#5458)

### What problem does this PR solve?


### Type of change

- [x] Bug Fix (non-breaking change which fixes an issue)
											
										
										
											2025-02-28 10:05:18 +08:00
+								                elif stream:
-												Apply agentic searching. (#5196)

### What problem does this PR solve?

#5173

### Type of change

- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2025-02-20 17:41:01 +08:00
+								                    yield think
 								        else:
-												Fix: issue for tavily only in a assistant. (#8076)

### What problem does this PR solve?


### Type of change

- [x] Bug Fix (non-breaking change which fixes an issue)
											
										
										
											2025-06-05 13:00:43 +08:00
+								            if embd_mdl:
 								                kbinfos = retriever.retrieval(
 								                    " ".join(questions),
 								                    embd_mdl,
 								                    tenant_ids,
 								                    dialog.kb_ids,
 ,
 								                    dialog.top_n,
 								                    dialog.similarity_threshold,
 								                    dialog.vector_similarity_weight,
 								                    doc_ids=attachments,
 								                    top=dialog.top_k,
 								                    aggs=False,
 								                    rerank_mdl=rerank_mdl,
 								                    rank_feature=label_question(" ".join(questions), kbs),
 								                )
-												Feat: TOC retrieval (#10456)

### What problem does this PR solve?

#10436

### Type of change

- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2025-10-10 17:07:55 +08:00
+								                if prompt_config.get("toc_enhance"):
 								                    cks = retriever.retrieval_by_toc(" ".join(questions), kbinfos["chunks"], tenant_ids, chat_mdl, dialog.top_n)
 								                    if cks:
 								                        kbinfos["chunks"] = cks
-												Add tavily as web searh tool. (#5349)

### What problem does this PR solve?

#5198

### Type of change

- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2025-02-26 10:21:04 +08:00
+								            if prompt_config.get("tavily_api_key"):
 								                tav = Tavily(prompt_config["tavily_api_key"])
 								                tav_res = tav.retrieve_chunks(" ".join(questions))
 								                kbinfos["chunks"].extend(tav_res["chunks"])
 								                kbinfos["doc_aggs"].extend(tav_res["doc_aggs"])
-												Apply agentic searching. (#5196)

### What problem does this PR solve?

#5173

### Type of change

- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2025-02-20 17:41:01 +08:00
+								            if prompt_config.get("use_kg"):
-												Fix typos: retrievaler -> retriever (#10372)

### What problem does this PR solve?

Fix typos

### Type of change

- [x] Refactoring

---------

Signed-off-by: Jin Hai <haijin.chn@gmail.com>
											
										
										
											2025-10-10 09:17:36 +08:00
+								                ck = settings.kg_retriever.retrieval(" ".join(questions), tenant_ids, dialog.kb_ids, embd_mdl,
-												Fix bug: broken import from rag.prompts.prompts (#10217)

### What problem does this PR solve?

Fix broken imports

### Type of change

- [x] Bug Fix (non-breaking change which fixes an issue)

---------

Signed-off-by: jinhai <haijin.chn@gmail.com>
											
										
										
											2025-09-23 10:19:25 +08:00
+								                                                       LLMBundle(dialog.tenant_id, LLMType.CHAT))
-												Apply agentic searching. (#5196)

### What problem does this PR solve?

#5173

### Type of change

- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2025-02-20 17:41:01 +08:00
+								                if ck["content_with_weight"]:
 								                    kbinfos["chunks"].insert(0, ck)
 								            knowledges = kb_prompt(kbinfos, max_tokens)
-												Refactor ask decorator (#4116)

### What problem does this PR solve?

Refactor ask decorator

### Type of change

- [x] Refactoring

---------

Signed-off-by: jinhai <haijin.chn@gmail.com>
Co-authored-by: Kevin Hu <kevinhu.sh@gmail.com>
											
										
										
											2024-12-19 18:13:33 +08:00
-												Feat: add basic Langfuse support for LLM module (#6443)

### What problem does this PR solve?

#6155

Add basic Langfuse support for LLM module.

A trace example:

<img width="755" alt="image"
src="https://github.com/user-attachments/assets/25c1f852-5116-486c-a47f-6097187142ca"
/>


### Type of change

- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2025-03-24 13:18:47 +08:00
+								    logging.debug("{}->{}".format(" ".join(questions), "\n->".join(knowledges)))
-												Format file format from Windows/dos to Unix (#1949)

### What problem does this PR solve?

Related source file is in Windows/DOS format, they are format to Unix
format.

### Type of change

- [x] Refactoring

Signed-off-by: Jin Hai <haijin.chn@gmail.com>
											
										
										
											2024-08-15 09:17:36 +08:00
-												Apply agentic searching. (#5196)

### What problem does this PR solve?

#5173

### Type of change

- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2025-02-20 17:41:01 +08:00
+								    retrieval_ts = timer()
-												Format file format from Windows/dos to Unix (#1949)

### What problem does this PR solve?

Related source file is in Windows/DOS format, they are format to Unix
format.

### Type of change

- [x] Refactoring

Signed-off-by: Jin Hai <haijin.chn@gmail.com>
											
										
										
											2024-08-15 09:17:36 +08:00
+								    if not knowledges and prompt_config.get("empty_response"):
-												add stream chat with TTS (#2228)

### What problem does this PR solve?



### Type of change

- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2024-09-03 19:49:14 +08:00
+								        empty_res = prompt_config["empty_response"]
-												Fix bug: broken import from rag.prompts.prompts (#10217)

### What problem does this PR solve?

Fix broken imports

### Type of change

- [x] Bug Fix (non-breaking change which fixes an issue)

---------

Signed-off-by: jinhai <haijin.chn@gmail.com>
											
										
										
											2025-09-23 10:19:25 +08:00
+								        yield {"answer": empty_res, "reference": kbinfos, "prompt": "\n\n### Query:\n%s" % " ".join(questions),
 								               "audio_binary": tts(tts_mdl, empty_res)}
-												Format file format from Windows/dos to Unix (#1949)

### What problem does this PR solve?

Related source file is in Windows/DOS format, they are format to Unix
format.

### Type of change

- [x] Refactoring

Signed-off-by: Jin Hai <haijin.chn@gmail.com>
											
										
										
											2024-08-15 09:17:36 +08:00
+								        return {"answer": prompt_config["empty_response"], "reference": kbinfos}
-												Add meta data while chatting. (#4455)

### What problem does this PR solve?

#3690

### Type of change

- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2025-01-13 14:35:24 +08:00
+								    kwargs["knowledge"] = "\n------\n" + "\n\n------\n\n".join(knowledges)
-												Format file format from Windows/dos to Unix (#1949)

### What problem does this PR solve?

Related source file is in Windows/DOS format, they are format to Unix
format.

### Type of change

- [x] Refactoring

Signed-off-by: Jin Hai <haijin.chn@gmail.com>
											
										
										
											2024-08-15 09:17:36 +08:00
+								    gen_conf = dialog.llm_setting
 								    msg = [{"role": "system", "content": prompt_config["system"].format(**kwargs)}]
-												Feat: apply LLM to optimize citations. (#5935)

### What problem does this PR solve?

#5905

### Type of change

- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2025-03-11 19:56:21 +08:00
+								    prompt4citation = ""
 								    if knowledges and (prompt_config.get("quote", True) and kwargs.get("quote", True)):
 								        prompt4citation = citation_prompt()
-												Feat: add basic Langfuse support for LLM module (#6443)

### What problem does this PR solve?

#6155

Add basic Langfuse support for LLM module.

A trace example:

<img width="755" alt="image"
src="https://github.com/user-attachments/assets/25c1f852-5116-486c-a47f-6097187142ca"
/>


### Type of change

- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2025-03-24 13:18:47 +08:00
+								    msg.extend([{"role": m["role"], "content": re.sub(r"##\d+\$\$", "", m["content"])} for m in messages if m["role"] != "system"])
-												Feat: apply LLM to optimize citations. (#5935)

### What problem does this PR solve?

#5905

### Type of change

- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2025-03-11 19:56:21 +08:00
+								    used_token_count, msg = message_fit_in(msg, int(max_tokens * 0.95))
-												Format file format from Windows/dos to Unix (#1949)

### What problem does this PR solve?

Related source file is in Windows/DOS format, they are format to Unix
format.

### Type of change

- [x] Refactoring

Signed-off-by: Jin Hai <haijin.chn@gmail.com>
											
										
										
											2024-08-15 09:17:36 +08:00
+								    assert len(msg) >= 2, f"message_fit_in has bug: {msg}"
-												add prompt to message (#2099)

### What problem does this PR solve?

#2098

### Type of change
 
- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2024-08-26 16:14:15 +08:00
+								    prompt = msg[0]["content"]
-												Format file format from Windows/dos to Unix (#1949)

### What problem does this PR solve?

Related source file is in Windows/DOS format, they are format to Unix
format.

### Type of change

- [x] Refactoring

Signed-off-by: Jin Hai <haijin.chn@gmail.com>
											
										
										
											2024-08-15 09:17:36 +08:00
 								    if "max_tokens" in gen_conf:
-												Feat: add basic Langfuse support for LLM module (#6443)

### What problem does this PR solve?

#6155

Add basic Langfuse support for LLM module.

A trace example:

<img width="755" alt="image"
src="https://github.com/user-attachments/assets/25c1f852-5116-486c-a47f-6097187142ca"
/>


### Type of change

- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2025-03-24 13:18:47 +08:00
+								        gen_conf["max_tokens"] = min(gen_conf["max_tokens"], max_tokens - used_token_count)
-												Format file format from Windows/dos to Unix (#1949)

### What problem does this PR solve?

Related source file is in Windows/DOS format, they are format to Unix
format.

### Type of change

- [x] Refactoring

Signed-off-by: Jin Hai <haijin.chn@gmail.com>
											
										
										
											2024-08-15 09:17:36 +08:00
 								    def decorate_answer(answer):
-												Fix: issue for tavily only in a assistant. (#8076)

### What problem does this PR solve?


### Type of change

- [x] Bug Fix (non-breaking change which fixes an issue)
											
										
										
											2025-06-05 13:00:43 +08:00
+								        nonlocal embd_mdl, prompt_config, knowledges, kwargs, kbinfos, prompt, retrieval_ts, questions, langfuse_tracer
-												Refactor ask decorator (#4116)

### What problem does this PR solve?

Refactor ask decorator

### Type of change

- [x] Refactoring

---------

Signed-off-by: jinhai <haijin.chn@gmail.com>
Co-authored-by: Kevin Hu <kevinhu.sh@gmail.com>
											
										
										
											2024-12-19 18:13:33 +08:00
-												Format file format from Windows/dos to Unix (#1949)

### What problem does this PR solve?

Related source file is in Windows/DOS format, they are format to Unix
format.

### Type of change

- [x] Refactoring

Signed-off-by: Jin Hai <haijin.chn@gmail.com>
											
										
										
											2024-08-15 09:17:36 +08:00
+								        refs = []
-												Apply agentic searching. (#5196)

### What problem does this PR solve?

#5173

### Type of change

- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2025-02-20 17:41:01 +08:00
+								        ans = answer.split("</think>")
 								        think = ""
 								        if len(ans) == 2:
 								            think = ans[0] + "</think>"
 								            answer = ans[1]
-												Fix: add fallback for bad citation output (#7014)

### What problem does this PR solve?

Add fallback for bad citation output. #6948

### Type of change

- [x] Bug Fix (non-breaking change which fixes an issue)
											
										
										
											2025-04-15 09:33:53 +08:00
-												Format file format from Windows/dos to Unix (#1949)

### What problem does this PR solve?

Related source file is in Windows/DOS format, they are format to Unix
format.

### Type of change

- [x] Refactoring

Signed-off-by: Jin Hai <haijin.chn@gmail.com>
											
										
										
											2024-08-15 09:17:36 +08:00
+								        if knowledges and (prompt_config.get("quote", True) and kwargs.get("quote", True)):
-												Fix: add fallback for bad citation output (#7014)

### What problem does this PR solve?

Add fallback for bad citation output. #6948

### Type of change

- [x] Bug Fix (non-breaking change which fixes an issue)
											
										
										
											2025-04-15 09:33:53 +08:00
+								            idx = set([])
-												Fix: issue for tavily only in a assistant. (#8076)

### What problem does this PR solve?


### Type of change

- [x] Bug Fix (non-breaking change which fixes an issue)
											
										
										
											2025-06-05 13:00:43 +08:00
+								            if embd_mdl and not re.search(r"\[ID:([0-9]+)\]", answer):
-												Feat: add basic Langfuse support for LLM module (#6443)

### What problem does this PR solve?

#6155

Add basic Langfuse support for LLM module.

A trace example:

<img width="755" alt="image"
src="https://github.com/user-attachments/assets/25c1f852-5116-486c-a47f-6097187142ca"
/>


### Type of change

- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2025-03-24 13:18:47 +08:00
+								                answer, idx = retriever.insert_citations(
 								                    answer,
 								                    [ck["content_ltks"] for ck in kbinfos["chunks"]],
 								                    [ck["vector"] for ck in kbinfos["chunks"]],
 								                    embd_mdl,
 								                    tkweight=1 - dialog.vector_similarity_weight,
 								                    vtweight=dialog.vector_similarity_weight,
 								                )
-												Feat: apply LLM to optimize citations. (#5935)

### What problem does this PR solve?

#5905

### Type of change

- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2025-03-11 19:56:21 +08:00
+								            else:
-												Refa: change citation mark as [ID:n] (#7923)

### What problem does this PR solve?

Change citation mark as [ID:n], it's easier for LLMs to follow the
instruction :) #7904

### Type of change

- [x] Refactoring
											
										
										
											2025-05-29 10:03:51 +08:00
+								                for match in re.finditer(r"\[ID:([0-9]+)\]", answer):
-												Fix: add fallback for bad citation output (#7014)

### What problem does this PR solve?

Add fallback for bad citation output. #6948

### Type of change

- [x] Bug Fix (non-breaking change which fixes an issue)
											
										
										
											2025-04-15 09:33:53 +08:00
+								                    i = int(match.group(1))
 								                    if i < len(kbinfos["chunks"]):
 								                        idx.add(i)
-												Refa: more fallbacks for bad citation format (#7710)

### What problem does this PR solve?

More fallbacks for bad citation format

### Type of change

- [x] Bug Fix (non-breaking change which fixes an issue)
- [x] Refactoring
											
										
										
											2025-05-19 19:34:05 +08:00
+								            answer, idx = repair_bad_citation_formats(answer, kbinfos, idx)
-												Feat: apply LLM to optimize citations. (#5935)

### What problem does this PR solve?

#5905

### Type of change

- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2025-03-11 19:56:21 +08:00
-												Format file format from Windows/dos to Unix (#1949)

### What problem does this PR solve?

Related source file is in Windows/DOS format, they are format to Unix
format.

### Type of change

- [x] Refactoring

Signed-off-by: Jin Hai <haijin.chn@gmail.com>
											
										
										
											2024-08-15 09:17:36 +08:00
+								            idx = set([kbinfos["chunks"][int(i)]["doc_id"] for i in idx])
-												Feat: add basic Langfuse support for LLM module (#6443)

### What problem does this PR solve?

#6155

Add basic Langfuse support for LLM module.

A trace example:

<img width="755" alt="image"
src="https://github.com/user-attachments/assets/25c1f852-5116-486c-a47f-6097187142ca"
/>


### Type of change

- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2025-03-24 13:18:47 +08:00
+								            recall_docs = [d for d in kbinfos["doc_aggs"] if d["doc_id"] in idx]
-												Fix errors detected by Ruff (#3918)

### What problem does this PR solve?

Fix errors detected by Ruff

### Type of change

- [x] Refactoring
											
										
										
											2024-12-08 14:21:12 +08:00
+								            if not recall_docs:
 								                recall_docs = kbinfos["doc_aggs"]
-												Format file format from Windows/dos to Unix (#1949)

### What problem does this PR solve?

Related source file is in Windows/DOS format, they are format to Unix
format.

### Type of change

- [x] Refactoring

Signed-off-by: Jin Hai <haijin.chn@gmail.com>
											
										
										
											2024-08-15 09:17:36 +08:00
+								            kbinfos["doc_aggs"] = recall_docs
 								            refs = deepcopy(kbinfos)
 								            for c in refs["chunks"]:
 								                if c.get("vector"):
 								                    del c["vector"]
 								        if answer.lower().find("invalid key") >= 0 or answer.lower().find("invalid api") >= 0:
-												Refactor UI text (#3911)

### What problem does this PR solve?

Refactor UI text

### Type of change

- [x] Documentation Update
- [x] Refactoring

Signed-off-by: jinhai <haijin.chn@gmail.com>
											
										
										
											2024-12-07 11:04:36 +08:00
+								            answer += " Please set LLM API-Key in 'User Setting -> Model providers -> API-Key'"
-												Refactor ask decorator (#4116)

### What problem does this PR solve?

Refactor ask decorator

### Type of change

- [x] Refactoring

---------

Signed-off-by: jinhai <haijin.chn@gmail.com>
Co-authored-by: Kevin Hu <kevinhu.sh@gmail.com>
											
										
										
											2024-12-19 18:13:33 +08:00
+								        finish_chat_ts = timer()
 								        total_time_cost = (finish_chat_ts - chat_start_ts) * 1000
 								        check_llm_time_cost = (check_llm_ts - chat_start_ts) * 1000
-												Feat: add basic Langfuse support for LLM module (#6443)

### What problem does this PR solve?

#6155

Add basic Langfuse support for LLM module.

A trace example:

<img width="755" alt="image"
src="https://github.com/user-attachments/assets/25c1f852-5116-486c-a47f-6097187142ca"
/>


### Type of change

- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2025-03-24 13:18:47 +08:00
+								        check_langfuse_tracer_cost = (check_langfuse_tracer_ts - check_llm_ts) * 1000
-												Fix: issue for tavily only in a assistant. (#8076)

### What problem does this PR solve?


### Type of change

- [x] Bug Fix (non-breaking change which fixes an issue)
											
										
										
											2025-06-05 13:00:43 +08:00
+								        bind_embedding_time_cost = (bind_models_ts - check_langfuse_tracer_ts) * 1000
 								        refine_question_time_cost = (refine_question_ts - bind_models_ts) * 1000
 								        retrieval_time_cost = (retrieval_ts - refine_question_ts) * 1000
-												Refactor ask decorator (#4116)

### What problem does this PR solve?

Refactor ask decorator

### Type of change

- [x] Refactoring

---------

Signed-off-by: jinhai <haijin.chn@gmail.com>
Co-authored-by: Kevin Hu <kevinhu.sh@gmail.com>
											
										
										
											2024-12-19 18:13:33 +08:00
+								        generate_result_time_cost = (finish_chat_ts - retrieval_ts) * 1000
-												Feat: add basic Langfuse support for LLM module (#6443)

### What problem does this PR solve?

#6155

Add basic Langfuse support for LLM module.

A trace example:

<img width="755" alt="image"
src="https://github.com/user-attachments/assets/25c1f852-5116-486c-a47f-6097187142ca"
/>


### Type of change

- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2025-03-24 13:18:47 +08:00
+								        tk_num = num_tokens_from_string(think + answer)
-												Optimize prompt. (#5541)

### What problem does this PR solve?

#5526

### Type of change

- [x] Performance Improvement
											
										
										
											2025-03-03 13:12:38 +08:00
+								        prompt += "\n\n### Query:\n%s" % " ".join(questions)
-												Feat: add token comsumption & speed to little lamp. (#6077)

### What problem does this PR solve?

#6059

### Type of change

- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2025-03-14 13:37:31 +08:00
+								        prompt = (
-												Feat: add basic Langfuse support for LLM module (#6443)

### What problem does this PR solve?

#6155

Add basic Langfuse support for LLM module.

A trace example:

<img width="755" alt="image"
src="https://github.com/user-attachments/assets/25c1f852-5116-486c-a47f-6097187142ca"
/>


### Type of change

- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2025-03-24 13:18:47 +08:00
+								            f"{prompt}\n\n"
 								            "## Time elapsed:\n"
 								            f"  - Total: {total_time_cost:.1f}ms\n"
 								            f"  - Check LLM: {check_llm_time_cost:.1f}ms\n"
 								            f"  - Check Langfuse tracer: {check_langfuse_tracer_cost:.1f}ms\n"
-												Fix: issue for tavily only in a assistant. (#8076)

### What problem does this PR solve?


### Type of change

- [x] Bug Fix (non-breaking change which fixes an issue)
											
										
										
											2025-06-05 13:00:43 +08:00
+								            f"  - Bind models: {bind_embedding_time_cost:.1f}ms\n"
 								            f"  - Query refinement(LLM): {refine_question_time_cost:.1f}ms\n"
-												Feat: add basic Langfuse support for LLM module (#6443)

### What problem does this PR solve?

#6155

Add basic Langfuse support for LLM module.

A trace example:

<img width="755" alt="image"
src="https://github.com/user-attachments/assets/25c1f852-5116-486c-a47f-6097187142ca"
/>


### Type of change

- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2025-03-24 13:18:47 +08:00
+								            f"  - Retrieval: {retrieval_time_cost:.1f}ms\n"
 								            f"  - Generate answer: {generate_result_time_cost:.1f}ms\n\n"
 								            "## Token usage:\n"
 								            f"  - Generated tokens(approximately): {tk_num}\n"
 								            f"  - Token speed: {int(tk_num / (generate_result_time_cost / 1000.0))}/s"
-												Feat: add token comsumption & speed to little lamp. (#6077)

### What problem does this PR solve?

#6059

### Type of change

- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2025-03-14 13:37:31 +08:00
+								        )
-												Feat: add basic Langfuse support for LLM module (#6443)

### What problem does this PR solve?

#6155

Add basic Langfuse support for LLM module.

A trace example:

<img width="755" alt="image"
src="https://github.com/user-attachments/assets/25c1f852-5116-486c-a47f-6097187142ca"
/>


### Type of change

- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2025-03-24 13:18:47 +08:00
-												Fix: NameError: free variable 'langfuse_generation' referenced before assignment in enclosing scope (#6451)

### What problem does this PR solve?


### Type of change

- [x] Bug Fix (non-breaking change which fixes an issue)

---------

Co-authored-by: lizheng@ssc-hn.com <lizheng@ssc-hn.com>
											
										
										
											2025-03-24 15:14:36 +08:00
+								        # Add a condition check to call the end method only if langfuse_tracer exists
-												Feat: add primitive support for function calls (#6840)

### What problem does this PR solve?

This PR introduces **primitive support for function calls**,
enabling the system to handle basic function call capabilities.
However, this feature is currently experimental and **not yet enabled
for general use**, as it is only supported by a subset of models,
namely, Qwen and OpenAI models.

### Type of change

- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2025-04-08 16:09:03 +08:00
+								        if langfuse_tracer and "langfuse_generation" in locals():
-												Fix: migrate deprecated Langfuse API from v2 to v3 (#9204)

### What problem does this PR solve?

Fix:

```bash
'Langfuse' object has no attribute 'trace'
```

### Type of change

- [x] Bug Fix (non-breaking change which fixes an issue)
											
										
										
											2025-08-04 14:45:43 +08:00
+								            langfuse_output = "\n" + re.sub(r"^.*?(### Query:.*)", r"\1", prompt, flags=re.DOTALL)
 								            langfuse_output = {"time_elapsed:": re.sub(r"\n", "  \n", langfuse_output), "created_at": time.time()}
 								            langfuse_generation.update(output=langfuse_output)
 								            langfuse_generation.end()
-												Feat: add basic Langfuse support for LLM module (#6443)

### What problem does this PR solve?

#6155

Add basic Langfuse support for LLM module.

A trace example:

<img width="755" alt="image"
src="https://github.com/user-attachments/assets/25c1f852-5116-486c-a47f-6097187142ca"
/>


### Type of change

- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2025-03-24 13:18:47 +08:00
 								        return {"answer": think + answer, "reference": refs, "prompt": re.sub(r"\n", "  \n", prompt), "created_at": time.time()}
 								    if langfuse_tracer:
-												Fix: migrate deprecated Langfuse API from v2 to v3 (#9204)

### What problem does this PR solve?

Fix:

```bash
'Langfuse' object has no attribute 'trace'
```

### Type of change

- [x] Bug Fix (non-breaking change which fixes an issue)
											
										
										
											2025-08-04 14:45:43 +08:00
+								        langfuse_generation = langfuse_tracer.start_generation(
-												Fix bug: broken import from rag.prompts.prompts (#10217)

### What problem does this PR solve?

Fix broken imports

### Type of change

- [x] Bug Fix (non-breaking change which fixes an issue)

---------

Signed-off-by: jinhai <haijin.chn@gmail.com>
											
										
										
											2025-09-23 10:19:25 +08:00
+								            trace_context=trace_context, name="chat", model=llm_model_config["llm_name"],
 								            input={"prompt": prompt, "prompt4citation": prompt4citation, "messages": msg}
-												Fix: migrate deprecated Langfuse API from v2 to v3 (#9204)

### What problem does this PR solve?

Fix:

```bash
'Langfuse' object has no attribute 'trace'
```

### Type of change

- [x] Bug Fix (non-breaking change which fixes an issue)
											
										
										
											2025-08-04 14:45:43 +08:00
+								        )
-												Format file format from Windows/dos to Unix (#1949)

### What problem does this PR solve?

Related source file is in Windows/DOS format, they are format to Unix
format.

### Type of change

- [x] Refactoring

Signed-off-by: Jin Hai <haijin.chn@gmail.com>
											
										
										
											2024-08-15 09:17:36 +08:00
 								    if stream:
-												add stream chat with TTS (#2228)

### What problem does this PR solve?



### Type of change

- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2024-09-03 19:49:14 +08:00
+								        last_ans = ""
-												Format file format from Windows/dos to Unix (#1949)

### What problem does this PR solve?

Related source file is in Windows/DOS format, they are format to Unix
format.

### Type of change

- [x] Refactoring

Signed-off-by: Jin Hai <haijin.chn@gmail.com>
											
										
										
											2024-08-15 09:17:36 +08:00
+								        answer = ""
-												Feat: add basic Langfuse support for LLM module (#6443)

### What problem does this PR solve?

#6155

Add basic Langfuse support for LLM module.

A trace example:

<img width="755" alt="image"
src="https://github.com/user-attachments/assets/25c1f852-5116-486c-a47f-6097187142ca"
/>


### Type of change

- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2025-03-24 13:18:47 +08:00
+								        for ans in chat_mdl.chat_streamly(prompt + prompt4citation, msg[1:], gen_conf):
-												Apply agentic searching. (#5196)

### What problem does this PR solve?

#5173

### Type of change

- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2025-02-20 17:41:01 +08:00
+								            if thought:
-												<think> tag is missing. (#7256)

### What problem does this PR solve?

Some models force thinking, resulting in the absence of the think tag in
the returned content

### Type of change

- [x] Bug Fix (non-breaking change which fixes an issue)
											
										
										
											2025-04-24 11:44:10 +08:00
+								                ans = re.sub(r"^.*</think>", "", ans, flags=re.DOTALL)
-												Format file format from Windows/dos to Unix (#1949)

### What problem does this PR solve?

Related source file is in Windows/DOS format, they are format to Unix
format.

### Type of change

- [x] Refactoring

Signed-off-by: Jin Hai <haijin.chn@gmail.com>
											
										
										
											2024-08-15 09:17:36 +08:00
+								            answer = ans
-												Fix bug: broken import from rag.prompts.prompts (#10217)

### What problem does this PR solve?

Fix broken imports

### Type of change

- [x] Bug Fix (non-breaking change which fixes an issue)

---------

Signed-off-by: jinhai <haijin.chn@gmail.com>
											
										
										
											2025-09-23 10:19:25 +08:00
+								            delta_ans = ans[len(last_ans):]
-												debug backend API for TAB 'search' (#2389)

### What problem does this PR solve?
#2247

### Type of change

- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2024-09-12 17:51:20 +08:00
+								            if num_tokens_from_string(delta_ans) < 16:
-												add stream chat with TTS (#2228)

### What problem does this PR solve?



### Type of change

- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2024-09-03 19:49:14 +08:00
+								                continue
 								            last_ans = answer
-												Feat: add basic Langfuse support for LLM module (#6443)

### What problem does this PR solve?

#6155

Add basic Langfuse support for LLM module.

A trace example:

<img width="755" alt="image"
src="https://github.com/user-attachments/assets/25c1f852-5116-486c-a47f-6097187142ca"
/>


### Type of change

- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2025-03-24 13:18:47 +08:00
+								            yield {"answer": thought + answer, "reference": {}, "audio_binary": tts(tts_mdl, delta_ans)}
-												Fix bug: broken import from rag.prompts.prompts (#10217)

### What problem does this PR solve?

Fix broken imports

### Type of change

- [x] Bug Fix (non-breaking change which fixes an issue)

---------

Signed-off-by: jinhai <haijin.chn@gmail.com>
											
										
										
											2025-09-23 10:19:25 +08:00
+								        delta_ans = answer[len(last_ans):]
-												add stream chat with TTS (#2228)

### What problem does this PR solve?



### Type of change

- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2024-09-03 19:49:14 +08:00
+								        if delta_ans:
-												Feat: add basic Langfuse support for LLM module (#6443)

### What problem does this PR solve?

#6155

Add basic Langfuse support for LLM module.

A trace example:

<img width="755" alt="image"
src="https://github.com/user-attachments/assets/25c1f852-5116-486c-a47f-6097187142ca"
/>


### Type of change

- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2025-03-24 13:18:47 +08:00
+								            yield {"answer": thought + answer, "reference": {}, "audio_binary": tts(tts_mdl, delta_ans)}
 								        yield decorate_answer(thought + answer)
-												Format file format from Windows/dos to Unix (#1949)

### What problem does this PR solve?

Related source file is in Windows/DOS format, they are format to Unix
format.

### Type of change

- [x] Refactoring

Signed-off-by: Jin Hai <haijin.chn@gmail.com>
											
										
										
											2024-08-15 09:17:36 +08:00
+								    else:
-												Feat: add basic Langfuse support for LLM module (#6443)

### What problem does this PR solve?

#6155

Add basic Langfuse support for LLM module.

A trace example:

<img width="755" alt="image"
src="https://github.com/user-attachments/assets/25c1f852-5116-486c-a47f-6097187142ca"
/>


### Type of change

- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2025-03-24 13:18:47 +08:00
+								        answer = chat_mdl.chat(prompt + prompt4citation, msg[1:], gen_conf)
-												Fixes KeyError: 'content' when using stream=False (#4944)

### 🛠 Fixes `KeyError: 'content'` when using `stream=False`

#### 🔍 Problem  
When calling the chat API with `stream=False`, the code attempts to
access `msg[-1]["content"]` without verifying if the key exists. This
causes a `KeyError` when the message structure does not contain
`"content"`.

This issue was discussed in
[#4885](https://github.com/infiniflow/ragflow/issues/4885), where we
analyzed the root cause. The error does not occur with `stream=True`, as
the response is processed differently.

#### ✅ Solution  
- **Logging Fix:**  
  - Before accessing `msg[-1]["content"]`, we check if the key exists.  
- If it does not exist, a default value (`"[content not available]"`) is
used to prevent errors.

- **Structural Fix in `msg` Construction:**  
- Ensured that every message in `msg` contains the `"content"` key, even
if empty.
- This fixes the issue at its root and ensures consistent behavior
between `stream=True` and `stream=False`.

#### 🔄 Impact  
- Prevents the `KeyError` without affecting normal application flow.  
- Ensures the integrity of the `msg` structure, avoiding future
failures.



### Type of change

- [x] Bug Fix (non-breaking change which fixes an issue)
											
										
										
											2025-02-13 23:27:01 -03:00
+								        user_content = msg[-1].get("content", "[content not available]")
 								        logging.debug("User: {}|Assistant: {}".format(user_content, answer))
-												add stream chat with TTS (#2228)

### What problem does this PR solve?



### Type of change

- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2024-09-03 19:49:14 +08:00
+								        res = decorate_answer(answer)
 								        res["audio_binary"] = tts(tts_mdl, answer)
 								        yield res
-												Format file format from Windows/dos to Unix (#1949)

### What problem does this PR solve?

Related source file is in Windows/DOS format, they are format to Unix
format.

### Type of change

- [x] Refactoring

Signed-off-by: Jin Hai <haijin.chn@gmail.com>
											
										
										
											2024-08-15 09:17:36 +08:00
-												Minor tweats (#11271)

### What problem does this PR solve?

As title.

### Type of change

- [x] Refactoring

---------

Signed-off-by: Jin Hai <haijin.chn@gmail.com>
											
										
										
											2025-11-16 19:29:20 +08:00
+								    return None
-												Format file format from Windows/dos to Unix (#1949)

### What problem does this PR solve?

Related source file is in Windows/DOS format, they are format to Unix
format.

### Type of change

- [x] Refactoring

Signed-off-by: Jin Hai <haijin.chn@gmail.com>
											
										
										
											2024-08-15 09:17:36 +08:00
-												During the chat, the assistant's response cited documents outside current chat's kbs (#9900)

### What problem does this PR solve?

During the chat, the assistant's response cited documents outside the
current knowledge base。

### Type of change

- [x] Bug Fix (non-breaking change which fixes an issue)
											
										
										
											2025-09-04 16:51:13 +08:00
+								def use_sql(question, field_map, tenant_id, chat_mdl, quota=True, kb_ids=None):
-												Fix: Optimize Prompts and Regex for use_sql() (#11148)

### What problem does this PR solve?

Fix: Optimize Prompts and Regex for use_sql() #11127 

### Type of change

- [x] Bug Fix (non-breaking change which fixes an issue)
											
										
										
											2025-11-10 19:02:07 +08:00
+								    sys_prompt = """
 								You are a Database Administrator. You need to check the fields of the following tables based on the user's list of questions and write the SQL corresponding to the last question.
 								Ensure that:
 . Field names should not start with a digit. If any field name starts with a digit, use double quotes around it.
 . Write only the SQL, no explanations or additional text.
 								"""
-												Refactor ask decorator (#4116)

### What problem does this PR solve?

Refactor ask decorator

### Type of change

- [x] Refactoring

---------

Signed-off-by: jinhai <haijin.chn@gmail.com>
Co-authored-by: Kevin Hu <kevinhu.sh@gmail.com>
											
										
										
											2024-12-19 18:13:33 +08:00
+								    user_prompt = """
 								Table name: {};
 								Table of database fields are as follows:
-												Format file format from Windows/dos to Unix (#1949)

### What problem does this PR solve?

Related source file is in Windows/DOS format, they are format to Unix
format.

### Type of change

- [x] Refactoring

Signed-off-by: Jin Hai <haijin.chn@gmail.com>
											
										
										
											2024-08-15 09:17:36 +08:00
+								{}
-												Refactor ask decorator (#4116)

### What problem does this PR solve?

Refactor ask decorator

### Type of change

- [x] Refactoring

---------

Signed-off-by: jinhai <haijin.chn@gmail.com>
Co-authored-by: Kevin Hu <kevinhu.sh@gmail.com>
											
										
										
											2024-12-19 18:13:33 +08:00
+								Question are as follows:
-												Format file format from Windows/dos to Unix (#1949)

### What problem does this PR solve?

Related source file is in Windows/DOS format, they are format to Unix
format.

### Type of change

- [x] Refactoring

Signed-off-by: Jin Hai <haijin.chn@gmail.com>
											
										
										
											2024-08-15 09:17:36 +08:00
+								{}
-												Refactor ask decorator (#4116)

### What problem does this PR solve?

Refactor ask decorator

### Type of change

- [x] Refactoring

---------

Signed-off-by: jinhai <haijin.chn@gmail.com>
Co-authored-by: Kevin Hu <kevinhu.sh@gmail.com>
											
										
										
											2024-12-19 18:13:33 +08:00
+								Please write the SQL, only SQL, without any other explanations or text.
-												Feat: add basic Langfuse support for LLM module (#6443)

### What problem does this PR solve?

#6155

Add basic Langfuse support for LLM module.

A trace example:

<img width="755" alt="image"
src="https://github.com/user-attachments/assets/25c1f852-5116-486c-a47f-6097187142ca"
/>


### Type of change

- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2025-03-24 13:18:47 +08:00
+								""".format(index_name(tenant_id), "\n".join([f"{k}: {v}" for k, v in field_map.items()]), question)
-												Format file format from Windows/dos to Unix (#1949)

### What problem does this PR solve?

Related source file is in Windows/DOS format, they are format to Unix
format.

### Type of change

- [x] Refactoring

Signed-off-by: Jin Hai <haijin.chn@gmail.com>
											
										
										
											2024-08-15 09:17:36 +08:00
+								    tried_times = 0
 								    def get_table():
-												Refactor ask decorator (#4116)

### What problem does this PR solve?

Refactor ask decorator

### Type of change

- [x] Refactoring

---------

Signed-off-by: jinhai <haijin.chn@gmail.com>
Co-authored-by: Kevin Hu <kevinhu.sh@gmail.com>
											
										
										
											2024-12-19 18:13:33 +08:00
+								        nonlocal sys_prompt, user_prompt, question, tried_times
-												Feat: add basic Langfuse support for LLM module (#6443)

### What problem does this PR solve?

#6155

Add basic Langfuse support for LLM module.

A trace example:

<img width="755" alt="image"
src="https://github.com/user-attachments/assets/25c1f852-5116-486c-a47f-6097187142ca"
/>


### Type of change

- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2025-03-24 13:18:47 +08:00
+								        sql = chat_mdl.chat(sys_prompt, [{"role": "user", "content": user_prompt}], {"temperature": 0.06})
-												<think> tag is missing. (#7256)

### What problem does this PR solve?

Some models force thinking, resulting in the absence of the think tag in
the returned content

### Type of change

- [x] Bug Fix (non-breaking change which fixes an issue)
											
										
										
											2025-04-24 11:44:10 +08:00
+								        sql = re.sub(r"^.*</think>", "", sql, flags=re.DOTALL)
-												Refactor ask decorator (#4116)

### What problem does this PR solve?

Refactor ask decorator

### Type of change

- [x] Refactoring

---------

Signed-off-by: jinhai <haijin.chn@gmail.com>
Co-authored-by: Kevin Hu <kevinhu.sh@gmail.com>
											
										
										
											2024-12-19 18:13:33 +08:00
+								        logging.debug(f"{question} ==> {user_prompt} get SQL: {sql}")
-												Format file format from Windows/dos to Unix (#1949)

### What problem does this PR solve?

Related source file is in Windows/DOS format, they are format to Unix
format.

### Type of change

- [x] Refactoring

Signed-off-by: Jin Hai <haijin.chn@gmail.com>
											
										
										
											2024-08-15 09:17:36 +08:00
+								        sql = re.sub(r"[\r\n]+", " ", sql.lower())
 								        sql = re.sub(r".*select ", "select ", sql.lower())
 								        sql = re.sub(r" +", " ", sql)
 								        sql = re.sub(r"([;；]|```).*", "", sql)
-												Fix: Optimize Prompts and Regex for use_sql() (#11148)

### What problem does this PR solve?

Fix: Optimize Prompts and Regex for use_sql() #11127 

### Type of change

- [x] Bug Fix (non-breaking change which fixes an issue)
											
										
										
											2025-11-10 19:02:07 +08:00
+								        sql = re.sub(r"&", "and", sql)
-												Feat: add basic Langfuse support for LLM module (#6443)

### What problem does this PR solve?

#6155

Add basic Langfuse support for LLM module.

A trace example:

<img width="755" alt="image"
src="https://github.com/user-attachments/assets/25c1f852-5116-486c-a47f-6097187142ca"
/>


### Type of change

- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2025-03-24 13:18:47 +08:00
+								        if sql[: len("select ")] != "select ":
-												Format file format from Windows/dos to Unix (#1949)

### What problem does this PR solve?

Related source file is in Windows/DOS format, they are format to Unix
format.

### Type of change

- [x] Refactoring

Signed-off-by: Jin Hai <haijin.chn@gmail.com>
											
										
										
											2024-08-15 09:17:36 +08:00
+								            return None, None
 								        if not re.search(r"((sum|avg|max|min)\(|group by )", sql.lower()):
-												Feat: add basic Langfuse support for LLM module (#6443)

### What problem does this PR solve?

#6155

Add basic Langfuse support for LLM module.

A trace example:

<img width="755" alt="image"
src="https://github.com/user-attachments/assets/25c1f852-5116-486c-a47f-6097187142ca"
/>


### Type of change

- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2025-03-24 13:18:47 +08:00
+								            if sql[: len("select *")] != "select *":
-												Format file format from Windows/dos to Unix (#1949)

### What problem does this PR solve?

Related source file is in Windows/DOS format, they are format to Unix
format.

### Type of change

- [x] Refactoring

Signed-off-by: Jin Hai <haijin.chn@gmail.com>
											
										
										
											2024-08-15 09:17:36 +08:00
+								                sql = "select doc_id,docnm_kwd," + sql[6:]
 								            else:
 								                flds = []
 								                for k in field_map.keys():
 								                    if k in forbidden_select_fields4resume:
 								                        continue
 								                    if len(flds) > 11:
 								                        break
 								                    flds.append(k)
 								                sql = "select doc_id,docnm_kwd," + ",".join(flds) + sql[8:]
-												During the chat, the assistant's response cited documents outside current chat's kbs (#9900)

### What problem does this PR solve?

During the chat, the assistant's response cited documents outside the
current knowledge base。

### Type of change

- [x] Bug Fix (non-breaking change which fixes an issue)
											
										
										
											2025-09-04 16:51:13 +08:00
+								        if kb_ids:
 								            kb_filter = "(" + " OR ".join([f"kb_id = '{kb_id}'" for kb_id in kb_ids]) + ")"
 								            if "where" not in sql.lower():
 								                sql += f" WHERE {kb_filter}"
 								            else:
 								                sql += f" AND {kb_filter}"
-												Use consistent log file names, introduced initLogger (#3403)

### What problem does this PR solve?

Use consistent log file names, introduced initLogger

### Type of change

- [ ] Bug Fix (non-breaking change which fixes an issue)
- [ ] New Feature (non-breaking change which adds functionality)
- [ ] Documentation Update
- [x] Refactoring
- [ ] Performance Improvement
- [ ] Other (please describe):
											
										
										
											2024-11-14 17:13:48 +08:00
+								        logging.debug(f"{question} get SQL(refined): {sql}")
-												Format file format from Windows/dos to Unix (#1949)

### What problem does this PR solve?

Related source file is in Windows/DOS format, they are format to Unix
format.

### Type of change

- [x] Refactoring

Signed-off-by: Jin Hai <haijin.chn@gmail.com>
											
										
										
											2024-08-15 09:17:36 +08:00
+								        tried_times += 1
-												Move api.settings to common.settings (#11036)

### What problem does this PR solve?

As title

### Type of change

- [x] Refactoring

---------

Signed-off-by: Jin Hai <haijin.chn@gmail.com>
											
										
										
											2025-11-06 09:36:38 +08:00
+								        return settings.retriever.sql_retrieval(sql, format="json"), sql
-												Format file format from Windows/dos to Unix (#1949)

### What problem does this PR solve?

Related source file is in Windows/DOS format, they are format to Unix
format.

### Type of change

- [x] Refactoring

Signed-off-by: Jin Hai <haijin.chn@gmail.com>
											
										
										
											2024-08-15 09:17:36 +08:00
 								    tbl, sql = get_table()
 								    if tbl is None:
 								        return None
 								    if tbl.get("error") and tried_times <= 2:
-												Refactor ask decorator (#4116)

### What problem does this PR solve?

Refactor ask decorator

### Type of change

- [x] Refactoring

---------

Signed-off-by: jinhai <haijin.chn@gmail.com>
Co-authored-by: Kevin Hu <kevinhu.sh@gmail.com>
											
										
										
											2024-12-19 18:13:33 +08:00
+								        user_prompt = """
 								        Table name: {};
 								        Table of database fields are as follows:
-												Format file format from Windows/dos to Unix (#1949)

### What problem does this PR solve?

Related source file is in Windows/DOS format, they are format to Unix
format.

### Type of change

- [x] Refactoring

Signed-off-by: Jin Hai <haijin.chn@gmail.com>
											
										
										
											2024-08-15 09:17:36 +08:00
+								        {}
-												Refa. (#7022)

### What problem does this PR solve?


### Type of change

- [x] Refactoring
											
										
										
											2025-04-15 10:20:33 +08:00
-												Refactor ask decorator (#4116)

### What problem does this PR solve?

Refactor ask decorator

### Type of change

- [x] Refactoring

---------

Signed-off-by: jinhai <haijin.chn@gmail.com>
Co-authored-by: Kevin Hu <kevinhu.sh@gmail.com>
											
										
										
											2024-12-19 18:13:33 +08:00
+								        Question are as follows:
-												Format file format from Windows/dos to Unix (#1949)

### What problem does this PR solve?

Related source file is in Windows/DOS format, they are format to Unix
format.

### Type of change

- [x] Refactoring

Signed-off-by: Jin Hai <haijin.chn@gmail.com>
											
										
										
											2024-08-15 09:17:36 +08:00
+								        {}
-												Refactor ask decorator (#4116)

### What problem does this PR solve?

Refactor ask decorator

### Type of change

- [x] Refactoring

---------

Signed-off-by: jinhai <haijin.chn@gmail.com>
Co-authored-by: Kevin Hu <kevinhu.sh@gmail.com>
											
										
										
											2024-12-19 18:13:33 +08:00
+								        Please write the SQL, only SQL, without any other explanations or text.
-												Refa. (#7022)

### What problem does this PR solve?


### Type of change

- [x] Refactoring
											
										
										
											2025-04-15 10:20:33 +08:00
-												Format file format from Windows/dos to Unix (#1949)

### What problem does this PR solve?

Related source file is in Windows/DOS format, they are format to Unix
format.

### Type of change

- [x] Refactoring

Signed-off-by: Jin Hai <haijin.chn@gmail.com>
											
										
										
											2024-08-15 09:17:36 +08:00
-												Refactor ask decorator (#4116)

### What problem does this PR solve?

Refactor ask decorator

### Type of change

- [x] Refactoring

---------

Signed-off-by: jinhai <haijin.chn@gmail.com>
Co-authored-by: Kevin Hu <kevinhu.sh@gmail.com>
											
										
										
											2024-12-19 18:13:33 +08:00
+								        The SQL error you provided last time is as follows:
-												Format file format from Windows/dos to Unix (#1949)

### What problem does this PR solve?

Related source file is in Windows/DOS format, they are format to Unix
format.

### Type of change

- [x] Refactoring

Signed-off-by: Jin Hai <haijin.chn@gmail.com>
											
										
										
											2024-08-15 09:17:36 +08:00
+								        {}
-												Refactor ask decorator (#4116)

### What problem does this PR solve?

Refactor ask decorator

### Type of change

- [x] Refactoring

---------

Signed-off-by: jinhai <haijin.chn@gmail.com>
Co-authored-by: Kevin Hu <kevinhu.sh@gmail.com>
											
										
										
											2024-12-19 18:13:33 +08:00
+								        Error issued by database as follows:
-												Format file format from Windows/dos to Unix (#1949)

### What problem does this PR solve?

Related source file is in Windows/DOS format, they are format to Unix
format.

### Type of change

- [x] Refactoring

Signed-off-by: Jin Hai <haijin.chn@gmail.com>
											
										
										
											2024-08-15 09:17:36 +08:00
+								        {}
-												Refactor ask decorator (#4116)

### What problem does this PR solve?

Refactor ask decorator

### Type of change

- [x] Refactoring

---------

Signed-off-by: jinhai <haijin.chn@gmail.com>
Co-authored-by: Kevin Hu <kevinhu.sh@gmail.com>
											
										
										
											2024-12-19 18:13:33 +08:00
+								        Please correct the error and write SQL again, only SQL, without any other explanations or text.
-												Feat: add basic Langfuse support for LLM module (#6443)

### What problem does this PR solve?

#6155

Add basic Langfuse support for LLM module.

A trace example:

<img width="755" alt="image"
src="https://github.com/user-attachments/assets/25c1f852-5116-486c-a47f-6097187142ca"
/>


### Type of change

- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2025-03-24 13:18:47 +08:00
+								        """.format(index_name(tenant_id), "\n".join([f"{k}: {v}" for k, v in field_map.items()]), question, sql, tbl["error"])
-												Format file format from Windows/dos to Unix (#1949)

### What problem does this PR solve?

Related source file is in Windows/DOS format, they are format to Unix
format.

### Type of change

- [x] Refactoring

Signed-off-by: Jin Hai <haijin.chn@gmail.com>
											
										
										
											2024-08-15 09:17:36 +08:00
+								        tbl, sql = get_table()
-												Use consistent log file names, introduced initLogger (#3403)

### What problem does this PR solve?

Use consistent log file names, introduced initLogger

### Type of change

- [ ] Bug Fix (non-breaking change which fixes an issue)
- [ ] New Feature (non-breaking change which adds functionality)
- [ ] Documentation Update
- [x] Refactoring
- [ ] Performance Improvement
- [ ] Other (please describe):
											
										
										
											2024-11-14 17:13:48 +08:00
+								        logging.debug("TRY it again: {}".format(sql))
-												Format file format from Windows/dos to Unix (#1949)

### What problem does this PR solve?

Related source file is in Windows/DOS format, they are format to Unix
format.

### Type of change

- [x] Refactoring

Signed-off-by: Jin Hai <haijin.chn@gmail.com>
											
										
										
											2024-08-15 09:17:36 +08:00
-												Use consistent log file names, introduced initLogger (#3403)

### What problem does this PR solve?

Use consistent log file names, introduced initLogger

### Type of change

- [ ] Bug Fix (non-breaking change which fixes an issue)
- [ ] New Feature (non-breaking change which adds functionality)
- [ ] Documentation Update
- [x] Refactoring
- [ ] Performance Improvement
- [ ] Other (please describe):
											
										
										
											2024-11-14 17:13:48 +08:00
+								    logging.debug("GET table: {}".format(tbl))
-												Format file format from Windows/dos to Unix (#1949)

### What problem does this PR solve?

Related source file is in Windows/DOS format, they are format to Unix
format.

### Type of change

- [x] Refactoring

Signed-off-by: Jin Hai <haijin.chn@gmail.com>
											
										
										
											2024-08-15 09:17:36 +08:00
+								    if tbl.get("error") or len(tbl["rows"]) == 0:
 								        return None
-												Feat: add basic Langfuse support for LLM module (#6443)

### What problem does this PR solve?

#6155

Add basic Langfuse support for LLM module.

A trace example:

<img width="755" alt="image"
src="https://github.com/user-attachments/assets/25c1f852-5116-486c-a47f-6097187142ca"
/>


### Type of change

- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2025-03-24 13:18:47 +08:00
+								    docid_idx = set([ii for ii, c in enumerate(tbl["columns"]) if c["name"] == "doc_id"])
 								    doc_name_idx = set([ii for ii, c in enumerate(tbl["columns"]) if c["name"] == "docnm_kwd"])
 								    column_idx = [ii for ii in range(len(tbl["columns"])) if ii not in (docid_idx | doc_name_idx)]
-												Format file format from Windows/dos to Unix (#1949)

### What problem does this PR solve?

Related source file is in Windows/DOS format, they are format to Unix
format.

### Type of change

- [x] Refactoring

Signed-off-by: Jin Hai <haijin.chn@gmail.com>
											
										
										
											2024-08-15 09:17:36 +08:00
-												Refactor ask decorator (#4116)

### What problem does this PR solve?

Refactor ask decorator

### Type of change

- [x] Refactoring

---------

Signed-off-by: jinhai <haijin.chn@gmail.com>
Co-authored-by: Kevin Hu <kevinhu.sh@gmail.com>
											
										
										
											2024-12-19 18:13:33 +08:00
+								    # compose Markdown table
-												Feat: add basic Langfuse support for LLM module (#6443)

### What problem does this PR solve?

#6155

Add basic Langfuse support for LLM module.

A trace example:

<img width="755" alt="image"
src="https://github.com/user-attachments/assets/25c1f852-5116-486c-a47f-6097187142ca"
/>


### Type of change

- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2025-03-24 13:18:47 +08:00
+								    columns = (
-												Fix bug: broken import from rag.prompts.prompts (#10217)

### What problem does this PR solve?

Fix broken imports

### Type of change

- [x] Bug Fix (non-breaking change which fixes an issue)

---------

Signed-off-by: jinhai <haijin.chn@gmail.com>
											
										
										
											2025-09-23 10:19:25 +08:00
+								            "|" + "|".join(
 								        [re.sub(r"(/.*|（[^（）]+）)", "", field_map.get(tbl["columns"][i]["name"], tbl["columns"][i]["name"])) for i in column_idx]) + (
 								                "|Source|" if docid_idx and docid_idx else "|")
-												Feat: add basic Langfuse support for LLM module (#6443)

### What problem does this PR solve?

#6155

Add basic Langfuse support for LLM module.

A trace example:

<img width="755" alt="image"
src="https://github.com/user-attachments/assets/25c1f852-5116-486c-a47f-6097187142ca"
/>


### Type of change

- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2025-03-24 13:18:47 +08:00
+								    )
-												Format file format from Windows/dos to Unix (#1949)

### What problem does this PR solve?

Related source file is in Windows/DOS format, they are format to Unix
format.

### Type of change

- [x] Refactoring

Signed-off-by: Jin Hai <haijin.chn@gmail.com>
											
										
										
											2024-08-15 09:17:36 +08:00
-												Feat: add basic Langfuse support for LLM module (#6443)

### What problem does this PR solve?

#6155

Add basic Langfuse support for LLM module.

A trace example:

<img width="755" alt="image"
src="https://github.com/user-attachments/assets/25c1f852-5116-486c-a47f-6097187142ca"
/>


### Type of change

- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2025-03-24 13:18:47 +08:00
+								    line = "|" + "|".join(["------" for _ in range(len(column_idx))]) + ("|------|" if docid_idx and docid_idx else "")
-												Format file format from Windows/dos to Unix (#1949)

### What problem does this PR solve?

Related source file is in Windows/DOS format, they are format to Unix
format.

### Type of change

- [x] Refactoring

Signed-off-by: Jin Hai <haijin.chn@gmail.com>
											
										
										
											2024-08-15 09:17:36 +08:00
-												Refactor: rename rmSpace to remove_redundant_spaces (#10796)

### What problem does this PR solve?

- rename rmSpace to remove_redundant_spaces
- move clean_markdown_block to common module
- add unit tests for remove_redundant_spaces and clean_markdown_block

### Type of change

- [x] Refactoring

---------

Signed-off-by: Jin Hai <haijin.chn@gmail.com>
											
										
										
											2025-10-28 09:46:32 +08:00
+								    rows = ["|" + "|".join([remove_redundant_spaces(str(r[i])) for i in column_idx]).replace("None", " ") + "|" for r in tbl["rows"]]
-												add inputs to display to every components (#3242)

### What problem does this PR solve?

#3240

### Type of change

- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2024-11-06 18:47:53 +08:00
+								    rows = [r for r in rows if re.sub(r"[ |]+", "", r)]
-												Format file format from Windows/dos to Unix (#1949)

### What problem does this PR solve?

Related source file is in Windows/DOS format, they are format to Unix
format.

### Type of change

- [x] Refactoring

Signed-off-by: Jin Hai <haijin.chn@gmail.com>
											
										
										
											2024-08-15 09:17:36 +08:00
+								    if quota:
 								        rows = "\n".join([r + f" ##{ii}$$ |" for ii, r in enumerate(rows)])
 								    else:
 								        rows = "\n".join([r + f" ##{ii}$$ |" for ii, r in enumerate(rows)])
 								    rows = re.sub(r"T[0-9]{2}:[0-9]{2}:[0-9]{2}(\.[0-9]+Z)?\|", "|", rows)
-												Refactor ask decorator (#4116)

### What problem does this PR solve?

Refactor ask decorator

### Type of change

- [x] Refactoring

---------

Signed-off-by: jinhai <haijin.chn@gmail.com>
Co-authored-by: Kevin Hu <kevinhu.sh@gmail.com>
											
										
										
											2024-12-19 18:13:33 +08:00
+								    if not docid_idx or not doc_name_idx:
-												Use consistent log file names, introduced initLogger (#3403)

### What problem does this PR solve?

Use consistent log file names, introduced initLogger

### Type of change

- [ ] Bug Fix (non-breaking change which fixes an issue)
- [ ] New Feature (non-breaking change which adds functionality)
- [ ] Documentation Update
- [x] Refactoring
- [ ] Performance Improvement
- [ ] Other (please describe):
											
										
										
											2024-11-14 17:13:48 +08:00
+								        logging.warning("SQL missing field: " + sql)
-												Feat: add basic Langfuse support for LLM module (#6443)

### What problem does this PR solve?

#6155

Add basic Langfuse support for LLM module.

A trace example:

<img width="755" alt="image"
src="https://github.com/user-attachments/assets/25c1f852-5116-486c-a47f-6097187142ca"
/>


### Type of change

- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2025-03-24 13:18:47 +08:00
+								        return {"answer": "\n".join([columns, line, rows]), "reference": {"chunks": [], "doc_aggs": []}, "prompt": sys_prompt}
-												Format file format from Windows/dos to Unix (#1949)

### What problem does this PR solve?

Related source file is in Windows/DOS format, they are format to Unix
format.

### Type of change

- [x] Refactoring

Signed-off-by: Jin Hai <haijin.chn@gmail.com>
											
										
										
											2024-08-15 09:17:36 +08:00
 								    docid_idx = list(docid_idx)[0]
-												Refactor ask decorator (#4116)

### What problem does this PR solve?

Refactor ask decorator

### Type of change

- [x] Refactoring

---------

Signed-off-by: jinhai <haijin.chn@gmail.com>
Co-authored-by: Kevin Hu <kevinhu.sh@gmail.com>
											
										
										
											2024-12-19 18:13:33 +08:00
+								    doc_name_idx = list(doc_name_idx)[0]
-												Format file format from Windows/dos to Unix (#1949)

### What problem does this PR solve?

Related source file is in Windows/DOS format, they are format to Unix
format.

### Type of change

- [x] Refactoring

Signed-off-by: Jin Hai <haijin.chn@gmail.com>
											
										
										
											2024-08-15 09:17:36 +08:00
+								    doc_aggs = {}
 								    for r in tbl["rows"]:
 								        if r[docid_idx] not in doc_aggs:
-												Refactor ask decorator (#4116)

### What problem does this PR solve?

Refactor ask decorator

### Type of change

- [x] Refactoring

---------

Signed-off-by: jinhai <haijin.chn@gmail.com>
Co-authored-by: Kevin Hu <kevinhu.sh@gmail.com>
											
										
										
											2024-12-19 18:13:33 +08:00
+								            doc_aggs[r[docid_idx]] = {"doc_name": r[doc_name_idx], "count": 0}
-												Format file format from Windows/dos to Unix (#1949)

### What problem does this PR solve?

Related source file is in Windows/DOS format, they are format to Unix
format.

### Type of change

- [x] Refactoring

Signed-off-by: Jin Hai <haijin.chn@gmail.com>
											
										
										
											2024-08-15 09:17:36 +08:00
+								        doc_aggs[r[docid_idx]]["count"] += 1
 								    return {
-												Refactor ask decorator (#4116)

### What problem does this PR solve?

Refactor ask decorator

### Type of change

- [x] Refactoring

---------

Signed-off-by: jinhai <haijin.chn@gmail.com>
Co-authored-by: Kevin Hu <kevinhu.sh@gmail.com>
											
										
										
											2024-12-19 18:13:33 +08:00
+								        "answer": "\n".join([columns, line, rows]),
-												Feat: add basic Langfuse support for LLM module (#6443)

### What problem does this PR solve?

#6155

Add basic Langfuse support for LLM module.

A trace example:

<img width="755" alt="image"
src="https://github.com/user-attachments/assets/25c1f852-5116-486c-a47f-6097187142ca"
/>


### Type of change

- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2025-03-24 13:18:47 +08:00
+								        "reference": {
 								            "chunks": [{"doc_id": r[docid_idx], "docnm_kwd": r[doc_name_idx]} for r in tbl["rows"]],
 								            "doc_aggs": [{"doc_id": did, "doc_name": d["doc_name"], "count": d["count"]} for did, d in doc_aggs.items()],
 								        },
 								        "prompt": sys_prompt,
-												Format file format from Windows/dos to Unix (#1949)

### What problem does this PR solve?

Related source file is in Windows/DOS format, they are format to Unix
format.

### Type of change

- [x] Refactoring

Signed-off-by: Jin Hai <haijin.chn@gmail.com>
											
										
										
											2024-08-15 09:17:36 +08:00
+								    }
-												add stream chat with TTS (#2228)

### What problem does this PR solve?



### Type of change

- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2024-09-03 19:49:14 +08:00
+								def tts(tts_mdl, text):
-												Fix errors detected by Ruff (#3918)

### What problem does this PR solve?

Fix errors detected by Ruff

### Type of change

- [x] Refactoring
											
										
										
											2024-12-08 14:21:12 +08:00
+								    if not tts_mdl or not text:
-												Minor tweats (#11271)

### What problem does this PR solve?

As title.

### Type of change

- [x] Refactoring

---------

Signed-off-by: Jin Hai <haijin.chn@gmail.com>
											
										
										
											2025-11-16 19:29:20 +08:00
+								        return None
-												add stream chat with TTS (#2228)

### What problem does this PR solve?



### Type of change

- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2024-09-03 19:49:14 +08:00
+								    bin = b""
 								    for chunk in tts_mdl.tts(text):
 								        bin += chunk
-												add elapsed time of conversation (#2316)

### What problem does this PR solve?

#2315

### Type of change


- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2024-09-09 12:08:50 +08:00
+								    return binascii.hexlify(bin).decode("utf-8")
-												Refa: refine search app (#9536)

### What problem does this PR solve?

Refine search app.

### Type of change

- [x] Refactoring
											
										
										
											2025-08-19 09:33:33 +08:00
+								def ask(question, kb_ids, tenant_id, chat_llm_name=None, search_config={}):
-												Feat: add meta filter to search app. (#9554)

### What problem does this PR solve?


### Type of change

- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2025-08-19 17:25:44 +08:00
+								    doc_ids = search_config.get("doc_ids", [])
-												Refa: refine search app (#9536)

### What problem does this PR solve?

Refine search app.

### Type of change

- [x] Refactoring
											
										
										
											2025-08-19 09:33:33 +08:00
+								    rerank_mdl = None
-												Feat: add meta filter to search app. (#9554)

### What problem does this PR solve?


### Type of change

- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2025-08-19 17:25:44 +08:00
+								    kb_ids = search_config.get("kb_ids", kb_ids)
 								    chat_llm_name = search_config.get("chat_id", chat_llm_name)
 								    rerank_id = search_config.get("rerank_id", "")
 								    meta_data_filter = search_config.get("meta_data_filter")
-												Refa: refine search app (#9536)

### What problem does this PR solve?

Refine search app.

### Type of change

- [x] Refactoring
											
										
										
											2025-08-19 09:33:33 +08:00
-												add elapsed time of conversation (#2316)

### What problem does this PR solve?

#2315

### Type of change


- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2024-09-09 12:08:50 +08:00
+								    kbs = KnowledgebaseService.get_by_ids(kb_ids)
-												Refactor ask decorator (#4116)

### What problem does this PR solve?

Refactor ask decorator

### Type of change

- [x] Refactoring

---------

Signed-off-by: jinhai <haijin.chn@gmail.com>
Co-authored-by: Kevin Hu <kevinhu.sh@gmail.com>
											
										
										
											2024-12-19 18:13:33 +08:00
+								    embedding_list = list(set([kb.embd_id for kb in kbs]))
-												add elapsed time of conversation (#2316)

### What problem does this PR solve?

#2315

### Type of change


- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2024-09-09 12:08:50 +08:00
-												Refactor ask decorator (#4116)

### What problem does this PR solve?

Refactor ask decorator

### Type of change

- [x] Refactoring

---------

Signed-off-by: jinhai <haijin.chn@gmail.com>
Co-authored-by: Kevin Hu <kevinhu.sh@gmail.com>
											
										
										
											2024-12-19 18:13:33 +08:00
+								    is_knowledge_graph = all([kb.parser_id == ParserType.KG for kb in kbs])
-												Move api.settings to common.settings (#11036)

### What problem does this PR solve?

As title

### Type of change

- [x] Refactoring

---------

Signed-off-by: Jin Hai <haijin.chn@gmail.com>
											
										
										
											2025-11-06 09:36:38 +08:00
+								    retriever = settings.retriever if not is_knowledge_graph else settings.kg_retriever
-												add elapsed time of conversation (#2316)

### What problem does this PR solve?

#2315

### Type of change


- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2024-09-09 12:08:50 +08:00
-												Refactor ask decorator (#4116)

### What problem does this PR solve?

Refactor ask decorator

### Type of change

- [x] Refactoring

---------

Signed-off-by: jinhai <haijin.chn@gmail.com>
Co-authored-by: Kevin Hu <kevinhu.sh@gmail.com>
											
										
										
											2024-12-19 18:13:33 +08:00
+								    embd_mdl = LLMBundle(tenant_id, LLMType.EMBEDDING, embedding_list[0])
-												Feat: wrap search app (#8320)

### What problem does this PR solve?

Wrap search app

### Type of change

- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2025-06-18 16:45:42 +08:00
+								    chat_mdl = LLMBundle(tenant_id, LLMType.CHAT, chat_llm_name)
-												Refa: refine search app (#9536)

### What problem does this PR solve?

Refine search app.

### Type of change

- [x] Refactoring
											
										
										
											2025-08-19 09:33:33 +08:00
+								    if rerank_id:
 								        rerank_mdl = LLMBundle(tenant_id, LLMType.RERANK, rerank_id)
-												add elapsed time of conversation (#2316)

### What problem does this PR solve?

#2315

### Type of change


- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2024-09-09 12:08:50 +08:00
+								    max_tokens = chat_mdl.max_length
-												Support iframe chatbot. (#3961)

### What problem does this PR solve?

#3909

### Type of change

- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2024-12-10 17:03:24 +08:00
+								    tenant_ids = list(set([kb.tenant_id for kb in kbs]))
-												Feat: Support metadata auto filer for Search. (#9524)

### What problem does this PR solve?

### Type of change

- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2025-08-19 10:27:24 +08:00
-												Feat: add meta filter to search app. (#9554)

### What problem does this PR solve?


### Type of change

- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2025-08-19 17:25:44 +08:00
+								    if meta_data_filter:
 								        metas = DocumentService.get_meta_by_kbs(kb_ids)
 								        if meta_data_filter.get("method") == "auto":
 								            filters = gen_meta_filter(chat_mdl, metas, question)
 								            doc_ids.extend(meta_filter(metas, filters))
 								            if not doc_ids:
 								                doc_ids = None
 								        elif meta_data_filter.get("method") == "manual":
 								            doc_ids.extend(meta_filter(metas, meta_data_filter["manual"]))
 								            if not doc_ids:
 								                doc_ids = None
-												Refa: refine search app (#9536)

### What problem does this PR solve?

Refine search app.

### Type of change

- [x] Refactoring
											
										
										
											2025-08-19 09:33:33 +08:00
+								    kbinfos = retriever.retrieval(
-												Fix bug: broken import from rag.prompts.prompts (#10217)

### What problem does this PR solve?

Fix broken imports

### Type of change

- [x] Bug Fix (non-breaking change which fixes an issue)

---------

Signed-off-by: jinhai <haijin.chn@gmail.com>
											
										
										
											2025-09-23 10:19:25 +08:00
+								        question=question,
-												Refa: refine search app (#9536)

### What problem does this PR solve?

Refine search app.

### Type of change

- [x] Refactoring
											
										
										
											2025-08-19 09:33:33 +08:00
+								        embd_mdl=embd_mdl,
 								        tenant_ids=tenant_ids,
 								        kb_ids=kb_ids,
 								        page=1,
 								        page_size=12,
-												Feat: add meta filter to search app. (#9554)

### What problem does this PR solve?


### Type of change

- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2025-08-19 17:25:44 +08:00
+								        similarity_threshold=search_config.get("similarity_threshold", 0.1),
 								        vector_similarity_weight=search_config.get("vector_similarity_weight", 0.3),
 								        top=search_config.get("top_k", 1024),
-												Refa: refine search app (#9536)

### What problem does this PR solve?

Refine search app.

### Type of change

- [x] Refactoring
											
										
										
											2025-08-19 09:33:33 +08:00
+								        doc_ids=doc_ids,
 								        aggs=False,
 								        rerank_mdl=rerank_mdl,
 								        rank_feature=label_question(question, kbs)
 								    )
-												Support iframe chatbot. (#3961)

### What problem does this PR solve?

#3909

### Type of change

- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2024-12-10 17:03:24 +08:00
+								    knowledges = kb_prompt(kbinfos, max_tokens)
-												Feat: Support metadata auto filer for Search. (#9524)

### What problem does this PR solve?

### Type of change

- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2025-08-19 10:27:24 +08:00
+								    sys_prompt = PROMPT_JINJA_ENV.from_string(ASK_SUMMARY).render(knowledge="\n".join(knowledges))
-												add elapsed time of conversation (#2316)

### What problem does this PR solve?

#2315

### Type of change


- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2024-09-09 12:08:50 +08:00
+								    msg = [{"role": "user", "content": question}]
 								    def decorate_answer(answer):
-												Feat: Support metadata auto filer for Search. (#9524)

### What problem does this PR solve?

### Type of change

- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2025-08-19 10:27:24 +08:00
+								        nonlocal knowledges, kbinfos, sys_prompt
-												Fix bug: broken import from rag.prompts.prompts (#10217)

### What problem does this PR solve?

Fix broken imports

### Type of change

- [x] Bug Fix (non-breaking change which fixes an issue)

---------

Signed-off-by: jinhai <haijin.chn@gmail.com>
											
										
										
											2025-09-23 10:19:25 +08:00
+								        answer, idx = retriever.insert_citations(answer, [ck["content_ltks"] for ck in kbinfos["chunks"]], [ck["vector"] for ck in kbinfos["chunks"]],
 								                                                 embd_mdl, tkweight=0.7, vtweight=0.3)
-												add elapsed time of conversation (#2316)

### What problem does this PR solve?

#2315

### Type of change


- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2024-09-09 12:08:50 +08:00
+								        idx = set([kbinfos["chunks"][int(i)]["doc_id"] for i in idx])
-												Feat: add basic Langfuse support for LLM module (#6443)

### What problem does this PR solve?

#6155

Add basic Langfuse support for LLM module.

A trace example:

<img width="755" alt="image"
src="https://github.com/user-attachments/assets/25c1f852-5116-486c-a47f-6097187142ca"
/>


### Type of change

- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2025-03-24 13:18:47 +08:00
+								        recall_docs = [d for d in kbinfos["doc_aggs"] if d["doc_id"] in idx]
-												Fix errors detected by Ruff (#3918)

### What problem does this PR solve?

Fix errors detected by Ruff

### Type of change

- [x] Refactoring
											
										
										
											2024-12-08 14:21:12 +08:00
+								        if not recall_docs:
 								            recall_docs = kbinfos["doc_aggs"]
-												add elapsed time of conversation (#2316)

### What problem does this PR solve?

#2315

### Type of change


- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2024-09-09 12:08:50 +08:00
+								        kbinfos["doc_aggs"] = recall_docs
 								        refs = deepcopy(kbinfos)
 								        for c in refs["chunks"]:
 								            if c.get("vector"):
 								                del c["vector"]
 								        if answer.lower().find("invalid key") >= 0 or answer.lower().find("invalid api") >= 0:
-												Support iframe chatbot. (#3961)

### What problem does this PR solve?

#3909

### Type of change

- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2024-12-10 17:03:24 +08:00
+								            answer += " Please set LLM API-Key in 'User Setting -> Model Providers -> API-Key'"
-												Fix: search citation issue. (#5657)

### What problem does this PR solve?
#5649
### Type of change

- [x] Bug Fix (non-breaking change which fixes an issue)
											
										
										
											2025-03-05 17:25:47 +08:00
+								        refs["chunks"] = chunks_format(refs)
 								        return {"answer": answer, "reference": refs}
-												add elapsed time of conversation (#2316)

### What problem does this PR solve?

#2315

### Type of change


- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2024-09-09 12:08:50 +08:00
 								    answer = ""
-												Feat: Support metadata auto filer for Search. (#9524)

### What problem does this PR solve?

### Type of change

- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2025-08-19 10:27:24 +08:00
+								    for ans in chat_mdl.chat_streamly(sys_prompt, msg, {"temperature": 0.1}):
-												add elapsed time of conversation (#2316)

### What problem does this PR solve?

#2315

### Type of change


- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2024-09-09 12:08:50 +08:00
+								        answer = ans
 								        yield {"answer": answer, "reference": {}}
-												Refa: more fallbacks for bad citation format (#7710)

### What problem does this PR solve?

More fallbacks for bad citation format

### Type of change

- [x] Bug Fix (non-breaking change which fixes an issue)
- [x] Refactoring
											
										
										
											2025-05-19 19:34:05 +08:00
+								    yield decorate_answer(answer)
-												Feat: add meta filter to search app. (#9554)

### What problem does this PR solve?


### Type of change

- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2025-08-19 17:25:44 +08:00
 								def gen_mindmap(question, kb_ids, tenant_id, search_config={}):
 								    meta_data_filter = search_config.get("meta_data_filter", {})
 								    doc_ids = search_config.get("doc_ids", [])
 								    rerank_id = search_config.get("rerank_id", "")
 								    rerank_mdl = None
 								    kbs = KnowledgebaseService.get_by_ids(kb_ids)
-												Fix: no effect on retrieval_test in term of metadata filter. (#9566)

### What problem does this PR solve?


### Type of change

- [x] Bug Fix (non-breaking change which fixes an issue)
											
										
										
											2025-08-19 18:57:35 +08:00
+								    if not kbs:
 								        return {"error": "No KB selected"}
-												Feat: add meta filter to search app. (#9554)

### What problem does this PR solve?


### Type of change

- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2025-08-19 17:25:44 +08:00
+								    embedding_list = list(set([kb.embd_id for kb in kbs]))
 								    tenant_ids = list(set([kb.tenant_id for kb in kbs]))
 								    embd_mdl = LLMBundle(tenant_id, LLMType.EMBEDDING, llm_name=embedding_list[0])
 								    chat_mdl = LLMBundle(tenant_id, LLMType.CHAT, llm_name=search_config.get("chat_id", ""))
 								    if rerank_id:
 								        rerank_mdl = LLMBundle(tenant_id, LLMType.RERANK, rerank_id)
 								    if meta_data_filter:
 								        metas = DocumentService.get_meta_by_kbs(kb_ids)
 								        if meta_data_filter.get("method") == "auto":
 								            filters = gen_meta_filter(chat_mdl, metas, question)
 								            doc_ids.extend(meta_filter(metas, filters))
 								            if not doc_ids:
 								                doc_ids = None
 								        elif meta_data_filter.get("method") == "manual":
 								            doc_ids.extend(meta_filter(metas, meta_data_filter["manual"]))
 								            if not doc_ids:
 								                doc_ids = None
-												Move api.settings to common.settings (#11036)

### What problem does this PR solve?

As title

### Type of change

- [x] Refactoring

---------

Signed-off-by: Jin Hai <haijin.chn@gmail.com>
											
										
										
											2025-11-06 09:36:38 +08:00
+								    ranks = settings.retriever.retrieval(
-												Feat: add meta filter to search app. (#9554)

### What problem does this PR solve?


### Type of change

- [x] New Feature (non-breaking change which adds functionality)
											
										
										
											2025-08-19 17:25:44 +08:00
+								        question=question,
 								        embd_mdl=embd_mdl,
 								        tenant_ids=tenant_ids,
 								        kb_ids=kb_ids,
 								        page=1,
 								        page_size=12,
 								        similarity_threshold=search_config.get("similarity_threshold", 0.2),
 								        vector_similarity_weight=search_config.get("vector_similarity_weight", 0.3),
 								        top=search_config.get("top_k", 1024),
 								        doc_ids=doc_ids,
 								        aggs=False,
 								        rerank_mdl=rerank_mdl,
 								        rank_feature=label_question(question, kbs),
 								    )
 								    mindmap = MindMapExtractor(chat_mdl)
 								    mind_map = trio.run(mindmap, [c["content_with_weight"] for c in ranks["chunks"]])
-												During the chat, the assistant's response cited documents outside current chat's kbs (#9900)

### What problem does this PR solve?

During the chat, the assistant's response cited documents outside the
current knowledge base。

### Type of change

- [x] Bug Fix (non-breaking change which fixes an issue)
											
										
										
											2025-09-04 16:51:13 +08:00
+								    return mind_map.output