Small UI and REST API fixes (#1223)

* small fixes * change default question
2026-01-07 12:37:27 +00:00 · 2021-06-24 09:53:08 +02:00 · 2021-06-24 09:53:08 +02:00 · 2caeea000e
commit 2caeea000e
parent 17dcb8c23e
3 changed files with 39 additions and 14 deletions
--- a/rest_api/controller/search.py
+++ b/rest_api/controller/search.py
@ -20,6 +20,9 @@ router = APIRouter()
 class Request(BaseModel):
    query: str
    filters: Optional[Dict[str, Optional[Union[str, List[str]]]]] = None
+    top_k_retriever: Optional[int] = None
+    top_k_reader: Optional[int] = None
+


 class Answer(BaseModel):
@ -66,7 +69,10 @@ def _process_request(pipeline, request) -> Response:
                values = [values]
            filters[key] = values

-    result = pipeline.run(query=request.query, filters=filters)
+    result = pipeline.run(query=request.query,
+                          filters=filters,
+                          top_k_retriever=request.top_k_retriever,
+                          top_k_reader=request.top_k_reader)

    end_time = time.time()
    logger.info(json.dumps({"request": request.dict(), "response": result, "time": f"{(end_time - start_time):.2f}"}))
--- a/ui/Dockerfile
+++ b/ui/Dockerfile
@ -4,16 +4,16 @@ WORKDIR /home/user

 RUN apt-get update && apt-get install -y curl git pkg-config cmake

+# install as a package
+COPY requirements.txt /home/user/
+RUN pip install -r requirements.txt
+
 # copy code
 COPY utils.py /home/user/
 COPY webapp.py /home/user/
 COPY eval_labels_example.csv /home/user/
 COPY SessionState.py /home/user/

-# install as a package
-COPY requirements.txt /home/user/
-RUN pip install -r requirements.txt
-
 EXPOSE 8501

 # cmd for running the API
--- a/ui/webapp.py
+++ b/ui/webapp.py
@ -13,14 +13,30 @@ from utils import feedback_doc
 from utils import retrieve_doc
 from utils import upload_doc

+# Adjust to a question that you would like users to see in the search bar when they load the UI:
+DEFAULT_QUESTION_AT_STARTUP = "Who is the father of Arya Stark?"
+

 def annotate_answer(answer, context):
+    """ If we are using an extractive QA pipeline, we'll get answers
+    from the API that we highlight in the given context"""
    start_idx = context.find(answer)
    end_idx = start_idx + len(answer)
    annotated_text(context[:start_idx], (answer, "ANSWER", "#8ef"), context[end_idx:])


+def show_plain_documents(text):
+    """ If we are using a plain document search pipeline, i.e. only retriever, we'll get plain documents
+    from the API that we just show without any highlighting"""
+    st.markdown(text)
+
+
 def random_questions(df):
+    """
+    Helper to get one random question + gold random_answer from the user's CSV 'eval_labels_example'.
+    This can then be shown in the UI when the evaluation mode is selected. Users can easily give feedback on the
+    model's results and "enrich" the eval dataset with more acceptable labels
+    """
    random_row = df.sample(1)
    random_question = random_row["Question Text"].values[0]
    random_answer = random_row["Answer"].values[0]
@ -29,12 +45,12 @@ def random_questions(df):

 # Define state
 state_question = SessionState.get(
-    random_question="Who is the father of Arya Starck?", random_answer="", next_question="false", run_query="false"
+    random_question=DEFAULT_QUESTION_AT_STARTUP, random_answer="", next_question="false", run_query="false"
 )

 # Initialize variables
 eval_mode = False
-random_question = "Who is the father of Arya Starck?"
+random_question = DEFAULT_QUESTION_AT_STARTUP
 eval_labels = os.getenv("EVAL_FILE", "eval_labels_example.csv")

 # UI search bar and sidebar
@ -76,7 +92,7 @@ if eval_mode:
        state_question.random_question = random_question
        state_question.random_answer = random_answer

-# Generate new random question
+# Get next random question from the CSV
 if eval_mode:
    next_question = st.button("Load new question")
    if next_question:
@ -113,23 +129,26 @@ if run_query:
        st.write("## Correct answers:")
        random_answer

-    st.write("## Retrieved answers:")
+    st.write("## Results:")

    # Make every button key unique
    count = 0

    for result in results:
-        annotate_answer(result["answer"], result["context"])
-        "**Relevance:** ", result["relevance"], "**Source:** ", result["source"]
+        if result["answer"]:
+            annotate_answer(result["answer"], result["context"])
+        else:
+            show_plain_documents(result["context"])
+        st.write("**Relevance:** ", result["relevance"], "**Source:** ", result["source"])
        if eval_mode:
            # Define columns for buttons
            button_col1, button_col2, button_col3, button_col4 = st.beta_columns([1, 1, 1, 6])
-            if button_col1.button("👍", key=(result["answer"] + str(count)), help="Correct answer"):
+            if button_col1.button("👍", key=(result["context"] + str(count)), help="Correct answer"):
                raw_json_feedback = feedback_doc(
                    question, "true", result["document_id"], 1, "true", result["answer"], result["offset_start_in_doc"]
                )
                st.success("Thanks for your feedback")
-            if button_col2.button("👎", key=(result["answer"] + str(count)), help="Wrong answer and wrong passage"):
+            if button_col2.button("👎", key=(result["context"] + str(count)), help="Wrong answer and wrong passage"):
                raw_json_feedback = feedback_doc(
                    question,
                    "false",
@ -140,7 +159,7 @@ if run_query:
                    result["offset_start_in_doc"],
                )
                st.success("Thanks for your feedback!")
-            if button_col3.button("👎👍", key=(result["answer"] + str(count)), help="Wrong answer, but correct passage"):
+            if button_col3.button("👎👍", key=(result["context"] + str(count)), help="Wrong answer, but correct passage"):
                raw_json_feedback = feedback_doc(
                    question, "false", result["document_id"], 1, "true", result["answer"], result["offset_start_in_doc"]
                )