From 2caeea000ea3525130086e76384d6134b8216557 Mon Sep 17 00:00:00 2001
From: Malte Pietsch <malte.pietsch@deepset.ai>
Date: Thu, 24 Jun 2021 09:53:08 +0200
Subject: [PATCH] Small UI and REST API fixes (#1223)

* small fixes

* change default question
---
 rest_api/controller/search.py |  8 +++++++-
 ui/Dockerfile                 |  8 ++++----
 ui/webapp.py                  | 37 ++++++++++++++++++++++++++---------
 3 files changed, 39 insertions(+), 14 deletions(-)

diff --git a/rest_api/controller/search.py b/rest_api/controller/search.py
index eb3644d03..53eb3919c 100644
--- a/rest_api/controller/search.py
+++ b/rest_api/controller/search.py
@@ -20,6 +20,9 @@ router = APIRouter()
 class Request(BaseModel):
     query: str
     filters: Optional[Dict[str, Optional[Union[str, List[str]]]]] = None
+    top_k_retriever: Optional[int] = None
+    top_k_reader: Optional[int] = None
+
 
 
 class Answer(BaseModel):
@@ -66,7 +69,10 @@ def _process_request(pipeline, request) -> Response:
                 values = [values]
             filters[key] = values
 
-    result = pipeline.run(query=request.query, filters=filters)
+    result = pipeline.run(query=request.query,
+                          filters=filters,
+                          top_k_retriever=request.top_k_retriever,
+                          top_k_reader=request.top_k_reader)
 
     end_time = time.time()
     logger.info(json.dumps({"request": request.dict(), "response": result, "time": f"{(end_time - start_time):.2f}"}))
diff --git a/ui/Dockerfile b/ui/Dockerfile
index 71357aebf..bce12a4fc 100644
--- a/ui/Dockerfile
+++ b/ui/Dockerfile
@@ -4,16 +4,16 @@ WORKDIR /home/user
 
 RUN apt-get update && apt-get install -y curl git pkg-config cmake
 
+# install as a package
+COPY requirements.txt /home/user/
+RUN pip install -r requirements.txt
+
 # copy code
 COPY utils.py /home/user/
 COPY webapp.py /home/user/
 COPY eval_labels_example.csv /home/user/
 COPY SessionState.py /home/user/
 
-# install as a package
-COPY requirements.txt /home/user/
-RUN pip install -r requirements.txt
-
 EXPOSE 8501
 
 # cmd for running the API
diff --git a/ui/webapp.py b/ui/webapp.py
index 0cf5b4fa3..ceb2d7908 100644
--- a/ui/webapp.py
+++ b/ui/webapp.py
@@ -13,14 +13,30 @@ from utils import feedback_doc
 from utils import retrieve_doc
 from utils import upload_doc
 
+# Adjust to a question that you would like users to see in the search bar when they load the UI:
+DEFAULT_QUESTION_AT_STARTUP = "Who is the father of Arya Stark?"
+
 
 def annotate_answer(answer, context):
+    """ If we are using an extractive QA pipeline, we'll get answers
+    from the API that we highlight in the given context"""
     start_idx = context.find(answer)
     end_idx = start_idx + len(answer)
     annotated_text(context[:start_idx], (answer, "ANSWER", "#8ef"), context[end_idx:])
 
 
+def show_plain_documents(text):
+    """ If we are using a plain document search pipeline, i.e. only retriever, we'll get plain documents
+    from the API that we just show without any highlighting"""
+    st.markdown(text)
+
+
 def random_questions(df):
+    """
+    Helper to get one random question + gold random_answer from the user's CSV 'eval_labels_example'.
+    This can then be shown in the UI when the evaluation mode is selected. Users can easily give feedback on the
+    model's results and "enrich" the eval dataset with more acceptable labels
+    """
     random_row = df.sample(1)
     random_question = random_row["Question Text"].values[0]
     random_answer = random_row["Answer"].values[0]
@@ -29,12 +45,12 @@ def random_questions(df):
 
 # Define state
 state_question = SessionState.get(
-    random_question="Who is the father of Arya Starck?", random_answer="", next_question="false", run_query="false"
+    random_question=DEFAULT_QUESTION_AT_STARTUP, random_answer="", next_question="false", run_query="false"
 )
 
 # Initialize variables
 eval_mode = False
-random_question = "Who is the father of Arya Starck?"
+random_question = DEFAULT_QUESTION_AT_STARTUP
 eval_labels = os.getenv("EVAL_FILE", "eval_labels_example.csv")
 
 # UI search bar and sidebar
@@ -76,7 +92,7 @@ if eval_mode:
         state_question.random_question = random_question
         state_question.random_answer = random_answer
 
-# Generate new random question
+# Get next random question from the CSV
 if eval_mode:
     next_question = st.button("Load new question")
     if next_question:
@@ -113,23 +129,26 @@ if run_query:
         st.write("## Correct answers:")
         random_answer
 
-    st.write("## Retrieved answers:")
+    st.write("## Results:")
 
     # Make every button key unique
     count = 0
 
     for result in results:
-        annotate_answer(result["answer"], result["context"])
-        "**Relevance:** ", result["relevance"], "**Source:** ", result["source"]
+        if result["answer"]:
+            annotate_answer(result["answer"], result["context"])
+        else:
+            show_plain_documents(result["context"])
+        st.write("**Relevance:** ", result["relevance"], "**Source:** ", result["source"])
         if eval_mode:
             # Define columns for buttons
             button_col1, button_col2, button_col3, button_col4 = st.beta_columns([1, 1, 1, 6])
-            if button_col1.button("👍", key=(result["answer"] + str(count)), help="Correct answer"):
+            if button_col1.button("👍", key=(result["context"] + str(count)), help="Correct answer"):
                 raw_json_feedback = feedback_doc(
                     question, "true", result["document_id"], 1, "true", result["answer"], result["offset_start_in_doc"]
                 )
                 st.success("Thanks for your feedback")
-            if button_col2.button("👎", key=(result["answer"] + str(count)), help="Wrong answer and wrong passage"):
+            if button_col2.button("👎", key=(result["context"] + str(count)), help="Wrong answer and wrong passage"):
                 raw_json_feedback = feedback_doc(
                     question,
                     "false",
@@ -140,7 +159,7 @@ if run_query:
                     result["offset_start_in_doc"],
                 )
                 st.success("Thanks for your feedback!")
-            if button_col3.button("👎👍", key=(result["answer"] + str(count)), help="Wrong answer, but correct passage"):
+            if button_col3.button("👎👍", key=(result["context"] + str(count)), help="Wrong answer, but correct passage"):
                 raw_json_feedback = feedback_doc(
                     question, "false", result["document_id"], 1, "true", result["answer"], result["offset_start_in_doc"]
                 )