haystack/ui/webapp.py

import os
import sys
import streamlit as st
from utils import retrieve_doc
from utils import feedback_doc
from annotated_text import annotated_text
import pandas as pd
# streamlit does not support any states out of the box. On every button click, streamlit reload the whole page 
# and every value gets lost. To keep track of our feedback state we use the official streamlit gist mentioned 
# here https://gist.github.com/tvst/036da038ab3e999a64497f42de966a92
import SessionState

def annotate_answer(answer, context):
    start_idx = context.find(answer)
    end_idx = start_idx+len(answer)
    annotated_text(context[:start_idx],(answer,"ANSWER","#8ef"),context[end_idx:])

def random_questions(df):
     random_row = df.sample(1)
     random_question = random_row["Question Text"].values[0]
     random_answer = random_row["Answer"].values[0]
     return random_question, random_answer

# Define state
state_question = SessionState.get(random_question='Who is the father of Arya Starck?', random_answer='', next_question='false', run_query='false')

# Initalize variables
eval_mode = False
random_question = "Who is the father of Arya Starck?"
eval_labels = os.getenv("EVAL_FILE", "eval_labels_example.csv")

# UI search bar and sidebar      
st.write("# Haystack Demo")
st.sidebar.header("Options")
top_k_reader = st.sidebar.slider("Max. number of answers",min_value=1,max_value=10,value=3,step=1)
top_k_retriever = st.sidebar.slider("Max. number of documents from retriever",min_value=1,max_value=10,value=3,step=1)
eval_mode = st.sidebar.checkbox("Evalution mode")
debug = st.sidebar.checkbox("Show debug info")

# load csv into pandas dataframe
if eval_mode:
    try:
        df = pd.read_csv(eval_labels, sep=";")
    except Exception:
        sys.exit('The eval file was not found. Please check the README for more information.')
    if state_question and hasattr(state_question, 'next_question') and hasattr(state_question, 'random_question') and state_question.next_question:
        random_question = state_question.random_question
        random_answer = state_question.random_answer
    else:
        random_question, random_answer = random_questions(df)
        state_question.random_question = random_question
        state_question.random_answer = random_answer

# Generate new random question
if eval_mode:
    next_question = st.button("Load new question")
    if next_question:
       random_question, random_answer = random_questions(df)
       state_question.random_question = random_question
       state_question.random_answer = random_answer
       state_question.next_question = "true"
       state_question.run_query = "false"
    else:
       state_question.next_question = "false"

# Search bar
question = st.text_input("Please provide your query:",value=random_question)
if state_question and state_question.run_query:
    run_query = state_question.run_query
    st.button("Run")
else:
    run_query = st.button("Run")
    state_question.run_query = run_query

raw_json_feedback = ""

# Get results for query
if run_query:
    with st.spinner("Performing neural search on documents... 🧠 \n "
                    "Do you want to optimize speed or accuracy? \n"
                    "Check out the docs: https://haystack.deepset.ai/docs/latest/optimizationmd "):
        results,raw_json = retrieve_doc(question,top_k_reader=top_k_reader,top_k_retriever=top_k_retriever)

    # Show if we use a question of the given set
    if question == random_question and eval_mode:
        st.write("## Correct answers:")
        random_answer
    
    st.write("## Retrieved answers:")

    # Make every button key unique
    count = 0

    for result in results:
        annotate_answer(result['answer'],result['context'])
        '**Relevance:** ', result['relevance'] , '**Source:** ' , result['source']
        if eval_mode:
            # Define columns for buttons
            button_col1, button_col2, button_col3, button_col4 = st.beta_columns([1,1,1,6])
            if button_col1.button("👍", key=(result['answer'] + str(count)), help="Correct answer"):
                raw_json_feedback = feedback_doc(question,"true",result['document_id'],1,"true",result['answer'],result['offset_start_in_doc'])
                st.success('Thanks for your feedback')
            if button_col2.button("👎", key=(result['answer'] + str(count)), help="Wrong answer and wrong passage"):
                raw_json_feedback = feedback_doc(question,"false",result['document_id'],1,"false",result['answer'],result['offset_start_in_doc'])
                st.success('Thanks for your feedback!')
            if button_col3.button("👎👍", key=(result['answer'] + str(count)), help="Wrong answer, but correct passage"):
                raw_json_feedback = feedback_doc(question,"false",result['document_id'],1,"true",result['answer'],result['offset_start_in_doc'])
                st.success('Thanks for your feedback!')
            count+=1
        st.write("___")
    if debug:
        st.subheader("REST API JSON response")
        st.write(raw_json)
Streamlit UI Evaluation mode (#920) * first running version of eval mode * restructuring, new naming of elements and testing * add new files to Docker, how to start with Haystack reference, remove not needed dependencies * Add latest docstring and tutorial changes * merged changes * fixing bugs after breaking changes from last release * newser version of states in streamlit, more docs for eval mode, eval file as env virable * eval file as env variable Co-authored-by: github-actions[bot] <41898282+github-actions[bot]@users.noreply.github.com> 2021-04-22 17:30:17 +02:00			`import os`
			`import sys`
Add basic demo UI via streamlit (#671) * Added starter code for frontend demo * worked on comments * Added Docker config for frontend * update docker file. restructure folder structure. minimal renamings and defaults * add screenshot to readme Co-authored-by: Malte Pietsch <malte.pietsch@deepset.ai> 2020-12-27 18:06:09 +05:30			`import streamlit as st`
Streamlit UI Evaluation mode (#920) * first running version of eval mode * restructuring, new naming of elements and testing * add new files to Docker, how to start with Haystack reference, remove not needed dependencies * Add latest docstring and tutorial changes * merged changes * fixing bugs after breaking changes from last release * newser version of states in streamlit, more docs for eval mode, eval file as env virable * eval file as env variable Co-authored-by: github-actions[bot] <41898282+github-actions[bot]@users.noreply.github.com> 2021-04-22 17:30:17 +02:00			`from utils import retrieve_doc`
			`from utils import feedback_doc`
Add basic demo UI via streamlit (#671) * Added starter code for frontend demo * worked on comments * Added Docker config for frontend * update docker file. restructure folder structure. minimal renamings and defaults * add screenshot to readme Co-authored-by: Malte Pietsch <malte.pietsch@deepset.ai> 2020-12-27 18:06:09 +05:30			`from annotated_text import annotated_text`
Streamlit UI Evaluation mode (#920) * first running version of eval mode * restructuring, new naming of elements and testing * add new files to Docker, how to start with Haystack reference, remove not needed dependencies * Add latest docstring and tutorial changes * merged changes * fixing bugs after breaking changes from last release * newser version of states in streamlit, more docs for eval mode, eval file as env virable * eval file as env variable Co-authored-by: github-actions[bot] <41898282+github-actions[bot]@users.noreply.github.com> 2021-04-22 17:30:17 +02:00			`import pandas as pd`
			`# streamlit does not support any states out of the box. On every button click, streamlit reload the whole page`
			`# and every value gets lost. To keep track of our feedback state we use the official streamlit gist mentioned`
			`# here https://gist.github.com/tvst/036da038ab3e999a64497f42de966a92`
			`import SessionState`
Refactor REST APIs to use Pipelines (#922) 2021-04-07 17:53:32 +02:00
			`def annotate_answer(answer, context):`
Add basic demo UI via streamlit (#671) * Added starter code for frontend demo * worked on comments * Added Docker config for frontend * update docker file. restructure folder structure. minimal renamings and defaults * add screenshot to readme Co-authored-by: Malte Pietsch <malte.pietsch@deepset.ai> 2020-12-27 18:06:09 +05:30			`start_idx = context.find(answer)`
Streamlit UI Evaluation mode (#920) * first running version of eval mode * restructuring, new naming of elements and testing * add new files to Docker, how to start with Haystack reference, remove not needed dependencies * Add latest docstring and tutorial changes * merged changes * fixing bugs after breaking changes from last release * newser version of states in streamlit, more docs for eval mode, eval file as env virable * eval file as env variable Co-authored-by: github-actions[bot] <41898282+github-actions[bot]@users.noreply.github.com> 2021-04-22 17:30:17 +02:00			`end_idx = start_idx+len(answer)`
			`annotated_text(context[:start_idx],(answer,"ANSWER","#8ef"),context[end_idx:])`

			`def random_questions(df):`
			`random_row = df.sample(1)`
			`random_question = random_row["Question Text"].values[0]`
			`random_answer = random_row["Answer"].values[0]`
			`return random_question, random_answer`
Refactor REST APIs to use Pipelines (#922) 2021-04-07 17:53:32 +02:00
Streamlit UI Evaluation mode (#920) * first running version of eval mode * restructuring, new naming of elements and testing * add new files to Docker, how to start with Haystack reference, remove not needed dependencies * Add latest docstring and tutorial changes * merged changes * fixing bugs after breaking changes from last release * newser version of states in streamlit, more docs for eval mode, eval file as env virable * eval file as env variable Co-authored-by: github-actions[bot] <41898282+github-actions[bot]@users.noreply.github.com> 2021-04-22 17:30:17 +02:00			`# Define state`
			`state_question = SessionState.get(random_question='Who is the father of Arya Starck?', random_answer='', next_question='false', run_query='false')`
Refactor REST APIs to use Pipelines (#922) 2021-04-07 17:53:32 +02:00
Streamlit UI Evaluation mode (#920) * first running version of eval mode * restructuring, new naming of elements and testing * add new files to Docker, how to start with Haystack reference, remove not needed dependencies * Add latest docstring and tutorial changes * merged changes * fixing bugs after breaking changes from last release * newser version of states in streamlit, more docs for eval mode, eval file as env virable * eval file as env variable Co-authored-by: github-actions[bot] <41898282+github-actions[bot]@users.noreply.github.com> 2021-04-22 17:30:17 +02:00			`# Initalize variables`
			`eval_mode = False`
			`random_question = "Who is the father of Arya Starck?"`
			`eval_labels = os.getenv("EVAL_FILE", "eval_labels_example.csv")`

			`# UI search bar and sidebar`
Add basic demo UI via streamlit (#671) * Added starter code for frontend demo * worked on comments * Added Docker config for frontend * update docker file. restructure folder structure. minimal renamings and defaults * add screenshot to readme Co-authored-by: Malte Pietsch <malte.pietsch@deepset.ai> 2020-12-27 18:06:09 +05:30			`st.write("# Haystack Demo")`
			`st.sidebar.header("Options")`
Streamlit UI Evaluation mode (#920) * first running version of eval mode * restructuring, new naming of elements and testing * add new files to Docker, how to start with Haystack reference, remove not needed dependencies * Add latest docstring and tutorial changes * merged changes * fixing bugs after breaking changes from last release * newser version of states in streamlit, more docs for eval mode, eval file as env virable * eval file as env variable Co-authored-by: github-actions[bot] <41898282+github-actions[bot]@users.noreply.github.com> 2021-04-22 17:30:17 +02:00			`top_k_reader = st.sidebar.slider("Max. number of answers",min_value=1,max_value=10,value=3,step=1)`
			`top_k_retriever = st.sidebar.slider("Max. number of documents from retriever",min_value=1,max_value=10,value=3,step=1)`
			`eval_mode = st.sidebar.checkbox("Evalution mode")`
Add basic demo UI via streamlit (#671) * Added starter code for frontend demo * worked on comments * Added Docker config for frontend * update docker file. restructure folder structure. minimal renamings and defaults * add screenshot to readme Co-authored-by: Malte Pietsch <malte.pietsch@deepset.ai> 2020-12-27 18:06:09 +05:30			`debug = st.sidebar.checkbox("Show debug info")`
Streamlit UI Evaluation mode (#920) * first running version of eval mode * restructuring, new naming of elements and testing * add new files to Docker, how to start with Haystack reference, remove not needed dependencies * Add latest docstring and tutorial changes * merged changes * fixing bugs after breaking changes from last release * newser version of states in streamlit, more docs for eval mode, eval file as env virable * eval file as env variable Co-authored-by: github-actions[bot] <41898282+github-actions[bot]@users.noreply.github.com> 2021-04-22 17:30:17 +02:00
			`# load csv into pandas dataframe`
			`if eval_mode:`
			`try:`
			`df = pd.read_csv(eval_labels, sep=";")`
			`except Exception:`
			`sys.exit('The eval file was not found. Please check the README for more information.')`
			`if state_question and hasattr(state_question, 'next_question') and hasattr(state_question, 'random_question') and state_question.next_question:`
			`random_question = state_question.random_question`
			`random_answer = state_question.random_answer`
			`else:`
			`random_question, random_answer = random_questions(df)`
			`state_question.random_question = random_question`
			`state_question.random_answer = random_answer`

			`# Generate new random question`
			`if eval_mode:`
			`next_question = st.button("Load new question")`
			`if next_question:`
			`random_question, random_answer = random_questions(df)`
			`state_question.random_question = random_question`
			`state_question.random_answer = random_answer`
			`state_question.next_question = "true"`
			`state_question.run_query = "false"`
			`else:`
			`state_question.next_question = "false"`

			`# Search bar`
			`question = st.text_input("Please provide your query:",value=random_question)`
			`if state_question and state_question.run_query:`
			`run_query = state_question.run_query`
			`st.button("Run")`
			`else:`
			`run_query = st.button("Run")`
			`state_question.run_query = run_query`

			`raw_json_feedback = ""`

			`# Get results for query`
Add basic demo UI via streamlit (#671) * Added starter code for frontend demo * worked on comments * Added Docker config for frontend * update docker file. restructure folder structure. minimal renamings and defaults * add screenshot to readme Co-authored-by: Malte Pietsch <malte.pietsch@deepset.ai> 2020-12-27 18:06:09 +05:30			`if run_query:`
Streamlit UI Evaluation mode (#920) * first running version of eval mode * restructuring, new naming of elements and testing * add new files to Docker, how to start with Haystack reference, remove not needed dependencies * Add latest docstring and tutorial changes * merged changes * fixing bugs after breaking changes from last release * newser version of states in streamlit, more docs for eval mode, eval file as env virable * eval file as env variable Co-authored-by: github-actions[bot] <41898282+github-actions[bot]@users.noreply.github.com> 2021-04-22 17:30:17 +02:00			`with st.spinner("Performing neural search on documents... 🧠 \n "`
			`"Do you want to optimize speed or accuracy? \n"`
			`"Check out the docs: https://haystack.deepset.ai/docs/latest/optimizationmd "):`
			`results,raw_json = retrieve_doc(question,top_k_reader=top_k_reader,top_k_retriever=top_k_retriever)`

			`# Show if we use a question of the given set`
			`if question == random_question and eval_mode:`
			`st.write("## Correct answers:")`
			`random_answer`

Add basic demo UI via streamlit (#671) * Added starter code for frontend demo * worked on comments * Added Docker config for frontend * update docker file. restructure folder structure. minimal renamings and defaults * add screenshot to readme Co-authored-by: Malte Pietsch <malte.pietsch@deepset.ai> 2020-12-27 18:06:09 +05:30			`st.write("## Retrieved answers:")`
Streamlit UI Evaluation mode (#920) * first running version of eval mode * restructuring, new naming of elements and testing * add new files to Docker, how to start with Haystack reference, remove not needed dependencies * Add latest docstring and tutorial changes * merged changes * fixing bugs after breaking changes from last release * newser version of states in streamlit, more docs for eval mode, eval file as env virable * eval file as env variable Co-authored-by: github-actions[bot] <41898282+github-actions[bot]@users.noreply.github.com> 2021-04-22 17:30:17 +02:00
			`# Make every button key unique`
			`count = 0`

Add basic demo UI via streamlit (#671) * Added starter code for frontend demo * worked on comments * Added Docker config for frontend * update docker file. restructure folder structure. minimal renamings and defaults * add screenshot to readme Co-authored-by: Malte Pietsch <malte.pietsch@deepset.ai> 2020-12-27 18:06:09 +05:30			`for result in results:`
Streamlit UI Evaluation mode (#920) * first running version of eval mode * restructuring, new naming of elements and testing * add new files to Docker, how to start with Haystack reference, remove not needed dependencies * Add latest docstring and tutorial changes * merged changes * fixing bugs after breaking changes from last release * newser version of states in streamlit, more docs for eval mode, eval file as env virable * eval file as env variable Co-authored-by: github-actions[bot] <41898282+github-actions[bot]@users.noreply.github.com> 2021-04-22 17:30:17 +02:00			`annotate_answer(result['answer'],result['context'])`
			`'Relevance: ', result['relevance'] , 'Source: ' , result['source']`
			`if eval_mode:`
			`# Define columns for buttons`
			`button_col1, button_col2, button_col3, button_col4 = st.beta_columns([1,1,1,6])`
			`if button_col1.button("👍", key=(result['answer'] + str(count)), help="Correct answer"):`
			`raw_json_feedback = feedback_doc(question,"true",result['document_id'],1,"true",result['answer'],result['offset_start_in_doc'])`
			`st.success('Thanks for your feedback')`
			`if button_col2.button("👎", key=(result['answer'] + str(count)), help="Wrong answer and wrong passage"):`
			`raw_json_feedback = feedback_doc(question,"false",result['document_id'],1,"false",result['answer'],result['offset_start_in_doc'])`
			`st.success('Thanks for your feedback!')`
			`if button_col3.button("👎👍", key=(result['answer'] + str(count)), help="Wrong answer, but correct passage"):`
			`raw_json_feedback = feedback_doc(question,"false",result['document_id'],1,"true",result['answer'],result['offset_start_in_doc'])`
			`st.success('Thanks for your feedback!')`
			`count+=1`
			`st.write("___")`
Add basic demo UI via streamlit (#671) * Added starter code for frontend demo * worked on comments * Added Docker config for frontend * update docker file. restructure folder structure. minimal renamings and defaults * add screenshot to readme Co-authored-by: Malte Pietsch <malte.pietsch@deepset.ai> 2020-12-27 18:06:09 +05:30			`if debug:`
Refactor REST APIs to use Pipelines (#922) 2021-04-07 17:53:32 +02:00			`st.subheader("REST API JSON response")`
Add basic demo UI via streamlit (#671) * Added starter code for frontend demo * worked on comments * Added Docker config for frontend * update docker file. restructure folder structure. minimal renamings and defaults * add screenshot to readme Co-authored-by: Malte Pietsch <malte.pietsch@deepset.ai> 2020-12-27 18:06:09 +05:30			`st.write(raw_json)`