mirror of
https://github.com/deepset-ai/haystack.git
synced 2026-01-28 02:23:48 +00:00
* add time and perf benchmark for es * Add retriever benchmarking * Add Reader benchmarking * add nq to squad conversion * add conversion stats * clean benchmarks * Add link to dataset * Update imports * add first support for neg psgs * Refactor test * set max_seq_len * cleanup benchmark * begin retriever speed benchmarking * Add support for retriever query index benchmarking * improve reader eval, retriever speed benchmarking * improve retriever speed benchmarking * Add retriever accuracy benchmark * Add neg doc shuffling * Add top_n * 3x speedup of SQL. add postgres docker run. make shuffle neg a param. add more logging * Add models to sweep * add option for faiss index type * remove unneeded line * change faiss to faiss_flat * begin automatic benchmark script * remove existing postgres docker for benchmarking * Add data processing scripts * Remove shuffle in script bc data already shuffled * switch hnsw setup from 256 to 128 * change es similarity to dot product by default * Error includes stack trace * Change ES default timeout * remove delete_docs() from timing for indexing * Add support for website export * update website on push to benchmarks * add complete benchmarks results * new json format * removed NaN as is not a valid json token * fix benchmarking for faiss hnsw queries. do sql calls in update_embeddings() as batches * update benchmarks for hnsw 128,20,80 * don't delete full index in delete_all_documents() * update texts for charts * update recall column for retriever * change scale and add units to desc * add units to legend * add axis titles. update desc * add html tags Co-authored-by: deepset <deepset@Crenolape.localdomain> Co-authored-by: Malte Pietsch <malte.pietsch@deepset.ai> Co-authored-by: PiffPaffM <markuspaff.mp@gmail.com>
105 lines
1.9 KiB
JSON
105 lines
1.9 KiB
JSON
{
|
|
"chart_type": "LineChart",
|
|
"title": "Retriever Speed",
|
|
"subtitle": "Query Speed at different number of docs",
|
|
"description": "Here you can see how the query speed of different Retriever / DocumentStore combinations scale as the number of documents increases. The set up is the same as the above querying benchmark except that a varying number of negative documents are used to fill the document store.",
|
|
"columns": [
|
|
"n_docs",
|
|
"BM25 / ElasticSearch",
|
|
"DPR / ElasticSearch",
|
|
"DPR / FAISS (flat)",
|
|
"DPR / FAISS (HSNW)"
|
|
],
|
|
"axis": [
|
|
{ "x": "Number of docs", "y": "Docs/sec" }
|
|
],
|
|
"data":
|
|
[
|
|
[
|
|
"model",
|
|
"n_docs",
|
|
"query_speed"
|
|
],
|
|
[
|
|
"DPR / ElasticSearch",
|
|
1000,
|
|
40.802
|
|
],
|
|
[
|
|
"BM25 / ElasticSearch",
|
|
1000,
|
|
232.97799999999998
|
|
],
|
|
[
|
|
"BM25 / ElasticSearch",
|
|
10000,
|
|
167.81
|
|
],
|
|
[
|
|
"DPR / ElasticSearch",
|
|
10000,
|
|
27.006999999999998
|
|
],
|
|
[
|
|
"DPR / ElasticSearch",
|
|
100000,
|
|
6.5360000000000005
|
|
],
|
|
[
|
|
"BM25 / ElasticSearch",
|
|
100000,
|
|
162.996
|
|
],
|
|
[
|
|
"DPR / FAISS (flat)",
|
|
1000,
|
|
40.048
|
|
],
|
|
[
|
|
"DPR / FAISS (flat)",
|
|
10000,
|
|
23.976999999999997
|
|
],
|
|
[
|
|
"DPR / FAISS (flat)",
|
|
100000,
|
|
5.044
|
|
],
|
|
[
|
|
"DPR / FAISS (HSNW)",
|
|
1000,
|
|
37.884
|
|
],
|
|
[
|
|
"DPR / FAISS (HSNW)",
|
|
10000,
|
|
33.421
|
|
],
|
|
[
|
|
"DPR / FAISS (HSNW)",
|
|
100000,
|
|
12.815
|
|
],
|
|
[
|
|
"DPR / ElasticSearch",
|
|
500000,
|
|
1.514
|
|
],
|
|
[
|
|
"DPR / FAISS (flat)",
|
|
500000,
|
|
1.091
|
|
],
|
|
[
|
|
"BM25 / ElasticSearch",
|
|
500000,
|
|
95.491
|
|
],
|
|
[
|
|
"DPR / FAISS (HSNW)",
|
|
500000,
|
|
3.259
|
|
]
|
|
]
|
|
|
|
} |