Deploying to gh-pages from @ microsoft/graphrag@e0d233fe10 🚀

This commit is contained in:
AlonsoGuevara 2025-02-25 00:37:36 +00:00
parent b26fbf993b
commit e9c6433127
5 changed files with 266 additions and 192 deletions

View File

@ -2052,80 +2052,27 @@ text_unit_df.head()</div>
<div class="jp-RenderedText jp-OutputArea-output" data-mime-type="application/vnd.jupyter.stderr" tabindex="0">
<pre>
<span class="ansi-red-fg">---------------------------------------------------------------------------</span>
<span class="ansi-red-fg">FileNotFoundError</span> Traceback (most recent call last)
Cell <span class="ansi-green-fg">In[2], line 37</span>
<span class="ansi-green-intense-fg ansi-bold"> 33</span> COMMUNITY_LEVEL <span style="color: rgb(98,98,98)">=</span> <span style="color: rgb(98,98,98)">2</span>
<span class="ansi-green-intense-fg ansi-bold"> 36</span> <span style="color: rgb(95,135,135)"># read nodes table to get community and degree data</span>
<span class="ansi-green-fg">---&gt; 37</span> entity_df <span style="color: rgb(98,98,98)">=</span> <span class="ansi-yellow-bg">pd</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">.</span><span class="ansi-yellow-bg">read_parquet</span><span class="ansi-yellow-bg">(</span><span class="ansi-yellow-bg" style="color: rgb(175,0,0)">f</span><span class="ansi-yellow-bg" style="color: rgb(175,0,0)">"</span><span class="ansi-yellow-bg ansi-bold" style="color: rgb(175,95,135)">{</span><span class="ansi-yellow-bg">INPUT_DIR</span><span class="ansi-yellow-bg ansi-bold" style="color: rgb(175,95,135)">}</span><span class="ansi-yellow-bg" style="color: rgb(175,0,0)">/</span><span class="ansi-yellow-bg ansi-bold" style="color: rgb(175,95,135)">{</span><span class="ansi-yellow-bg">ENTITY_TABLE</span><span class="ansi-yellow-bg ansi-bold" style="color: rgb(175,95,135)">}</span><span class="ansi-yellow-bg" style="color: rgb(175,0,0)">.parquet</span><span class="ansi-yellow-bg" style="color: rgb(175,0,0)">"</span><span class="ansi-yellow-bg">)</span>
<span class="ansi-green-intense-fg ansi-bold"> 38</span> community_df <span style="color: rgb(98,98,98)">=</span> pd<span style="color: rgb(98,98,98)">.</span>read_parquet(<span style="color: rgb(175,0,0)">f</span><span style="color: rgb(175,0,0)">"</span><span class="ansi-bold" style="color: rgb(175,95,135)">{</span>INPUT_DIR<span class="ansi-bold" style="color: rgb(175,95,135)">}</span><span style="color: rgb(175,0,0)">/</span><span class="ansi-bold" style="color: rgb(175,95,135)">{</span>COMMUNITY_TABLE<span class="ansi-bold" style="color: rgb(175,95,135)">}</span><span style="color: rgb(175,0,0)">.parquet</span><span style="color: rgb(175,0,0)">"</span>)
<span class="ansi-green-intense-fg ansi-bold"> 40</span> <span style="color: rgb(0,135,0)">print</span>(<span style="color: rgb(175,0,0)">f</span><span style="color: rgb(175,0,0)">"</span><span style="color: rgb(175,0,0)">Entity df columns: </span><span class="ansi-bold" style="color: rgb(175,95,135)">{</span>entity_df<span style="color: rgb(98,98,98)">.</span>columns<span class="ansi-bold" style="color: rgb(175,95,135)">}</span><span style="color: rgb(175,0,0)">"</span>)
File <span class="ansi-green-fg">~/.cache/pypoetry/virtualenvs/graphrag-F2jvqev7-py3.11/lib/python3.11/site-packages/pandas/io/parquet.py:667</span>, in <span class="ansi-cyan-fg">read_parquet</span><span class="ansi-blue-fg">(path, engine, columns, storage_options, use_nullable_dtypes, dtype_backend, filesystem, filters, **kwargs)</span>
<span class="ansi-green-intense-fg ansi-bold"> 664</span> use_nullable_dtypes <span style="color: rgb(98,98,98)">=</span> <span class="ansi-bold" style="color: rgb(0,135,0)">False</span>
<span class="ansi-green-intense-fg ansi-bold"> 665</span> check_dtype_backend(dtype_backend)
<span class="ansi-green-fg">--&gt; 667</span> <span class="ansi-bold" style="color: rgb(0,135,0)">return</span> <span class="ansi-yellow-bg">impl</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">.</span><span class="ansi-yellow-bg">read</span><span class="ansi-yellow-bg">(</span>
<span class="ansi-green-intense-fg ansi-bold"> 668</span> <span class="ansi-yellow-bg"> </span><span class="ansi-yellow-bg">path</span><span class="ansi-yellow-bg">,</span>
<span class="ansi-green-intense-fg ansi-bold"> 669</span> <span class="ansi-yellow-bg"> </span><span class="ansi-yellow-bg">columns</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">=</span><span class="ansi-yellow-bg">columns</span><span class="ansi-yellow-bg">,</span>
<span class="ansi-green-intense-fg ansi-bold"> 670</span> <span class="ansi-yellow-bg"> </span><span class="ansi-yellow-bg">filters</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">=</span><span class="ansi-yellow-bg">filters</span><span class="ansi-yellow-bg">,</span>
<span class="ansi-green-intense-fg ansi-bold"> 671</span> <span class="ansi-yellow-bg"> </span><span class="ansi-yellow-bg">storage_options</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">=</span><span class="ansi-yellow-bg">storage_options</span><span class="ansi-yellow-bg">,</span>
<span class="ansi-green-intense-fg ansi-bold"> 672</span> <span class="ansi-yellow-bg"> </span><span class="ansi-yellow-bg">use_nullable_dtypes</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">=</span><span class="ansi-yellow-bg">use_nullable_dtypes</span><span class="ansi-yellow-bg">,</span>
<span class="ansi-green-intense-fg ansi-bold"> 673</span> <span class="ansi-yellow-bg"> </span><span class="ansi-yellow-bg">dtype_backend</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">=</span><span class="ansi-yellow-bg">dtype_backend</span><span class="ansi-yellow-bg">,</span>
<span class="ansi-green-intense-fg ansi-bold"> 674</span> <span class="ansi-yellow-bg"> </span><span class="ansi-yellow-bg">filesystem</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">=</span><span class="ansi-yellow-bg">filesystem</span><span class="ansi-yellow-bg">,</span>
<span class="ansi-green-intense-fg ansi-bold"> 675</span> <span class="ansi-yellow-bg"> </span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">*</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">*</span><span class="ansi-yellow-bg">kwargs</span><span class="ansi-yellow-bg">,</span>
<span class="ansi-green-intense-fg ansi-bold"> 676</span> <span class="ansi-yellow-bg">)</span>
File <span class="ansi-green-fg">~/.cache/pypoetry/virtualenvs/graphrag-F2jvqev7-py3.11/lib/python3.11/site-packages/pandas/io/parquet.py:267</span>, in <span class="ansi-cyan-fg">PyArrowImpl.read</span><span class="ansi-blue-fg">(self, path, columns, filters, use_nullable_dtypes, dtype_backend, storage_options, filesystem, **kwargs)</span>
<span class="ansi-green-intense-fg ansi-bold"> 264</span> <span class="ansi-bold" style="color: rgb(0,135,0)">if</span> manager <span style="color: rgb(98,98,98)">==</span> <span style="color: rgb(175,0,0)">"</span><span style="color: rgb(175,0,0)">array</span><span style="color: rgb(175,0,0)">"</span>:
<span class="ansi-green-intense-fg ansi-bold"> 265</span> to_pandas_kwargs[<span style="color: rgb(175,0,0)">"</span><span style="color: rgb(175,0,0)">split_blocks</span><span style="color: rgb(175,0,0)">"</span>] <span style="color: rgb(98,98,98)">=</span> <span class="ansi-bold" style="color: rgb(0,135,0)">True</span> <span style="color: rgb(95,135,135)"># type: ignore[assignment]</span>
<span class="ansi-green-fg">--&gt; 267</span> path_or_handle, handles, filesystem <span style="color: rgb(98,98,98)">=</span> <span class="ansi-yellow-bg">_get_path_or_handle</span><span class="ansi-yellow-bg">(</span>
<span class="ansi-green-intense-fg ansi-bold"> 268</span> <span class="ansi-yellow-bg"> </span><span class="ansi-yellow-bg">path</span><span class="ansi-yellow-bg">,</span>
<span class="ansi-green-intense-fg ansi-bold"> 269</span> <span class="ansi-yellow-bg"> </span><span class="ansi-yellow-bg">filesystem</span><span class="ansi-yellow-bg">,</span>
<span class="ansi-green-intense-fg ansi-bold"> 270</span> <span class="ansi-yellow-bg"> </span><span class="ansi-yellow-bg">storage_options</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">=</span><span class="ansi-yellow-bg">storage_options</span><span class="ansi-yellow-bg">,</span>
<span class="ansi-green-intense-fg ansi-bold"> 271</span> <span class="ansi-yellow-bg"> </span><span class="ansi-yellow-bg">mode</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">=</span><span class="ansi-yellow-bg" style="color: rgb(175,0,0)">"</span><span class="ansi-yellow-bg" style="color: rgb(175,0,0)">rb</span><span class="ansi-yellow-bg" style="color: rgb(175,0,0)">"</span><span class="ansi-yellow-bg">,</span>
<span class="ansi-green-intense-fg ansi-bold"> 272</span> <span class="ansi-yellow-bg">)</span>
<span class="ansi-green-intense-fg ansi-bold"> 273</span> <span class="ansi-bold" style="color: rgb(0,135,0)">try</span>:
<span class="ansi-green-intense-fg ansi-bold"> 274</span> pa_table <span style="color: rgb(98,98,98)">=</span> <span style="color: rgb(0,135,0)">self</span><span style="color: rgb(98,98,98)">.</span>api<span style="color: rgb(98,98,98)">.</span>parquet<span style="color: rgb(98,98,98)">.</span>read_table(
<span class="ansi-green-intense-fg ansi-bold"> 275</span> path_or_handle,
<span class="ansi-green-intense-fg ansi-bold"> 276</span> columns<span style="color: rgb(98,98,98)">=</span>columns,
<span class="ansi-red-fg">ModuleNotFoundError</span> Traceback (most recent call last)
Cell <span class="ansi-green-fg">In[2], line 15</span>
<span class="ansi-green-intense-fg ansi-bold"> 7</span> <span class="ansi-bold" style="color: rgb(0,135,0)">from</span><span style="color: rgb(188,188,188)"> </span><span class="ansi-bold" style="color: rgb(0,0,255)">graphrag</span><span class="ansi-bold" style="color: rgb(0,0,255)">.</span><span class="ansi-bold" style="color: rgb(0,0,255)">config</span><span class="ansi-bold" style="color: rgb(0,0,255)">.</span><span class="ansi-bold" style="color: rgb(0,0,255)">models</span><span class="ansi-bold" style="color: rgb(0,0,255)">.</span><span class="ansi-bold" style="color: rgb(0,0,255)">drift_search_config</span><span style="color: rgb(188,188,188)"> </span><span class="ansi-bold" style="color: rgb(0,135,0)">import</span> DRIFTSearchConfig
<span class="ansi-green-intense-fg ansi-bold"> 8</span> <span class="ansi-bold" style="color: rgb(0,135,0)">from</span><span style="color: rgb(188,188,188)"> </span><span class="ansi-bold" style="color: rgb(0,0,255)">graphrag</span><span class="ansi-bold" style="color: rgb(0,0,255)">.</span><span class="ansi-bold" style="color: rgb(0,0,255)">query</span><span class="ansi-bold" style="color: rgb(0,0,255)">.</span><span class="ansi-bold" style="color: rgb(0,0,255)">indexer_adapters</span><span style="color: rgb(188,188,188)"> </span><span class="ansi-bold" style="color: rgb(0,135,0)">import</span> (
<span class="ansi-green-intense-fg ansi-bold"> 9</span> read_indexer_entities,
<span class="ansi-green-intense-fg ansi-bold"> 10</span> read_indexer_relationships,
<span class="ansi-green-fg"> (...)</span>
<span class="ansi-green-intense-fg ansi-bold"> 279</span> <span style="color: rgb(98,98,98)">*</span><span style="color: rgb(98,98,98)">*</span>kwargs,
<span class="ansi-green-intense-fg ansi-bold"> 280</span> )
<span class="ansi-green-intense-fg ansi-bold"> 13</span> read_indexer_text_units,
<span class="ansi-green-intense-fg ansi-bold"> 14</span> )
<span class="ansi-green-fg">---&gt; 15</span> <span class="ansi-bold" style="color: rgb(0,135,0)">from</span><span style="color: rgb(188,188,188)"> </span><span class="ansi-bold" style="color: rgb(0,0,255)">graphrag</span><span class="ansi-bold" style="color: rgb(0,0,255)">.</span><span class="ansi-bold" style="color: rgb(0,0,255)">query</span><span class="ansi-bold" style="color: rgb(0,0,255)">.</span><span class="ansi-bold" style="color: rgb(0,0,255)">llm</span><span class="ansi-bold" style="color: rgb(0,0,255)">.</span><span class="ansi-bold" style="color: rgb(0,0,255)">oai</span><span class="ansi-bold" style="color: rgb(0,0,255)">.</span><span class="ansi-bold" style="color: rgb(0,0,255)">chat_openai</span><span style="color: rgb(188,188,188)"> </span><span class="ansi-bold" style="color: rgb(0,135,0)">import</span> ChatOpenAI
<span class="ansi-green-intense-fg ansi-bold"> 16</span> <span class="ansi-bold" style="color: rgb(0,135,0)">from</span><span style="color: rgb(188,188,188)"> </span><span class="ansi-bold" style="color: rgb(0,0,255)">graphrag</span><span class="ansi-bold" style="color: rgb(0,0,255)">.</span><span class="ansi-bold" style="color: rgb(0,0,255)">query</span><span class="ansi-bold" style="color: rgb(0,0,255)">.</span><span class="ansi-bold" style="color: rgb(0,0,255)">llm</span><span class="ansi-bold" style="color: rgb(0,0,255)">.</span><span class="ansi-bold" style="color: rgb(0,0,255)">oai</span><span class="ansi-bold" style="color: rgb(0,0,255)">.</span><span class="ansi-bold" style="color: rgb(0,0,255)">embedding</span><span style="color: rgb(188,188,188)"> </span><span class="ansi-bold" style="color: rgb(0,135,0)">import</span> OpenAIEmbedding
<span class="ansi-green-intense-fg ansi-bold"> 17</span> <span class="ansi-bold" style="color: rgb(0,135,0)">from</span><span style="color: rgb(188,188,188)"> </span><span class="ansi-bold" style="color: rgb(0,0,255)">graphrag</span><span class="ansi-bold" style="color: rgb(0,0,255)">.</span><span class="ansi-bold" style="color: rgb(0,0,255)">query</span><span class="ansi-bold" style="color: rgb(0,0,255)">.</span><span class="ansi-bold" style="color: rgb(0,0,255)">llm</span><span class="ansi-bold" style="color: rgb(0,0,255)">.</span><span class="ansi-bold" style="color: rgb(0,0,255)">oai</span><span class="ansi-bold" style="color: rgb(0,0,255)">.</span><span class="ansi-bold" style="color: rgb(0,0,255)">typing</span><span style="color: rgb(188,188,188)"> </span><span class="ansi-bold" style="color: rgb(0,135,0)">import</span> OpenaiApiType
File <span class="ansi-green-fg">~/.cache/pypoetry/virtualenvs/graphrag-F2jvqev7-py3.11/lib/python3.11/site-packages/pandas/io/parquet.py:140</span>, in <span class="ansi-cyan-fg">_get_path_or_handle</span><span class="ansi-blue-fg">(path, fs, storage_options, mode, is_dir)</span>
<span class="ansi-green-intense-fg ansi-bold"> 130</span> handles <span style="color: rgb(98,98,98)">=</span> <span class="ansi-bold" style="color: rgb(0,135,0)">None</span>
<span class="ansi-green-intense-fg ansi-bold"> 131</span> <span class="ansi-bold" style="color: rgb(0,135,0)">if</span> (
<span class="ansi-green-intense-fg ansi-bold"> 132</span> <span class="ansi-bold" style="color: rgb(175,0,255)">not</span> fs
<span class="ansi-green-intense-fg ansi-bold"> 133</span> <span class="ansi-bold" style="color: rgb(175,0,255)">and</span> <span class="ansi-bold" style="color: rgb(175,0,255)">not</span> is_dir
<span class="ansi-green-fg"> (...)</span>
<span class="ansi-green-intense-fg ansi-bold"> 138</span> <span style="color: rgb(95,135,135)"># fsspec resources can also point to directories</span>
<span class="ansi-green-intense-fg ansi-bold"> 139</span> <span style="color: rgb(95,135,135)"># this branch is used for example when reading from non-fsspec URLs</span>
<span class="ansi-green-fg">--&gt; 140</span> handles <span style="color: rgb(98,98,98)">=</span> <span class="ansi-yellow-bg">get_handle</span><span class="ansi-yellow-bg">(</span>
<span class="ansi-green-intense-fg ansi-bold"> 141</span> <span class="ansi-yellow-bg"> </span><span class="ansi-yellow-bg">path_or_handle</span><span class="ansi-yellow-bg">,</span><span class="ansi-yellow-bg"> </span><span class="ansi-yellow-bg">mode</span><span class="ansi-yellow-bg">,</span><span class="ansi-yellow-bg"> </span><span class="ansi-yellow-bg">is_text</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">=</span><span class="ansi-yellow-bg ansi-bold" style="color: rgb(0,135,0)">False</span><span class="ansi-yellow-bg">,</span><span class="ansi-yellow-bg"> </span><span class="ansi-yellow-bg">storage_options</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">=</span><span class="ansi-yellow-bg">storage_options</span>
<span class="ansi-green-intense-fg ansi-bold"> 142</span> <span class="ansi-yellow-bg"> </span><span class="ansi-yellow-bg">)</span>
<span class="ansi-green-intense-fg ansi-bold"> 143</span> fs <span style="color: rgb(98,98,98)">=</span> <span class="ansi-bold" style="color: rgb(0,135,0)">None</span>
<span class="ansi-green-intense-fg ansi-bold"> 144</span> path_or_handle <span style="color: rgb(98,98,98)">=</span> handles<span style="color: rgb(98,98,98)">.</span>handle
File <span class="ansi-green-fg">~/.cache/pypoetry/virtualenvs/graphrag-F2jvqev7-py3.11/lib/python3.11/site-packages/pandas/io/common.py:882</span>, in <span class="ansi-cyan-fg">get_handle</span><span class="ansi-blue-fg">(path_or_buf, mode, encoding, compression, memory_map, is_text, errors, storage_options)</span>
<span class="ansi-green-intense-fg ansi-bold"> 873</span> handle <span style="color: rgb(98,98,98)">=</span> <span style="color: rgb(0,135,0)">open</span>(
<span class="ansi-green-intense-fg ansi-bold"> 874</span> handle,
<span class="ansi-green-intense-fg ansi-bold"> 875</span> ioargs<span style="color: rgb(98,98,98)">.</span>mode,
<span class="ansi-green-fg"> (...)</span>
<span class="ansi-green-intense-fg ansi-bold"> 878</span> newline<span style="color: rgb(98,98,98)">=</span><span style="color: rgb(175,0,0)">"</span><span style="color: rgb(175,0,0)">"</span>,
<span class="ansi-green-intense-fg ansi-bold"> 879</span> )
<span class="ansi-green-intense-fg ansi-bold"> 880</span> <span class="ansi-bold" style="color: rgb(0,135,0)">else</span>:
<span class="ansi-green-intense-fg ansi-bold"> 881</span> <span style="color: rgb(95,135,135)"># Binary mode</span>
<span class="ansi-green-fg">--&gt; 882</span> handle <span style="color: rgb(98,98,98)">=</span> <span class="ansi-yellow-bg" style="color: rgb(0,135,0)">open</span><span class="ansi-yellow-bg">(</span><span class="ansi-yellow-bg">handle</span><span class="ansi-yellow-bg">,</span><span class="ansi-yellow-bg"> </span><span class="ansi-yellow-bg">ioargs</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">.</span><span class="ansi-yellow-bg">mode</span><span class="ansi-yellow-bg">)</span>
<span class="ansi-green-intense-fg ansi-bold"> 883</span> handles<span style="color: rgb(98,98,98)">.</span>append(handle)
<span class="ansi-green-intense-fg ansi-bold"> 885</span> <span style="color: rgb(95,135,135)"># Convert BytesIO or file objects passed with an encoding</span>
<span class="ansi-red-fg">FileNotFoundError</span>: [Errno 2] No such file or directory: './inputs/operation dulce/entities.parquet'</pre>
<span class="ansi-red-fg">ModuleNotFoundError</span>: No module named 'graphrag.query.llm.oai'</pre>
</div>
</div>
</div>
</div>
</div>
</div><div class="jp-Cell jp-CodeCell jp-Notebook-cell jp-mod-noOutputs">
<div class="jp-Cell jp-CodeCell jp-Notebook-cell jp-mod-noOutputs">
</div><div class="jp-Cell jp-CodeCell jp-Notebook-cell">
<div class="jp-Cell jp-CodeCell jp-Notebook-cell">
<div class="jp-Cell-inputWrapper" tabindex="0">
<div class="jp-Collapser jp-InputCollapser jp-Cell-inputCollapser">
</div>
@ -2190,6 +2137,38 @@ text_embedder = OpenAIEmbedding(
</div>
</div>
</div>
<div class="jp-Cell-outputWrapper">
<div class="jp-Collapser jp-OutputCollapser jp-Cell-outputCollapser">
</div>
<div class="jp-OutputArea jp-Cell-outputArea">
<div class="jp-OutputArea-child">
<div class="jp-OutputPrompt jp-OutputArea-prompt"></div>
<div class="jp-RenderedText jp-OutputArea-output" data-mime-type="application/vnd.jupyter.stderr" tabindex="0">
<pre>
<span class="ansi-red-fg">---------------------------------------------------------------------------</span>
<span class="ansi-red-fg">NameError</span> Traceback (most recent call last)
Cell <span class="ansi-green-fg">In[3], line 5</span>
<span class="ansi-green-intense-fg ansi-bold"> 2</span> llm_model <span style="color: rgb(98,98,98)">=</span> os<span style="color: rgb(98,98,98)">.</span>environ[<span style="color: rgb(175,0,0)">"</span><span style="color: rgb(175,0,0)">GRAPHRAG_LLM_MODEL</span><span style="color: rgb(175,0,0)">"</span>]
<span class="ansi-green-intense-fg ansi-bold"> 3</span> embedding_model <span style="color: rgb(98,98,98)">=</span> os<span style="color: rgb(98,98,98)">.</span>environ[<span style="color: rgb(175,0,0)">"</span><span style="color: rgb(175,0,0)">GRAPHRAG_EMBEDDING_MODEL</span><span style="color: rgb(175,0,0)">"</span>]
<span class="ansi-green-fg">----&gt; 5</span> chat_llm <span style="color: rgb(98,98,98)">=</span> <span class="ansi-yellow-bg">ChatOpenAI</span>(
<span class="ansi-green-intense-fg ansi-bold"> 6</span> api_key<span style="color: rgb(98,98,98)">=</span>api_key,
<span class="ansi-green-intense-fg ansi-bold"> 7</span> model<span style="color: rgb(98,98,98)">=</span>llm_model,
<span class="ansi-green-intense-fg ansi-bold"> 8</span> api_type<span style="color: rgb(98,98,98)">=</span>OpenaiApiType<span style="color: rgb(98,98,98)">.</span>OpenAI, <span style="color: rgb(95,135,135)"># OpenaiApiType.OpenAI or OpenaiApiType.AzureOpenAI</span>
<span class="ansi-green-intense-fg ansi-bold"> 9</span> max_retries<span style="color: rgb(98,98,98)">=</span><span style="color: rgb(98,98,98)">20</span>,
<span class="ansi-green-intense-fg ansi-bold"> 10</span> )
<span class="ansi-green-intense-fg ansi-bold"> 12</span> token_encoder <span style="color: rgb(98,98,98)">=</span> tiktoken<span style="color: rgb(98,98,98)">.</span>encoding_for_model(llm_model)
<span class="ansi-green-intense-fg ansi-bold"> 14</span> text_embedder <span style="color: rgb(98,98,98)">=</span> OpenAIEmbedding(
<span class="ansi-green-intense-fg ansi-bold"> 15</span> api_key<span style="color: rgb(98,98,98)">=</span>api_key,
<span class="ansi-green-intense-fg ansi-bold"> 16</span> api_base<span style="color: rgb(98,98,98)">=</span><span class="ansi-bold" style="color: rgb(0,135,0)">None</span>,
<span class="ansi-green-fg"> (...)</span>
<span class="ansi-green-intense-fg ansi-bold"> 20</span> max_retries<span style="color: rgb(98,98,98)">=</span><span style="color: rgb(98,98,98)">20</span>,
<span class="ansi-green-intense-fg ansi-bold"> 21</span> )
<span class="ansi-red-fg">NameError</span>: name 'ChatOpenAI' is not defined</pre>
</div>
</div>
</div>
</div>
</div>
</div><div class="jp-Cell jp-CodeCell jp-Notebook-cell">
<div class="jp-Cell jp-CodeCell jp-Notebook-cell">
@ -2258,83 +2237,16 @@ read_indexer_report_embeddings(reports, full_content_embedding_store)</div>
<div class="jp-RenderedText jp-OutputArea-output" data-mime-type="application/vnd.jupyter.stderr" tabindex="0">
<pre>
<span class="ansi-red-fg">---------------------------------------------------------------------------</span>
<span class="ansi-red-fg">FileNotFoundError</span> Traceback (most recent call last)
Cell <span class="ansi-green-fg">In[4], line 10</span>
<span class="ansi-red-fg">NameError</span> Traceback (most recent call last)
Cell <span class="ansi-green-fg">In[4], line 3</span>
<span class="ansi-green-intense-fg ansi-bold"> 1</span> <span class="ansi-bold" style="color: rgb(0,135,0)">def</span><span style="color: rgb(188,188,188)"> </span><span style="color: rgb(0,0,255)">read_community_reports</span>(
<span class="ansi-green-intense-fg ansi-bold"> 2</span> input_dir: <span style="color: rgb(0,135,0)">str</span>,
<span class="ansi-green-fg">----&gt; 3</span> community_report_table: <span style="color: rgb(0,135,0)">str</span> <span style="color: rgb(98,98,98)">=</span> <span class="ansi-yellow-bg">COMMUNITY_REPORT_TABLE</span>,
<span class="ansi-green-intense-fg ansi-bold"> 4</span> ):
<span class="ansi-green-intense-fg ansi-bold"> 5</span> <span style="color: rgb(188,188,188)"> </span><span style="color: rgb(175,0,0)">"""Embeds the full content of the community reports and saves the DataFrame with embeddings to the output path."""</span>
<span class="ansi-green-intense-fg ansi-bold"> 6</span> input_path <span style="color: rgb(98,98,98)">=</span> Path(input_dir) <span style="color: rgb(98,98,98)">/</span> <span style="color: rgb(175,0,0)">f</span><span style="color: rgb(175,0,0)">"</span><span class="ansi-bold" style="color: rgb(175,95,135)">{</span>community_report_table<span class="ansi-bold" style="color: rgb(175,95,135)">}</span><span style="color: rgb(175,0,0)">.parquet</span><span style="color: rgb(175,0,0)">"</span>
<span class="ansi-green-intense-fg ansi-bold"> 7</span> <span class="ansi-bold" style="color: rgb(0,135,0)">return</span> pd<span style="color: rgb(98,98,98)">.</span>read_parquet(input_path)
<span class="ansi-green-fg">---&gt; 10</span> report_df <span style="color: rgb(98,98,98)">=</span> <span class="ansi-yellow-bg">read_community_reports</span><span class="ansi-yellow-bg">(</span><span class="ansi-yellow-bg">INPUT_DIR</span><span class="ansi-yellow-bg">)</span>
<span class="ansi-green-intense-fg ansi-bold"> 11</span> reports <span style="color: rgb(98,98,98)">=</span> read_indexer_reports(
<span class="ansi-green-intense-fg ansi-bold"> 12</span> report_df,
<span class="ansi-green-intense-fg ansi-bold"> 13</span> community_df,
<span class="ansi-green-intense-fg ansi-bold"> 14</span> COMMUNITY_LEVEL,
<span class="ansi-green-intense-fg ansi-bold"> 15</span> content_embedding_col<span style="color: rgb(98,98,98)">=</span><span style="color: rgb(175,0,0)">"</span><span style="color: rgb(175,0,0)">full_content_embeddings</span><span style="color: rgb(175,0,0)">"</span>,
<span class="ansi-green-intense-fg ansi-bold"> 16</span> )
<span class="ansi-green-intense-fg ansi-bold"> 17</span> read_indexer_report_embeddings(reports, full_content_embedding_store)
Cell <span class="ansi-green-fg">In[4], line 7</span>, in <span class="ansi-cyan-fg">read_community_reports</span><span class="ansi-blue-fg">(input_dir, community_report_table)</span>
<span class="ansi-green-intense-fg ansi-bold"> 5</span> <span style="color: rgb(175,0,0)">"""Embeds the full content of the community reports and saves the DataFrame with embeddings to the output path."""</span>
<span class="ansi-green-intense-fg ansi-bold"> 6</span> input_path <span style="color: rgb(98,98,98)">=</span> Path(input_dir) <span style="color: rgb(98,98,98)">/</span> <span style="color: rgb(175,0,0)">f</span><span style="color: rgb(175,0,0)">"</span><span class="ansi-bold" style="color: rgb(175,95,135)">{</span>community_report_table<span class="ansi-bold" style="color: rgb(175,95,135)">}</span><span style="color: rgb(175,0,0)">.parquet</span><span style="color: rgb(175,0,0)">"</span>
<span class="ansi-green-fg">----&gt; 7</span> <span class="ansi-bold" style="color: rgb(0,135,0)">return</span> <span class="ansi-yellow-bg">pd</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">.</span><span class="ansi-yellow-bg">read_parquet</span><span class="ansi-yellow-bg">(</span><span class="ansi-yellow-bg">input_path</span><span class="ansi-yellow-bg">)</span>
File <span class="ansi-green-fg">~/.cache/pypoetry/virtualenvs/graphrag-F2jvqev7-py3.11/lib/python3.11/site-packages/pandas/io/parquet.py:667</span>, in <span class="ansi-cyan-fg">read_parquet</span><span class="ansi-blue-fg">(path, engine, columns, storage_options, use_nullable_dtypes, dtype_backend, filesystem, filters, **kwargs)</span>
<span class="ansi-green-intense-fg ansi-bold"> 664</span> use_nullable_dtypes <span style="color: rgb(98,98,98)">=</span> <span class="ansi-bold" style="color: rgb(0,135,0)">False</span>
<span class="ansi-green-intense-fg ansi-bold"> 665</span> check_dtype_backend(dtype_backend)
<span class="ansi-green-fg">--&gt; 667</span> <span class="ansi-bold" style="color: rgb(0,135,0)">return</span> <span class="ansi-yellow-bg">impl</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">.</span><span class="ansi-yellow-bg">read</span><span class="ansi-yellow-bg">(</span>
<span class="ansi-green-intense-fg ansi-bold"> 668</span> <span class="ansi-yellow-bg"> </span><span class="ansi-yellow-bg">path</span><span class="ansi-yellow-bg">,</span>
<span class="ansi-green-intense-fg ansi-bold"> 669</span> <span class="ansi-yellow-bg"> </span><span class="ansi-yellow-bg">columns</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">=</span><span class="ansi-yellow-bg">columns</span><span class="ansi-yellow-bg">,</span>
<span class="ansi-green-intense-fg ansi-bold"> 670</span> <span class="ansi-yellow-bg"> </span><span class="ansi-yellow-bg">filters</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">=</span><span class="ansi-yellow-bg">filters</span><span class="ansi-yellow-bg">,</span>
<span class="ansi-green-intense-fg ansi-bold"> 671</span> <span class="ansi-yellow-bg"> </span><span class="ansi-yellow-bg">storage_options</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">=</span><span class="ansi-yellow-bg">storage_options</span><span class="ansi-yellow-bg">,</span>
<span class="ansi-green-intense-fg ansi-bold"> 672</span> <span class="ansi-yellow-bg"> </span><span class="ansi-yellow-bg">use_nullable_dtypes</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">=</span><span class="ansi-yellow-bg">use_nullable_dtypes</span><span class="ansi-yellow-bg">,</span>
<span class="ansi-green-intense-fg ansi-bold"> 673</span> <span class="ansi-yellow-bg"> </span><span class="ansi-yellow-bg">dtype_backend</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">=</span><span class="ansi-yellow-bg">dtype_backend</span><span class="ansi-yellow-bg">,</span>
<span class="ansi-green-intense-fg ansi-bold"> 674</span> <span class="ansi-yellow-bg"> </span><span class="ansi-yellow-bg">filesystem</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">=</span><span class="ansi-yellow-bg">filesystem</span><span class="ansi-yellow-bg">,</span>
<span class="ansi-green-intense-fg ansi-bold"> 675</span> <span class="ansi-yellow-bg"> </span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">*</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">*</span><span class="ansi-yellow-bg">kwargs</span><span class="ansi-yellow-bg">,</span>
<span class="ansi-green-intense-fg ansi-bold"> 676</span> <span class="ansi-yellow-bg">)</span>
File <span class="ansi-green-fg">~/.cache/pypoetry/virtualenvs/graphrag-F2jvqev7-py3.11/lib/python3.11/site-packages/pandas/io/parquet.py:267</span>, in <span class="ansi-cyan-fg">PyArrowImpl.read</span><span class="ansi-blue-fg">(self, path, columns, filters, use_nullable_dtypes, dtype_backend, storage_options, filesystem, **kwargs)</span>
<span class="ansi-green-intense-fg ansi-bold"> 264</span> <span class="ansi-bold" style="color: rgb(0,135,0)">if</span> manager <span style="color: rgb(98,98,98)">==</span> <span style="color: rgb(175,0,0)">"</span><span style="color: rgb(175,0,0)">array</span><span style="color: rgb(175,0,0)">"</span>:
<span class="ansi-green-intense-fg ansi-bold"> 265</span> to_pandas_kwargs[<span style="color: rgb(175,0,0)">"</span><span style="color: rgb(175,0,0)">split_blocks</span><span style="color: rgb(175,0,0)">"</span>] <span style="color: rgb(98,98,98)">=</span> <span class="ansi-bold" style="color: rgb(0,135,0)">True</span> <span style="color: rgb(95,135,135)"># type: ignore[assignment]</span>
<span class="ansi-green-fg">--&gt; 267</span> path_or_handle, handles, filesystem <span style="color: rgb(98,98,98)">=</span> <span class="ansi-yellow-bg">_get_path_or_handle</span><span class="ansi-yellow-bg">(</span>
<span class="ansi-green-intense-fg ansi-bold"> 268</span> <span class="ansi-yellow-bg"> </span><span class="ansi-yellow-bg">path</span><span class="ansi-yellow-bg">,</span>
<span class="ansi-green-intense-fg ansi-bold"> 269</span> <span class="ansi-yellow-bg"> </span><span class="ansi-yellow-bg">filesystem</span><span class="ansi-yellow-bg">,</span>
<span class="ansi-green-intense-fg ansi-bold"> 270</span> <span class="ansi-yellow-bg"> </span><span class="ansi-yellow-bg">storage_options</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">=</span><span class="ansi-yellow-bg">storage_options</span><span class="ansi-yellow-bg">,</span>
<span class="ansi-green-intense-fg ansi-bold"> 271</span> <span class="ansi-yellow-bg"> </span><span class="ansi-yellow-bg">mode</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">=</span><span class="ansi-yellow-bg" style="color: rgb(175,0,0)">"</span><span class="ansi-yellow-bg" style="color: rgb(175,0,0)">rb</span><span class="ansi-yellow-bg" style="color: rgb(175,0,0)">"</span><span class="ansi-yellow-bg">,</span>
<span class="ansi-green-intense-fg ansi-bold"> 272</span> <span class="ansi-yellow-bg">)</span>
<span class="ansi-green-intense-fg ansi-bold"> 273</span> <span class="ansi-bold" style="color: rgb(0,135,0)">try</span>:
<span class="ansi-green-intense-fg ansi-bold"> 274</span> pa_table <span style="color: rgb(98,98,98)">=</span> <span style="color: rgb(0,135,0)">self</span><span style="color: rgb(98,98,98)">.</span>api<span style="color: rgb(98,98,98)">.</span>parquet<span style="color: rgb(98,98,98)">.</span>read_table(
<span class="ansi-green-intense-fg ansi-bold"> 275</span> path_or_handle,
<span class="ansi-green-intense-fg ansi-bold"> 276</span> columns<span style="color: rgb(98,98,98)">=</span>columns,
<span class="ansi-green-fg"> (...)</span>
<span class="ansi-green-intense-fg ansi-bold"> 279</span> <span style="color: rgb(98,98,98)">*</span><span style="color: rgb(98,98,98)">*</span>kwargs,
<span class="ansi-green-intense-fg ansi-bold"> 280</span> )
File <span class="ansi-green-fg">~/.cache/pypoetry/virtualenvs/graphrag-F2jvqev7-py3.11/lib/python3.11/site-packages/pandas/io/parquet.py:140</span>, in <span class="ansi-cyan-fg">_get_path_or_handle</span><span class="ansi-blue-fg">(path, fs, storage_options, mode, is_dir)</span>
<span class="ansi-green-intense-fg ansi-bold"> 130</span> handles <span style="color: rgb(98,98,98)">=</span> <span class="ansi-bold" style="color: rgb(0,135,0)">None</span>
<span class="ansi-green-intense-fg ansi-bold"> 131</span> <span class="ansi-bold" style="color: rgb(0,135,0)">if</span> (
<span class="ansi-green-intense-fg ansi-bold"> 132</span> <span class="ansi-bold" style="color: rgb(175,0,255)">not</span> fs
<span class="ansi-green-intense-fg ansi-bold"> 133</span> <span class="ansi-bold" style="color: rgb(175,0,255)">and</span> <span class="ansi-bold" style="color: rgb(175,0,255)">not</span> is_dir
<span class="ansi-green-fg"> (...)</span>
<span class="ansi-green-intense-fg ansi-bold"> 138</span> <span style="color: rgb(95,135,135)"># fsspec resources can also point to directories</span>
<span class="ansi-green-intense-fg ansi-bold"> 139</span> <span style="color: rgb(95,135,135)"># this branch is used for example when reading from non-fsspec URLs</span>
<span class="ansi-green-fg">--&gt; 140</span> handles <span style="color: rgb(98,98,98)">=</span> <span class="ansi-yellow-bg">get_handle</span><span class="ansi-yellow-bg">(</span>
<span class="ansi-green-intense-fg ansi-bold"> 141</span> <span class="ansi-yellow-bg"> </span><span class="ansi-yellow-bg">path_or_handle</span><span class="ansi-yellow-bg">,</span><span class="ansi-yellow-bg"> </span><span class="ansi-yellow-bg">mode</span><span class="ansi-yellow-bg">,</span><span class="ansi-yellow-bg"> </span><span class="ansi-yellow-bg">is_text</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">=</span><span class="ansi-yellow-bg ansi-bold" style="color: rgb(0,135,0)">False</span><span class="ansi-yellow-bg">,</span><span class="ansi-yellow-bg"> </span><span class="ansi-yellow-bg">storage_options</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">=</span><span class="ansi-yellow-bg">storage_options</span>
<span class="ansi-green-intense-fg ansi-bold"> 142</span> <span class="ansi-yellow-bg"> </span><span class="ansi-yellow-bg">)</span>
<span class="ansi-green-intense-fg ansi-bold"> 143</span> fs <span style="color: rgb(98,98,98)">=</span> <span class="ansi-bold" style="color: rgb(0,135,0)">None</span>
<span class="ansi-green-intense-fg ansi-bold"> 144</span> path_or_handle <span style="color: rgb(98,98,98)">=</span> handles<span style="color: rgb(98,98,98)">.</span>handle
File <span class="ansi-green-fg">~/.cache/pypoetry/virtualenvs/graphrag-F2jvqev7-py3.11/lib/python3.11/site-packages/pandas/io/common.py:882</span>, in <span class="ansi-cyan-fg">get_handle</span><span class="ansi-blue-fg">(path_or_buf, mode, encoding, compression, memory_map, is_text, errors, storage_options)</span>
<span class="ansi-green-intense-fg ansi-bold"> 873</span> handle <span style="color: rgb(98,98,98)">=</span> <span style="color: rgb(0,135,0)">open</span>(
<span class="ansi-green-intense-fg ansi-bold"> 874</span> handle,
<span class="ansi-green-intense-fg ansi-bold"> 875</span> ioargs<span style="color: rgb(98,98,98)">.</span>mode,
<span class="ansi-green-fg"> (...)</span>
<span class="ansi-green-intense-fg ansi-bold"> 878</span> newline<span style="color: rgb(98,98,98)">=</span><span style="color: rgb(175,0,0)">"</span><span style="color: rgb(175,0,0)">"</span>,
<span class="ansi-green-intense-fg ansi-bold"> 879</span> )
<span class="ansi-green-intense-fg ansi-bold"> 880</span> <span class="ansi-bold" style="color: rgb(0,135,0)">else</span>:
<span class="ansi-green-intense-fg ansi-bold"> 881</span> <span style="color: rgb(95,135,135)"># Binary mode</span>
<span class="ansi-green-fg">--&gt; 882</span> handle <span style="color: rgb(98,98,98)">=</span> <span class="ansi-yellow-bg" style="color: rgb(0,135,0)">open</span><span class="ansi-yellow-bg">(</span><span class="ansi-yellow-bg">handle</span><span class="ansi-yellow-bg">,</span><span class="ansi-yellow-bg"> </span><span class="ansi-yellow-bg">ioargs</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">.</span><span class="ansi-yellow-bg">mode</span><span class="ansi-yellow-bg">)</span>
<span class="ansi-green-intense-fg ansi-bold"> 883</span> handles<span style="color: rgb(98,98,98)">.</span>append(handle)
<span class="ansi-green-intense-fg ansi-bold"> 885</span> <span style="color: rgb(95,135,135)"># Convert BytesIO or file objects passed with an encoding</span>
<span class="ansi-red-fg">FileNotFoundError</span>: [Errno 2] No such file or directory: 'inputs/operation dulce/community_reports.parquet'</pre>
<span class="ansi-red-fg">NameError</span>: name 'COMMUNITY_REPORT_TABLE' is not defined</pre>
</div>
</div>
</div>
@ -2422,17 +2334,17 @@ search = DRIFTSearch(
<pre>
<span class="ansi-red-fg">---------------------------------------------------------------------------</span>
<span class="ansi-red-fg">NameError</span> Traceback (most recent call last)
Cell <span class="ansi-green-fg">In[5], line 13</span>
Cell <span class="ansi-green-fg">In[5], line 10</span>
<span class="ansi-green-intense-fg ansi-bold"> 1</span> drift_params <span style="color: rgb(98,98,98)">=</span> DRIFTSearchConfig(
<span class="ansi-green-intense-fg ansi-bold"> 2</span> temperature<span style="color: rgb(98,98,98)">=</span><span style="color: rgb(98,98,98)">0</span>,
<span class="ansi-green-intense-fg ansi-bold"> 3</span> max_tokens<span style="color: rgb(98,98,98)">=</span><span style="color: rgb(98,98,98)">12_000</span>,
<span class="ansi-green-fg"> (...)</span>
<span class="ansi-green-intense-fg ansi-bold"> 7</span> n<span style="color: rgb(98,98,98)">=</span><span style="color: rgb(98,98,98)">1</span>,
<span class="ansi-green-intense-fg ansi-bold"> 8</span> )
<span class="ansi-green-intense-fg ansi-bold"> 10</span> context_builder <span style="color: rgb(98,98,98)">=</span> DRIFTSearchContextBuilder(
<span class="ansi-green-fg">---&gt; 10</span> context_builder <span style="color: rgb(98,98,98)">=</span> <span class="ansi-yellow-bg">DRIFTSearchContextBuilder</span>(
<span class="ansi-green-intense-fg ansi-bold"> 11</span> chat_llm<span style="color: rgb(98,98,98)">=</span>chat_llm,
<span class="ansi-green-intense-fg ansi-bold"> 12</span> text_embedder<span style="color: rgb(98,98,98)">=</span>text_embedder,
<span class="ansi-green-fg">---&gt; 13</span> entities<span style="color: rgb(98,98,98)">=</span><span class="ansi-yellow-bg">entities</span>,
<span class="ansi-green-intense-fg ansi-bold"> 13</span> entities<span style="color: rgb(98,98,98)">=</span>entities,
<span class="ansi-green-intense-fg ansi-bold"> 14</span> relationships<span style="color: rgb(98,98,98)">=</span>relationships,
<span class="ansi-green-intense-fg ansi-bold"> 15</span> reports<span style="color: rgb(98,98,98)">=</span>reports,
<span class="ansi-green-intense-fg ansi-bold"> 16</span> entity_text_embeddings<span style="color: rgb(98,98,98)">=</span>description_embedding_store,
@ -2444,7 +2356,7 @@ Cell <span class="ansi-green-fg">In[5], line 13</span>
<span class="ansi-green-intense-fg ansi-bold"> 23</span> llm<span style="color: rgb(98,98,98)">=</span>chat_llm, context_builder<span style="color: rgb(98,98,98)">=</span>context_builder, token_encoder<span style="color: rgb(98,98,98)">=</span>token_encoder
<span class="ansi-green-intense-fg ansi-bold"> 24</span> )
<span class="ansi-red-fg">NameError</span>: name 'entities' is not defined</pre>
<span class="ansi-red-fg">NameError</span>: name 'DRIFTSearchContextBuilder' is not defined</pre>
</div>
</div>
</div>

View File

@ -2037,8 +2037,8 @@ span.linenos.special { color: #000000; background-color: #ffffc0; padding-left:
</div>
</div>
</div>
</div><div class="jp-Cell jp-CodeCell jp-Notebook-cell jp-mod-noOutputs">
<div class="jp-Cell jp-CodeCell jp-Notebook-cell jp-mod-noOutputs">
</div><div class="jp-Cell jp-CodeCell jp-Notebook-cell">
<div class="jp-Cell jp-CodeCell jp-Notebook-cell">
<div class="jp-Cell-inputWrapper" tabindex="0">
<div class="jp-Collapser jp-InputCollapser jp-Cell-inputCollapser">
</div>
@ -2093,6 +2093,34 @@ from graphrag.query.structured_search.global_search.search import GlobalSearch</
</div>
</div>
</div>
<div class="jp-Cell-outputWrapper">
<div class="jp-Collapser jp-OutputCollapser jp-Cell-outputCollapser">
</div>
<div class="jp-OutputArea jp-Cell-outputArea">
<div class="jp-OutputArea-child">
<div class="jp-OutputPrompt jp-OutputArea-prompt"></div>
<div class="jp-RenderedText jp-OutputArea-output" data-mime-type="application/vnd.jupyter.stderr" tabindex="0">
<pre>
<span class="ansi-red-fg">---------------------------------------------------------------------------</span>
<span class="ansi-red-fg">ModuleNotFoundError</span> Traceback (most recent call last)
Cell <span class="ansi-green-fg">In[2], line 11</span>
<span class="ansi-green-intense-fg ansi-bold"> 4</span> <span class="ansi-bold" style="color: rgb(0,135,0)">import</span><span style="color: rgb(188,188,188)"> </span><span class="ansi-bold" style="color: rgb(0,0,255)">tiktoken</span>
<span class="ansi-green-intense-fg ansi-bold"> 6</span> <span class="ansi-bold" style="color: rgb(0,135,0)">from</span><span style="color: rgb(188,188,188)"> </span><span class="ansi-bold" style="color: rgb(0,0,255)">graphrag</span><span class="ansi-bold" style="color: rgb(0,0,255)">.</span><span class="ansi-bold" style="color: rgb(0,0,255)">query</span><span class="ansi-bold" style="color: rgb(0,0,255)">.</span><span class="ansi-bold" style="color: rgb(0,0,255)">indexer_adapters</span><span style="color: rgb(188,188,188)"> </span><span class="ansi-bold" style="color: rgb(0,135,0)">import</span> (
<span class="ansi-green-intense-fg ansi-bold"> 7</span> read_indexer_communities,
<span class="ansi-green-intense-fg ansi-bold"> 8</span> read_indexer_entities,
<span class="ansi-green-intense-fg ansi-bold"> 9</span> read_indexer_reports,
<span class="ansi-green-intense-fg ansi-bold"> 10</span> )
<span class="ansi-green-fg">---&gt; 11</span> <span class="ansi-bold" style="color: rgb(0,135,0)">from</span><span style="color: rgb(188,188,188)"> </span><span class="ansi-bold" style="color: rgb(0,0,255)">graphrag</span><span class="ansi-bold" style="color: rgb(0,0,255)">.</span><span class="ansi-bold" style="color: rgb(0,0,255)">query</span><span class="ansi-bold" style="color: rgb(0,0,255)">.</span><span class="ansi-bold" style="color: rgb(0,0,255)">llm</span><span class="ansi-bold" style="color: rgb(0,0,255)">.</span><span class="ansi-bold" style="color: rgb(0,0,255)">oai</span><span class="ansi-bold" style="color: rgb(0,0,255)">.</span><span class="ansi-bold" style="color: rgb(0,0,255)">chat_openai</span><span style="color: rgb(188,188,188)"> </span><span class="ansi-bold" style="color: rgb(0,135,0)">import</span> ChatOpenAI
<span class="ansi-green-intense-fg ansi-bold"> 12</span> <span class="ansi-bold" style="color: rgb(0,135,0)">from</span><span style="color: rgb(188,188,188)"> </span><span class="ansi-bold" style="color: rgb(0,0,255)">graphrag</span><span class="ansi-bold" style="color: rgb(0,0,255)">.</span><span class="ansi-bold" style="color: rgb(0,0,255)">query</span><span class="ansi-bold" style="color: rgb(0,0,255)">.</span><span class="ansi-bold" style="color: rgb(0,0,255)">llm</span><span class="ansi-bold" style="color: rgb(0,0,255)">.</span><span class="ansi-bold" style="color: rgb(0,0,255)">oai</span><span class="ansi-bold" style="color: rgb(0,0,255)">.</span><span class="ansi-bold" style="color: rgb(0,0,255)">typing</span><span style="color: rgb(188,188,188)"> </span><span class="ansi-bold" style="color: rgb(0,135,0)">import</span> OpenaiApiType
<span class="ansi-green-intense-fg ansi-bold"> 13</span> <span class="ansi-bold" style="color: rgb(0,135,0)">from</span><span style="color: rgb(188,188,188)"> </span><span class="ansi-bold" style="color: rgb(0,0,255)">graphrag</span><span class="ansi-bold" style="color: rgb(0,0,255)">.</span><span class="ansi-bold" style="color: rgb(0,0,255)">query</span><span class="ansi-bold" style="color: rgb(0,0,255)">.</span><span class="ansi-bold" style="color: rgb(0,0,255)">structured_search</span><span class="ansi-bold" style="color: rgb(0,0,255)">.</span><span class="ansi-bold" style="color: rgb(0,0,255)">global_search</span><span class="ansi-bold" style="color: rgb(0,0,255)">.</span><span class="ansi-bold" style="color: rgb(0,0,255)">community_context</span><span style="color: rgb(188,188,188)"> </span><span class="ansi-bold" style="color: rgb(0,135,0)">import</span> (
<span class="ansi-green-intense-fg ansi-bold"> 14</span> GlobalCommunityContext,
<span class="ansi-green-intense-fg ansi-bold"> 15</span> )
<span class="ansi-red-fg">ModuleNotFoundError</span>: No module named 'graphrag.query.llm.oai'</pre>
</div>
</div>
</div>
</div>
</div>
</div>
<div class="jp-Cell jp-MarkdownCell jp-Notebook-cell">
@ -2116,8 +2144,8 @@ from graphrag.query.structured_search.global_search.search import GlobalSearch</
</div>
</div>
</div>
</div><div class="jp-Cell jp-CodeCell jp-Notebook-cell jp-mod-noOutputs">
<div class="jp-Cell jp-CodeCell jp-Notebook-cell jp-mod-noOutputs">
</div><div class="jp-Cell jp-CodeCell jp-Notebook-cell">
<div class="jp-Cell jp-CodeCell jp-Notebook-cell">
<div class="jp-Cell-inputWrapper" tabindex="0">
<div class="jp-Collapser jp-InputCollapser jp-Cell-inputCollapser">
</div>
@ -2162,6 +2190,32 @@ token_encoder = tiktoken.encoding_for_model(llm_model)</div>
</div>
</div>
</div>
<div class="jp-Cell-outputWrapper">
<div class="jp-Collapser jp-OutputCollapser jp-Cell-outputCollapser">
</div>
<div class="jp-OutputArea jp-Cell-outputArea">
<div class="jp-OutputArea-child">
<div class="jp-OutputPrompt jp-OutputArea-prompt"></div>
<div class="jp-RenderedText jp-OutputArea-output" data-mime-type="application/vnd.jupyter.stderr" tabindex="0">
<pre>
<span class="ansi-red-fg">---------------------------------------------------------------------------</span>
<span class="ansi-red-fg">NameError</span> Traceback (most recent call last)
Cell <span class="ansi-green-fg">In[3], line 4</span>
<span class="ansi-green-intense-fg ansi-bold"> 1</span> api_key <span style="color: rgb(98,98,98)">=</span> os<span style="color: rgb(98,98,98)">.</span>environ[<span style="color: rgb(175,0,0)">"</span><span style="color: rgb(175,0,0)">GRAPHRAG_API_KEY</span><span style="color: rgb(175,0,0)">"</span>]
<span class="ansi-green-intense-fg ansi-bold"> 2</span> llm_model <span style="color: rgb(98,98,98)">=</span> os<span style="color: rgb(98,98,98)">.</span>environ[<span style="color: rgb(175,0,0)">"</span><span style="color: rgb(175,0,0)">GRAPHRAG_LLM_MODEL</span><span style="color: rgb(175,0,0)">"</span>]
<span class="ansi-green-fg">----&gt; 4</span> llm <span style="color: rgb(98,98,98)">=</span> <span class="ansi-yellow-bg">ChatOpenAI</span>(
<span class="ansi-green-intense-fg ansi-bold"> 5</span> api_key<span style="color: rgb(98,98,98)">=</span>api_key,
<span class="ansi-green-intense-fg ansi-bold"> 6</span> model<span style="color: rgb(98,98,98)">=</span>llm_model,
<span class="ansi-green-intense-fg ansi-bold"> 7</span> api_type<span style="color: rgb(98,98,98)">=</span>OpenaiApiType<span style="color: rgb(98,98,98)">.</span>OpenAI, <span style="color: rgb(95,135,135)"># OpenaiApiType.OpenAI or OpenaiApiType.AzureOpenAI</span>
<span class="ansi-green-intense-fg ansi-bold"> 8</span> max_retries<span style="color: rgb(98,98,98)">=</span><span style="color: rgb(98,98,98)">20</span>,
<span class="ansi-green-intense-fg ansi-bold"> 9</span> )
<span class="ansi-green-intense-fg ansi-bold"> 11</span> token_encoder <span style="color: rgb(98,98,98)">=</span> tiktoken<span style="color: rgb(98,98,98)">.</span>encoding_for_model(llm_model)
<span class="ansi-red-fg">NameError</span>: name 'ChatOpenAI' is not defined</pre>
</div>
</div>
</div>
</div>
</div>
</div>
<div class="jp-Cell jp-MarkdownCell jp-Notebook-cell">
@ -2409,15 +2463,15 @@ File <span class="ansi-green-fg">~/.cache/pypoetry/virtualenvs/graphrag-F2jvqev7
<pre>
<span class="ansi-red-fg">---------------------------------------------------------------------------</span>
<span class="ansi-red-fg">NameError</span> Traceback (most recent call last)
Cell <span class="ansi-green-fg">In[6], line 2</span>
<span class="ansi-green-intense-fg ansi-bold"> 1</span> context_builder <span style="color: rgb(98,98,98)">=</span> GlobalCommunityContext(
<span class="ansi-green-fg">----&gt; 2</span> community_reports<span style="color: rgb(98,98,98)">=</span><span class="ansi-yellow-bg">reports</span>,
Cell <span class="ansi-green-fg">In[6], line 1</span>
<span class="ansi-green-fg">----&gt; 1</span> context_builder <span style="color: rgb(98,98,98)">=</span> <span class="ansi-yellow-bg">GlobalCommunityContext</span>(
<span class="ansi-green-intense-fg ansi-bold"> 2</span> community_reports<span style="color: rgb(98,98,98)">=</span>reports,
<span class="ansi-green-intense-fg ansi-bold"> 3</span> communities<span style="color: rgb(98,98,98)">=</span>communities,
<span class="ansi-green-intense-fg ansi-bold"> 4</span> entities<span style="color: rgb(98,98,98)">=</span>entities, <span style="color: rgb(95,135,135)"># default to None if you don't want to use community weights for ranking</span>
<span class="ansi-green-intense-fg ansi-bold"> 5</span> token_encoder<span style="color: rgb(98,98,98)">=</span>token_encoder,
<span class="ansi-green-intense-fg ansi-bold"> 6</span> )
<span class="ansi-red-fg">NameError</span>: name 'reports' is not defined</pre>
<span class="ansi-red-fg">NameError</span>: name 'GlobalCommunityContext' is not defined</pre>
</div>
</div>
</div>
@ -2565,10 +2619,10 @@ reduce_llm_params = {
<pre>
<span class="ansi-red-fg">---------------------------------------------------------------------------</span>
<span class="ansi-red-fg">NameError</span> Traceback (most recent call last)
Cell <span class="ansi-green-fg">In[8], line 3</span>
<span class="ansi-green-intense-fg ansi-bold"> 1</span> search_engine <span style="color: rgb(98,98,98)">=</span> GlobalSearch(
Cell <span class="ansi-green-fg">In[8], line 1</span>
<span class="ansi-green-fg">----&gt; 1</span> search_engine <span style="color: rgb(98,98,98)">=</span> <span class="ansi-yellow-bg">GlobalSearch</span>(
<span class="ansi-green-intense-fg ansi-bold"> 2</span> llm<span style="color: rgb(98,98,98)">=</span>llm,
<span class="ansi-green-fg">----&gt; 3</span> context_builder<span style="color: rgb(98,98,98)">=</span><span class="ansi-yellow-bg">context_builder</span>,
<span class="ansi-green-intense-fg ansi-bold"> 3</span> context_builder<span style="color: rgb(98,98,98)">=</span>context_builder,
<span class="ansi-green-intense-fg ansi-bold"> 4</span> token_encoder<span style="color: rgb(98,98,98)">=</span>token_encoder,
<span class="ansi-green-intense-fg ansi-bold"> 5</span> max_data_tokens<span style="color: rgb(98,98,98)">=</span><span style="color: rgb(98,98,98)">12_000</span>, <span style="color: rgb(95,135,135)"># change this based on the token limit you have on your model (if you are using a model with 8k limit, a good setting could be 5000)</span>
<span class="ansi-green-intense-fg ansi-bold"> 6</span> map_llm_params<span style="color: rgb(98,98,98)">=</span>map_llm_params,
@ -2580,7 +2634,7 @@ Cell <span class="ansi-green-fg">In[8], line 3</span>
<span class="ansi-green-intense-fg ansi-bold"> 12</span> response_type<span style="color: rgb(98,98,98)">=</span><span style="color: rgb(175,0,0)">"</span><span style="color: rgb(175,0,0)">multiple paragraphs</span><span style="color: rgb(175,0,0)">"</span>, <span style="color: rgb(95,135,135)"># free form text describing the response type and format, can be anything, e.g. prioritized list, single paragraph, multiple paragraphs, multiple-page report</span>
<span class="ansi-green-intense-fg ansi-bold"> 13</span> )
<span class="ansi-red-fg">NameError</span>: name 'context_builder' is not defined</pre>
<span class="ansi-red-fg">NameError</span>: name 'GlobalSearch' is not defined</pre>
</div>
</div>
</div>

View File

@ -1930,8 +1930,8 @@ span.linenos.special { color: #000000; background-color: #ffffc0; padding-left:
</div>
</div>
</div>
</div><div class="jp-Cell jp-CodeCell jp-Notebook-cell jp-mod-noOutputs">
<div class="jp-Cell jp-CodeCell jp-Notebook-cell jp-mod-noOutputs">
</div><div class="jp-Cell jp-CodeCell jp-Notebook-cell">
<div class="jp-Cell jp-CodeCell jp-Notebook-cell">
<div class="jp-Cell-inputWrapper" tabindex="0">
<div class="jp-Collapser jp-InputCollapser jp-Cell-inputCollapser">
</div>
@ -1986,6 +1986,34 @@ from graphrag.query.structured_search.global_search.search import GlobalSearch</
</div>
</div>
</div>
<div class="jp-Cell-outputWrapper">
<div class="jp-Collapser jp-OutputCollapser jp-Cell-outputCollapser">
</div>
<div class="jp-OutputArea jp-Cell-outputArea">
<div class="jp-OutputArea-child">
<div class="jp-OutputPrompt jp-OutputArea-prompt"></div>
<div class="jp-RenderedText jp-OutputArea-output" data-mime-type="application/vnd.jupyter.stderr" tabindex="0">
<pre>
<span class="ansi-red-fg">---------------------------------------------------------------------------</span>
<span class="ansi-red-fg">ModuleNotFoundError</span> Traceback (most recent call last)
Cell <span class="ansi-green-fg">In[2], line 11</span>
<span class="ansi-green-intense-fg ansi-bold"> 4</span> <span class="ansi-bold" style="color: rgb(0,135,0)">import</span><span style="color: rgb(188,188,188)"> </span><span class="ansi-bold" style="color: rgb(0,0,255)">tiktoken</span>
<span class="ansi-green-intense-fg ansi-bold"> 6</span> <span class="ansi-bold" style="color: rgb(0,135,0)">from</span><span style="color: rgb(188,188,188)"> </span><span class="ansi-bold" style="color: rgb(0,0,255)">graphrag</span><span class="ansi-bold" style="color: rgb(0,0,255)">.</span><span class="ansi-bold" style="color: rgb(0,0,255)">query</span><span class="ansi-bold" style="color: rgb(0,0,255)">.</span><span class="ansi-bold" style="color: rgb(0,0,255)">indexer_adapters</span><span style="color: rgb(188,188,188)"> </span><span class="ansi-bold" style="color: rgb(0,135,0)">import</span> (
<span class="ansi-green-intense-fg ansi-bold"> 7</span> read_indexer_communities,
<span class="ansi-green-intense-fg ansi-bold"> 8</span> read_indexer_entities,
<span class="ansi-green-intense-fg ansi-bold"> 9</span> read_indexer_reports,
<span class="ansi-green-intense-fg ansi-bold"> 10</span> )
<span class="ansi-green-fg">---&gt; 11</span> <span class="ansi-bold" style="color: rgb(0,135,0)">from</span><span style="color: rgb(188,188,188)"> </span><span class="ansi-bold" style="color: rgb(0,0,255)">graphrag</span><span class="ansi-bold" style="color: rgb(0,0,255)">.</span><span class="ansi-bold" style="color: rgb(0,0,255)">query</span><span class="ansi-bold" style="color: rgb(0,0,255)">.</span><span class="ansi-bold" style="color: rgb(0,0,255)">llm</span><span class="ansi-bold" style="color: rgb(0,0,255)">.</span><span class="ansi-bold" style="color: rgb(0,0,255)">oai</span><span class="ansi-bold" style="color: rgb(0,0,255)">.</span><span class="ansi-bold" style="color: rgb(0,0,255)">chat_openai</span><span style="color: rgb(188,188,188)"> </span><span class="ansi-bold" style="color: rgb(0,135,0)">import</span> ChatOpenAI
<span class="ansi-green-intense-fg ansi-bold"> 12</span> <span class="ansi-bold" style="color: rgb(0,135,0)">from</span><span style="color: rgb(188,188,188)"> </span><span class="ansi-bold" style="color: rgb(0,0,255)">graphrag</span><span class="ansi-bold" style="color: rgb(0,0,255)">.</span><span class="ansi-bold" style="color: rgb(0,0,255)">query</span><span class="ansi-bold" style="color: rgb(0,0,255)">.</span><span class="ansi-bold" style="color: rgb(0,0,255)">llm</span><span class="ansi-bold" style="color: rgb(0,0,255)">.</span><span class="ansi-bold" style="color: rgb(0,0,255)">oai</span><span class="ansi-bold" style="color: rgb(0,0,255)">.</span><span class="ansi-bold" style="color: rgb(0,0,255)">typing</span><span style="color: rgb(188,188,188)"> </span><span class="ansi-bold" style="color: rgb(0,135,0)">import</span> OpenaiApiType
<span class="ansi-green-intense-fg ansi-bold"> 13</span> <span class="ansi-bold" style="color: rgb(0,135,0)">from</span><span style="color: rgb(188,188,188)"> </span><span class="ansi-bold" style="color: rgb(0,0,255)">graphrag</span><span class="ansi-bold" style="color: rgb(0,0,255)">.</span><span class="ansi-bold" style="color: rgb(0,0,255)">query</span><span class="ansi-bold" style="color: rgb(0,0,255)">.</span><span class="ansi-bold" style="color: rgb(0,0,255)">structured_search</span><span class="ansi-bold" style="color: rgb(0,0,255)">.</span><span class="ansi-bold" style="color: rgb(0,0,255)">global_search</span><span class="ansi-bold" style="color: rgb(0,0,255)">.</span><span class="ansi-bold" style="color: rgb(0,0,255)">community_context</span><span style="color: rgb(188,188,188)"> </span><span class="ansi-bold" style="color: rgb(0,135,0)">import</span> (
<span class="ansi-green-intense-fg ansi-bold"> 14</span> GlobalCommunityContext,
<span class="ansi-green-intense-fg ansi-bold"> 15</span> )
<span class="ansi-red-fg">ModuleNotFoundError</span>: No module named 'graphrag.query.llm.oai'</pre>
</div>
</div>
</div>
</div>
</div>
</div>
<div class="jp-Cell jp-MarkdownCell jp-Notebook-cell">
@ -2009,8 +2037,8 @@ from graphrag.query.structured_search.global_search.search import GlobalSearch</
</div>
</div>
</div>
</div><div class="jp-Cell jp-CodeCell jp-Notebook-cell jp-mod-noOutputs">
<div class="jp-Cell jp-CodeCell jp-Notebook-cell jp-mod-noOutputs">
</div><div class="jp-Cell jp-CodeCell jp-Notebook-cell">
<div class="jp-Cell jp-CodeCell jp-Notebook-cell">
<div class="jp-Cell-inputWrapper" tabindex="0">
<div class="jp-Collapser jp-InputCollapser jp-Cell-inputCollapser">
</div>
@ -2055,6 +2083,32 @@ token_encoder = tiktoken.encoding_for_model(llm_model)</div>
</div>
</div>
</div>
<div class="jp-Cell-outputWrapper">
<div class="jp-Collapser jp-OutputCollapser jp-Cell-outputCollapser">
</div>
<div class="jp-OutputArea jp-Cell-outputArea">
<div class="jp-OutputArea-child">
<div class="jp-OutputPrompt jp-OutputArea-prompt"></div>
<div class="jp-RenderedText jp-OutputArea-output" data-mime-type="application/vnd.jupyter.stderr" tabindex="0">
<pre>
<span class="ansi-red-fg">---------------------------------------------------------------------------</span>
<span class="ansi-red-fg">NameError</span> Traceback (most recent call last)
Cell <span class="ansi-green-fg">In[3], line 4</span>
<span class="ansi-green-intense-fg ansi-bold"> 1</span> api_key <span style="color: rgb(98,98,98)">=</span> os<span style="color: rgb(98,98,98)">.</span>environ[<span style="color: rgb(175,0,0)">"</span><span style="color: rgb(175,0,0)">GRAPHRAG_API_KEY</span><span style="color: rgb(175,0,0)">"</span>]
<span class="ansi-green-intense-fg ansi-bold"> 2</span> llm_model <span style="color: rgb(98,98,98)">=</span> os<span style="color: rgb(98,98,98)">.</span>environ[<span style="color: rgb(175,0,0)">"</span><span style="color: rgb(175,0,0)">GRAPHRAG_LLM_MODEL</span><span style="color: rgb(175,0,0)">"</span>]
<span class="ansi-green-fg">----&gt; 4</span> llm <span style="color: rgb(98,98,98)">=</span> <span class="ansi-yellow-bg">ChatOpenAI</span>(
<span class="ansi-green-intense-fg ansi-bold"> 5</span> api_key<span style="color: rgb(98,98,98)">=</span>api_key,
<span class="ansi-green-intense-fg ansi-bold"> 6</span> model<span style="color: rgb(98,98,98)">=</span>llm_model,
<span class="ansi-green-intense-fg ansi-bold"> 7</span> api_type<span style="color: rgb(98,98,98)">=</span>OpenaiApiType<span style="color: rgb(98,98,98)">.</span>OpenAI, <span style="color: rgb(95,135,135)"># OpenaiApiType.OpenAI or OpenaiApiType.AzureOpenAI</span>
<span class="ansi-green-intense-fg ansi-bold"> 8</span> max_retries<span style="color: rgb(98,98,98)">=</span><span style="color: rgb(98,98,98)">20</span>,
<span class="ansi-green-intense-fg ansi-bold"> 9</span> )
<span class="ansi-green-intense-fg ansi-bold"> 11</span> token_encoder <span style="color: rgb(98,98,98)">=</span> tiktoken<span style="color: rgb(98,98,98)">.</span>encoding_for_model(llm_model)
<span class="ansi-red-fg">NameError</span>: name 'ChatOpenAI' is not defined</pre>
</div>
</div>
</div>
</div>
</div>
</div>
<div class="jp-Cell jp-MarkdownCell jp-Notebook-cell">
@ -2344,8 +2398,8 @@ context_builder = GlobalCommunityContext(
<pre>
<span class="ansi-red-fg">---------------------------------------------------------------------------</span>
<span class="ansi-red-fg">NameError</span> Traceback (most recent call last)
Cell <span class="ansi-green-fg">In[6], line 10</span>
<span class="ansi-green-intense-fg ansi-bold"> 1</span> mini_llm <span style="color: rgb(98,98,98)">=</span> ChatOpenAI(
Cell <span class="ansi-green-fg">In[6], line 1</span>
<span class="ansi-green-fg">----&gt; 1</span> mini_llm <span style="color: rgb(98,98,98)">=</span> <span class="ansi-yellow-bg">ChatOpenAI</span>(
<span class="ansi-green-intense-fg ansi-bold"> 2</span> api_key<span style="color: rgb(98,98,98)">=</span>api_key,
<span class="ansi-green-intense-fg ansi-bold"> 3</span> model<span style="color: rgb(98,98,98)">=</span><span style="color: rgb(175,0,0)">"</span><span style="color: rgb(175,0,0)">gpt-4o-mini</span><span style="color: rgb(175,0,0)">"</span>,
<span class="ansi-green-intense-fg ansi-bold"> 4</span> api_type<span style="color: rgb(98,98,98)">=</span>OpenaiApiType<span style="color: rgb(98,98,98)">.</span>OpenAI, <span style="color: rgb(95,135,135)"># OpenaiApiType.OpenAI or OpenaiApiType.AzureOpenAI</span>
@ -2353,18 +2407,13 @@ Cell <span class="ansi-green-fg">In[6], line 10</span>
<span class="ansi-green-intense-fg ansi-bold"> 6</span> )
<span class="ansi-green-intense-fg ansi-bold"> 7</span> mini_token_encoder <span style="color: rgb(98,98,98)">=</span> tiktoken<span style="color: rgb(98,98,98)">.</span>encoding_for_model(mini_llm<span style="color: rgb(98,98,98)">.</span>model)
<span class="ansi-green-intense-fg ansi-bold"> 9</span> context_builder <span style="color: rgb(98,98,98)">=</span> GlobalCommunityContext(
<span class="ansi-green-fg">---&gt; 10</span> community_reports<span style="color: rgb(98,98,98)">=</span><span class="ansi-yellow-bg">reports</span>,
<span class="ansi-green-intense-fg ansi-bold"> 10</span> community_reports<span style="color: rgb(98,98,98)">=</span>reports,
<span class="ansi-green-intense-fg ansi-bold"> 11</span> communities<span style="color: rgb(98,98,98)">=</span>communities,
<span class="ansi-green-intense-fg ansi-bold"> 12</span> entities<span style="color: rgb(98,98,98)">=</span>entities, <span style="color: rgb(95,135,135)"># default to None if you don't want to use community weights for ranking</span>
<span class="ansi-green-intense-fg ansi-bold"> 13</span> token_encoder<span style="color: rgb(98,98,98)">=</span>token_encoder,
<span class="ansi-green-intense-fg ansi-bold"> 14</span> dynamic_community_selection<span style="color: rgb(98,98,98)">=</span><span class="ansi-bold" style="color: rgb(0,135,0)">True</span>,
<span class="ansi-green-intense-fg ansi-bold"> 15</span> dynamic_community_selection_kwargs<span style="color: rgb(98,98,98)">=</span>{
<span class="ansi-green-intense-fg ansi-bold"> 16</span> <span style="color: rgb(175,0,0)">"</span><span style="color: rgb(175,0,0)">llm</span><span style="color: rgb(175,0,0)">"</span>: mini_llm,
<span class="ansi-green-intense-fg ansi-bold"> 17</span> <span style="color: rgb(175,0,0)">"</span><span style="color: rgb(175,0,0)">token_encoder</span><span style="color: rgb(175,0,0)">"</span>: mini_token_encoder,
<span class="ansi-green-fg"> (...)</span>
<span class="ansi-green-intense-fg ansi-bold"> 18</span> },
<span class="ansi-green-intense-fg ansi-bold"> 19</span> )
<span class="ansi-red-fg">NameError</span>: name 'reports' is not defined</pre>
<span class="ansi-red-fg">NameError</span>: name 'ChatOpenAI' is not defined</pre>
</div>
</div>
</div>
@ -2512,10 +2561,10 @@ reduce_llm_params = {
<pre>
<span class="ansi-red-fg">---------------------------------------------------------------------------</span>
<span class="ansi-red-fg">NameError</span> Traceback (most recent call last)
Cell <span class="ansi-green-fg">In[8], line 3</span>
<span class="ansi-green-intense-fg ansi-bold"> 1</span> search_engine <span style="color: rgb(98,98,98)">=</span> GlobalSearch(
Cell <span class="ansi-green-fg">In[8], line 1</span>
<span class="ansi-green-fg">----&gt; 1</span> search_engine <span style="color: rgb(98,98,98)">=</span> <span class="ansi-yellow-bg">GlobalSearch</span>(
<span class="ansi-green-intense-fg ansi-bold"> 2</span> llm<span style="color: rgb(98,98,98)">=</span>llm,
<span class="ansi-green-fg">----&gt; 3</span> context_builder<span style="color: rgb(98,98,98)">=</span><span class="ansi-yellow-bg">context_builder</span>,
<span class="ansi-green-intense-fg ansi-bold"> 3</span> context_builder<span style="color: rgb(98,98,98)">=</span>context_builder,
<span class="ansi-green-intense-fg ansi-bold"> 4</span> token_encoder<span style="color: rgb(98,98,98)">=</span>token_encoder,
<span class="ansi-green-intense-fg ansi-bold"> 5</span> max_data_tokens<span style="color: rgb(98,98,98)">=</span><span style="color: rgb(98,98,98)">12_000</span>, <span style="color: rgb(95,135,135)"># change this based on the token limit you have on your model (if you are using a model with 8k limit, a good setting could be 5000)</span>
<span class="ansi-green-intense-fg ansi-bold"> 6</span> map_llm_params<span style="color: rgb(98,98,98)">=</span>map_llm_params,
@ -2527,7 +2576,7 @@ Cell <span class="ansi-green-fg">In[8], line 3</span>
<span class="ansi-green-intense-fg ansi-bold"> 12</span> response_type<span style="color: rgb(98,98,98)">=</span><span style="color: rgb(175,0,0)">"</span><span style="color: rgb(175,0,0)">multiple paragraphs</span><span style="color: rgb(175,0,0)">"</span>, <span style="color: rgb(95,135,135)"># free form text describing the response type and format, can be anything, e.g. prioritized list, single paragraph, multiple paragraphs, multiple-page report</span>
<span class="ansi-green-intense-fg ansi-bold"> 13</span> )
<span class="ansi-red-fg">NameError</span>: name 'context_builder' is not defined</pre>
<span class="ansi-red-fg">NameError</span>: name 'GlobalSearch' is not defined</pre>
</div>
</div>
</div>

View File

@ -2175,8 +2175,8 @@ span.linenos.special { color: #000000; background-color: #ffffc0; padding-left:
</div>
</div>
</div>
</div><div class="jp-Cell jp-CodeCell jp-Notebook-cell jp-mod-noOutputs">
<div class="jp-Cell jp-CodeCell jp-Notebook-cell jp-mod-noOutputs">
</div><div class="jp-Cell jp-CodeCell jp-Notebook-cell">
<div class="jp-Cell jp-CodeCell jp-Notebook-cell">
<div class="jp-Cell-inputWrapper" tabindex="0">
<div class="jp-Collapser jp-InputCollapser jp-Cell-inputCollapser">
</div>
@ -2243,6 +2243,33 @@ from graphrag.vector_stores.lancedb import LanceDBVectorStore</div>
</div>
</div>
</div>
<div class="jp-Cell-outputWrapper">
<div class="jp-Collapser jp-OutputCollapser jp-Cell-outputCollapser">
</div>
<div class="jp-OutputArea jp-Cell-outputArea">
<div class="jp-OutputArea-child">
<div class="jp-OutputPrompt jp-OutputArea-prompt"></div>
<div class="jp-RenderedText jp-OutputArea-output" data-mime-type="application/vnd.jupyter.stderr" tabindex="0">
<pre>
<span class="ansi-red-fg">---------------------------------------------------------------------------</span>
<span class="ansi-red-fg">ModuleNotFoundError</span> Traceback (most recent call last)
Cell <span class="ansi-green-fg">In[2], line 14</span>
<span class="ansi-green-intense-fg ansi-bold"> 6</span> <span class="ansi-bold" style="color: rgb(0,135,0)">from</span><span style="color: rgb(188,188,188)"> </span><span class="ansi-bold" style="color: rgb(0,0,255)">graphrag</span><span class="ansi-bold" style="color: rgb(0,0,255)">.</span><span class="ansi-bold" style="color: rgb(0,0,255)">query</span><span class="ansi-bold" style="color: rgb(0,0,255)">.</span><span class="ansi-bold" style="color: rgb(0,0,255)">context_builder</span><span class="ansi-bold" style="color: rgb(0,0,255)">.</span><span class="ansi-bold" style="color: rgb(0,0,255)">entity_extraction</span><span style="color: rgb(188,188,188)"> </span><span class="ansi-bold" style="color: rgb(0,135,0)">import</span> EntityVectorStoreKey
<span class="ansi-green-intense-fg ansi-bold"> 7</span> <span class="ansi-bold" style="color: rgb(0,135,0)">from</span><span style="color: rgb(188,188,188)"> </span><span class="ansi-bold" style="color: rgb(0,0,255)">graphrag</span><span class="ansi-bold" style="color: rgb(0,0,255)">.</span><span class="ansi-bold" style="color: rgb(0,0,255)">query</span><span class="ansi-bold" style="color: rgb(0,0,255)">.</span><span class="ansi-bold" style="color: rgb(0,0,255)">indexer_adapters</span><span style="color: rgb(188,188,188)"> </span><span class="ansi-bold" style="color: rgb(0,135,0)">import</span> (
<span class="ansi-green-intense-fg ansi-bold"> 8</span> read_indexer_covariates,
<span class="ansi-green-intense-fg ansi-bold"> 9</span> read_indexer_entities,
<span class="ansi-green-fg"> (...)</span>
<span class="ansi-green-intense-fg ansi-bold"> 12</span> read_indexer_text_units,
<span class="ansi-green-intense-fg ansi-bold"> 13</span> )
<span class="ansi-green-fg">---&gt; 14</span> <span class="ansi-bold" style="color: rgb(0,135,0)">from</span><span style="color: rgb(188,188,188)"> </span><span class="ansi-bold" style="color: rgb(0,0,255)">graphrag</span><span class="ansi-bold" style="color: rgb(0,0,255)">.</span><span class="ansi-bold" style="color: rgb(0,0,255)">query</span><span class="ansi-bold" style="color: rgb(0,0,255)">.</span><span class="ansi-bold" style="color: rgb(0,0,255)">llm</span><span class="ansi-bold" style="color: rgb(0,0,255)">.</span><span class="ansi-bold" style="color: rgb(0,0,255)">oai</span><span class="ansi-bold" style="color: rgb(0,0,255)">.</span><span class="ansi-bold" style="color: rgb(0,0,255)">chat_openai</span><span style="color: rgb(188,188,188)"> </span><span class="ansi-bold" style="color: rgb(0,135,0)">import</span> ChatOpenAI
<span class="ansi-green-intense-fg ansi-bold"> 15</span> <span class="ansi-bold" style="color: rgb(0,135,0)">from</span><span style="color: rgb(188,188,188)"> </span><span class="ansi-bold" style="color: rgb(0,0,255)">graphrag</span><span class="ansi-bold" style="color: rgb(0,0,255)">.</span><span class="ansi-bold" style="color: rgb(0,0,255)">query</span><span class="ansi-bold" style="color: rgb(0,0,255)">.</span><span class="ansi-bold" style="color: rgb(0,0,255)">llm</span><span class="ansi-bold" style="color: rgb(0,0,255)">.</span><span class="ansi-bold" style="color: rgb(0,0,255)">oai</span><span class="ansi-bold" style="color: rgb(0,0,255)">.</span><span class="ansi-bold" style="color: rgb(0,0,255)">embedding</span><span style="color: rgb(188,188,188)"> </span><span class="ansi-bold" style="color: rgb(0,135,0)">import</span> OpenAIEmbedding
<span class="ansi-green-intense-fg ansi-bold"> 16</span> <span class="ansi-bold" style="color: rgb(0,135,0)">from</span><span style="color: rgb(188,188,188)"> </span><span class="ansi-bold" style="color: rgb(0,0,255)">graphrag</span><span class="ansi-bold" style="color: rgb(0,0,255)">.</span><span class="ansi-bold" style="color: rgb(0,0,255)">query</span><span class="ansi-bold" style="color: rgb(0,0,255)">.</span><span class="ansi-bold" style="color: rgb(0,0,255)">llm</span><span class="ansi-bold" style="color: rgb(0,0,255)">.</span><span class="ansi-bold" style="color: rgb(0,0,255)">oai</span><span class="ansi-bold" style="color: rgb(0,0,255)">.</span><span class="ansi-bold" style="color: rgb(0,0,255)">typing</span><span style="color: rgb(188,188,188)"> </span><span class="ansi-bold" style="color: rgb(0,135,0)">import</span> OpenaiApiType
<span class="ansi-red-fg">ModuleNotFoundError</span>: No module named 'graphrag.query.llm.oai'</pre>
</div>
</div>
</div>
</div>
</div>
</div>
<div class="jp-Cell jp-MarkdownCell jp-Notebook-cell">
@ -2962,8 +2989,8 @@ File <span class="ansi-green-fg">~/.cache/pypoetry/virtualenvs/graphrag-F2jvqev7
</div>
</div>
</div>
</div><div class="jp-Cell jp-CodeCell jp-Notebook-cell jp-mod-noOutputs">
<div class="jp-Cell jp-CodeCell jp-Notebook-cell jp-mod-noOutputs">
</div><div class="jp-Cell jp-CodeCell jp-Notebook-cell">
<div class="jp-Cell jp-CodeCell jp-Notebook-cell">
<div class="jp-Cell-inputWrapper" tabindex="0">
<div class="jp-Collapser jp-InputCollapser jp-Cell-inputCollapser">
</div>
@ -3028,6 +3055,38 @@ text_embedder = OpenAIEmbedding(
</div>
</div>
</div>
<div class="jp-Cell-outputWrapper">
<div class="jp-Collapser jp-OutputCollapser jp-Cell-outputCollapser">
</div>
<div class="jp-OutputArea jp-Cell-outputArea">
<div class="jp-OutputArea-child">
<div class="jp-OutputPrompt jp-OutputArea-prompt"></div>
<div class="jp-RenderedText jp-OutputArea-output" data-mime-type="application/vnd.jupyter.stderr" tabindex="0">
<pre>
<span class="ansi-red-fg">---------------------------------------------------------------------------</span>
<span class="ansi-red-fg">NameError</span> Traceback (most recent call last)
Cell <span class="ansi-green-fg">In[9], line 5</span>
<span class="ansi-green-intense-fg ansi-bold"> 2</span> llm_model <span style="color: rgb(98,98,98)">=</span> os<span style="color: rgb(98,98,98)">.</span>environ[<span style="color: rgb(175,0,0)">"</span><span style="color: rgb(175,0,0)">GRAPHRAG_LLM_MODEL</span><span style="color: rgb(175,0,0)">"</span>]
<span class="ansi-green-intense-fg ansi-bold"> 3</span> embedding_model <span style="color: rgb(98,98,98)">=</span> os<span style="color: rgb(98,98,98)">.</span>environ[<span style="color: rgb(175,0,0)">"</span><span style="color: rgb(175,0,0)">GRAPHRAG_EMBEDDING_MODEL</span><span style="color: rgb(175,0,0)">"</span>]
<span class="ansi-green-fg">----&gt; 5</span> llm <span style="color: rgb(98,98,98)">=</span> <span class="ansi-yellow-bg">ChatOpenAI</span>(
<span class="ansi-green-intense-fg ansi-bold"> 6</span> api_key<span style="color: rgb(98,98,98)">=</span>api_key,
<span class="ansi-green-intense-fg ansi-bold"> 7</span> model<span style="color: rgb(98,98,98)">=</span>llm_model,
<span class="ansi-green-intense-fg ansi-bold"> 8</span> api_type<span style="color: rgb(98,98,98)">=</span>OpenaiApiType<span style="color: rgb(98,98,98)">.</span>OpenAI, <span style="color: rgb(95,135,135)"># OpenaiApiType.OpenAI or OpenaiApiType.AzureOpenAI</span>
<span class="ansi-green-intense-fg ansi-bold"> 9</span> max_retries<span style="color: rgb(98,98,98)">=</span><span style="color: rgb(98,98,98)">20</span>,
<span class="ansi-green-intense-fg ansi-bold"> 10</span> )
<span class="ansi-green-intense-fg ansi-bold"> 12</span> token_encoder <span style="color: rgb(98,98,98)">=</span> tiktoken<span style="color: rgb(98,98,98)">.</span>get_encoding(<span style="color: rgb(175,0,0)">"</span><span style="color: rgb(175,0,0)">cl100k_base</span><span style="color: rgb(175,0,0)">"</span>)
<span class="ansi-green-intense-fg ansi-bold"> 14</span> text_embedder <span style="color: rgb(98,98,98)">=</span> OpenAIEmbedding(
<span class="ansi-green-intense-fg ansi-bold"> 15</span> api_key<span style="color: rgb(98,98,98)">=</span>api_key,
<span class="ansi-green-intense-fg ansi-bold"> 16</span> api_base<span style="color: rgb(98,98,98)">=</span><span class="ansi-bold" style="color: rgb(0,135,0)">None</span>,
<span class="ansi-green-fg"> (...)</span>
<span class="ansi-green-intense-fg ansi-bold"> 20</span> max_retries<span style="color: rgb(98,98,98)">=</span><span style="color: rgb(98,98,98)">20</span>,
<span class="ansi-green-intense-fg ansi-bold"> 21</span> )
<span class="ansi-red-fg">NameError</span>: name 'ChatOpenAI' is not defined</pre>
</div>
</div>
</div>
</div>
</div>
</div>
<div class="jp-Cell jp-MarkdownCell jp-Notebook-cell">
@ -3098,9 +3157,9 @@ text_embedder = OpenAIEmbedding(
<pre>
<span class="ansi-red-fg">---------------------------------------------------------------------------</span>
<span class="ansi-red-fg">NameError</span> Traceback (most recent call last)
Cell <span class="ansi-green-fg">In[10], line 2</span>
<span class="ansi-green-intense-fg ansi-bold"> 1</span> context_builder <span style="color: rgb(98,98,98)">=</span> LocalSearchMixedContext(
<span class="ansi-green-fg">----&gt; 2</span> community_reports<span style="color: rgb(98,98,98)">=</span><span class="ansi-yellow-bg">reports</span>,
Cell <span class="ansi-green-fg">In[10], line 1</span>
<span class="ansi-green-fg">----&gt; 1</span> context_builder <span style="color: rgb(98,98,98)">=</span> <span class="ansi-yellow-bg">LocalSearchMixedContext</span>(
<span class="ansi-green-intense-fg ansi-bold"> 2</span> community_reports<span style="color: rgb(98,98,98)">=</span>reports,
<span class="ansi-green-intense-fg ansi-bold"> 3</span> text_units<span style="color: rgb(98,98,98)">=</span>text_units,
<span class="ansi-green-intense-fg ansi-bold"> 4</span> entities<span style="color: rgb(98,98,98)">=</span>entities,
<span class="ansi-green-intense-fg ansi-bold"> 5</span> relationships<span style="color: rgb(98,98,98)">=</span>relationships,
@ -3112,7 +3171,7 @@ Cell <span class="ansi-green-fg">In[10], line 2</span>
<span class="ansi-green-intense-fg ansi-bold"> 11</span> token_encoder<span style="color: rgb(98,98,98)">=</span>token_encoder,
<span class="ansi-green-intense-fg ansi-bold"> 12</span> )
<span class="ansi-red-fg">NameError</span>: name 'reports' is not defined</pre>
<span class="ansi-red-fg">NameError</span>: name 'LocalSearchMixedContext' is not defined</pre>
</div>
</div>
</div>
@ -3274,17 +3333,17 @@ llm_params = {
<pre>
<span class="ansi-red-fg">---------------------------------------------------------------------------</span>
<span class="ansi-red-fg">NameError</span> Traceback (most recent call last)
Cell <span class="ansi-green-fg">In[12], line 3</span>
<span class="ansi-green-intense-fg ansi-bold"> 1</span> search_engine <span style="color: rgb(98,98,98)">=</span> LocalSearch(
Cell <span class="ansi-green-fg">In[12], line 1</span>
<span class="ansi-green-fg">----&gt; 1</span> search_engine <span style="color: rgb(98,98,98)">=</span> <span class="ansi-yellow-bg">LocalSearch</span>(
<span class="ansi-green-intense-fg ansi-bold"> 2</span> llm<span style="color: rgb(98,98,98)">=</span>llm,
<span class="ansi-green-fg">----&gt; 3</span> context_builder<span style="color: rgb(98,98,98)">=</span><span class="ansi-yellow-bg">context_builder</span>,
<span class="ansi-green-intense-fg ansi-bold"> 3</span> context_builder<span style="color: rgb(98,98,98)">=</span>context_builder,
<span class="ansi-green-intense-fg ansi-bold"> 4</span> token_encoder<span style="color: rgb(98,98,98)">=</span>token_encoder,
<span class="ansi-green-intense-fg ansi-bold"> 5</span> llm_params<span style="color: rgb(98,98,98)">=</span>llm_params,
<span class="ansi-green-intense-fg ansi-bold"> 6</span> context_builder_params<span style="color: rgb(98,98,98)">=</span>local_context_params,
<span class="ansi-green-intense-fg ansi-bold"> 7</span> response_type<span style="color: rgb(98,98,98)">=</span><span style="color: rgb(175,0,0)">"</span><span style="color: rgb(175,0,0)">multiple paragraphs</span><span style="color: rgb(175,0,0)">"</span>, <span style="color: rgb(95,135,135)"># free form text describing the response type and format, can be anything, e.g. prioritized list, single paragraph, multiple paragraphs, multiple-page report</span>
<span class="ansi-green-intense-fg ansi-bold"> 8</span> )
<span class="ansi-red-fg">NameError</span>: name 'context_builder' is not defined</pre>
<span class="ansi-red-fg">NameError</span>: name 'LocalSearch' is not defined</pre>
</div>
</div>
</div>
@ -3712,16 +3771,16 @@ Cell <span class="ansi-green-fg">In[19], line 1</span>
<pre>
<span class="ansi-red-fg">---------------------------------------------------------------------------</span>
<span class="ansi-red-fg">NameError</span> Traceback (most recent call last)
Cell <span class="ansi-green-fg">In[20], line 3</span>
<span class="ansi-green-intense-fg ansi-bold"> 1</span> question_generator <span style="color: rgb(98,98,98)">=</span> LocalQuestionGen(
Cell <span class="ansi-green-fg">In[20], line 1</span>
<span class="ansi-green-fg">----&gt; 1</span> question_generator <span style="color: rgb(98,98,98)">=</span> <span class="ansi-yellow-bg">LocalQuestionGen</span>(
<span class="ansi-green-intense-fg ansi-bold"> 2</span> llm<span style="color: rgb(98,98,98)">=</span>llm,
<span class="ansi-green-fg">----&gt; 3</span> context_builder<span style="color: rgb(98,98,98)">=</span><span class="ansi-yellow-bg">context_builder</span>,
<span class="ansi-green-intense-fg ansi-bold"> 3</span> context_builder<span style="color: rgb(98,98,98)">=</span>context_builder,
<span class="ansi-green-intense-fg ansi-bold"> 4</span> token_encoder<span style="color: rgb(98,98,98)">=</span>token_encoder,
<span class="ansi-green-intense-fg ansi-bold"> 5</span> llm_params<span style="color: rgb(98,98,98)">=</span>llm_params,
<span class="ansi-green-intense-fg ansi-bold"> 6</span> context_builder_params<span style="color: rgb(98,98,98)">=</span>local_context_params,
<span class="ansi-green-intense-fg ansi-bold"> 7</span> )
<span class="ansi-red-fg">NameError</span>: name 'context_builder' is not defined</pre>
<span class="ansi-red-fg">NameError</span>: name 'LocalQuestionGen' is not defined</pre>
</div>
</div>
</div>

Binary file not shown.