diff --git a/config/yaml/index.html b/config/yaml/index.html
index c11bd831..19e1e00c 100644
--- a/config/yaml/index.html
+++ b/config/yaml/index.html
@@ -1590,8 +1590,6 @@
 <ul>
 <li><code>embeddings</code> <strong>bool</strong> - Export embeddings snapshots to parquet.</li>
 <li><code>graphml</code> <strong>bool</strong> - Export graph snapshots to GraphML.</li>
-<li><code>raw_entities</code> <strong>bool</strong> - Export raw entity snapshots to JSON.</li>
-<li><code>top_level_nodes</code> <strong>bool</strong> - Export top-level-node snapshots to JSON.</li>
 <li><code>transient</code> <strong>bool</strong> - Export transient workflow tables snapshots to parquet.</li>
 </ul>
 <h3 id="encoding_model">encoding_model</h3>
diff --git a/examples_notebooks/drift_search/index.html b/examples_notebooks/drift_search/index.html
index 70d1ad36..0bb2efcd 100644
--- a/examples_notebooks/drift_search/index.html
+++ b/examples_notebooks/drift_search/index.html
@@ -2015,7 +2015,7 @@ Text unit records: 50
 <div class="jp-OutputArea-child">
 <div class="jp-OutputPrompt jp-OutputArea-prompt"></div>
 <div class="jp-RenderedText jp-OutputArea-output" data-mime-type="application/vnd.jupyter.stderr" tabindex="0">
-<pre>[2024-12-04T22:53:08Z WARN  lance::dataset] No existing dataset at /home/runner/work/graphrag/graphrag/docs/examples_notebooks/inputs/operation dulce/lancedb/default-entity-description.lance, it will be created
+<pre>[2024-12-05T17:58:22Z WARN  lance::dataset] No existing dataset at /home/runner/work/graphrag/graphrag/docs/examples_notebooks/inputs/operation dulce/lancedb/default-entity-description.lance, it will be created
 </pre>
 </div>
 </div>
@@ -2287,15 +2287,130 @@ reports = read_indexer_reports(
 <div class="jp-OutputArea-child">
 <div class="jp-OutputPrompt jp-OutputArea-prompt"></div>
 <div class="jp-RenderedText jp-OutputArea-output" data-mime-type="text/plain" tabindex="0">
-<pre>Embeddings saved to inputs/operation dulce/create_final_community_reports_with_embeddings.parquet
+<pre>Error embedding chunk {'OpenAIEmbedding': "Error code: 429 - {'error': {'message': 'You exceeded your current quota, please check your plan and billing details. For more information on this error, read the docs: https://platform.openai.com/docs/guides/error-codes/api-errors.', 'type': 'insufficient_quota', 'param': None, 'code': 'insufficient_quota'}}"}
 </pre>
 </div>
 </div>
+<div class="jp-OutputArea-child">
+<div class="jp-OutputPrompt jp-OutputArea-prompt"></div>
+<div class="jp-RenderedText jp-OutputArea-output" data-mime-type="application/vnd.jupyter.stderr" tabindex="0">
+<pre>
+<span class="ansi-red-fg">---------------------------------------------------------------------------</span>
+<span class="ansi-red-fg">ZeroDivisionError</span>                         Traceback (most recent call last)
+Cell <span class="ansi-green-fg">In[4], line 31</span>
+<span class="ansi-green-intense-fg ansi-bold">     27</span>     <span style="color: rgb(0,135,0)">print</span>(<span style="color: rgb(175,0,0)">f</span><span style="color: rgb(175,0,0)">"</span><span style="color: rgb(175,0,0)">Embeddings file already exists at </span><span class="ansi-bold" style="color: rgb(175,95,135)">{</span>output_path<span class="ansi-bold" style="color: rgb(175,95,135)">}</span><span style="color: rgb(175,0,0)">"</span>)
+<span class="ansi-green-intense-fg ansi-bold">     28</span>     <span class="ansi-bold" style="color: rgb(0,135,0)">return</span> pd<span style="color: rgb(98,98,98)">.</span>read_parquet(output_path)
+<span class="ansi-green-fg">---&gt; 31</span> report_df <span style="color: rgb(98,98,98)">=</span> <span class="ansi-yellow-bg">embed_community_reports</span><span class="ansi-yellow-bg">(</span><span class="ansi-yellow-bg">INPUT_DIR</span><span class="ansi-yellow-bg">,</span><span class="ansi-yellow-bg"> </span><span class="ansi-yellow-bg">text_embedder</span><span class="ansi-yellow-bg">)</span>
+<span class="ansi-green-intense-fg ansi-bold">     32</span> reports <span style="color: rgb(98,98,98)">=</span> read_indexer_reports(
+<span class="ansi-green-intense-fg ansi-bold">     33</span>     report_df,
+<span class="ansi-green-intense-fg ansi-bold">     34</span>     entity_df,
+<span class="ansi-green-intense-fg ansi-bold">     35</span>     COMMUNITY_LEVEL,
+<span class="ansi-green-intense-fg ansi-bold">     36</span>     content_embedding_col<span style="color: rgb(98,98,98)">=</span><span style="color: rgb(175,0,0)">"</span><span style="color: rgb(175,0,0)">full_content_embeddings</span><span style="color: rgb(175,0,0)">"</span>,
+<span class="ansi-green-intense-fg ansi-bold">     37</span> )
+
+Cell <span class="ansi-green-fg">In[4], line 19</span>, in <span class="ansi-cyan-fg">embed_community_reports</span><span class="ansi-blue-fg">(input_dir, embedder, community_report_table)</span>
+<span class="ansi-green-intense-fg ansi-bold">     16</span>     error_msg <span style="color: rgb(98,98,98)">=</span> <span style="color: rgb(175,0,0)">f</span><span style="color: rgb(175,0,0)">"</span><span style="color: rgb(175,0,0)">'</span><span style="color: rgb(175,0,0)">full_content</span><span style="color: rgb(175,0,0)">'</span><span style="color: rgb(175,0,0)"> column not found in </span><span class="ansi-bold" style="color: rgb(175,95,135)">{</span>input_path<span class="ansi-bold" style="color: rgb(175,95,135)">}</span><span style="color: rgb(175,0,0)">"</span>
+<span class="ansi-green-intense-fg ansi-bold">     17</span>     <span class="ansi-bold" style="color: rgb(0,135,0)">raise</span> <span class="ansi-bold" style="color: rgb(215,95,95)">ValueError</span>(error_msg)
+<span class="ansi-green-fg">---&gt; 19</span> report_df[<span style="color: rgb(175,0,0)">"</span><span style="color: rgb(175,0,0)">full_content_embeddings</span><span style="color: rgb(175,0,0)">"</span>] <span style="color: rgb(98,98,98)">=</span> <span class="ansi-yellow-bg">report_df</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">.</span><span class="ansi-yellow-bg">loc</span><span class="ansi-yellow-bg">[</span><span class="ansi-yellow-bg">:</span><span class="ansi-yellow-bg">,</span><span class="ansi-yellow-bg"> </span><span class="ansi-yellow-bg" style="color: rgb(175,0,0)">"</span><span class="ansi-yellow-bg" style="color: rgb(175,0,0)">full_content</span><span class="ansi-yellow-bg" style="color: rgb(175,0,0)">"</span><span class="ansi-yellow-bg">]</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">.</span><span class="ansi-yellow-bg">apply</span><span class="ansi-yellow-bg">(</span>
+<span class="ansi-green-intense-fg ansi-bold">     20</span> <span class="ansi-yellow-bg">    </span><span class="ansi-yellow-bg ansi-bold" style="color: rgb(0,135,0)">lambda</span><span class="ansi-yellow-bg"> </span><span class="ansi-yellow-bg">x</span><span class="ansi-yellow-bg">:</span><span class="ansi-yellow-bg"> </span><span class="ansi-yellow-bg">embedder</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">.</span><span class="ansi-yellow-bg">embed</span><span class="ansi-yellow-bg">(</span><span class="ansi-yellow-bg">x</span><span class="ansi-yellow-bg">)</span>
+<span class="ansi-green-intense-fg ansi-bold">     21</span> <span class="ansi-yellow-bg">)</span>
+<span class="ansi-green-intense-fg ansi-bold">     23</span> <span style="color: rgb(95,135,135)"># Save the DataFrame with embeddings to the output path</span>
+<span class="ansi-green-intense-fg ansi-bold">     24</span> report_df<span style="color: rgb(98,98,98)">.</span>to_parquet(output_path)
+
+File <span class="ansi-green-fg">~/.cache/pypoetry/virtualenvs/graphrag-F2jvqev7-py3.11/lib/python3.11/site-packages/pandas/core/series.py:4924</span>, in <span class="ansi-cyan-fg">Series.apply</span><span class="ansi-blue-fg">(self, func, convert_dtype, args, by_row, **kwargs)</span>
+<span class="ansi-green-intense-fg ansi-bold">   4789</span> <span class="ansi-bold" style="color: rgb(0,135,0)">def</span> <span style="color: rgb(0,0,255)">apply</span>(
+<span class="ansi-green-intense-fg ansi-bold">   4790</span>     <span style="color: rgb(0,135,0)">self</span>,
+<span class="ansi-green-intense-fg ansi-bold">   4791</span>     func: AggFuncType,
+<span class="ansi-green-fg">   (...)</span>
+<span class="ansi-green-intense-fg ansi-bold">   4796</span>     <span style="color: rgb(98,98,98)">*</span><span style="color: rgb(98,98,98)">*</span>kwargs,
+<span class="ansi-green-intense-fg ansi-bold">   4797</span> ) <span style="color: rgb(98,98,98)">-</span><span style="color: rgb(98,98,98)">&gt;</span> DataFrame <span style="color: rgb(98,98,98)">|</span> Series:
+<span class="ansi-green-intense-fg ansi-bold">   4798</span> <span style="color: rgb(188,188,188)">    </span><span style="color: rgb(175,0,0)">"""</span>
+<span class="ansi-green-intense-fg ansi-bold">   4799</span> <span style="color: rgb(175,0,0)">    Invoke function on values of Series.</span>
+<span class="ansi-green-intense-fg ansi-bold">   4800</span> 
+<span class="ansi-green-fg">   (...)</span>
+<span class="ansi-green-intense-fg ansi-bold">   4915</span> <span style="color: rgb(175,0,0)">    dtype: float64</span>
+<span class="ansi-green-intense-fg ansi-bold">   4916</span> <span style="color: rgb(175,0,0)">    """</span>
+<span class="ansi-green-intense-fg ansi-bold">   4917</span>     <span class="ansi-bold" style="color: rgb(0,135,0)">return</span> <span class="ansi-yellow-bg">SeriesApply</span><span class="ansi-yellow-bg">(</span>
+<span class="ansi-green-intense-fg ansi-bold">   4918</span> <span class="ansi-yellow-bg">        </span><span class="ansi-yellow-bg" style="color: rgb(0,135,0)">self</span><span class="ansi-yellow-bg">,</span>
+<span class="ansi-green-intense-fg ansi-bold">   4919</span> <span class="ansi-yellow-bg">        </span><span class="ansi-yellow-bg">func</span><span class="ansi-yellow-bg">,</span>
+<span class="ansi-green-intense-fg ansi-bold">   4920</span> <span class="ansi-yellow-bg">        </span><span class="ansi-yellow-bg">convert_dtype</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">=</span><span class="ansi-yellow-bg">convert_dtype</span><span class="ansi-yellow-bg">,</span>
+<span class="ansi-green-intense-fg ansi-bold">   4921</span> <span class="ansi-yellow-bg">        </span><span class="ansi-yellow-bg">by_row</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">=</span><span class="ansi-yellow-bg">by_row</span><span class="ansi-yellow-bg">,</span>
+<span class="ansi-green-intense-fg ansi-bold">   4922</span> <span class="ansi-yellow-bg">        </span><span class="ansi-yellow-bg">args</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">=</span><span class="ansi-yellow-bg">args</span><span class="ansi-yellow-bg">,</span>
+<span class="ansi-green-intense-fg ansi-bold">   4923</span> <span class="ansi-yellow-bg">        </span><span class="ansi-yellow-bg">kwargs</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">=</span><span class="ansi-yellow-bg">kwargs</span><span class="ansi-yellow-bg">,</span>
+<span class="ansi-green-fg">-&gt; 4924</span> <span class="ansi-yellow-bg">    </span><span class="ansi-yellow-bg">)</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">.</span><span class="ansi-yellow-bg">apply</span><span class="ansi-yellow-bg">(</span><span class="ansi-yellow-bg">)</span>
+
+File <span class="ansi-green-fg">~/.cache/pypoetry/virtualenvs/graphrag-F2jvqev7-py3.11/lib/python3.11/site-packages/pandas/core/apply.py:1427</span>, in <span class="ansi-cyan-fg">SeriesApply.apply</span><span class="ansi-blue-fg">(self)</span>
+<span class="ansi-green-intense-fg ansi-bold">   1424</span>     <span class="ansi-bold" style="color: rgb(0,135,0)">return</span> <span style="color: rgb(0,135,0)">self</span><span style="color: rgb(98,98,98)">.</span>apply_compat()
+<span class="ansi-green-intense-fg ansi-bold">   1426</span> <span style="color: rgb(95,135,135)"># self.func is Callable</span>
+<span class="ansi-green-fg">-&gt; 1427</span> <span class="ansi-bold" style="color: rgb(0,135,0)">return</span> <span class="ansi-yellow-bg" style="color: rgb(0,135,0)">self</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">.</span><span class="ansi-yellow-bg">apply_standard</span><span class="ansi-yellow-bg">(</span><span class="ansi-yellow-bg">)</span>
+
+File <span class="ansi-green-fg">~/.cache/pypoetry/virtualenvs/graphrag-F2jvqev7-py3.11/lib/python3.11/site-packages/pandas/core/apply.py:1507</span>, in <span class="ansi-cyan-fg">SeriesApply.apply_standard</span><span class="ansi-blue-fg">(self)</span>
+<span class="ansi-green-intense-fg ansi-bold">   1501</span> <span style="color: rgb(95,135,135)"># row-wise access</span>
+<span class="ansi-green-intense-fg ansi-bold">   1502</span> <span style="color: rgb(95,135,135)"># apply doesn't have a `na_action` keyword and for backward compat reasons</span>
+<span class="ansi-green-intense-fg ansi-bold">   1503</span> <span style="color: rgb(95,135,135)"># we need to give `na_action="ignore"` for categorical data.</span>
+<span class="ansi-green-intense-fg ansi-bold">   1504</span> <span style="color: rgb(95,135,135)"># TODO: remove the `na_action="ignore"` when that default has been changed in</span>
+<span class="ansi-green-intense-fg ansi-bold">   1505</span> <span style="color: rgb(95,135,135)">#  Categorical (GH51645).</span>
+<span class="ansi-green-intense-fg ansi-bold">   1506</span> action <span style="color: rgb(98,98,98)">=</span> <span style="color: rgb(175,0,0)">"</span><span style="color: rgb(175,0,0)">ignore</span><span style="color: rgb(175,0,0)">"</span> <span class="ansi-bold" style="color: rgb(0,135,0)">if</span> <span style="color: rgb(0,135,0)">isinstance</span>(obj<span style="color: rgb(98,98,98)">.</span>dtype, CategoricalDtype) <span class="ansi-bold" style="color: rgb(0,135,0)">else</span> <span class="ansi-bold" style="color: rgb(0,135,0)">None</span>
+<span class="ansi-green-fg">-&gt; 1507</span> mapped <span style="color: rgb(98,98,98)">=</span> <span class="ansi-yellow-bg">obj</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">.</span><span class="ansi-yellow-bg">_map_values</span><span class="ansi-yellow-bg">(</span>
+<span class="ansi-green-intense-fg ansi-bold">   1508</span> <span class="ansi-yellow-bg">    </span><span class="ansi-yellow-bg">mapper</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">=</span><span class="ansi-yellow-bg">curried</span><span class="ansi-yellow-bg">,</span><span class="ansi-yellow-bg"> </span><span class="ansi-yellow-bg">na_action</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">=</span><span class="ansi-yellow-bg">action</span><span class="ansi-yellow-bg">,</span><span class="ansi-yellow-bg"> </span><span class="ansi-yellow-bg">convert</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">=</span><span class="ansi-yellow-bg" style="color: rgb(0,135,0)">self</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">.</span><span class="ansi-yellow-bg">convert_dtype</span>
+<span class="ansi-green-intense-fg ansi-bold">   1509</span> <span class="ansi-yellow-bg">)</span>
+<span class="ansi-green-intense-fg ansi-bold">   1511</span> <span class="ansi-bold" style="color: rgb(0,135,0)">if</span> <span style="color: rgb(0,135,0)">len</span>(mapped) <span class="ansi-bold" style="color: rgb(175,0,255)">and</span> <span style="color: rgb(0,135,0)">isinstance</span>(mapped[<span style="color: rgb(98,98,98)">0</span>], ABCSeries):
+<span class="ansi-green-intense-fg ansi-bold">   1512</span>     <span style="color: rgb(95,135,135)"># GH#43986 Need to do list(mapped) in order to get treated as nested</span>
+<span class="ansi-green-intense-fg ansi-bold">   1513</span>     <span style="color: rgb(95,135,135)">#  See also GH#25959 regarding EA support</span>
+<span class="ansi-green-intense-fg ansi-bold">   1514</span>     <span class="ansi-bold" style="color: rgb(0,135,0)">return</span> obj<span style="color: rgb(98,98,98)">.</span>_constructor_expanddim(<span style="color: rgb(0,135,0)">list</span>(mapped), index<span style="color: rgb(98,98,98)">=</span>obj<span style="color: rgb(98,98,98)">.</span>index)
+
+File <span class="ansi-green-fg">~/.cache/pypoetry/virtualenvs/graphrag-F2jvqev7-py3.11/lib/python3.11/site-packages/pandas/core/base.py:921</span>, in <span class="ansi-cyan-fg">IndexOpsMixin._map_values</span><span class="ansi-blue-fg">(self, mapper, na_action, convert)</span>
+<span class="ansi-green-intense-fg ansi-bold">    918</span> <span class="ansi-bold" style="color: rgb(0,135,0)">if</span> <span style="color: rgb(0,135,0)">isinstance</span>(arr, ExtensionArray):
+<span class="ansi-green-intense-fg ansi-bold">    919</span>     <span class="ansi-bold" style="color: rgb(0,135,0)">return</span> arr<span style="color: rgb(98,98,98)">.</span>map(mapper, na_action<span style="color: rgb(98,98,98)">=</span>na_action)
+<span class="ansi-green-fg">--&gt; 921</span> <span class="ansi-bold" style="color: rgb(0,135,0)">return</span> <span class="ansi-yellow-bg">algorithms</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">.</span><span class="ansi-yellow-bg">map_array</span><span class="ansi-yellow-bg">(</span><span class="ansi-yellow-bg">arr</span><span class="ansi-yellow-bg">,</span><span class="ansi-yellow-bg"> </span><span class="ansi-yellow-bg">mapper</span><span class="ansi-yellow-bg">,</span><span class="ansi-yellow-bg"> </span><span class="ansi-yellow-bg">na_action</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">=</span><span class="ansi-yellow-bg">na_action</span><span class="ansi-yellow-bg">,</span><span class="ansi-yellow-bg"> </span><span class="ansi-yellow-bg">convert</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">=</span><span class="ansi-yellow-bg">convert</span><span class="ansi-yellow-bg">)</span>
+
+File <span class="ansi-green-fg">~/.cache/pypoetry/virtualenvs/graphrag-F2jvqev7-py3.11/lib/python3.11/site-packages/pandas/core/algorithms.py:1743</span>, in <span class="ansi-cyan-fg">map_array</span><span class="ansi-blue-fg">(arr, mapper, na_action, convert)</span>
+<span class="ansi-green-intense-fg ansi-bold">   1741</span> values <span style="color: rgb(98,98,98)">=</span> arr<span style="color: rgb(98,98,98)">.</span>astype(<span style="color: rgb(0,135,0)">object</span>, copy<span style="color: rgb(98,98,98)">=</span><span class="ansi-bold" style="color: rgb(0,135,0)">False</span>)
+<span class="ansi-green-intense-fg ansi-bold">   1742</span> <span class="ansi-bold" style="color: rgb(0,135,0)">if</span> na_action <span class="ansi-bold" style="color: rgb(175,0,255)">is</span> <span class="ansi-bold" style="color: rgb(0,135,0)">None</span>:
+<span class="ansi-green-fg">-&gt; 1743</span>     <span class="ansi-bold" style="color: rgb(0,135,0)">return</span> <span class="ansi-yellow-bg">lib</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">.</span><span class="ansi-yellow-bg">map_infer</span><span class="ansi-yellow-bg">(</span><span class="ansi-yellow-bg">values</span><span class="ansi-yellow-bg">,</span><span class="ansi-yellow-bg"> </span><span class="ansi-yellow-bg">mapper</span><span class="ansi-yellow-bg">,</span><span class="ansi-yellow-bg"> </span><span class="ansi-yellow-bg">convert</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">=</span><span class="ansi-yellow-bg">convert</span><span class="ansi-yellow-bg">)</span>
+<span class="ansi-green-intense-fg ansi-bold">   1744</span> <span class="ansi-bold" style="color: rgb(0,135,0)">else</span>:
+<span class="ansi-green-intense-fg ansi-bold">   1745</span>     <span class="ansi-bold" style="color: rgb(0,135,0)">return</span> lib<span style="color: rgb(98,98,98)">.</span>map_infer_mask(
+<span class="ansi-green-intense-fg ansi-bold">   1746</span>         values, mapper, mask<span style="color: rgb(98,98,98)">=</span>isna(values)<span style="color: rgb(98,98,98)">.</span>view(np<span style="color: rgb(98,98,98)">.</span>uint8), convert<span style="color: rgb(98,98,98)">=</span>convert
+<span class="ansi-green-intense-fg ansi-bold">   1747</span>     )
+
+File <span class="ansi-green-fg">lib.pyx:2972</span>, in <span class="ansi-cyan-fg">pandas._libs.lib.map_infer</span><span class="ansi-blue-fg">()</span>
+
+Cell <span class="ansi-green-fg">In[4], line 20</span>, in <span class="ansi-cyan-fg">embed_community_reports.&lt;locals&gt;.&lt;lambda&gt;</span><span class="ansi-blue-fg">(x)</span>
+<span class="ansi-green-intense-fg ansi-bold">     16</span>     error_msg <span style="color: rgb(98,98,98)">=</span> <span style="color: rgb(175,0,0)">f</span><span style="color: rgb(175,0,0)">"</span><span style="color: rgb(175,0,0)">'</span><span style="color: rgb(175,0,0)">full_content</span><span style="color: rgb(175,0,0)">'</span><span style="color: rgb(175,0,0)"> column not found in </span><span class="ansi-bold" style="color: rgb(175,95,135)">{</span>input_path<span class="ansi-bold" style="color: rgb(175,95,135)">}</span><span style="color: rgb(175,0,0)">"</span>
+<span class="ansi-green-intense-fg ansi-bold">     17</span>     <span class="ansi-bold" style="color: rgb(0,135,0)">raise</span> <span class="ansi-bold" style="color: rgb(215,95,95)">ValueError</span>(error_msg)
+<span class="ansi-green-intense-fg ansi-bold">     19</span> report_df[<span style="color: rgb(175,0,0)">"</span><span style="color: rgb(175,0,0)">full_content_embeddings</span><span style="color: rgb(175,0,0)">"</span>] <span style="color: rgb(98,98,98)">=</span> report_df<span style="color: rgb(98,98,98)">.</span>loc[:, <span style="color: rgb(175,0,0)">"</span><span style="color: rgb(175,0,0)">full_content</span><span style="color: rgb(175,0,0)">"</span>]<span style="color: rgb(98,98,98)">.</span>apply(
+<span class="ansi-green-fg">---&gt; 20</span>     <span class="ansi-bold" style="color: rgb(0,135,0)">lambda</span> x: <span class="ansi-yellow-bg">embedder</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">.</span><span class="ansi-yellow-bg">embed</span><span class="ansi-yellow-bg">(</span><span class="ansi-yellow-bg">x</span><span class="ansi-yellow-bg">)</span>
+<span class="ansi-green-intense-fg ansi-bold">     21</span> )
+<span class="ansi-green-intense-fg ansi-bold">     23</span> <span style="color: rgb(95,135,135)"># Save the DataFrame with embeddings to the output path</span>
+<span class="ansi-green-intense-fg ansi-bold">     24</span> report_df<span style="color: rgb(98,98,98)">.</span>to_parquet(output_path)
+
+File <span class="ansi-green-fg">~/work/graphrag/graphrag/graphrag/query/llm/oai/embedding.py:96</span>, in <span class="ansi-cyan-fg">OpenAIEmbedding.embed</span><span class="ansi-blue-fg">(self, text, **kwargs)</span>
+<span class="ansi-green-intense-fg ansi-bold">     90</span>         <span style="color: rgb(0,135,0)">self</span><span style="color: rgb(98,98,98)">.</span>_reporter<span style="color: rgb(98,98,98)">.</span>error(
+<span class="ansi-green-intense-fg ansi-bold">     91</span>             message<span style="color: rgb(98,98,98)">=</span><span style="color: rgb(175,0,0)">"</span><span style="color: rgb(175,0,0)">Error embedding chunk</span><span style="color: rgb(175,0,0)">"</span>,
+<span class="ansi-green-intense-fg ansi-bold">     92</span>             details<span style="color: rgb(98,98,98)">=</span>{<span style="color: rgb(0,135,0)">self</span><span style="color: rgb(98,98,98)">.</span><span style="color: rgb(0,0,135)">__class__</span><span style="color: rgb(98,98,98)">.</span><span style="color: rgb(0,0,135)">__name__</span>: <span style="color: rgb(0,135,0)">str</span>(e)},
+<span class="ansi-green-intense-fg ansi-bold">     93</span>         )
+<span class="ansi-green-intense-fg ansi-bold">     95</span>         <span class="ansi-bold" style="color: rgb(0,135,0)">continue</span>
+<span class="ansi-green-fg">---&gt; 96</span> chunk_embeddings <span style="color: rgb(98,98,98)">=</span> <span class="ansi-yellow-bg">np</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">.</span><span class="ansi-yellow-bg">average</span><span class="ansi-yellow-bg">(</span><span class="ansi-yellow-bg">chunk_embeddings</span><span class="ansi-yellow-bg">,</span><span class="ansi-yellow-bg"> </span><span class="ansi-yellow-bg">axis</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">=</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">0</span><span class="ansi-yellow-bg">,</span><span class="ansi-yellow-bg"> </span><span class="ansi-yellow-bg">weights</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">=</span><span class="ansi-yellow-bg">chunk_lens</span><span class="ansi-yellow-bg">)</span>
+<span class="ansi-green-intense-fg ansi-bold">     97</span> chunk_embeddings <span style="color: rgb(98,98,98)">=</span> chunk_embeddings <span style="color: rgb(98,98,98)">/</span> np<span style="color: rgb(98,98,98)">.</span>linalg<span style="color: rgb(98,98,98)">.</span>norm(chunk_embeddings)
+<span class="ansi-green-intense-fg ansi-bold">     98</span> <span class="ansi-bold" style="color: rgb(0,135,0)">return</span> chunk_embeddings<span style="color: rgb(98,98,98)">.</span>tolist()
+
+File <span class="ansi-green-fg">~/.cache/pypoetry/virtualenvs/graphrag-F2jvqev7-py3.11/lib/python3.11/site-packages/numpy/lib/function_base.py:550</span>, in <span class="ansi-cyan-fg">average</span><span class="ansi-blue-fg">(a, axis, weights, returned, keepdims)</span>
+<span class="ansi-green-intense-fg ansi-bold">    548</span>     scl <span style="color: rgb(98,98,98)">=</span> wgt<span style="color: rgb(98,98,98)">.</span>sum(axis<span style="color: rgb(98,98,98)">=</span>axis, dtype<span style="color: rgb(98,98,98)">=</span>result_dtype, <span style="color: rgb(98,98,98)">*</span><span style="color: rgb(98,98,98)">*</span>keepdims_kw)
+<span class="ansi-green-intense-fg ansi-bold">    549</span>     <span class="ansi-bold" style="color: rgb(0,135,0)">if</span> np<span style="color: rgb(98,98,98)">.</span>any(scl <span style="color: rgb(98,98,98)">==</span> <span style="color: rgb(98,98,98)">0.0</span>):
+<span class="ansi-green-fg">--&gt; 550</span>         <span class="ansi-bold" style="color: rgb(0,135,0)">raise</span> <span class="ansi-bold" style="color: rgb(215,95,95)">ZeroDivisionError</span>(
+<span class="ansi-green-intense-fg ansi-bold">    551</span>             <span style="color: rgb(175,0,0)">"</span><span style="color: rgb(175,0,0)">Weights sum to zero, can</span><span style="color: rgb(175,0,0)">'</span><span style="color: rgb(175,0,0)">t be normalized</span><span style="color: rgb(175,0,0)">"</span>)
+<span class="ansi-green-intense-fg ansi-bold">    553</span>     avg <span style="color: rgb(98,98,98)">=</span> avg_as_array <span style="color: rgb(98,98,98)">=</span> np<span style="color: rgb(98,98,98)">.</span>multiply(a, wgt,
+<span class="ansi-green-intense-fg ansi-bold">    554</span>                       dtype<span style="color: rgb(98,98,98)">=</span>result_dtype)<span style="color: rgb(98,98,98)">.</span>sum(axis, <span style="color: rgb(98,98,98)">*</span><span style="color: rgb(98,98,98)">*</span>keepdims_kw) <span style="color: rgb(98,98,98)">/</span> scl
+<span class="ansi-green-intense-fg ansi-bold">    556</span> <span class="ansi-bold" style="color: rgb(0,135,0)">if</span> returned:
+
+<span class="ansi-red-fg">ZeroDivisionError</span>: Weights sum to zero, can't be normalized</pre>
 </div>
 </div>
 </div>
-</div><div class="jp-Cell jp-CodeCell jp-Notebook-cell jp-mod-noOutputs">
-<div class="jp-Cell jp-CodeCell jp-Notebook-cell jp-mod-noOutputs">
+</div>
+</div>
+</div><div class="jp-Cell jp-CodeCell jp-Notebook-cell">
+<div class="jp-Cell jp-CodeCell jp-Notebook-cell">
 <div class="jp-Cell-inputWrapper" tabindex="0">
 <div class="jp-Collapser jp-InputCollapser jp-Cell-inputCollapser">
 </div>
@@ -2344,6 +2459,35 @@ search = DRIFTSearch(
 </div>
 </div>
 </div>
+<div class="jp-Cell-outputWrapper">
+<div class="jp-Collapser jp-OutputCollapser jp-Cell-outputCollapser">
+</div>
+<div class="jp-OutputArea jp-Cell-outputArea">
+<div class="jp-OutputArea-child">
+<div class="jp-OutputPrompt jp-OutputArea-prompt"></div>
+<div class="jp-RenderedText jp-OutputArea-output" data-mime-type="application/vnd.jupyter.stderr" tabindex="0">
+<pre>
+<span class="ansi-red-fg">---------------------------------------------------------------------------</span>
+<span class="ansi-red-fg">NameError</span>                                 Traceback (most recent call last)
+Cell <span class="ansi-green-fg">In[5], line 6</span>
+<span class="ansi-green-intense-fg ansi-bold">      1</span> context_builder <span style="color: rgb(98,98,98)">=</span> DRIFTSearchContextBuilder(
+<span class="ansi-green-intense-fg ansi-bold">      2</span>     chat_llm<span style="color: rgb(98,98,98)">=</span>chat_llm,
+<span class="ansi-green-intense-fg ansi-bold">      3</span>     text_embedder<span style="color: rgb(98,98,98)">=</span>text_embedder,
+<span class="ansi-green-intense-fg ansi-bold">      4</span>     entities<span style="color: rgb(98,98,98)">=</span>entities,
+<span class="ansi-green-intense-fg ansi-bold">      5</span>     relationships<span style="color: rgb(98,98,98)">=</span>relationships,
+<span class="ansi-green-fg">----&gt; 6</span>     reports<span style="color: rgb(98,98,98)">=</span><span class="ansi-yellow-bg">reports</span>,
+<span class="ansi-green-intense-fg ansi-bold">      7</span>     entity_text_embeddings<span style="color: rgb(98,98,98)">=</span>entity_description_embeddings,
+<span class="ansi-green-intense-fg ansi-bold">      8</span>     text_units<span style="color: rgb(98,98,98)">=</span>text_units,
+<span class="ansi-green-intense-fg ansi-bold">      9</span> )
+<span class="ansi-green-intense-fg ansi-bold">     11</span> search <span style="color: rgb(98,98,98)">=</span> DRIFTSearch(
+<span class="ansi-green-intense-fg ansi-bold">     12</span>     llm<span style="color: rgb(98,98,98)">=</span>chat_llm, context_builder<span style="color: rgb(98,98,98)">=</span>context_builder, token_encoder<span style="color: rgb(98,98,98)">=</span>token_encoder
+<span class="ansi-green-intense-fg ansi-bold">     13</span> )
+
+<span class="ansi-red-fg">NameError</span>: name 'reports' is not defined</pre>
+</div>
+</div>
+</div>
+</div>
 </div>
 </div><div class="jp-Cell jp-CodeCell jp-Notebook-cell">
 <div class="jp-Cell jp-CodeCell jp-Notebook-cell">
@@ -2378,345 +2522,13 @@ search = DRIFTSearch(
 <div class="jp-OutputArea-child">
 <div class="jp-OutputPrompt jp-OutputArea-prompt"></div>
 <div class="jp-RenderedText jp-OutputArea-output" data-mime-type="application/vnd.jupyter.stderr" tabindex="0">
-<pre>/home/runner/.cache/pypoetry/virtualenvs/graphrag-F2jvqev7-py3.11/lib/python3.11/site-packages/numpy/core/fromnumeric.py:59: FutureWarning: 'DataFrame.swapaxes' is deprecated and will be removed in a future version. Please use 'DataFrame.transpose' instead.
-  return bound(*args, **kwds)
-</pre>
-</div>
-</div>
-<div class="jp-OutputArea-child">
-<div class="jp-OutputPrompt jp-OutputArea-prompt"></div>
-<div class="jp-RenderedText jp-OutputArea-output" data-mime-type="application/vnd.jupyter.stderr" tabindex="0">
-<pre>  0%|          | 0/5 [00:00&lt;?, ?it/s]</pre>
-</div>
-</div>
-<div class="jp-OutputArea-child">
-<div class="jp-OutputPrompt jp-OutputArea-prompt"></div>
-<div class="jp-RenderedText jp-OutputArea-output" data-mime-type="application/vnd.jupyter.stderr" tabindex="0">
-<pre> 20%|██        | 1/5 [00:06&lt;00:24,  6.16s/it]</pre>
-</div>
-</div>
-<div class="jp-OutputArea-child">
-<div class="jp-OutputPrompt jp-OutputArea-prompt"></div>
-<div class="jp-RenderedText jp-OutputArea-output" data-mime-type="application/vnd.jupyter.stderr" tabindex="0">
-<pre> 60%|██████    | 3/5 [00:06&lt;00:03,  1.78s/it]</pre>
-</div>
-</div>
-<div class="jp-OutputArea-child">
-<div class="jp-OutputPrompt jp-OutputArea-prompt"></div>
-<div class="jp-RenderedText jp-OutputArea-output" data-mime-type="application/vnd.jupyter.stderr" tabindex="0">
-<pre> 80%|████████  | 4/5 [00:06&lt;00:01,  1.20s/it]</pre>
-</div>
-</div>
-<div class="jp-OutputArea-child">
-<div class="jp-OutputPrompt jp-OutputArea-prompt"></div>
-<div class="jp-RenderedText jp-OutputArea-output" data-mime-type="application/vnd.jupyter.stderr" tabindex="0">
-<pre>100%|██████████| 5/5 [00:07&lt;00:00,  1.15s/it]</pre>
-</div>
-</div>
-<div class="jp-OutputArea-child">
-<div class="jp-OutputPrompt jp-OutputArea-prompt"></div>
-<div class="jp-RenderedText jp-OutputArea-output" data-mime-type="application/vnd.jupyter.stderr" tabindex="0">
-<pre>                                             </pre>
-</div>
-</div>
-<div class="jp-OutputArea-child">
-<div class="jp-OutputPrompt jp-OutputArea-prompt"></div>
-<div class="jp-RenderedText jp-OutputArea-output" data-mime-type="application/vnd.jupyter.stderr" tabindex="0">
-<pre></pre>
-</div>
-</div>
-<div class="jp-OutputArea-child">
-<div class="jp-OutputPrompt jp-OutputArea-prompt"></div>
-<div class="jp-RenderedText jp-OutputArea-output" data-mime-type="application/vnd.jupyter.stderr" tabindex="0">
-<pre>  0%|          | 0/20 [00:00&lt;?, ?it/s]</pre>
-</div>
-</div>
-<div class="jp-OutputArea-child">
-<div class="jp-OutputPrompt jp-OutputArea-prompt"></div>
-<div class="jp-RenderedText jp-OutputArea-output" data-mime-type="application/vnd.jupyter.stderr" tabindex="0">
-<pre>  5%|▌         | 1/20 [00:12&lt;04:05, 12.92s/it]</pre>
-</div>
-</div>
-<div class="jp-OutputArea-child">
-<div class="jp-OutputPrompt jp-OutputArea-prompt"></div>
-<div class="jp-RenderedText jp-OutputArea-output" data-mime-type="application/vnd.jupyter.stderr" tabindex="0">
-<pre> 10%|█         | 2/20 [00:13&lt;01:38,  5.45s/it]</pre>
-</div>
-</div>
-<div class="jp-OutputArea-child">
-<div class="jp-OutputPrompt jp-OutputArea-prompt"></div>
-<div class="jp-RenderedText jp-OutputArea-output" data-mime-type="application/vnd.jupyter.stderr" tabindex="0">
-<pre> 15%|█▌        | 3/20 [00:13&lt;00:52,  3.10s/it]</pre>
-</div>
-</div>
-<div class="jp-OutputArea-child">
-<div class="jp-OutputPrompt jp-OutputArea-prompt"></div>
-<div class="jp-RenderedText jp-OutputArea-output" data-mime-type="application/vnd.jupyter.stderr" tabindex="0">
-<pre> 25%|██▌       | 5/20 [00:13&lt;00:21,  1.42s/it]</pre>
-</div>
-</div>
-<div class="jp-OutputArea-child">
-<div class="jp-OutputPrompt jp-OutputArea-prompt"></div>
-<div class="jp-RenderedText jp-OutputArea-output" data-mime-type="application/vnd.jupyter.stderr" tabindex="0">
-<pre> 40%|████      | 8/20 [00:14&lt;00:08,  1.41it/s]</pre>
-</div>
-</div>
-<div class="jp-OutputArea-child">
-<div class="jp-OutputPrompt jp-OutputArea-prompt"></div>
-<div class="jp-RenderedText jp-OutputArea-output" data-mime-type="application/vnd.jupyter.stderr" tabindex="0">
-<pre> 50%|█████     | 10/20 [00:14&lt;00:05,  1.96it/s]</pre>
-</div>
-</div>
-<div class="jp-OutputArea-child">
-<div class="jp-OutputPrompt jp-OutputArea-prompt"></div>
-<div class="jp-RenderedText jp-OutputArea-output" data-mime-type="application/vnd.jupyter.stderr" tabindex="0">
-<pre> 65%|██████▌   | 13/20 [00:14&lt;00:02,  2.76it/s]</pre>
-</div>
-</div>
-<div class="jp-OutputArea-child">
-<div class="jp-OutputPrompt jp-OutputArea-prompt"></div>
-<div class="jp-RenderedText jp-OutputArea-output" data-mime-type="application/vnd.jupyter.stderr" tabindex="0">
-<pre> 75%|███████▌  | 15/20 [00:15&lt;00:01,  3.31it/s]</pre>
-</div>
-</div>
-<div class="jp-OutputArea-child">
-<div class="jp-OutputPrompt jp-OutputArea-prompt"></div>
-<div class="jp-RenderedText jp-OutputArea-output" data-mime-type="application/vnd.jupyter.stderr" tabindex="0">
-<pre> 80%|████████  | 16/20 [00:15&lt;00:01,  3.71it/s]</pre>
-</div>
-</div>
-<div class="jp-OutputArea-child">
-<div class="jp-OutputPrompt jp-OutputArea-prompt"></div>
-<div class="jp-RenderedText jp-OutputArea-output" data-mime-type="application/vnd.jupyter.stderr" tabindex="0">
-<pre> 85%|████████▌ | 17/20 [00:15&lt;00:00,  3.20it/s]</pre>
-</div>
-</div>
-<div class="jp-OutputArea-child">
-<div class="jp-OutputPrompt jp-OutputArea-prompt"></div>
-<div class="jp-RenderedText jp-OutputArea-output" data-mime-type="application/vnd.jupyter.stderr" tabindex="0">
-<pre> 90%|█████████ | 18/20 [00:16&lt;00:00,  2.90it/s]</pre>
-</div>
-</div>
-<div class="jp-OutputArea-child">
-<div class="jp-OutputPrompt jp-OutputArea-prompt"></div>
-<div class="jp-RenderedText jp-OutputArea-output" data-mime-type="application/vnd.jupyter.stderr" tabindex="0">
-<pre> 95%|█████████▌| 19/20 [00:16&lt;00:00,  2.85it/s]</pre>
-</div>
-</div>
-<div class="jp-OutputArea-child">
-<div class="jp-OutputPrompt jp-OutputArea-prompt"></div>
-<div class="jp-RenderedText jp-OutputArea-output" data-mime-type="application/vnd.jupyter.stderr" tabindex="0">
-<pre>100%|██████████| 20/20 [00:17&lt;00:00,  2.29it/s]</pre>
-</div>
-</div>
-<div class="jp-OutputArea-child">
-<div class="jp-OutputPrompt jp-OutputArea-prompt"></div>
-<div class="jp-RenderedText jp-OutputArea-output" data-mime-type="application/vnd.jupyter.stderr" tabindex="0">
-<pre>                                               </pre>
-</div>
-</div>
-<div class="jp-OutputArea-child">
-<div class="jp-OutputPrompt jp-OutputArea-prompt"></div>
-<div class="jp-RenderedText jp-OutputArea-output" data-mime-type="application/vnd.jupyter.stderr" tabindex="0">
-<pre></pre>
-</div>
-</div>
-<div class="jp-OutputArea-child">
-<div class="jp-OutputPrompt jp-OutputArea-prompt"></div>
-<div class="jp-RenderedText jp-OutputArea-output" data-mime-type="application/vnd.jupyter.stderr" tabindex="0">
-<pre>  0%|          | 0/20 [00:00&lt;?, ?it/s]</pre>
-</div>
-</div>
-<div class="jp-OutputArea-child">
-<div class="jp-OutputPrompt jp-OutputArea-prompt"></div>
-<div class="jp-RenderedText jp-OutputArea-output" data-mime-type="application/vnd.jupyter.stderr" tabindex="0">
-<pre>  5%|▌         | 1/20 [00:11&lt;03:34, 11.31s/it]</pre>
-</div>
-</div>
-<div class="jp-OutputArea-child">
-<div class="jp-OutputPrompt jp-OutputArea-prompt"></div>
-<div class="jp-RenderedText jp-OutputArea-output" data-mime-type="application/vnd.jupyter.stderr" tabindex="0">
-<pre> 15%|█▌        | 3/20 [00:11&lt;00:53,  3.17s/it]</pre>
-</div>
-</div>
-<div class="jp-OutputArea-child">
-<div class="jp-OutputPrompt jp-OutputArea-prompt"></div>
-<div class="jp-RenderedText jp-OutputArea-output" data-mime-type="application/vnd.jupyter.stderr" tabindex="0">
-<pre> 20%|██        | 4/20 [00:12&lt;00:35,  2.23s/it]</pre>
-</div>
-</div>
-<div class="jp-OutputArea-child">
-<div class="jp-OutputPrompt jp-OutputArea-prompt"></div>
-<div class="jp-RenderedText jp-OutputArea-output" data-mime-type="application/vnd.jupyter.stderr" tabindex="0">
-<pre> 25%|██▌       | 5/20 [00:12&lt;00:23,  1.56s/it]</pre>
-</div>
-</div>
-<div class="jp-OutputArea-child">
-<div class="jp-OutputPrompt jp-OutputArea-prompt"></div>
-<div class="jp-RenderedText jp-OutputArea-output" data-mime-type="application/vnd.jupyter.stderr" tabindex="0">
-<pre> 40%|████      | 8/20 [00:12&lt;00:08,  1.46it/s]</pre>
-</div>
-</div>
-<div class="jp-OutputArea-child">
-<div class="jp-OutputPrompt jp-OutputArea-prompt"></div>
-<div class="jp-RenderedText jp-OutputArea-output" data-mime-type="application/vnd.jupyter.stderr" tabindex="0">
-<pre> 45%|████▌     | 9/20 [00:13&lt;00:07,  1.51it/s]</pre>
-</div>
-</div>
-<div class="jp-OutputArea-child">
-<div class="jp-OutputPrompt jp-OutputArea-prompt"></div>
-<div class="jp-RenderedText jp-OutputArea-output" data-mime-type="application/vnd.jupyter.stderr" tabindex="0">
-<pre> 50%|█████     | 10/20 [00:13&lt;00:06,  1.66it/s]</pre>
-</div>
-</div>
-<div class="jp-OutputArea-child">
-<div class="jp-OutputPrompt jp-OutputArea-prompt"></div>
-<div class="jp-RenderedText jp-OutputArea-output" data-mime-type="application/vnd.jupyter.stderr" tabindex="0">
-<pre> 60%|██████    | 12/20 [00:13&lt;00:03,  2.59it/s]</pre>
-</div>
-</div>
-<div class="jp-OutputArea-child">
-<div class="jp-OutputPrompt jp-OutputArea-prompt"></div>
-<div class="jp-RenderedText jp-OutputArea-output" data-mime-type="application/vnd.jupyter.stderr" tabindex="0">
-<pre> 65%|██████▌   | 13/20 [00:14&lt;00:03,  2.21it/s]</pre>
-</div>
-</div>
-<div class="jp-OutputArea-child">
-<div class="jp-OutputPrompt jp-OutputArea-prompt"></div>
-<div class="jp-RenderedText jp-OutputArea-output" data-mime-type="application/vnd.jupyter.stderr" tabindex="0">
-<pre> 70%|███████   | 14/20 [00:14&lt;00:02,  2.64it/s]</pre>
-</div>
-</div>
-<div class="jp-OutputArea-child">
-<div class="jp-OutputPrompt jp-OutputArea-prompt"></div>
-<div class="jp-RenderedText jp-OutputArea-output" data-mime-type="application/vnd.jupyter.stderr" tabindex="0">
-<pre> 75%|███████▌  | 15/20 [00:15&lt;00:01,  2.81it/s]</pre>
-</div>
-</div>
-<div class="jp-OutputArea-child">
-<div class="jp-OutputPrompt jp-OutputArea-prompt"></div>
-<div class="jp-RenderedText jp-OutputArea-output" data-mime-type="application/vnd.jupyter.stderr" tabindex="0">
-<pre> 80%|████████  | 16/20 [00:15&lt;00:01,  2.95it/s]</pre>
-</div>
-</div>
-<div class="jp-OutputArea-child">
-<div class="jp-OutputPrompt jp-OutputArea-prompt"></div>
-<div class="jp-RenderedText jp-OutputArea-output" data-mime-type="application/vnd.jupyter.stderr" tabindex="0">
-<pre> 85%|████████▌ | 17/20 [00:15&lt;00:00,  3.63it/s]</pre>
-</div>
-</div>
-<div class="jp-OutputArea-child">
-<div class="jp-OutputPrompt jp-OutputArea-prompt"></div>
-<div class="jp-RenderedText jp-OutputArea-output" data-mime-type="application/vnd.jupyter.stderr" tabindex="0">
-<pre> 90%|█████████ | 18/20 [00:15&lt;00:00,  3.93it/s]</pre>
-</div>
-</div>
-<div class="jp-OutputArea-child">
-<div class="jp-OutputPrompt jp-OutputArea-prompt"></div>
-<div class="jp-RenderedText jp-OutputArea-output" data-mime-type="application/vnd.jupyter.stderr" tabindex="0">
-<pre> 95%|█████████▌| 19/20 [00:16&lt;00:00,  2.52it/s]</pre>
-</div>
-</div>
-<div class="jp-OutputArea-child">
-<div class="jp-OutputPrompt jp-OutputArea-prompt"></div>
-<div class="jp-RenderedText jp-OutputArea-output" data-mime-type="application/vnd.jupyter.stderr" tabindex="0">
-<pre>100%|██████████| 20/20 [00:17&lt;00:00,  1.45it/s]</pre>
-</div>
-</div>
-<div class="jp-OutputArea-child">
-<div class="jp-OutputPrompt jp-OutputArea-prompt"></div>
-<div class="jp-RenderedText jp-OutputArea-output" data-mime-type="application/vnd.jupyter.stderr" tabindex="0">
-<pre>                                               </pre>
-</div>
-</div>
-<div class="jp-OutputArea-child">
-<div class="jp-OutputPrompt jp-OutputArea-prompt"></div>
-<div class="jp-RenderedText jp-OutputArea-output" data-mime-type="application/vnd.jupyter.stderr" tabindex="0">
-<pre></pre>
-</div>
-</div>
-<div class="jp-OutputArea-child">
-<div class="jp-OutputPrompt jp-OutputArea-prompt"></div>
-<div class="jp-RenderedText jp-OutputArea-output" data-mime-type="application/vnd.jupyter.stderr" tabindex="0">
-<pre>  0%|          | 0/20 [00:00&lt;?, ?it/s]</pre>
-</div>
-</div>
-<div class="jp-OutputArea-child">
-<div class="jp-OutputPrompt jp-OutputArea-prompt"></div>
-<div class="jp-RenderedText jp-OutputArea-output" data-mime-type="application/vnd.jupyter.stderr" tabindex="0">
-<pre>  5%|▌         | 1/20 [00:10&lt;03:19, 10.49s/it]</pre>
-</div>
-</div>
-<div class="jp-OutputArea-child">
-<div class="jp-OutputPrompt jp-OutputArea-prompt"></div>
-<div class="jp-RenderedText jp-OutputArea-output" data-mime-type="application/vnd.jupyter.stderr" tabindex="0">
-<pre> 10%|█         | 2/20 [00:11&lt;01:25,  4.74s/it]</pre>
-</div>
-</div>
-<div class="jp-OutputArea-child">
-<div class="jp-OutputPrompt jp-OutputArea-prompt"></div>
-<div class="jp-RenderedText jp-OutputArea-output" data-mime-type="application/vnd.jupyter.stderr" tabindex="0">
-<pre> 25%|██▌       | 5/20 [00:11&lt;00:21,  1.44s/it]</pre>
-</div>
-</div>
-<div class="jp-OutputArea-child">
-<div class="jp-OutputPrompt jp-OutputArea-prompt"></div>
-<div class="jp-RenderedText jp-OutputArea-output" data-mime-type="application/vnd.jupyter.stderr" tabindex="0">
-<pre> 35%|███▌      | 7/20 [00:11&lt;00:11,  1.13it/s]</pre>
-</div>
-</div>
-<div class="jp-OutputArea-child">
-<div class="jp-OutputPrompt jp-OutputArea-prompt"></div>
-<div class="jp-RenderedText jp-OutputArea-output" data-mime-type="application/vnd.jupyter.stderr" tabindex="0">
-<pre> 45%|████▌     | 9/20 [00:12&lt;00:07,  1.45it/s]</pre>
-</div>
-</div>
-<div class="jp-OutputArea-child">
-<div class="jp-OutputPrompt jp-OutputArea-prompt"></div>
-<div class="jp-RenderedText jp-OutputArea-output" data-mime-type="application/vnd.jupyter.stderr" tabindex="0">
-<pre> 55%|█████▌    | 11/20 [00:12&lt;00:04,  2.01it/s]</pre>
-</div>
-</div>
-<div class="jp-OutputArea-child">
-<div class="jp-OutputPrompt jp-OutputArea-prompt"></div>
-<div class="jp-RenderedText jp-OutputArea-output" data-mime-type="application/vnd.jupyter.stderr" tabindex="0">
-<pre> 70%|███████   | 14/20 [00:12&lt;00:01,  3.25it/s]</pre>
-</div>
-</div>
-<div class="jp-OutputArea-child">
-<div class="jp-OutputPrompt jp-OutputArea-prompt"></div>
-<div class="jp-RenderedText jp-OutputArea-output" data-mime-type="application/vnd.jupyter.stderr" tabindex="0">
-<pre> 80%|████████  | 16/20 [00:13&lt;00:01,  3.47it/s]</pre>
-</div>
-</div>
-<div class="jp-OutputArea-child">
-<div class="jp-OutputPrompt jp-OutputArea-prompt"></div>
-<div class="jp-RenderedText jp-OutputArea-output" data-mime-type="application/vnd.jupyter.stderr" tabindex="0">
-<pre> 85%|████████▌ | 17/20 [00:13&lt;00:00,  3.30it/s]</pre>
-</div>
-</div>
-<div class="jp-OutputArea-child">
-<div class="jp-OutputPrompt jp-OutputArea-prompt"></div>
-<div class="jp-RenderedText jp-OutputArea-output" data-mime-type="application/vnd.jupyter.stderr" tabindex="0">
-<pre> 95%|█████████▌| 19/20 [00:15&lt;00:00,  2.40it/s]</pre>
-</div>
-</div>
-<div class="jp-OutputArea-child">
-<div class="jp-OutputPrompt jp-OutputArea-prompt"></div>
-<div class="jp-RenderedText jp-OutputArea-output" data-mime-type="application/vnd.jupyter.stderr" tabindex="0">
-<pre>100%|██████████| 20/20 [00:15&lt;00:00,  2.04it/s]</pre>
-</div>
-</div>
-<div class="jp-OutputArea-child">
-<div class="jp-OutputPrompt jp-OutputArea-prompt"></div>
-<div class="jp-RenderedText jp-OutputArea-output" data-mime-type="application/vnd.jupyter.stderr" tabindex="0">
-<pre>                                               </pre>
-</div>
-</div>
-<div class="jp-OutputArea-child">
-<div class="jp-OutputPrompt jp-OutputArea-prompt"></div>
-<div class="jp-RenderedText jp-OutputArea-output" data-mime-type="application/vnd.jupyter.stderr" tabindex="0">
-<pre></pre>
+<pre>
+<span class="ansi-red-fg">---------------------------------------------------------------------------</span>
+<span class="ansi-red-fg">NameError</span>                                 Traceback (most recent call last)
+Cell <span class="ansi-green-fg">In[6], line 1</span>
+<span class="ansi-green-fg">----&gt; 1</span> resp <span style="color: rgb(98,98,98)">=</span> <span class="ansi-bold" style="color: rgb(0,135,0)">await</span> <span class="ansi-yellow-bg">search</span><span style="color: rgb(98,98,98)">.</span>asearch(<span style="color: rgb(175,0,0)">"</span><span style="color: rgb(175,0,0)">Who is agent Mercer?</span><span style="color: rgb(175,0,0)">"</span>)
+
+<span class="ansi-red-fg">NameError</span>: name 'search' is not defined</pre>
 </div>
 </div>
 </div>
@@ -2752,3316 +2564,16 @@ search = DRIFTSearch(
 <div class="jp-Collapser jp-OutputCollapser jp-Cell-outputCollapser">
 </div>
 <div class="jp-OutputArea jp-Cell-outputArea">
-<div class="jp-OutputArea-child jp-OutputArea-executeResult">
-<div class="jp-OutputPrompt jp-OutputArea-prompt">Out[7]:</div>
-<div class="jp-RenderedText jp-OutputArea-output jp-OutputArea-executeResult" data-mime-type="text/plain" tabindex="0">
-<pre>{'nodes': [{'query': 'Who is agent Mercer?',
-   'answer': '# Alex Mercer\'s Role and Influence as an Agent\n\nAlex Mercer is a distinguished figure within the context of the Paranormal Military Squad at Dulce Base, with his influence extending across multiple strategic and operational domains. As a key member, Mercer is involved in the oversight of critical operations related to extraterrestrial intelligence and the strategic response to alien communications. His approach to leadership within the squad is marked by a blend of caution and analytical engagement, facilitating both the advancement of their mission objectives and ensuring adherence to protocol.\n\nMercer is noted for his pivotal role in decision-making processes, where his strategic acumen and experience contribute significantly to shaping the team\'s interactions with cosmic entities. Mercer\'s emphasis is on balancing safety with exploration, ensuring that the squad\'s engagements with extraterrestrial communications align with broader diplomatic and cosmic goals. This involves careful consideration of risks while pursuing the mission at Dulce Base, a high-tech facility known for its focus on interstellar communication.\n\nCollaboratively, Mercer works closely with other team members like Taylor Cruz, Jordan Hayes, and Sam Rivera, each contributing unique expertise to the team\'s mission. The dynamics among these members not only highlight Mercer\'s leadership but also underscore the collective efforts required to decode and strategize responses to alien signals. Mercer’s mentorship within the Paranormal Military Squad is instrumental in enhancing the squad\'s morale and operational efficiency, reinforcing his status as a mentor and leader.\n\nIn summary, Agent Alex Mercer serves as a cornerstone for the Paranormal Military Squad\'s operations at Dulce Base, providing strategic oversight and mentorship that is crucial for their interstellar communication initiatives. Through his leadership, Mercer navigates the complexities of alien communication, guiding the team towards potential cosmic partnerships while ensuring mission integrity and safety remain paramount.\n\n\n# Understanding Agent Alex Mercer\'s Role in Paranormal Activities at Dulce Base\n\nAgent Alex Mercer is a prominent member of the Paranormal Military Squad, operating chiefly at the Dulce Military Base, where significant efforts are being made to decode and establish communication with extraterrestrial intelligence. In these operations, Mercer plays a crucial role in both strategic planning and the execution of missions related to interstellar dialogue and the investigation of paranormal anomalies.\n\nHis involvement is particularly highlighted during \'Operation: Dulce,\' a high-stakes mission that not only aims to observe but also actively interact with paranormal entities, marking a significant evolution in understanding extraterrestrial phenomena. Mercer is recognized for his tactical insight, guiding the mission’s strategic decisions, and exploring its implications for humanity. Despite his outward compliance, Mercer\'s subtle determination suggests a complex dynamic with the authority figures around him, adding a nuanced layer to his interactions within the team.\n\nMercer\'s expertise in signal analysis, alongside other key personnel such as Taylor Cruz and Dr. Jordan Hayes, is vital for deciphering cosmic signals, which are believed to be structured communications from alien intelligence. These operations, centered at Dulce Base, position the team at the forefront of potentially groundbreaking technological and scientific advancements related to extraterrestrial communication.\n\nFurthermore, his collaboration with Dr. Jordan Hayes enhances the overall mission\'s success by integrating scientific research with strategic military objectives. These efforts are instrumental in preparing responses for potential extraterrestrial entities, making Mercer a critical asset in the community that operates on the cutting edge of both technology and extraterrestrial diplomacy.\n\nAgent Mercer\'s role is pivotal not only because of his direct contributions but also due to his ability to navigate the challenges of working in a high-tech, high-stress environment where understanding and preparing for extraterrestrial threats is the primary objective. This makes his presence and activities at Dulce Base integral to the continued success of these missions.\n\n# Understanding Agent Mercer and Their Role at Dulce\n\nAlex Mercer is a key figure in the operations associated with Dulce, a clandestine site known for its involvement in interspecies communication and paranormal military activities. Situated underground in New Mexico, Dulce serves as the hub for the Paranormal Military Squad, a group engaged in high-stakes operations involving alien communications. Mercer\'s contributions are integral to the success of these missions, highlighting his leadership and operational roles within this specialized community.\n\nIn the context of the Dulce Team and the Underground Command Center, Alex Mercer emerges as a central agency driving the interspecies communication project. His leadership in strategic guidance and operational management underscores his influence and critical position in the project\'s direction and success. These efforts are mirrored in the complex environment of Dulce, which requires adept navigation of its oppressive and challenging conditions to ensure mission success.\n\nThe Central Terminal and Viewing Monitors located at Dulce Base are essential to Mercer’s work, especially in handling extraterrestrial signals. His involvement with these technologies suggests a position of operational or strategic leadership, pivotal during significant moments of extraterrestrial communication operations. Mercer, alongside other key personnel, exhibits a reliable capacity to manage the critical aspects of extraterrestrial signal handling and analysis.\n\nThe community and operations Mercer is a part of illustrate a larger context involving high-security measures, collaboration between a diverse team of experts, and a focus on maintaining intergalactic communication integrity. The collective efforts of Mercer\'s team in handling distress signals and extraterrestrial data are instrumental in the broader context of Dulce\'s operations, reflecting both the historical significance and future implications of their contributions to cosmic exploration and security.\n\n\n# Understanding Agent Mercer\n\nBased on the summaries of the communities related to Earth\'s interstellar communication efforts, Agent Mercer appears to be connected to the intricate network of individuals operating from crucial locations such as Dulce Base. The community summaries place significant emphasis on the Paranormal Military Squad and the operations at Dulce Base, suggesting a strategic and hierarchical structure. Within this framework, an entity like Agent Mercer could play a vital role in managing, directing, or executing parts of the mission, particularly involving first contact and interstellar communication with extraterrestrial entities. \n\nThe summaries highlight the central role of key figures such as Cruz and Rivera, as well as Washington, in the coordination of interstellar communication efforts and defense measures. Cruz’s leadership is critical in missions that appoint Washington and Agent Mercer as part of the communication and strategic command network. With Rivera\'s technical expertise greatly influencing mission success, it is plausible that Agent Mercer is involved in supporting these operations directly or indirectly, potentially as a liaison or operative within the Paranormal Military Squad.\n\nReferences to communication tasks, security, and operational strategies point towards a highly sensitive environment in which Mercer might operate. Given Dulce Base’s role as a central hub in Earth’s cosmic outreach, any agent, including Mercer, stationed there would presumably partake in mission-critical activities, which could range from technical implementation to strategic planning and responses to extraterrestrial interactions. The extensively fortified position in which these operations are conducted suggests that agents like Mercer are key to maintaining both operational security and success during high-stakes interstellar engagements. Thus, while the summaries do not specifically mention Agent Mercer, the context indicates that this figure might be integral to executing, planning, or overseeing parts of these complex and diplomatic interstellar missions.\n\n\n# Understanding Agent Mercer\'s Role within Cosmic Interactions and Extraterrestrial Communications\n\nAgent Mercer, identified as Alex Mercer within various community contexts, appears to be a pivotal figure in an intricate web of cosmic and extraterrestrial interactions. Within the Cosmic Vocalization and Universe Interaction community, Mercer is portrayed as an interpreter of cosmic phenomena, viewing the Cosmic Vocalization as part of an "interstellar duet." This suggests an approach where Mercer sees these cosmic events as exchanges, perhaps necessitating a response or understanding from our end [Data: Relationships (55)]. His involvement in this domain indicates a focus on deciphering potential cosmic signals which may range from benign to threatening.\n\nMercer\'s role extends into the operations at the Dulce Facility, a noted extraterrestrial communication hub. Here, Mercer, alongside others like Taylor Cruz, Jordan Hayes, and Sam Rivera, contributes significantly to the communication efforts with alien intelligence. This role involves setting communication frequencies and managing signals, hinting at a highly technical and strategic aspect of his work, essential for successful extraterrestrial interactions [Data: Relationships (40, 41, 42, 94, 95)].\n\nMoreover, Mercer is intertwined with larger strategic responses to cosmic phenomena, as indicated by his involvement with entities like the Paranormal Military Squad. This military group perceives cosmic events as part of a greater strategic landscape impacting security measures [Data: Relationships (240)]. Mercer\'s involvement with both scientific exploration and strategic defense initiatives underscores his comprehensive role in navigating the complex cosmos-human dynamics.\n\nThrough these roles, Mercer emerges as a person of significant influence and expertise, navigating both the scientific and security implications of cosmic and extraterrestrial phenomena. His work within these spheres suggests that he might be at the forefront of interpreting and responding to cosmic challenges and opportunities, contributing both to human understanding and to potentially pivotal defense strategies.',
-   'score': 88.0,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 0},
-  {'query': 'What specific strategies has Alex Mercer implemented in dealing with extraterrestrial communications?',
-   'answer': "Alex Mercer, a key figure in the Paranormal Military Squad, has been at the forefront of handling extraterrestrial communications, particularly in the context of the Dulce Base operations. His strategies are characterized by a blend of caution, adaptability, and a deep understanding of the potential implications of such communications.\n\nOne of Mercer's primary strategies is maintaining open communication channels while ensuring that no message or signal goes unchecked. This approach is likened to balancing between the potential of a 'Rosetta Stone' and the risk of a 'Tower of Babel,' highlighting the dual nature of the opportunity and threat posed by these communications [Data: Sources (23, 24, 45)]. Mercer emphasizes the importance of echoing the patterns of the extraterrestrial signals and speaking their language, which suggests a strategy of mirroring and adapting to the communication style of the alien intelligence [Data: Sources (45, 44)].\n\nMercer also adopts a balanced strategy that involves cautious optimism. He acknowledges the potential for empathy to bridge galaxies, indicating a willingness to explore the positive aspects of the communication while remaining vigilant about the risks involved [Data: Sources (31, 32)]. This is further supported by his insistence on a measured response to every new discovery, ensuring that the team remains grounded even as they explore the unknown [Data: Sources (31, 32)].\n\nOverall, Mercer's strategies reflect a nuanced approach to extraterrestrial communications, combining technical acumen with a philosophical understanding of the broader implications of such interactions.",
-   'score': 85,
-   'metadata': {'llm_calls': 1,
-    'prompt_tokens': 10982,
-    'output_tokens': 426,
-    'context_data': {'entities': Empty DataFrame
-     Columns: [in_context]
-     Index: [],
-     'sources':     id                                               text
-     0   45   they faced. "If it's truly sentient, we're no...
-     1   31   set the tempo for an undertaking that travers...
-     2   27  , and not a small measure of trepidation. "Thi...
-     3   23  Sam Rivera, ever the source of technological a...
-     4   24  Keep the communication channels open. But let ...
-     5   26  eterred, Jordan cast a determined glance at th...
-     6    0  # Operation: Dulce\n\n## Chapter 1\n\nThe thru...
-     7   16   a new cosmic paradigm.\n\nAlex Mercer watched...
-     8   32   cosmos—secrets that, until now, had been lost...
-     9   14   a communal outreach beyond the stars. As dawn...
-     10  18   the universe.\n\nIn a symphony of clicks and ...
-     11  44   It's a... symphony. It's as if they're teachi...
-     12  41   conviction that knowledge was more than power...
-     13   8   I'm right, what we're looking at isn't random...
-     14  10   but felt by all. The walls didn't just whispe...
-     15   3  , weighing his words carefully. "Our tech is t...
-     16  21   an undercurrent of intensity carried forth in...}},
-   'id': 1},
-  {'query': "How does Alex Mercer's leadership style impact the Paranormal Military Squad's operations?",
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 2},
-  {'query': 'What are the key challenges faced by Alex Mercer and his team at Dulce Base?',
-   'answer': "Alex Mercer and his team at Dulce Base face a multitude of challenges as they engage in their mission, which involves deciphering and responding to an alien signal. One of the primary challenges is the complexity and unpredictability of the alien communication. The signal is described as evolving and adapting in real-time, which requires the team to continuously adjust their strategies and maintain open communication channels without letting any message go unchecked [Data: Sources (23, 24, 45)]. This dynamic interaction is likened to a conversation where both parties are learning each other's language, highlighting the need for a nuanced understanding of the alien intent [Data: Sources (23, 24, 45)].\n\nAnother significant challenge is the potential risk associated with the alien signal. The team is aware that the signal's intentions could be either benign or hostile, and they must tread carefully to avoid provoking a negative response. This uncertainty is compounded by the fact that the signal exhibits characteristics of sentience, such as recognition, learning, and even empathy, which adds layers of complexity to their task [Data: Sources (31, 32, 44)].\n\nThe team also faces internal challenges related to maintaining focus and cohesion under pressure. Each member brings a unique perspective and expertise, which is crucial for the mission's success. However, they must balance their individual insights with the need for a coordinated approach, especially as they navigate the unknown variables that exceed the known [Data: Sources (0, 16, 18)]. The tension between maintaining protocol and adapting to new information is a recurring theme, as highlighted by the interactions between team members like Alex Mercer, Jordan Hayes, and Taylor Cruz [Data: Sources (0, 16, 18)].\n\nOverall, the challenges at Dulce Base are both technical and existential, requiring the team to operate at the intersection of science, diplomacy, and survival. Their mission is not just about decoding a signal but about potentially redefining humanity's place in the cosmos.",
-   'score': 85,
-   'metadata': {'llm_calls': 1,
-    'prompt_tokens': 10982,
-    'output_tokens': 519,
-    'context_data': {'entities': Empty DataFrame
-     Columns: [in_context]
-     Index: [],
-     'sources':     id                                               text
-     0   45   they faced. "If it's truly sentient, we're no...
-     1   31   set the tempo for an undertaking that travers...
-     2   27  , and not a small measure of trepidation. "Thi...
-     3   23  Sam Rivera, ever the source of technological a...
-     4   24  Keep the communication channels open. But let ...
-     5   26  eterred, Jordan cast a determined glance at th...
-     6    0  # Operation: Dulce\n\n## Chapter 1\n\nThe thru...
-     7   16   a new cosmic paradigm.\n\nAlex Mercer watched...
-     8   32   cosmos—secrets that, until now, had been lost...
-     9   14   a communal outreach beyond the stars. As dawn...
-     10  18   the universe.\n\nIn a symphony of clicks and ...
-     11  44   It's a... symphony. It's as if they're teachi...
-     12  41   conviction that knowledge was more than power...
-     13   8   I'm right, what we're looking at isn't random...
-     14  10   but felt by all. The walls didn't just whispe...
-     15   3  , weighing his words carefully. "Our tech is t...
-     16  21   an undercurrent of intensity carried forth in...}},
-   'id': 3},
-  {'query': "How does Mercer's approach to extraterrestrial diplomacy differ from other key figures in the squad?",
-   'answer': "Agent Alex Mercer plays a pivotal role in the Paranormal Military Squad's efforts to engage with extraterrestrial intelligence, and his approach to diplomacy is characterized by a blend of cautious optimism and strategic foresight. Mercer is depicted as a leader who values open communication and the careful management of interactions with alien signals. He emphasizes the importance of keeping communication channels open while ensuring that no message or pulse goes unchecked, highlighting his awareness of the potential risks and rewards of such interactions [Data: Sources (45, 23, 24)].\n\nMercer's approach is notably balanced, as he seeks to maintain a dialogue that could either be humanity's 'Rosetta Stone or Tower of Babel,' indicating his understanding of the dual potential for breakthrough or disaster inherent in these communications [Data: Sources (23, 24)]. This perspective is shared with his team, as he encourages them to proceed with cautious optimism, recognizing the historic weight of their task and the need for a measured response to the unknown [Data: Sources (31, 32)].\n\nIn contrast, Taylor Cruz, another key figure in the squad, often adopts a more pragmatic and cautious stance. Cruz is portrayed as a sentinel who emphasizes the need to assess risks and maintain control over the situation, reflecting a more defensive and protocol-driven approach to the potential threats posed by alien intelligence [Data: Sources (31, 32, 44)]. Cruz's focus on security and risk management serves as a counterbalance to Mercer's more open and exploratory strategy.\n\nDr. Jordan Hayes, on the other hand, is depicted as a figure who is deeply engaged in the technical and analytical aspects of the mission. Hayes's approach is characterized by a focus on understanding the alien signal's architecture and its implications for human cognition and empathy. This scientific curiosity complements Mercer's diplomatic efforts by providing the necessary insights to inform their interactions with the extraterrestrial intelligence [Data: Sources (31, 32, 44)].\n\nSam Rivera contributes a sense of technological acumen and enthusiasm, often highlighting the adaptive nature of the alien signal and the potential for a new form of dialogue. Rivera's optimism and focus on the technological aspects of the mission align with Mercer's vision of maintaining an open line of communication, though Rivera's approach is more centered on the technical challenges and opportunities presented by the alien contact [Data: Sources (23, 44)].\n\nOverall, Mercer's approach to extraterrestrial diplomacy is distinguished by his emphasis on maintaining a balanced and open dialogue, while other key figures in the squad bring their unique perspectives and expertise to the mission, creating a comprehensive and multifaceted strategy for engaging with the unknown.",
-   'score': 85,
-   'metadata': {'llm_calls': 1,
-    'prompt_tokens': 10982,
-    'output_tokens': 671,
-    'context_data': {'entities': Empty DataFrame
-     Columns: [in_context]
-     Index: [],
-     'sources':     id                                               text
-     0   45   they faced. "If it's truly sentient, we're no...
-     1   31   set the tempo for an undertaking that travers...
-     2   27  , and not a small measure of trepidation. "Thi...
-     3   23  Sam Rivera, ever the source of technological a...
-     4   24  Keep the communication channels open. But let ...
-     5   26  eterred, Jordan cast a determined glance at th...
-     6    0  # Operation: Dulce\n\n## Chapter 1\n\nThe thru...
-     7   16   a new cosmic paradigm.\n\nAlex Mercer watched...
-     8   32   cosmos—secrets that, until now, had been lost...
-     9   14   a communal outreach beyond the stars. As dawn...
-     10  18   the universe.\n\nIn a symphony of clicks and ...
-     11  44   It's a... symphony. It's as if they're teachi...
-     12  41   conviction that knowledge was more than power...
-     13   8   I'm right, what we're looking at isn't random...
-     14  10   but felt by all. The walls didn't just whispe...
-     15   3  , weighing his words carefully. "Our tech is t...
-     16  21   an undercurrent of intensity carried forth in...}},
-   'id': 4},
-  {'query': 'What is the historical significance of Dulce Base in interstellar communication efforts?',
-   'answer': "Dulce Base, as depicted in the provided sources, plays a pivotal role in the narrative of interstellar communication efforts. The base is portrayed as a clandestine facility where a team of agents, including Alex Mercer, Jordan Hayes, Taylor Cruz, and Sam Rivera, engage in decoding and responding to alien signals. This facility is not just a backdrop but a central hub for groundbreaking interactions with extraterrestrial intelligence.\n\nThe narrative suggests that Dulce Base is equipped with advanced technology and serves as a command center for the Paranormal Military Squad. The agents stationed there are tasked with interpreting complex alien signals, which are described as more than mere data—they are seen as a form of sentience or a new form of dialogue that spans galaxies [Data: Sources (6, 38, 27, 30, 46)]. The base's significance is further highlighted by the agents' realization that they are not just decoding messages but engaging in a dialogue that could reshape human history and understanding of the cosmos [Data: Sources (38, 27, 30, 46)].\n\nDulce Base's historical significance is underscored by its role as a bridge between humanity and potential extraterrestrial civilizations. The agents' work at the base is depicted as a delicate dance of interstellar diplomacy, where they must balance caution with the opportunity to expand human knowledge and connection with the universe [Data: Sources (38, 27, 30, 46)]. This narrative positions Dulce Base as a critical site for humanity's first steps into a broader cosmic community, marking a shift from Earth-bound exploration to interstellar engagement.",
-   'score': 85,
-   'metadata': {'llm_calls': 1,
-    'prompt_tokens': 10982,
-    'output_tokens': 443,
-    'context_data': {'entities': Empty DataFrame
-     Columns: [in_context]
-     Index: [],
-     'sources':     id                                               text
-     0    6   ordered, their voice echoing slightly before ...
-     1   38   urged, his voice bearing the gravitas of thei...
-     2   27  , and not a small measure of trepidation. "Thi...
-     3    5   very walls of the shaft—a whisper of somethin...
-     4    9   "The silence here... It's almost as if the ba...
-     5   30   emissaries to a celestial congress we're only...
-     6   46   was now actively partaking in an exchange not...
-     7   29  crum of insight and expertise, and felt the so...
-     8   45   they faced. "If it's truly sentient, we're no...
-     9   31   set the tempo for an undertaking that travers...
-     10  32   cosmos—secrets that, until now, had been lost...
-     11   3  , weighing his words carefully. "Our tech is t...
-     12  23  Sam Rivera, ever the source of technological a...
-     13  47   revealing a tinge of skepticism at Taylor Cru...
-     14  15   than the last.\n\nThen, with a sudden burst t...
-     15  35  , every keystroke an intricate step in their t...
-     16  28   "and in every word we script, in every respon...}},
-   'id': 5},
-  {'query': 'What specific tasks does Agent Alex Mercer perform at Dulce Base?',
-   'answer': "Agent Alex Mercer is a key figure in the operations at Dulce Base, where he is involved in a series of complex and high-stakes tasks. His role is multifaceted, encompassing both leadership and technical responsibilities as part of the Paranormal Military Squad. \n\n**Leadership and Coordination**\n\nAlex Mercer is depicted as a leader who coordinates with his team members, including Dr. Jordan Hayes, Taylor Cruz, and Sam Rivera. He is responsible for overseeing the team's activities and ensuring that they remain focused on their mission objectives. His leadership is characterized by a balance of authority and collaboration, as he often seeks input from his team and values their expertise [Data: Sources (0, 23, 24, 31, 32)].\n\n**Technical and Analytical Tasks**\n\nMercer is actively involved in the technical aspects of the mission, particularly in decoding and interpreting alien signals. He works closely with Dr. Jordan Hayes to decrypt complex alien codes and assess the implications of these communications. His analytical skills are crucial in understanding the potential risks and opportunities presented by the alien signals, which are described as evolving and potentially sentient [Data: Sources (23, 24, 31, 32, 44)].\n\n**Strategic Decision-Making**\n\nThroughout the mission, Alex Mercer is engaged in strategic decision-making, weighing the potential outcomes of their interactions with the alien intelligence. He is portrayed as cautious yet open to the possibilities of interstellar communication, emphasizing the importance of maintaining open communication channels while ensuring that no message goes unchecked [Data: Sources (23, 24, 31, 32, 44)].\n\n**Diplomatic Engagement**\n\nMercer also plays a diplomatic role, as he is involved in crafting humanity's response to the alien signals. He understands the historical significance of their mission and the potential for establishing a dialogue with an extraterrestrial intelligence. His approach is one of cautious optimism, aiming to bridge the gap between humanity and the unknown [Data: Sources (23, 24, 31, 32, 44)].\n\nIn summary, Agent Alex Mercer is a central figure at Dulce Base, performing tasks that range from leadership and coordination to technical analysis and strategic decision-making. His role is pivotal in navigating the complexities of the mission and in shaping humanity's potential first contact with an alien intelligence.",
-   'score': 85,
-   'metadata': {'llm_calls': 1,
-    'prompt_tokens': 10981,
-    'output_tokens': 601,
-    'context_data': {'entities': Empty DataFrame
-     Columns: [in_context]
-     Index: [],
-     'sources':     id                                               text
-     0   40   and the distant hum of machinery hinted at Du...
-     1   45   they faced. "If it's truly sentient, we're no...
-     2   31   set the tempo for an undertaking that travers...
-     3   27  , and not a small measure of trepidation. "Thi...
-     4   23  Sam Rivera, ever the source of technological a...
-     5   24  Keep the communication channels open. But let ...
-     6   26  eterred, Jordan cast a determined glance at th...
-     7    0  # Operation: Dulce\n\n## Chapter 1\n\nThe thru...
-     8   16   a new cosmic paradigm.\n\nAlex Mercer watched...
-     9   32   cosmos—secrets that, until now, had been lost...
-     10  14   a communal outreach beyond the stars. As dawn...
-     11  18   the universe.\n\nIn a symphony of clicks and ...
-     12  44   It's a... symphony. It's as if they're teachi...
-     13  41   conviction that knowledge was more than power...
-     14   8   I'm right, what we're looking at isn't random...
-     15  10   but felt by all. The walls didn't just whispe...
-     16   3  , weighing his words carefully. "Our tech is t...}},
-   'id': 6},
-  {'query': "How does Agent Mercer's role compare to other members of the Paranormal Military Squad?",
-   'answer': "Agent Alex Mercer plays a pivotal role within the Paranormal Military Squad, characterized by a blend of leadership, strategic insight, and a deep commitment to understanding the unknown. His role is often depicted as one of balance between military discipline and intellectual curiosity, which sets him apart from his peers.\n\nMercer is portrayed as a central figure who often bridges the gap between the technical and philosophical aspects of their mission. He is seen engaging deeply with the enigmatic challenges posed by the alien signals, emphasizing the importance of keeping communication channels open and ensuring that no message or pulse goes unchecked [Data: Sources (23, 24, 31, 41)]. This approach highlights his strategic mindset and his ability to adapt to the evolving nature of their mission.\n\nIn contrast, Taylor Cruz is depicted as a more pragmatic and authoritative figure, often emphasizing caution and protocol. Cruz's role is to ensure that the team remains grounded and focused on the mission's objectives, often reminding the team of the potential risks involved in their interactions with the alien intelligence [Data: Sources (16, 18, 26, 44)].\n\nDr. Jordan Hayes, on the other hand, is portrayed as the scientific mind of the team, deeply involved in the technical aspects of decoding and understanding the alien signals. Hayes's role is crucial in interpreting the signals and providing insights into their potential implications, often working closely with Mercer to navigate the complexities of their mission [Data: Sources (0, 10, 14, 32)].\n\nSam Rivera brings a youthful energy and technological acumen to the team, often contributing innovative ideas and expressing optimism about the potential for forming a connection with the alien intelligence. Rivera's role complements Mercer's by providing technical support and a fresh perspective on the challenges they face [Data: Sources (23, 44)].\n\nOverall, Mercer's role is one of synthesis and leadership, integrating the diverse skills and perspectives of his team to navigate the unknown. His ability to balance caution with curiosity and to foster collaboration among his team members is a defining aspect of his role within the Paranormal Military Squad.",
-   'score': 85,
-   'metadata': {'llm_calls': 1,
-    'prompt_tokens': 10981,
-    'output_tokens': 530,
-    'context_data': {'entities': Empty DataFrame
-     Columns: [in_context]
-     Index: [],
-     'sources':     id                                               text
-     0   40   and the distant hum of machinery hinted at Du...
-     1   45   they faced. "If it's truly sentient, we're no...
-     2   31   set the tempo for an undertaking that travers...
-     3   27  , and not a small measure of trepidation. "Thi...
-     4   23  Sam Rivera, ever the source of technological a...
-     5   24  Keep the communication channels open. But let ...
-     6   26  eterred, Jordan cast a determined glance at th...
-     7    0  # Operation: Dulce\n\n## Chapter 1\n\nThe thru...
-     8   16   a new cosmic paradigm.\n\nAlex Mercer watched...
-     9   32   cosmos—secrets that, until now, had been lost...
-     10  14   a communal outreach beyond the stars. As dawn...
-     11  18   the universe.\n\nIn a symphony of clicks and ...
-     12  44   It's a... symphony. It's as if they're teachi...
-     13  41   conviction that knowledge was more than power...
-     14   8   I'm right, what we're looking at isn't random...
-     15  10   but felt by all. The walls didn't just whispe...
-     16   3  , weighing his words carefully. "Our tech is t...}},
-   'id': 7},
-  {'query': 'What are the key achievements of Operation: Dulce involving Agent Mercer?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 8},
-  {'query': 'How does the Dulce Base facilitate communication with extraterrestrial beings?',
-   'answer': "The Dulce Base serves as a pivotal hub for facilitating communication with extraterrestrial beings through a combination of advanced technology and human expertise. The command center at Dulce is equipped with sophisticated machinery and consoles that allow the team to decode and interact with alien signals. These signals are not merely static transmissions but are described as complex, evolving patterns that suggest a form of sentience or intelligence [Data: Sources (26, 38, 27, 46)].\n\nDr. Jordan Hayes and their team, including Alex Mercer, Taylor Cruz, and Sam Rivera, play crucial roles in interpreting these signals. They work tirelessly to decrypt the alien messages, which are seen as a dialogue across the celestial divide. The team approaches this task with a mix of awe and caution, aware of the potential risks and the historic significance of their work [Data: Sources (26, 38, 27, 46)].\n\nThe process involves not just decoding the signals but also crafting responses that encapsulate human curiosity and compassion. The team is aware that they are not just communicating with an unknown intelligence but are potentially establishing a new form of dialogue that could redefine humanity's place in the cosmos. This endeavor is seen as a delicate dance, requiring both innovation and caution to ensure that the communication remains constructive and does not lead to unintended consequences [Data: Sources (26, 38, 27, 46)].\n\nOverall, the Dulce Base acts as a bridge between Earth and the stars, with its team of experts navigating the complexities of interstellar communication. Their work is not just about understanding alien signals but also about ensuring that humanity's response is thoughtful and measured, reflecting the depth of human experience and the potential for cosmic diplomacy.",
-   'score': 0,
-   'metadata': {'llm_calls': 1,
-    'prompt_tokens': 10982,
-    'output_tokens': 471,
-    'context_data': {'entities': Empty DataFrame
-     Columns: [in_context]
-     Index: [],
-     'sources':     id                                               text
-     0   26  eterred, Jordan cast a determined glance at th...
-     1    6   ordered, their voice echoing slightly before ...
-     2   38   urged, his voice bearing the gravitas of thei...
-     3   27  , and not a small measure of trepidation. "Thi...
-     4    5   very walls of the shaft—a whisper of somethin...
-     5    9   "The silence here... It's almost as if the ba...
-     6   30   emissaries to a celestial congress we're only...
-     7   46   was now actively partaking in an exchange not...
-     8   29  crum of insight and expertise, and felt the so...
-     9   45   they faced. "If it's truly sentient, we're no...
-     10  31   set the tempo for an undertaking that travers...
-     11  32   cosmos—secrets that, until now, had been lost...
-     12   3  , weighing his words carefully. "Our tech is t...
-     13  23  Sam Rivera, ever the source of technological a...
-     14  47   revealing a tinge of skepticism at Taylor Cru...
-     15  15   than the last.\n\nThen, with a sudden burst t...
-     16  35  , every keystroke an intricate step in their t...}},
-   'id': 9},
-  {'query': 'What are the strategic implications of successful alien communication for the Paranormal Military Squad?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 10},
-  {'query': "What is the Paranormal Military Squad's mission at Dulce?",
-   'answer': "The Paranormal Military Squad's mission at Dulce involves deciphering and establishing communication with an alien intelligence through a complex signal that has been detected. The team, led by Agent Alex Mercer, is tasked with unraveling the origins and intentions behind this signal, which is believed to be sentient and capable of adapting to their interactions [Data: Sources (17, 32, 28, 25, 18)].\n\nThe mission is set in the underground command center of Dulce Base, where the team, including Dr. Jordan Hayes, Taylor Cruz, and Sam Rivera, works tirelessly to decode the alien encryption. Their goal is to establish a dialogue with the extraterrestrial intelligence, which could potentially lead to a new cosmic relationship for humanity [Data: Sources (32, 28, 34, 15, 49)].\n\nThe operation is fraught with tension and uncertainty, as the team must balance the potential for groundbreaking discovery with the risk of misunderstanding or provoking an unknown entity. The mission's success hinges on their ability to interpret the alien signals accurately and respond in a way that fosters understanding rather than conflict [Data: Sources (17, 32, 18, 44, 23)].\n\nOverall, the mission at Dulce represents a significant leap for humanity in terms of interstellar communication and understanding, with the Paranormal Military Squad at the forefront of this unprecedented endeavor.",
-   'score': 85,
-   'metadata': {'llm_calls': 1,
-    'prompt_tokens': 10982,
-    'output_tokens': 384,
-    'context_data': {'entities': Empty DataFrame
-     Columns: [in_context]
-     Index: [],
-     'sources':     id                                               text
-     0   17   on the sequences that danced across the scree...
-     1   32   cosmos—secrets that, until now, had been lost...
-     2   28   "and in every word we script, in every respon...
-     3   34  Our responses so far have echoed their complex...
-     4   25   his fingers hovering over the command keys. W...
-     5   30   emissaries to a celestial congress we're only...
-     6   11  , whose steady presence and ready tech affirme...
-     7   36  's luminescence. "Remember, while we seek comm...
-     8   37   from across the console, their eyes not leavi...
-     9   15   than the last.\n\nThen, with a sudden burst t...
-     10  18   the universe.\n\nIn a symphony of clicks and ...
-     11  44   It's a... symphony. It's as if they're teachi...
-     12  24  Keep the communication channels open. But let ...
-     13  49   on. In his eyes flashed the foreboding excite...
-     14  21   an undercurrent of intensity carried forth in...
-     15   0  # Operation: Dulce\n\n## Chapter 1\n\nThe thru...
-     16  23  Sam Rivera, ever the source of technological a...}},
-   'id': 11},
-  {'query': 'How does the Dulce Base facilitate interspecies communication?',
-   'answer': "The Dulce Base, as depicted in the provided sources, serves as a critical hub for interspecies communication, primarily through its advanced technological infrastructure and the expertise of its personnel. The base is equipped with sophisticated communication systems capable of decoding and interpreting alien signals, which are described as complex and evolving patterns that require careful analysis and response [Data: Sources (22, 26, 38, 46)].\n\nThe team at Dulce Base, including key figures like Dr. Jordan Hayes, Alex Mercer, Taylor Cruz, and Sam Rivera, plays a pivotal role in facilitating this communication. They are depicted as highly skilled individuals who combine their scientific acumen with diplomatic caution to engage with extraterrestrial intelligences. Their work involves not just decoding signals but also crafting responses that reflect human curiosity and empathy, aiming to establish a dialogue that transcends mere data exchange [Data: Sources (22, 38, 46, 29)].\n\nThe process of communication is described as a symphony, where the team must align their responses to the rhythm and nuances of the alien signals. This metaphor highlights the complexity and delicacy of the task, as the team navigates the unknown with both caution and ambition. The base's environment, with its advanced machinery and the strategic oversight of its agents, provides a controlled setting where these interactions can unfold, potentially leading to a new era of interstellar diplomacy [Data: Sources (22, 26, 38, 46)].\n\nOverall, Dulce Base's role in interspecies communication is characterized by its blend of cutting-edge technology and the human element of its team, who are tasked with interpreting and responding to signals that could redefine humanity's place in the cosmos.",
-   'score': 85,
-   'metadata': {'llm_calls': 1,
-    'prompt_tokens': 10982,
-    'output_tokens': 464,
-    'context_data': {'entities': Empty DataFrame
-     Columns: [in_context]
-     Index: [],
-     'sources':     id                                               text
-     0   22   his team into the core of their approach, his...
-     1   26  eterred, Jordan cast a determined glance at th...
-     2    6   ordered, their voice echoing slightly before ...
-     3   38   urged, his voice bearing the gravitas of thei...
-     4   27  , and not a small measure of trepidation. "Thi...
-     5    5   very walls of the shaft—a whisper of somethin...
-     6    9   "The silence here... It's almost as if the ba...
-     7   30   emissaries to a celestial congress we're only...
-     8   46   was now actively partaking in an exchange not...
-     9   29  crum of insight and expertise, and felt the so...
-     10  45   they faced. "If it's truly sentient, we're no...
-     11  31   set the tempo for an undertaking that travers...
-     12  32   cosmos—secrets that, until now, had been lost...
-     13   3  , weighing his words carefully. "Our tech is t...
-     14  23  Sam Rivera, ever the source of technological a...
-     15  47   revealing a tinge of skepticism at Taylor Cru...
-     16  15   than the last.\n\nThen, with a sudden burst t...}},
-   'id': 12},
-  {'query': 'What specific technologies do Alex Mercer and the team use for extraterrestrial communication?',
-   'answer': "In the context of the Paranormal Military Squad's mission at Dulce Base, Alex Mercer and his team employ a variety of advanced technologies to facilitate communication with extraterrestrial intelligence. The narrative suggests a high level of technological sophistication, though specific devices and systems are not exhaustively detailed.\n\n### Communication and Decryption Technologies\n\nThe team utilizes decryption algorithms to break through layers of encryption in the alien signals, as indicated by Dr. Jordan Hayes' work on decryption algorithms [Data: Sources (45, 23)]. This suggests the use of advanced computational tools capable of handling complex, adaptive signals that change in real-time, akin to a conversation where both parties are learning each other's language [Data: Sources (23, 24)].\n\n### Signal Analysis and Monitoring\n\nThe command center at Dulce Base is equipped with monitors and consoles that display alien code and signals, which the team analyzes to understand the structure and intent of the communications [Data: Sources (24, 26)]. The presence of a central terminal and a bank of monitors indicates the use of sophisticated signal processing equipment to interpret the alien language and intentions [Data: Sources (31, 32)].\n\n### Adaptive Communication Systems\n\nThe narrative describes the alien signal as evolving and adapting, suggesting that the team might be using adaptive communication systems that can respond to changes in the signal's structure. This is further supported by the description of the signal as being reflexive and responsive, indicating a level of interaction that requires dynamic and flexible communication technologies [Data: Sources (44, 41)].\n\n### Conclusion\n\nWhile the specific technologies are not explicitly named, it is clear that Alex Mercer and his team rely on a combination of decryption algorithms, signal processing equipment, and adaptive communication systems to engage with extraterrestrial intelligence. These technologies are crucial for interpreting and responding to the complex and evolving signals they encounter.",
-   'score': 70,
-   'metadata': {'llm_calls': 1,
-    'prompt_tokens': 10982,
-    'output_tokens': 484,
-    'context_data': {'entities': Empty DataFrame
-     Columns: [in_context]
-     Index: [],
-     'sources':     id                                               text
-     0   45   they faced. "If it's truly sentient, we're no...
-     1   31   set the tempo for an undertaking that travers...
-     2   27  , and not a small measure of trepidation. "Thi...
-     3   23  Sam Rivera, ever the source of technological a...
-     4   24  Keep the communication channels open. But let ...
-     5   26  eterred, Jordan cast a determined glance at th...
-     6    0  # Operation: Dulce\n\n## Chapter 1\n\nThe thru...
-     7   16   a new cosmic paradigm.\n\nAlex Mercer watched...
-     8   32   cosmos—secrets that, until now, had been lost...
-     9   14   a communal outreach beyond the stars. As dawn...
-     10  18   the universe.\n\nIn a symphony of clicks and ...
-     11  44   It's a... symphony. It's as if they're teachi...
-     12  41   conviction that knowledge was more than power...
-     13   8   I'm right, what we're looking at isn't random...
-     14  10   but felt by all. The walls didn't just whispe...
-     15   3  , weighing his words carefully. "Our tech is t...
-     16  21   an undercurrent of intensity carried forth in...}},
-   'id': 13},
-  {'query': 'Who are the other key figures involved in operations at Dulce besides Alex Mercer?',
-   'answer': "In the operations at Dulce, several key figures play significant roles alongside Agent Alex Mercer. Dr. Jordan Hayes is a prominent character, depicted as a scientist deeply involved in the analysis and interpretation of alien technology and signals. Jordan is portrayed as composed and focused, often contemplating the broader implications of their discoveries, such as the potential paradigm shifts in understanding physics and the nature of alien communication [Data: Sources (40, 42, 45, 31, 41)].\n\nTaylor Cruz is another central figure, characterized by their authoritative and pragmatic approach. Taylor often emphasizes the importance of protocol and caution, especially when dealing with the unknown elements of the Dulce base. Their leadership style is marked by a balance of control and occasional moments of unexpected reverence for the alien technology they encounter [Data: Sources (9, 42, 23, 24, 44)].\n\nSam Rivera is noted for their technological expertise and optimism about forming connections with alien intelligence. Sam's role involves adapting technology to communicate with alien signals, and they are often seen as a source of youthful energy and enthusiasm within the team [Data: Sources (42, 23, 44)].\n\nThese individuals, along with Alex Mercer, form a team that navigates the complexities of the Dulce operations, each bringing their unique skills and perspectives to the mission.",
-   'score': 85,
-   'metadata': {'llm_calls': 1,
-    'prompt_tokens': 10980,
-    'output_tokens': 386,
-    'context_data': {'entities': Empty DataFrame
-     Columns: [in_context]
-     Index: [],
-     'sources':     id                                               text
-     0   40   and the distant hum of machinery hinted at Du...
-     1    9   "The silence here... It's almost as if the ba...
-     2   42   the dark heart of Dulce's secrets. \n\nAnd th...
-     3   45   they faced. "If it's truly sentient, we're no...
-     4   31   set the tempo for an undertaking that travers...
-     5   27  , and not a small measure of trepidation. "Thi...
-     6   23  Sam Rivera, ever the source of technological a...
-     7   24  Keep the communication channels open. But let ...
-     8   26  eterred, Jordan cast a determined glance at th...
-     9    0  # Operation: Dulce\n\n## Chapter 1\n\nThe thru...
-     10  16   a new cosmic paradigm.\n\nAlex Mercer watched...
-     11  32   cosmos—secrets that, until now, had been lost...
-     12  14   a communal outreach beyond the stars. As dawn...
-     13  18   the universe.\n\nIn a symphony of clicks and ...
-     14  44   It's a... symphony. It's as if they're teachi...
-     15  41   conviction that knowledge was more than power...
-     16   8   I'm right, what we're looking at isn't random...}},
-   'id': 14},
-  {'query': 'What historical events are linked to Dulce and its operations?',
-   'answer': 'The narrative surrounding Dulce and its operations is steeped in mystery and speculation, often linked to conspiracy theories and alleged secret government projects. Dulce, a small town in New Mexico, is purportedly the site of a secret underground facility known as the Dulce Base. This base is rumored to be a joint human-alien biogenetic laboratory, where various clandestine activities, including experiments on humans and extraterrestrials, are said to occur.\n\nThe origins of the Dulce Base conspiracy theory can be traced back to the late 1970s and early 1980s, when a former New Mexico State Police officer named Gabe Valdez reported unusual cattle mutilations in the area. These incidents fueled speculation about extraterrestrial involvement and secret government operations. The story gained further traction when a man named Paul Bennewitz, who lived near Kirtland Air Force Base, claimed to have intercepted electronic communications from alien spacecraft and a secret base in Dulce.\n\nIn the 1980s, the narrative was expanded by various conspiracy theorists, including John Lear and Milton William Cooper, who alleged that the U.S. government had entered into agreements with extraterrestrial beings, allowing them to abduct humans in exchange for technology. These theories often include references to the supposed underground base at Dulce, where these activities are said to take place.\n\nWhile there is no concrete evidence to support the existence of the Dulce Base or the activities alleged to occur there, the story has become a staple of UFO lore and conspiracy theories. It reflects broader themes of distrust in government and fascination with the possibility of extraterrestrial life, which have been prevalent in American culture since the mid-20th century.',
-   'score': 0,
-   'metadata': {'llm_calls': 1,
-    'prompt_tokens': 10981,
-    'output_tokens': 449,
-    'context_data': {'entities': Empty DataFrame
-     Columns: [in_context]
-     Index: [],
-     'sources':     id                                               text
-     0   12   keep the team grounded. No one goes off-cours...
-     1   40   and the distant hum of machinery hinted at Du...
-     2    6   ordered, their voice echoing slightly before ...
-     3    8   I'm right, what we're looking at isn't random...
-     4    0  # Operation: Dulce\n\n## Chapter 1\n\nThe thru...
-     5   33   were locked onto the display screen, where an...
-     6   15   than the last.\n\nThen, with a sudden burst t...
-     7   42   the dark heart of Dulce's secrets. \n\nAnd th...
-     8    1  's authoritarian performance. _Protocols_, Jor...
-     9   41   conviction that knowledge was more than power...
-     10  10   but felt by all. The walls didn't just whispe...
-     11  34  Our responses so far have echoed their complex...
-     12  38   urged, his voice bearing the gravitas of thei...
-     13   7  , while Alex clenched his jaw, the buzz of fru...
-     14   2  , rehearsing the speech for their subordinates...
-     15  17   on the sequences that danced across the scree...
-     16  18   the universe.\n\nIn a symphony of clicks and ...}},
-   'id': 15},
-  {'query': 'What are the specific roles of Washington and Mercer in the interstellar communication efforts?',
-   'answer': "In the interstellar communication efforts described in the sources, Alex Mercer plays a pivotal role as a leader and coordinator within the Paranormal Military Squad. His responsibilities include overseeing the team's operations, ensuring that communication channels remain open, and guiding the team through the complexities of decoding and responding to alien signals. Mercer is depicted as a steady and reliable presence, providing both strategic oversight and emotional support to his team members as they navigate the challenges of first contact with an extraterrestrial intelligence [Data: Sources (12, 13, 45, 31, 27)].\n\nMercer is portrayed as a figure who balances military discipline with a diplomatic approach, understanding the significance of their mission not just for their squad but for all of humanity. He emphasizes the importance of maintaining open communication channels and ensuring that every message and pulse is carefully monitored, recognizing the potential for both breakthrough and disaster in their interactions with the alien signal [Data: Sources (23, 24, 44)].\n\nOn the other hand, Washington's role is less explicitly detailed in the sources. The mention of Washington seems to refer to a broader governmental or military oversight, possibly providing directives or support to the Paranormal Military Squad. However, the specific actions or decisions made by Washington in the context of the interstellar communication efforts are not clearly outlined in the provided data [Data: Sources (12, 13)].\n\nOverall, while Mercer is actively engaged in the day-to-day operations and strategic decision-making of the interstellar communication efforts, Washington appears to be more of a background presence, potentially representing higher-level authority or oversight without direct involvement in the team's activities.",
-   'score': 80,
-   'metadata': {'llm_calls': 1,
-    'prompt_tokens': 10982,
-    'output_tokens': 442,
-    'context_data': {'entities': Empty DataFrame
-     Columns: [in_context]
-     Index: [],
-     'sources':     id                                               text
-     0   12   keep the team grounded. No one goes off-cours...
-     1   13   primacy within.\n\n"The closer we get to unlo...
-     2   45   they faced. "If it's truly sentient, we're no...
-     3   31   set the tempo for an undertaking that travers...
-     4   27  , and not a small measure of trepidation. "Thi...
-     5   23  Sam Rivera, ever the source of technological a...
-     6   24  Keep the communication channels open. But let ...
-     7   26  eterred, Jordan cast a determined glance at th...
-     8    0  # Operation: Dulce\n\n## Chapter 1\n\nThe thru...
-     9   16   a new cosmic paradigm.\n\nAlex Mercer watched...
-     10  32   cosmos—secrets that, until now, had been lost...
-     11  14   a communal outreach beyond the stars. As dawn...
-     12  18   the universe.\n\nIn a symphony of clicks and ...
-     13  44   It's a... symphony. It's as if they're teachi...
-     14  41   conviction that knowledge was more than power...
-     15   8   I'm right, what we're looking at isn't random...
-     16  10   but felt by all. The walls didn't just whispe...}},
-   'id': 16},
-  {'query': 'How does Agent Mercer interact with other key figures like Cruz and Rivera?',
-   'answer': "Agent Alex Mercer is depicted as a central figure within the Paranormal Military Squad, interacting with other key figures such as Taylor Cruz and Sam Rivera in a manner that reflects both his leadership qualities and his adaptability to the evolving dynamics of their mission.\n\n### Interaction with Taylor Cruz\n\nMercer's interactions with Taylor Cruz are marked by a balance of respect and subtle tension. Cruz is portrayed as a commanding presence, often emphasizing protocol and caution. For instance, when Mercer expresses doubts or questions the situation, Cruz is quick to remind him of the importance of staying focused and adhering to protocols [Data: Sources (9, 0, 8)]. Despite this, Mercer acknowledges Cruz's authority and often aligns his actions with Cruz's directives, indicating a professional respect for Cruz's leadership [Data: Sources (0, 8)]. However, there is an underlying complexity in their relationship, as Mercer sometimes feels the weight of compliance conflicting with his natural inclination to question and explore beyond the given directives [Data: Sources (0, 8)].\n\n### Interaction with Sam Rivera\n\nMercer's relationship with Sam Rivera is characterized by a sense of mentorship and collaboration. Rivera, who is depicted as a youthful and enthusiastic member of the team, often brings a fresh perspective and technological acumen to their operations. Mercer values Rivera's insights and encourages his contributions, recognizing the importance of Rivera's role in deciphering the alien signals they encounter [Data: Sources (23, 44, 41)]. This dynamic is evident when Mercer supports Rivera's technological efforts and acknowledges the potential of Rivera's findings, fostering an environment of mutual respect and intellectual curiosity [Data: Sources (23, 44)].\n\n### Overall Dynamics\n\nOverall, Mercer's interactions with Cruz and Rivera highlight his ability to navigate the complexities of leadership within a high-stakes environment. He balances the need to adhere to military protocols, as emphasized by Cruz, with the innovative and exploratory spirit encouraged by Rivera. This duality in his interactions underscores Mercer's role as a mediator between the structured demands of their mission and the unpredictable nature of their discoveries.",
-   'score': 85,
-   'metadata': {'llm_calls': 1,
-    'prompt_tokens': 10981,
-    'output_tokens': 518,
-    'context_data': {'entities': Empty DataFrame
-     Columns: [in_context]
-     Index: [],
-     'sources':     id                                               text
-     0    9   "The silence here... It's almost as if the ba...
-     1   42   the dark heart of Dulce's secrets. \n\nAnd th...
-     2    4   stepping into their exchange. The authority i...
-     3   45   they faced. "If it's truly sentient, we're no...
-     4   31   set the tempo for an undertaking that travers...
-     5   27  , and not a small measure of trepidation. "Thi...
-     6   23  Sam Rivera, ever the source of technological a...
-     7   24  Keep the communication channels open. But let ...
-     8   26  eterred, Jordan cast a determined glance at th...
-     9    0  # Operation: Dulce\n\n## Chapter 1\n\nThe thru...
-     10  16   a new cosmic paradigm.\n\nAlex Mercer watched...
-     11  32   cosmos—secrets that, until now, had been lost...
-     12  14   a communal outreach beyond the stars. As dawn...
-     13  18   the universe.\n\nIn a symphony of clicks and ...
-     14  44   It's a... symphony. It's as if they're teachi...
-     15  41   conviction that knowledge was more than power...
-     16   8   I'm right, what we're looking at isn't random...}},
-   'id': 17},
-  {'query': 'What are the responsibilities of the Paranormal Military Squad where Mercer is involved?',
-   'answer': "The Paranormal Military Squad, with Agent Alex Mercer as a key member, is tasked with navigating the complexities of extraterrestrial communication and potential first contact scenarios. Their responsibilities include deciphering alien signals, understanding the intentions behind these communications, and ensuring that humanity's response is both cautious and informed. The team operates within the confines of Dulce Base, a location shrouded in secrecy and charged with the potential for groundbreaking discoveries.\n\nAgent Mercer, along with his colleagues Dr. Jordan Hayes, Taylor Cruz, and Sam Rivera, is deeply involved in the process of decrypting alien codes and engaging in a dialogue with an unknown intelligence. This involves not only technical expertise but also a strategic approach to ensure that the interactions do not lead to unintended consequences. The squad's mission is to bridge the gap between human and alien understanding, potentially altering the course of human history by establishing a new form of interstellar communication [Data: Sources (40, 45, 31, 27, 23)].\n\nThe squad's work is characterized by a blend of scientific inquiry and military discipline, as they must balance the pursuit of knowledge with the need for security and caution. They are responsible for maintaining open communication channels with the alien intelligence while ensuring that no message or signal goes unchecked, as the implications of their work could be profound and far-reaching [Data: Sources (24, 26, 44, 41)].\n\nOverall, the Paranormal Military Squad's responsibilities extend beyond mere observation; they are active participants in a potentially historic exchange, tasked with scripting humanity's interstellar narrative and ensuring that the dialogue remains constructive and safe [Data: Sources (32, 14, 18)].",
-   'score': 85,
-   'metadata': {'llm_calls': 1,
-    'prompt_tokens': 10981,
-    'output_tokens': 445,
-    'context_data': {'entities': Empty DataFrame
-     Columns: [in_context]
-     Index: [],
-     'sources':     id                                               text
-     0   40   and the distant hum of machinery hinted at Du...
-     1   45   they faced. "If it's truly sentient, we're no...
-     2   31   set the tempo for an undertaking that travers...
-     3   27  , and not a small measure of trepidation. "Thi...
-     4   23  Sam Rivera, ever the source of technological a...
-     5   24  Keep the communication channels open. But let ...
-     6   26  eterred, Jordan cast a determined glance at th...
-     7    0  # Operation: Dulce\n\n## Chapter 1\n\nThe thru...
-     8   16   a new cosmic paradigm.\n\nAlex Mercer watched...
-     9   32   cosmos—secrets that, until now, had been lost...
-     10  14   a communal outreach beyond the stars. As dawn...
-     11  18   the universe.\n\nIn a symphony of clicks and ...
-     12  44   It's a... symphony. It's as if they're teachi...
-     13  41   conviction that knowledge was more than power...
-     14   8   I'm right, what we're looking at isn't random...
-     15  10   but felt by all. The walls didn't just whispe...
-     16   3  , weighing his words carefully. "Our tech is t...}},
-   'id': 18},
-  {'query': 'In what ways is Mercer instrumental in the operations at Dulce Base?',
-   'answer': "Agent Alex Mercer plays a pivotal role in the operations at Dulce Base, primarily through his leadership and strategic thinking. As a member of the Paranormal Military Squad, Mercer is depicted as a determined and reliable figure, often acting as a stabilizing force amidst the chaos of their mission. His presence is marked by a blend of military discipline and intellectual curiosity, which allows him to navigate the complexities of the situation effectively.\n\nMercer's leadership is evident in his interactions with his team. He is seen providing guidance and support to his colleagues, such as Dr. Jordan Hayes, as they work to decrypt alien signals and understand the implications of their findings [Data: Sources (23, 24, 31, 41)]. His ability to maintain composure and focus under pressure is crucial in ensuring that the team remains on track and that their efforts are coordinated and purposeful.\n\nFurthermore, Mercer's strategic mindset is highlighted in his approach to the unknown challenges posed by the alien signals. He emphasizes the importance of keeping communication channels open and ensuring that no message goes unchecked, recognizing the potential for both breakthrough and disaster [Data: Sources (23, 24, 31)]. This balanced strategy reflects his understanding of the delicate nature of their mission and the need for careful navigation of the unknown.\n\nOverall, Mercer's role at Dulce Base is characterized by his ability to lead, support, and strategize, making him an instrumental figure in the team's efforts to engage with the extraterrestrial intelligence they encounter.",
-   'score': 85,
-   'metadata': {'llm_calls': 1,
-    'prompt_tokens': 10981,
-    'output_tokens': 427,
-    'context_data': {'entities': Empty DataFrame
-     Columns: [in_context]
-     Index: [],
-     'sources':     id                                               text
-     0    9   "The silence here... It's almost as if the ba...
-     1   42   the dark heart of Dulce's secrets. \n\nAnd th...
-     2   45   they faced. "If it's truly sentient, we're no...
-     3   31   set the tempo for an undertaking that travers...
-     4   27  , and not a small measure of trepidation. "Thi...
-     5   23  Sam Rivera, ever the source of technological a...
-     6   24  Keep the communication channels open. But let ...
-     7   26  eterred, Jordan cast a determined glance at th...
-     8    0  # Operation: Dulce\n\n## Chapter 1\n\nThe thru...
-     9   16   a new cosmic paradigm.\n\nAlex Mercer watched...
-     10  32   cosmos—secrets that, until now, had been lost...
-     11  14   a communal outreach beyond the stars. As dawn...
-     12  18   the universe.\n\nIn a symphony of clicks and ...
-     13  44   It's a... symphony. It's as if they're teachi...
-     14  41   conviction that knowledge was more than power...
-     15   8   I'm right, what we're looking at isn't random...
-     16  10   but felt by all. The walls didn't just whispe...}},
-   'id': 19},
-  {'query': 'What is the historical context and background of Mercer’s involvement in extraterrestrial communications?',
-   'answer': "Agent Alex Mercer is a key figure in the Paranormal Military Squad, a clandestine group tasked with deciphering and engaging with extraterrestrial communications. His involvement is set against the backdrop of a secretive operation at Dulce Base, where the team is working to decode a complex signal believed to be of alien origin. The narrative unfolds in a high-stakes environment where the team, including Mercer, is navigating the challenges of first contact with an unknown intelligence [Data: Sources (45, 31, 27, 23, 24)].\n\nMercer's role is pivotal as he leads the team through the intricacies of this unprecedented mission. His leadership is characterized by a balance of caution and curiosity, as he guides his team through the potential risks and rewards of engaging with an alien consciousness. The operation is not just about decoding a signal but understanding the intentions behind it, which could range from peaceful communication to potential threats [Data: Sources (45, 31, 27, 23, 24)].\n\nThe historical context of Mercer's involvement is marked by the tension between military protocol and the unknown variables of extraterrestrial contact. The team operates under the constant pressure of making decisions that could have far-reaching implications for humanity. Mercer's experience and strategic thinking are crucial as the team attempts to bridge the gap between human and alien understanding, potentially altering the course of human history [Data: Sources (45, 31, 27, 23, 24)].",
-   'score': 85,
-   'metadata': {'llm_calls': 1,
-    'prompt_tokens': 10982,
-    'output_tokens': 411,
-    'context_data': {'entities': Empty DataFrame
-     Columns: [in_context]
-     Index: [],
-     'sources':     id                                               text
-     0   45   they faced. "If it's truly sentient, we're no...
-     1   31   set the tempo for an undertaking that travers...
-     2   27  , and not a small measure of trepidation. "Thi...
-     3   23  Sam Rivera, ever the source of technological a...
-     4   24  Keep the communication channels open. But let ...
-     5   26  eterred, Jordan cast a determined glance at th...
-     6    0  # Operation: Dulce\n\n## Chapter 1\n\nThe thru...
-     7   16   a new cosmic paradigm.\n\nAlex Mercer watched...
-     8   32   cosmos—secrets that, until now, had been lost...
-     9   14   a communal outreach beyond the stars. As dawn...
-     10  18   the universe.\n\nIn a symphony of clicks and ...
-     11  44   It's a... symphony. It's as if they're teachi...
-     12  41   conviction that knowledge was more than power...
-     13   8   I'm right, what we're looking at isn't random...
-     14  10   but felt by all. The walls didn't just whispe...
-     15   3  , weighing his words carefully. "Our tech is t...
-     16  21   an undercurrent of intensity carried forth in...}},
-   'id': 20},
-  {'query': 'What specific roles does Alex Mercer play at the Dulce Facility?',
-   'answer': "Alex Mercer plays a pivotal role at the Dulce Facility, primarily as a leader and strategist within the Paranormal Military Squad. His responsibilities include overseeing the team's operations and ensuring that communication channels with the alien signal remain open and secure. Mercer is depicted as a figure of authority and reliability, often providing guidance and support to his team members, such as Dr. Jordan Hayes, Taylor Cruz, and Sam Rivera, as they navigate the complexities of decoding and interacting with the alien signal [Data: Sources (45, 31, 27, 23, 24)].\n\nMercer is also portrayed as a mediator, balancing the need for caution with the pursuit of understanding. He emphasizes the importance of maintaining open communication while ensuring that no message or signal goes unchecked, highlighting his role in managing the delicate balance between exploration and security [Data: Sources (23, 24, 44)]. His leadership style is characterized by a blend of military discipline and diplomatic acumen, as he guides his team through the unprecedented challenges posed by the alien contact [Data: Sources (45, 31, 27, 23, 24)].\n\nFurthermore, Mercer is involved in strategic decision-making, often consulting with his team to assess the risks and potential outcomes of their interactions with the alien intelligence. His approach is marked by a cautious optimism, as he encourages his team to proceed with both curiosity and prudence [Data: Sources (31, 27, 23, 24)]. Overall, Alex Mercer's role at the Dulce Facility is multifaceted, encompassing leadership, strategy, and diplomacy in the face of an extraordinary extraterrestrial encounter.",
-   'score': 85,
-   'metadata': {'llm_calls': 1,
-    'prompt_tokens': 10982,
-    'output_tokens': 439,
-    'context_data': {'entities': Empty DataFrame
-     Columns: [in_context]
-     Index: [],
-     'sources':     id                                               text
-     0   45   they faced. "If it's truly sentient, we're no...
-     1   31   set the tempo for an undertaking that travers...
-     2   27  , and not a small measure of trepidation. "Thi...
-     3   23  Sam Rivera, ever the source of technological a...
-     4   24  Keep the communication channels open. But let ...
-     5   26  eterred, Jordan cast a determined glance at th...
-     6    0  # Operation: Dulce\n\n## Chapter 1\n\nThe thru...
-     7   16   a new cosmic paradigm.\n\nAlex Mercer watched...
-     8   32   cosmos—secrets that, until now, had been lost...
-     9   14   a communal outreach beyond the stars. As dawn...
-     10  18   the universe.\n\nIn a symphony of clicks and ...
-     11  44   It's a... symphony. It's as if they're teachi...
-     12  41   conviction that knowledge was more than power...
-     13   8   I'm right, what we're looking at isn't random...
-     14  10   but felt by all. The walls didn't just whispe...
-     15   3  , weighing his words carefully. "Our tech is t...
-     16  21   an undercurrent of intensity carried forth in...}},
-   'id': 21},
-  {'query': "How does Alex Mercer's perception of Cosmic Vocalization differ from Taylor Cruz's views?",
-   'answer': "Alex Mercer and Taylor Cruz, both members of the Paranormal Military Squad, exhibit differing perspectives on the phenomenon of Cosmic Vocalization, which refers to the communication signals they are receiving from an unknown extraterrestrial source.\n\n**Alex Mercer's Perspective**\n\nAlex Mercer approaches the Cosmic Vocalization with a sense of cautious optimism and a strategic mindset. He is portrayed as someone who is deeply aware of the historical significance of their task and the potential for these signals to represent a new form of consciousness. Alex emphasizes the importance of keeping communication channels open and ensuring that every message is carefully monitored. He views the signals as a potential 'Rosetta Stone' for humanity, suggesting that they could unlock new understandings and bridge the cosmic divide [Data: Sources (45, 23, 24)]. Alex's approach is characterized by a balance between curiosity and caution, as he acknowledges the potential for both profound discovery and significant risk [Data: Sources (45, 23, 24)].\n\n**Taylor Cruz's Perspective**\n\nIn contrast, Taylor Cruz exhibits a more cautious and pragmatic approach to the Cosmic Vocalization. Taylor is consistently portrayed as urging caution and emphasizing the potential risks associated with the signals. They are concerned about the possibility of the signals being hostile or aggressive, and they stress the importance of maintaining control and security over the communication process. Taylor's perspective is rooted in a sense of duty to assess the risk to humanity and to ensure that the team's actions do not inadvertently lead to disaster [Data: Sources (31, 23, 24)]. Taylor's approach is more conservative, focusing on the need for a measured response to each new discovery and the potential threats that could arise from misinterpreting the signals [Data: Sources (31, 23, 24)].\n\n**Conclusion**\n\nOverall, while Alex Mercer is open to the possibilities that the Cosmic Vocalization presents, viewing it as an opportunity for interstellar diplomacy and understanding, Taylor Cruz remains vigilant about the potential dangers, advocating for a more guarded and controlled approach. This difference in perspectives highlights the dynamic tension within the team as they navigate the unknowns of extraterrestrial communication.",
-   'score': 85,
-   'metadata': {'llm_calls': 1,
-    'prompt_tokens': 10982,
-    'output_tokens': 556,
-    'context_data': {'entities': Empty DataFrame
-     Columns: [in_context]
-     Index: [],
-     'sources':     id                                               text
-     0   45   they faced. "If it's truly sentient, we're no...
-     1   31   set the tempo for an undertaking that travers...
-     2   27  , and not a small measure of trepidation. "Thi...
-     3   23  Sam Rivera, ever the source of technological a...
-     4   24  Keep the communication channels open. But let ...
-     5   26  eterred, Jordan cast a determined glance at th...
-     6    0  # Operation: Dulce\n\n## Chapter 1\n\nThe thru...
-     7   16   a new cosmic paradigm.\n\nAlex Mercer watched...
-     8   32   cosmos—secrets that, until now, had been lost...
-     9   14   a communal outreach beyond the stars. As dawn...
-     10  18   the universe.\n\nIn a symphony of clicks and ...
-     11  44   It's a... symphony. It's as if they're teachi...
-     12  41   conviction that knowledge was more than power...
-     13   8   I'm right, what we're looking at isn't random...
-     14  10   but felt by all. The walls didn't just whispe...
-     15   3  , weighing his words carefully. "Our tech is t...
-     16  21   an undercurrent of intensity carried forth in...}},
-   'id': 22},
-  {'query': 'What is the relationship between the Paranormal Military Squad and Alex Mercer?',
-   'answer': "Agent Alex Mercer is a key member of the Paranormal Military Squad, a specialized team tasked with investigating and managing extraordinary phenomena, particularly those involving potential extraterrestrial contact. The narrative surrounding Alex Mercer highlights his role as a determined and strategic leader within the squad, often navigating the complexities of their missions with a blend of military discipline and intellectual curiosity.\n\nIn the context of Operation: Dulce, Alex Mercer is portrayed as a central figure who balances the demands of protocol with the need for adaptability in the face of unknown cosmic challenges. His interactions with other team members, such as Dr. Jordan Hayes and Taylor Cruz, reveal his capacity for collaboration and leadership, as well as his commitment to the mission's success [Data: Sources (0, 3, 8, 10, 16)].\n\nAlex's relationship with the Paranormal Military Squad is characterized by a shared purpose and a collective drive to uncover the mysteries of the universe. The squad operates as a cohesive unit, with each member contributing their expertise to the overarching goal of understanding and potentially communicating with extraterrestrial intelligences. Alex's role is pivotal in guiding the team through the intricacies of their mission, ensuring that they remain focused and prepared for the challenges ahead [Data: Sources (23, 24, 27, 31, 32)].",
-   'score': 85,
-   'metadata': {'llm_calls': 1,
-    'prompt_tokens': 10981,
-    'output_tokens': 374,
-    'context_data': {'entities': Empty DataFrame
-     Columns: [in_context]
-     Index: [],
-     'sources':     id                                               text
-     0   40   and the distant hum of machinery hinted at Du...
-     1   45   they faced. "If it's truly sentient, we're no...
-     2   31   set the tempo for an undertaking that travers...
-     3   27  , and not a small measure of trepidation. "Thi...
-     4   23  Sam Rivera, ever the source of technological a...
-     5   24  Keep the communication channels open. But let ...
-     6   26  eterred, Jordan cast a determined glance at th...
-     7    0  # Operation: Dulce\n\n## Chapter 1\n\nThe thru...
-     8   16   a new cosmic paradigm.\n\nAlex Mercer watched...
-     9   32   cosmos—secrets that, until now, had been lost...
-     10  14   a communal outreach beyond the stars. As dawn...
-     11  18   the universe.\n\nIn a symphony of clicks and ...
-     12  44   It's a... symphony. It's as if they're teachi...
-     13  41   conviction that knowledge was more than power...
-     14   8   I'm right, what we're looking at isn't random...
-     15  10   but felt by all. The walls didn't just whispe...
-     16   3  , weighing his words carefully. "Our tech is t...}},
-   'id': 23},
-  {'query': "How has Alex Mercer's involvement influenced strategic decisions regarding cosmic events?",
-   'answer': "Alex Mercer plays a pivotal role in the strategic decisions surrounding cosmic events, particularly in the context of the Paranormal Military Squad's operations. His involvement is characterized by a blend of caution and curiosity, which is crucial in navigating the unknown territories of interstellar communication and potential first contact scenarios.\n\nMercer's leadership style is marked by a balance between military discipline and a diplomatic approach to the unknown. He emphasizes the importance of keeping communication channels open while ensuring that no message or signal goes unchecked, highlighting the delicate nature of their mission [Data: Sources (45, 23, 24)]. This approach reflects a strategic decision to engage with potential extraterrestrial intelligence with both openness and vigilance, recognizing the dual possibilities of breakthrough or disaster [Data: Sources (23, 24, 31)].\n\nFurthermore, Mercer's interactions with his team, including Dr. Jordan Hayes, Taylor Cruz, and Sam Rivera, demonstrate his ability to foster a collaborative environment where each member's expertise contributes to the mission's success. His encouragement of cautious optimism and strategic foresight helps guide the team through the complexities of decoding alien signals and understanding their implications [Data: Sources (45, 23, 24, 31, 32)].\n\nOverall, Alex Mercer's influence is evident in the strategic decisions that prioritize both the pursuit of knowledge and the safeguarding of humanity's interests. His leadership ensures that the team remains adaptable and prepared for the unpredictable nature of cosmic events, positioning them as both protectors and pioneers in the realm of interstellar diplomacy.",
-   'score': 85,
-   'metadata': {'llm_calls': 1,
-    'prompt_tokens': 10982,
-    'output_tokens': 425,
-    'context_data': {'entities': Empty DataFrame
-     Columns: [in_context]
-     Index: [],
-     'sources':     id                                               text
-     0   45   they faced. "If it's truly sentient, we're no...
-     1   31   set the tempo for an undertaking that travers...
-     2   27  , and not a small measure of trepidation. "Thi...
-     3   23  Sam Rivera, ever the source of technological a...
-     4   24  Keep the communication channels open. But let ...
-     5   26  eterred, Jordan cast a determined glance at th...
-     6    0  # Operation: Dulce\n\n## Chapter 1\n\nThe thru...
-     7   16   a new cosmic paradigm.\n\nAlex Mercer watched...
-     8   32   cosmos—secrets that, until now, had been lost...
-     9   14   a communal outreach beyond the stars. As dawn...
-     10  18   the universe.\n\nIn a symphony of clicks and ...
-     11  44   It's a... symphony. It's as if they're teachi...
-     12  41   conviction that knowledge was more than power...
-     13   8   I'm right, what we're looking at isn't random...
-     14  10   but felt by all. The walls didn't just whispe...
-     15   3  , weighing his words carefully. "Our tech is t...
-     16  21   an undercurrent of intensity carried forth in...}},
-   'id': 24},
-  {'query': 'What technologies does Alex Mercer use in the Dulce Facility for extraterrestrial communications?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 25},
-  {'query': 'What are the specific challenges Alex Mercer faces during the mission?',
-   'answer': "Alex Mercer, a key figure in the Paranormal Military Squad, faces a multitude of challenges during the mission at Dulce Base. One of the primary challenges is the complexity and unpredictability of the alien signal they are attempting to decode. The signal is not only encrypted but also appears to be sentient, adapting in real-time to their interactions, which adds a layer of difficulty in understanding its true intent [Data: Sources (23, 45, 24)]. This requires Alex and his team to maintain open communication channels while ensuring that no message goes unchecked, as the consequences of misinterpretation could be significant [Data: Sources (23, 24)].\n\nAnother challenge is the need to balance caution with curiosity. The team is aware that the signal could either be a Rosetta Stone, offering profound insights, or a Tower of Babel, leading to potential disaster [Data: Sources (23, 24)]. This duality requires Alex to adopt a balanced strategy, ensuring that the team remains vigilant and prepared for any outcome, whether it be diplomatic or hostile [Data: Sources (45, 24)].\n\nAdditionally, Alex faces the challenge of leadership under pressure. He must guide his team through the unknown, fostering a sense of trust and collaboration while navigating the high-stakes environment of potential first contact with an extraterrestrial intelligence. This involves managing the diverse perspectives and expertise of his team members, such as Dr. Jordan Hayes, Taylor Cruz, and Sam Rivera, each of whom brings unique insights and concerns to the mission [Data: Sources (45, 23, 24)].\n\nThe mission also tests Alex's ability to adapt to rapidly evolving situations. As the signal's complexity increases, so does the need for innovative problem-solving and the ability to make quick, informed decisions. This is compounded by the underlying tension of operating within a secretive military framework, where the stakes are not only scientific but also geopolitical [Data: Sources (45, 24, 44)].\n\nOverall, Alex Mercer is tasked with navigating a mission fraught with uncertainty, where the potential for groundbreaking discovery is matched by the risk of catastrophic failure. His role as a leader and strategist is crucial in steering the team through these challenges, ensuring that they remain focused on their objectives while being prepared for the unexpected.",
-   'score': 85,
-   'metadata': {'llm_calls': 1,
-    'prompt_tokens': 10982,
-    'output_tokens': 575,
-    'context_data': {'entities': Empty DataFrame
-     Columns: [in_context]
-     Index: [],
-     'sources':     id                                               text
-     0   45   they faced. "If it's truly sentient, we're no...
-     1   31   set the tempo for an undertaking that travers...
-     2   27  , and not a small measure of trepidation. "Thi...
-     3   23  Sam Rivera, ever the source of technological a...
-     4   24  Keep the communication channels open. But let ...
-     5   26  eterred, Jordan cast a determined glance at th...
-     6    0  # Operation: Dulce\n\n## Chapter 1\n\nThe thru...
-     7   16   a new cosmic paradigm.\n\nAlex Mercer watched...
-     8   32   cosmos—secrets that, until now, had been lost...
-     9   14   a communal outreach beyond the stars. As dawn...
-     10  18   the universe.\n\nIn a symphony of clicks and ...
-     11  44   It's a... symphony. It's as if they're teachi...
-     12  41   conviction that knowledge was more than power...
-     13   8   I'm right, what we're looking at isn't random...
-     14  10   but felt by all. The walls didn't just whispe...
-     15   3  , weighing his words carefully. "Our tech is t...
-     16  21   an undercurrent of intensity carried forth in...}},
-   'id': 26},
-  {'query': "How does Alex Mercer's leadership style affect the team's dynamics?",
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 27},
-  {'query': 'What is the nature of the alien signals that Alex Mercer is working to decode?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 28},
-  {'query': 'How does Alex Mercer balance caution and optimism in his approach to the mission?',
-   'answer': "Alex Mercer, a key figure in the Paranormal Military Squad, demonstrates a nuanced balance of caution and optimism throughout the mission at Dulce Base. His approach is characterized by a strategic blend of careful consideration and hopeful engagement with the unknown, as evidenced by his interactions with his team and the unfolding events.\n\nIn the face of potential first contact with an alien intelligence, Alex maintains a cautious stance, emphasizing the importance of monitoring and securing communication channels. He is acutely aware of the risks involved, as highlighted by his insistence that no message or pulse go unchecked, recognizing the potential for both breakthrough and disaster [Data: Sources (23, 24, 45)]. This cautious approach is further reinforced by his acknowledgment of the need for a measured response to the evolving signal, which could either be a Rosetta Stone or a Tower of Babel [Data: Sources (23, 24)].\n\nSimultaneously, Alex embodies optimism through his encouragement of open communication and his belief in the potential for positive outcomes. He supports his team's efforts to engage with the signal, viewing it as an opportunity to bridge gaps in understanding and to possibly initiate a broader cosmic dialogue. His optimism is reflected in his willingness to explore the unknown, as he guides his team with a focus on understanding rather than confrontation [Data: Sources (18, 21, 44)].\n\nAlex's leadership is marked by a diplomatic tenor, as he advises his team to focus on translating intentions rather than merely decoding signals. This approach underscores his belief in the potential for dialogue and connection, even as he remains vigilant against the unknown risks [Data: Sources (32, 44)]. By balancing these elements, Alex Mercer navigates the mission with a steady hand, ensuring that his team is prepared for both the challenges and opportunities that lie ahead.",
-   'score': 85,
-   'metadata': {'llm_calls': 1,
-    'prompt_tokens': 10982,
-    'output_tokens': 481,
-    'context_data': {'entities': Empty DataFrame
-     Columns: [in_context]
-     Index: [],
-     'sources':     id                                               text
-     0   45   they faced. "If it's truly sentient, we're no...
-     1   31   set the tempo for an undertaking that travers...
-     2   27  , and not a small measure of trepidation. "Thi...
-     3   23  Sam Rivera, ever the source of technological a...
-     4   24  Keep the communication channels open. But let ...
-     5   26  eterred, Jordan cast a determined glance at th...
-     6    0  # Operation: Dulce\n\n## Chapter 1\n\nThe thru...
-     7   16   a new cosmic paradigm.\n\nAlex Mercer watched...
-     8   32   cosmos—secrets that, until now, had been lost...
-     9   14   a communal outreach beyond the stars. As dawn...
-     10  18   the universe.\n\nIn a symphony of clicks and ...
-     11  44   It's a... symphony. It's as if they're teachi...
-     12  41   conviction that knowledge was more than power...
-     13   8   I'm right, what we're looking at isn't random...
-     14  10   but felt by all. The walls didn't just whispe...
-     15   3  , weighing his words carefully. "Our tech is t...
-     16  21   an undercurrent of intensity carried forth in...}},
-   'id': 29},
-  {'query': "What are the implications of the mission's success or failure for Alex Mercer and his team?",
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 30},
-  {'query': 'What specific technologies are used at Dulce Base for communication with extraterrestrial beings?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 31},
-  {'query': 'What role does Alex Mercer play in the communication process at Dulce Base?',
-   'answer': "Alex Mercer plays a pivotal role in the communication process at Dulce Base, acting as a leader and strategist in the Paranormal Military Squad's efforts to engage with an alien signal. His responsibilities include overseeing the team's operations, ensuring that communication channels remain open, and maintaining a balance between caution and curiosity in their interactions with the unknown intelligence [Data: Sources (45, 31, 27, 23, 24)].\n\nMercer is depicted as a steady and reliable presence, providing guidance and support to his team members, such as Dr. Jordan Hayes, Taylor Cruz, and Sam Rivera, as they work to decode and understand the alien signal. He emphasizes the importance of keeping the communication channels open while ensuring that no message or pulse goes unchecked, highlighting the potential significance of their work as either a breakthrough or a disaster [Data: Sources (45, 23, 24)].\n\nThroughout the process, Mercer demonstrates a blend of military discipline and diplomatic acumen, recognizing the historic weight of their task and the potential implications of their actions. He encourages his team to proceed with cautious optimism, understanding that their efforts could mark humanity's readiness to engage in a broader interstellar dialogue [Data: Sources (31, 27, 18, 44)].\n\nOverall, Alex Mercer's role is crucial in navigating the complexities of the communication process, balancing the need for security with the opportunity for groundbreaking discovery, and leading his team through uncharted territory in their quest to understand and respond to the alien signal.",
-   'score': 85,
-   'metadata': {'llm_calls': 1,
-    'prompt_tokens': 10982,
-    'output_tokens': 427,
-    'context_data': {'entities': Empty DataFrame
-     Columns: [in_context]
-     Index: [],
-     'sources':     id                                               text
-     0   45   they faced. "If it's truly sentient, we're no...
-     1   31   set the tempo for an undertaking that travers...
-     2   27  , and not a small measure of trepidation. "Thi...
-     3   23  Sam Rivera, ever the source of technological a...
-     4   24  Keep the communication channels open. But let ...
-     5   26  eterred, Jordan cast a determined glance at th...
-     6    0  # Operation: Dulce\n\n## Chapter 1\n\nThe thru...
-     7   16   a new cosmic paradigm.\n\nAlex Mercer watched...
-     8   32   cosmos—secrets that, until now, had been lost...
-     9   14   a communal outreach beyond the stars. As dawn...
-     10  18   the universe.\n\nIn a symphony of clicks and ...
-     11  44   It's a... symphony. It's as if they're teachi...
-     12  41   conviction that knowledge was more than power...
-     13   8   I'm right, what we're looking at isn't random...
-     14  10   but felt by all. The walls didn't just whispe...
-     15   3  , weighing his words carefully. "Our tech is t...
-     16  21   an undercurrent of intensity carried forth in...}},
-   'id': 32},
-  {'query': 'How does the team at Dulce Base ensure the security of their communications with extraterrestrial beings?',
-   'answer': 'The team at Dulce Base employs a multi-faceted approach to ensure the security of their communications with extraterrestrial beings. This involves a combination of technological vigilance, strategic protocols, and adaptive strategies.\n\nFirstly, the team is acutely aware of the potential risks involved in communicating with an unknown intelligence. Taylor Cruz, a member of the team, emphasizes the importance of maintaining secure and monitored communication streams, highlighting the need for caution and protocol adherence amidst uncertainty [Data: Sources (27, 29, 31)]. This suggests that the team uses secure channels and possibly encryption to protect their communications from unauthorized access or interference.\n\nMoreover, the team is described as being highly adaptive, with members like Sam Rivera and Jordan Hayes recognizing the need to remain flexible in their approach. They acknowledge that the signal they are interacting with is not static but evolving, which requires them to continuously adapt their methods to ensure security and understanding [Data: Sources (23, 47)]. This adaptability likely extends to their security measures, allowing them to respond to any changes or threats in real-time.\n\nAdditionally, the team operates under a framework of trust and intuition, as highlighted by Alex Mercer. He stresses the importance of intuition and trust in navigating the unknown variables that exceed the known, suggesting that the team relies on both technological and human insights to maintain the integrity of their communications [Data: Sources (3, 47)].\n\nOverall, the security of communications at Dulce Base is maintained through a combination of secure technological practices, adherence to protocols, and a flexible, intuitive approach to the evolving nature of their extraterrestrial interactions.',
-   'score': 75,
-   'metadata': {'llm_calls': 1,
-    'prompt_tokens': 10982,
-    'output_tokens': 447,
-    'context_data': {'entities': Empty DataFrame
-     Columns: [in_context]
-     Index: [],
-     'sources':     id                                               text
-     0   22   his team into the core of their approach, his...
-     1   26  eterred, Jordan cast a determined glance at th...
-     2    6   ordered, their voice echoing slightly before ...
-     3   38   urged, his voice bearing the gravitas of thei...
-     4   27  , and not a small measure of trepidation. "Thi...
-     5    5   very walls of the shaft—a whisper of somethin...
-     6    9   "The silence here... It's almost as if the ba...
-     7   30   emissaries to a celestial congress we're only...
-     8   46   was now actively partaking in an exchange not...
-     9   29  crum of insight and expertise, and felt the so...
-     10  45   they faced. "If it's truly sentient, we're no...
-     11  31   set the tempo for an undertaking that travers...
-     12  32   cosmos—secrets that, until now, had been lost...
-     13   3  , weighing his words carefully. "Our tech is t...
-     14  23  Sam Rivera, ever the source of technological a...
-     15  47   revealing a tinge of skepticism at Taylor Cru...
-     16  15   than the last.\n\nThen, with a sudden burst t...}},
-   'id': 33},
-  {'query': 'What are the potential risks involved in communicating with extraterrestrial intelligences at Dulce Base?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 34},
-  {'query': 'How does the team interpret the evolving nature of the alien signals at Dulce Base?',
-   'answer': "The team at Dulce Base, led by figures such as Alex Mercer, Dr. Jordan Hayes, Taylor Cruz, and Sam Rivera, approaches the alien signals with a blend of scientific curiosity and cautious diplomacy. The signals are perceived as more than mere data; they are seen as a potential bridge to interspecies communication, carrying profound implications for humanity's future [Data: Sources (22, 26, 38, 27, 45)].\n\nDr. Jordan Hayes plays a crucial role in deciphering the signals, noting their complexity and the potential for them to represent a form of sentience. The signals are described as evolving, adapting to the team's attempts to decrypt them, which suggests a form of intelligence that is both reactive and proactive [Data: Sources (38, 23, 15)]. This evolution is seen as a dialogue, with each interaction teaching both parties more about the other's language and intentions [Data: Sources (38, 23, 15)].\n\nAlex Mercer, embodying leadership and focus, emphasizes the importance of maintaining a balanced strategy in responding to the signals. He views the situation as an opportunity for humanity to engage in a broader cosmic dialogue, urging the team to proceed with caution and empathy [Data: Sources (46, 29, 31)]. Taylor Cruz, on the other hand, remains vigilant about the potential risks, advocating for a measured response to ensure that the team's actions do not inadvertently lead to negative consequences [Data: Sources (38, 31, 45)].\n\nSam Rivera brings a youthful enthusiasm to the team, expressing optimism about the potential to form a connection with the alien intelligence. They highlight the rhythmic nature of the signals, suggesting that the communication extends beyond words to encompass a broader spectrum of human expression [Data: Sources (38, 46, 31)].\n\nOverall, the team interprets the evolving nature of the alien signals as a complex and dynamic interaction that requires a careful balance of scientific inquiry, diplomatic caution, and human empathy. They recognize the potential for these signals to redefine humanity's understanding of its place in the universe, and they approach the task with a sense of historical significance and responsibility [Data: Sources (22, 26, 38, 27, 45)].",
-   'score': 0,
-   'metadata': {'llm_calls': 1,
-    'prompt_tokens': 10982,
-    'output_tokens': 574,
-    'context_data': {'entities': Empty DataFrame
-     Columns: [in_context]
-     Index: [],
-     'sources':     id                                               text
-     0   22   his team into the core of their approach, his...
-     1   26  eterred, Jordan cast a determined glance at th...
-     2    6   ordered, their voice echoing slightly before ...
-     3   38   urged, his voice bearing the gravitas of thei...
-     4   27  , and not a small measure of trepidation. "Thi...
-     5    5   very walls of the shaft—a whisper of somethin...
-     6    9   "The silence here... It's almost as if the ba...
-     7   30   emissaries to a celestial congress we're only...
-     8   46   was now actively partaking in an exchange not...
-     9   29  crum of insight and expertise, and felt the so...
-     10  45   they faced. "If it's truly sentient, we're no...
-     11  31   set the tempo for an undertaking that travers...
-     12  32   cosmos—secrets that, until now, had been lost...
-     13   3  , weighing his words carefully. "Our tech is t...
-     14  23  Sam Rivera, ever the source of technological a...
-     15  47   revealing a tinge of skepticism at Taylor Cru...
-     16  15   than the last.\n\nThen, with a sudden burst t...}},
-   'id': 35},
-  {'query': 'What specific roles do Dr. Jordan Hayes and Taylor Cruz play in the operations at Dulce?',
-   'answer': "Dr. Jordan Hayes and Taylor Cruz play pivotal roles in the operations at Dulce, each contributing their unique expertise and perspectives to the mission.\n\n### Dr. Jordan Hayes\nDr. Jordan Hayes is primarily responsible for interpreting and analyzing alien technology and communications. Their role is deeply rooted in scientific inquiry and the pursuit of understanding extraterrestrial signals and technology. Jordan is depicted as a meticulous and thoughtful scientist, often seen working on decryption algorithms and deciphering alien codes. They are portrayed as someone who balances scientific acuity with diplomatic caution, recognizing the potential paradigm shifts that their discoveries could bring about [Data: Sources (18, 19, 33, 45)]. Jordan's work is crucial in bridging the gap between human and alien understanding, as they are often at the forefront of interpreting the signals and determining their implications for humanity [Data: Sources (16, 20, 22)].\n\n### Taylor Cruz\nTaylor Cruz, on the other hand, embodies military precision and authority. Their role is more strategic and operational, focusing on maintaining control and ensuring the safety and success of the mission. Taylor is often seen as a voice of caution, reminding the team of the potential risks and the need for vigilance. They are portrayed as a pragmatic leader who questions the potential aggressiveness of alien intent and emphasizes the importance of adhering to protocols [Data: Sources (0, 16, 19, 21)]. Taylor's presence is a stabilizing force, ensuring that the team remains focused and prepared for any eventuality, whether it be a peaceful exchange or a potential threat [Data: Sources (4, 22, 27)].\n\nTogether, Dr. Jordan Hayes and Taylor Cruz represent the dual aspects of the mission at Dulce: the quest for knowledge and understanding, and the need for strategic caution and preparedness. Their collaboration highlights the complex interplay between scientific exploration and military strategy in the face of the unknown.",
-   'score': 85,
-   'metadata': {'llm_calls': 1,
-    'prompt_tokens': 10980,
-    'output_tokens': 494,
-    'context_data': {'entities': Empty DataFrame
-     Columns: [in_context]
-     Index: [],
-     'sources':     id                                               text
-     0   40   and the distant hum of machinery hinted at Du...
-     1   18   the universe.\n\nIn a symphony of clicks and ...
-     2   37   from across the console, their eyes not leavi...
-     3   19   extraterrestrial sentience that had outreache...
-     4   44   It's a... symphony. It's as if they're teachi...
-     5   35  , every keystroke an intricate step in their t...
-     6    4   stepping into their exchange. The authority i...
-     7   42   the dark heart of Dulce's secrets. \n\nAnd th...
-     8   33   were locked onto the display screen, where an...
-     9   45   they faced. "If it's truly sentient, we're no...
-     10  27  , and not a small measure of trepidation. "Thi...
-     11  24  Keep the communication channels open. But let ...
-     12  21   an undercurrent of intensity carried forth in...
-     13  22   his team into the core of their approach, his...
-     14   0  # Operation: Dulce\n\n## Chapter 1\n\nThe thru...
-     15  16   a new cosmic paradigm.\n\nAlex Mercer watched...
-     16  20   bridge—or the abysses into which they might u...}},
-   'id': 36},
-  {'query': 'How does Sam Rivera contribute to the mission at Dulce?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 37},
-  {'query': 'What are the dynamics between Alex Mercer and the other key figures at Dulce?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 38},
-  {'query': 'How do the personalities of the key figures influence the outcomes of the operations at Dulce?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 39},
-  {'query': 'What challenges do the key figures face during the operations at Dulce?',
-   'answer': "The key figures involved in the operations at Dulce face a multitude of challenges, both internal and external, as they navigate the complexities of their mission. \n\n### Internal Conflicts and Leadership Dynamics\n\nAgent Alex Mercer, a central figure in the operation, grapples with the tension between adhering to protocol and pursuing a deeper understanding of the unknown. His interactions with Taylor Cruz, who embodies a more authoritarian approach, highlight the struggle between maintaining control and embracing the unpredictable nature of their mission [Data: Sources (0, 1, 2, 7, 8)]. Mercer's internal conflict is further compounded by his role as a leader, where he must balance the need for strategic decision-making with the humanistic aspects of their mission [Data: Sources (17, 18)].\n\n### Technological and Scientific Challenges\n\nDr. Jordan Hayes faces the daunting task of deciphering alien technology and communication signals. The complexity of the alien code presents a significant challenge, requiring not only technical expertise but also an openness to new paradigms that could fundamentally alter their understanding of physics and communication [Data: Sources (6, 12, 33, 34)]. Jordan's analytical mind is constantly at odds with the need to remain adaptive in the face of unknown variables, a challenge that is echoed by Sam Rivera's efforts to interpret signal distortions and anomalies [Data: Sources (1, 10, 17)].\n\n### Existential and Ethical Dilemmas\n\nThe team as a whole is confronted with existential questions about the implications of their discoveries. The potential for contact with an alien intelligence raises ethical considerations about how to engage with such entities and the broader impact on humanity [Data: Sources (15, 18, 38)]. These dilemmas are compounded by the pressure to deliver actionable intelligence while navigating the unknown, a task that requires both courage and caution [Data: Sources (40, 42)].\n\n### External Threats and Operational Risks\n\nExternally, the team must contend with the physical and operational risks inherent in their mission. The Dulce base itself is shrouded in mystery, with its hidden technologies and potential threats lurking in the shadows. The team must remain vigilant against these unknown dangers while maintaining their focus on the mission objectives [Data: Sources (6, 10, 41)].\n\nIn summary, the key figures at Dulce face a complex web of challenges that test their resolve, adaptability, and ethical compass. These challenges are not only technical and operational but also deeply personal, as each member of the team must confront their own beliefs and motivations in the face of the unknown.",
-   'score': 85,
-   'metadata': {'llm_calls': 1,
-    'prompt_tokens': 10981,
-    'output_tokens': 643,
-    'context_data': {'entities': Empty DataFrame
-     Columns: [in_context]
-     Index: [],
-     'sources':     id                                               text
-     0   12   keep the team grounded. No one goes off-cours...
-     1   40   and the distant hum of machinery hinted at Du...
-     2    6   ordered, their voice echoing slightly before ...
-     3    8   I'm right, what we're looking at isn't random...
-     4    0  # Operation: Dulce\n\n## Chapter 1\n\nThe thru...
-     5   33   were locked onto the display screen, where an...
-     6   15   than the last.\n\nThen, with a sudden burst t...
-     7   42   the dark heart of Dulce's secrets. \n\nAnd th...
-     8    1  's authoritarian performance. _Protocols_, Jor...
-     9   41   conviction that knowledge was more than power...
-     10  10   but felt by all. The walls didn't just whispe...
-     11  34  Our responses so far have echoed their complex...
-     12  38   urged, his voice bearing the gravitas of thei...
-     13   7  , while Alex clenched his jaw, the buzz of fru...
-     14   2  , rehearsing the speech for their subordinates...
-     15  17   on the sequences that danced across the scree...
-     16  18   the universe.\n\nIn a symphony of clicks and ...}},
-   'id': 40},
-  {'query': 'What specific role does Alex Mercer play in the Paranormal Military Squad?',
-   'answer': "Alex Mercer plays a pivotal role in the Paranormal Military Squad, primarily as a leader and strategist. His responsibilities include overseeing the team's operations and ensuring that their mission objectives are met with precision and caution. Mercer is depicted as a figure of authority and reliability, often guiding his team through complex and unprecedented situations involving extraterrestrial communications and potential first contact scenarios.\n\nIn the context of the Dulce Base operations, Alex Mercer is portrayed as a steadying presence amidst the uncertainty and high stakes of their mission. He is seen coordinating with his team members, such as Dr. Jordan Hayes, Taylor Cruz, and Sam Rivera, to decode alien signals and navigate the challenges of interstellar communication. His leadership style is characterized by a balance of caution and curiosity, as he encourages his team to keep communication channels open while ensuring that no message or signal goes unchecked [Data: Sources (45, 31, 27, 23, 24)].\n\nMercer's role extends beyond mere command; he is also a mediator and a diplomat, understanding the potential implications of their interactions with alien intelligence. He emphasizes the importance of interpreting the signals correctly and maintaining a strategic approach to their mission, recognizing the historical significance of their work and the potential impact on humanity's understanding of the cosmos [Data: Sources (26, 0, 16, 32, 14)].\n\nOverall, Alex Mercer is a central figure in the Paranormal Military Squad, embodying the qualities of leadership, strategic thinking, and diplomatic foresight necessary for navigating the unknown territories of extraterrestrial engagement.",
-   'score': 85,
-   'metadata': {'llm_calls': 1,
-    'prompt_tokens': 10982,
-    'output_tokens': 420,
-    'context_data': {'entities': Empty DataFrame
-     Columns: [in_context]
-     Index: [],
-     'sources':     id                                               text
-     0   45   they faced. "If it's truly sentient, we're no...
-     1   31   set the tempo for an undertaking that travers...
-     2   27  , and not a small measure of trepidation. "Thi...
-     3   23  Sam Rivera, ever the source of technological a...
-     4   24  Keep the communication channels open. But let ...
-     5   26  eterred, Jordan cast a determined glance at th...
-     6    0  # Operation: Dulce\n\n## Chapter 1\n\nThe thru...
-     7   16   a new cosmic paradigm.\n\nAlex Mercer watched...
-     8   32   cosmos—secrets that, until now, had been lost...
-     9   14   a communal outreach beyond the stars. As dawn...
-     10  18   the universe.\n\nIn a symphony of clicks and ...
-     11  44   It's a... symphony. It's as if they're teachi...
-     12  41   conviction that knowledge was more than power...
-     13   8   I'm right, what we're looking at isn't random...
-     14  10   but felt by all. The walls didn't just whispe...
-     15   3  , weighing his words carefully. "Our tech is t...
-     16  21   an undercurrent of intensity carried forth in...}},
-   'id': 41},
-  {'query': 'What are the key challenges faced by Alex Mercer during Operation: Dulce?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 42},
-  {'query': "How do other team members perceive Alex Mercer's contributions to the mission?",
-   'answer': "Alex Mercer is perceived by his team members as a pivotal figure in the mission, embodying both leadership and a deep sense of responsibility. His presence is marked by a blend of determination and strategic foresight, which is crucial in navigating the complexities of their interstellar communication efforts. For instance, Alex is seen as a reliable and steadying force, particularly in moments of uncertainty, as he encourages his team to maintain open communication channels and to approach the unknown with both caution and curiosity [Data: Sources (45, 23, 24, 44)].\n\nDr. Jordan Hayes, a key member of the team, acknowledges Alex's leadership and shares a mutual understanding of the mission's gravity. Jordan's interactions with Alex often reflect a shared responsibility and trust, as seen when Alex supports Jordan's efforts in decrypting alien signals and encourages a balanced approach to the mission [Data: Sources (45, 23, 24, 44)].\n\nTaylor Cruz, another team member, often brings a pragmatic perspective to the mission, emphasizing caution and protocol. While Taylor's approach is more conservative, they recognize Alex's role in maintaining the team's focus and ensuring that their actions are aligned with the mission's objectives. Taylor's interactions with Alex suggest a respect for his leadership, even as they remind the team of the potential risks involved [Data: Sources (45, 23, 24, 44)].\n\nSam Rivera, known for their technological acumen, views Alex as a source of support and encouragement. Sam's enthusiasm for the mission is bolstered by Alex's strategic insights and his ability to foster a collaborative environment. This dynamic is evident in their shared excitement about the potential for interstellar communication and the historic nature of their work [Data: Sources (45, 23, 24, 44)].\n\nOverall, Alex Mercer is seen as a central figure whose contributions are integral to the mission's progress. His ability to balance leadership with collaboration and his commitment to understanding the unknown are key elements that shape the team's perception of his role.",
-   'score': 85,
-   'metadata': {'llm_calls': 1,
-    'prompt_tokens': 10982,
-    'output_tokens': 523,
-    'context_data': {'entities': Empty DataFrame
-     Columns: [in_context]
-     Index: [],
-     'sources':     id                                               text
-     0   45   they faced. "If it's truly sentient, we're no...
-     1   31   set the tempo for an undertaking that travers...
-     2   27  , and not a small measure of trepidation. "Thi...
-     3   23  Sam Rivera, ever the source of technological a...
-     4   24  Keep the communication channels open. But let ...
-     5   26  eterred, Jordan cast a determined glance at th...
-     6    0  # Operation: Dulce\n\n## Chapter 1\n\nThe thru...
-     7   16   a new cosmic paradigm.\n\nAlex Mercer watched...
-     8   32   cosmos—secrets that, until now, had been lost...
-     9   14   a communal outreach beyond the stars. As dawn...
-     10  18   the universe.\n\nIn a symphony of clicks and ...
-     11  44   It's a... symphony. It's as if they're teachi...
-     12  41   conviction that knowledge was more than power...
-     13   8   I'm right, what we're looking at isn't random...
-     14  10   but felt by all. The walls didn't just whispe...
-     15   3  , weighing his words carefully. "Our tech is t...
-     16  21   an undercurrent of intensity carried forth in...}},
-   'id': 43},
-  {'query': "What is the significance of Alex Mercer's interactions with Dr. Jordan Hayes?",
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 44},
-  {'query': 'What role does Agent Mercer play in the Dulce operations?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 45},
-  {'query': 'How does the narrative of Dulce Base connect to broader UFO conspiracy theories?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 46},
-  {'query': 'What evidence, if any, supports the existence of the Dulce Base?',
-   'answer': "The existence of the Dulce Base, often described as a secret underground facility in New Mexico, is a topic of much speculation and conspiracy theory. The narrative surrounding Dulce Base suggests it is a site of covert operations involving extraterrestrial beings and advanced technology. However, concrete evidence supporting the existence of such a base is largely anecdotal and speculative.\n\nThe sources provided in the data tables describe a fictional narrative involving a team of agents, including Alex Mercer, Jordan Hayes, Taylor Cruz, and Sam Rivera, who are engaged in operations at Dulce Base. These narratives depict scenarios of first contact with alien intelligence and the decoding of extraterrestrial signals [Data: Sources (6, 38, 27, 5, 9, 30, 46, 29, 31, 32, 3, 23, 47, 15, 35, 28)]. The stories are rich with descriptions of the base's operations and the agents' interactions with alien technology, but they do not provide verifiable evidence of the base's real-world existence.\n\nIn the broader context, claims about Dulce Base often stem from conspiracy theories and unverified testimonies. These include alleged whistleblower accounts and supposed leaked documents, none of which have been substantiated by credible evidence. The lack of physical evidence, official acknowledgment, or credible documentation makes the existence of Dulce Base highly questionable.\n\nIn summary, while the narrative sources provide a detailed fictional account of activities at Dulce Base, they do not constitute evidence of its existence in reality. The stories serve more as a creative exploration of themes related to extraterrestrial contact and secret military operations rather than factual reporting.",
-   'score': 20,
-   'metadata': {'llm_calls': 1,
-    'prompt_tokens': 10982,
-    'output_tokens': 447,
-    'context_data': {'entities': Empty DataFrame
-     Columns: [in_context]
-     Index: [],
-     'sources':     id                                               text
-     0    6   ordered, their voice echoing slightly before ...
-     1   38   urged, his voice bearing the gravitas of thei...
-     2   27  , and not a small measure of trepidation. "Thi...
-     3    5   very walls of the shaft—a whisper of somethin...
-     4    9   "The silence here... It's almost as if the ba...
-     5   30   emissaries to a celestial congress we're only...
-     6   46   was now actively partaking in an exchange not...
-     7   29  crum of insight and expertise, and felt the so...
-     8   45   they faced. "If it's truly sentient, we're no...
-     9   31   set the tempo for an undertaking that travers...
-     10  32   cosmos—secrets that, until now, had been lost...
-     11   3  , weighing his words carefully. "Our tech is t...
-     12  23  Sam Rivera, ever the source of technological a...
-     13  47   revealing a tinge of skepticism at Taylor Cru...
-     14  15   than the last.\n\nThen, with a sudden burst t...
-     15  35  , every keystroke an intricate step in their t...
-     16  28   "and in every word we script, in every respon...}},
-   'id': 47},
-  {'query': 'Who are the key figures associated with the Dulce Base conspiracy theory?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 48},
-  {'query': 'How have government agencies responded to claims about Dulce Base?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 49},
-  {'query': 'What specific strategies does Mercer employ to ensure communication with extraterrestrial intelligence remains open and secure?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 50},
-  {'query': "How does Taylor Cruz's focus on risk management influence the squad's overall approach to extraterrestrial diplomacy?",
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 51},
-  {'query': "In what ways does Dr. Jordan Hayes's scientific analysis contribute to the squad's understanding of alien signals?",
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 52},
-  {'query': "How does Sam Rivera's technological expertise complement Mercer's diplomatic efforts?",
-   'answer': "Sam Rivera's technological expertise plays a crucial role in complementing Alex Mercer's diplomatic efforts, particularly in the context of their mission at Dulce Base. As the team navigates the complexities of alien communication, Sam's ability to manipulate and interpret advanced technology becomes indispensable. Their proficiency in handling sophisticated equipment allows the team to bridge the gap between human and extraterrestrial communication, transforming alien signals into comprehensible data [Data: Sources (16, 18, 24, 25, 28)].\n\nSam's enthusiasm and technical acumen are evident as they work alongside Mercer and the rest of the team to decode the alien messages. This technical prowess is not just about understanding the signals but also about ensuring that the communication is secure and effective. Sam's role in adapting the team's systems to interact with the alien intelligence highlights their importance in the mission's success [Data: Sources (14, 18, 24, 25, 28)].\n\nMeanwhile, Alex Mercer's diplomatic skills are crucial in framing the team's approach to this unprecedented contact. His leadership ensures that the team remains focused on understanding and responding to the alien signals with caution and curiosity. Mercer's ability to balance the team's technical achievements with a strategic and diplomatic mindset helps guide their interactions with the unknown, ensuring that their responses are measured and thoughtful [Data: Sources (16, 18, 24, 25, 28)].\n\nTogether, Sam's technical expertise and Mercer's diplomatic acumen create a synergy that allows the team to navigate the challenges of interstellar communication effectively. While Sam provides the technical means to engage with the alien intelligence, Mercer ensures that these engagements are conducted with the necessary diplomatic foresight, making their collaboration essential to the mission's success.",
-   'score': 85,
-   'metadata': {'llm_calls': 1,
-    'prompt_tokens': 10981,
-    'output_tokens': 468,
-    'context_data': {'entities': Empty DataFrame
-     Columns: [in_context]
-     Index: [],
-     'sources':     id                                               text
-     0   45   they faced. "If it's truly sentient, we're no...
-     1   27  , and not a small measure of trepidation. "Thi...
-     2   16   a new cosmic paradigm.\n\nAlex Mercer watched...
-     3   31   set the tempo for an undertaking that travers...
-     4   14   a communal outreach beyond the stars. As dawn...
-     5   18   the universe.\n\nIn a symphony of clicks and ...
-     6    3  , weighing his words carefully. "Our tech is t...
-     7   21   an undercurrent of intensity carried forth in...
-     8   43   of a cosmic message that could redefine their...
-     9    0  # Operation: Dulce\n\n## Chapter 1\n\nThe thru...
-     10  42   the dark heart of Dulce's secrets. \n\nAnd th...
-     11  28   "and in every word we script, in every respon...
-     12  25   his fingers hovering over the command keys. W...
-     13  44   It's a... symphony. It's as if they're teachi...
-     14  30   emissaries to a celestial congress we're only...
-     15  13   primacy within.\n\n"The closer we get to unlo...
-     16  24  Keep the communication channels open. But let ...}},
-   'id': 53},
-  {'query': 'What are the potential risks and rewards that Mercer anticipates in maintaining an open dialogue with extraterrestrial intelligence?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 54},
-  {'query': 'What role does Alex Mercer play in the Paranormal Military Squad?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 55},
-  {'query': "How does Alex Mercer's approach compare to other team members like Jordan Hayes or Taylor Cruz?",
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 56},
-  {'query': "What are the potential risks and benefits of Mercer's strategies in dealing with extraterrestrial communications?",
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 57},
-  {'query': "How has Alex Mercer's background influenced his strategies in handling extraterrestrial communications?",
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 58},
-  {'query': 'What specific challenges has Alex Mercer faced in maintaining open communication channels with extraterrestrial entities?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 59},
-  {'query': 'What specific skills does Mercer bring to the team that enhance their operations?',
-   'answer': "Agent Alex Mercer is portrayed as a pivotal member of the Paranormal Military Squad, bringing a unique blend of skills and attributes that significantly enhance the team's operations. His role is characterized by a combination of leadership, strategic thinking, and a deep understanding of the complexities involved in their mission.\n\n### Leadership and Strategic Thinking\nMercer is depicted as a leader who balances military discipline with a strategic mindset. He is often seen guiding his team through complex situations, such as when he advises caution and strategic engagement with the alien signal, emphasizing the importance of understanding and diplomacy over confrontation [Data: Sources (23, 24, 26)]. His ability to maintain composure and provide clear directives in high-pressure situations is crucial for the team's success.\n\n### Technical Acumen and Problem-Solving\nMercer demonstrates a strong technical acumen, particularly in understanding and interacting with alien technology and signals. He is actively involved in the decryption and analysis of alien communications, working closely with Dr. Jordan Hayes to unravel complex codes and patterns [Data: Sources (23, 24, 44)]. His problem-solving skills are evident as he navigates the challenges posed by the alien intelligence, ensuring that the team remains focused and effective.\n\n### Interpersonal Skills and Team Dynamics\nMercer's interpersonal skills are highlighted through his interactions with team members. He fosters a collaborative environment, encouraging input from experts like Dr. Hayes and Sam Rivera, and values their insights in decision-making processes [Data: Sources (23, 24, 44)]. His ability to build trust and camaraderie within the team enhances their collective performance and resilience.\n\n### Adaptability and Resilience\nThroughout the mission, Mercer exhibits adaptability and resilience, crucial traits for navigating the unpredictable nature of their operations. He is open to new information and willing to adjust strategies as the situation evolves, demonstrating a flexible approach to leadership [Data: Sources (23, 24, 44)]. This adaptability ensures that the team can respond effectively to the dynamic challenges they face.\n\nIn summary, Alex Mercer's skills in leadership, technical problem-solving, interpersonal communication, and adaptability significantly contribute to the effectiveness of the Paranormal Military Squad's operations, enabling them to tackle the complex and often enigmatic challenges of their mission.",
-   'score': 85,
-   'metadata': {'llm_calls': 1,
-    'prompt_tokens': 10981,
-    'output_tokens': 575,
-    'context_data': {'entities': Empty DataFrame
-     Columns: [in_context]
-     Index: [],
-     'sources':     id                                               text
-     0    9   "The silence here... It's almost as if the ba...
-     1   42   the dark heart of Dulce's secrets. \n\nAnd th...
-     2   45   they faced. "If it's truly sentient, we're no...
-     3   31   set the tempo for an undertaking that travers...
-     4   27  , and not a small measure of trepidation. "Thi...
-     5   23  Sam Rivera, ever the source of technological a...
-     6   24  Keep the communication channels open. But let ...
-     7   26  eterred, Jordan cast a determined glance at th...
-     8    0  # Operation: Dulce\n\n## Chapter 1\n\nThe thru...
-     9   16   a new cosmic paradigm.\n\nAlex Mercer watched...
-     10  32   cosmos—secrets that, until now, had been lost...
-     11  14   a communal outreach beyond the stars. As dawn...
-     12  18   the universe.\n\nIn a symphony of clicks and ...
-     13  44   It's a... symphony. It's as if they're teachi...
-     14  41   conviction that knowledge was more than power...
-     15   8   I'm right, what we're looking at isn't random...
-     16  10   but felt by all. The walls didn't just whispe...}},
-   'id': 60},
-  {'query': "How does Mercer's leadership style influence the dynamics of the Paranormal Military Squad?",
-   'answer': "Agent Alex Mercer plays a pivotal role in the dynamics of the Paranormal Military Squad, primarily through his leadership style, which is characterized by a blend of strategic foresight, empathy, and adaptability. Mercer's approach to leadership is evident in his interactions with his team members, where he balances authority with collaboration, fostering an environment where each member's expertise is valued and utilized effectively.\n\nMercer demonstrates a keen awareness of the importance of communication and trust within the team. He often engages in dialogues that encourage input from all members, as seen when he invites Dr. Jordan Hayes to share insights on the alien signal they are deciphering [Data: Sources (45, 23, 24)]. This inclusive approach not only empowers team members like Jordan and Sam Rivera but also ensures that diverse perspectives are considered in decision-making processes, which is crucial in their high-stakes mission.\n\nMoreover, Mercer's leadership is marked by a strategic balance between caution and curiosity. He acknowledges the potential risks involved in their mission, urging the team to proceed with both optimism and vigilance [Data: Sources (31, 27, 18)]. This dual focus helps maintain a steady course amidst the uncertainties of their interstellar communication efforts, ensuring that the team remains grounded while exploring new frontiers.\n\nMercer's ability to adapt his leadership style to the evolving challenges faced by the squad is another key aspect of his influence. He recognizes the need for flexibility in their approach, especially when dealing with unknown variables, and encourages the team to remain open to new strategies and solutions [Data: Sources (16, 32, 44)]. This adaptability not only enhances the team's resilience but also positions them to effectively navigate the complexities of their mission.\n\nIn summary, Alex Mercer's leadership style significantly influences the dynamics of the Paranormal Military Squad by fostering a collaborative, communicative, and adaptable team environment. His strategic foresight and emphasis on trust and inclusivity enable the squad to tackle the challenges of their mission with confidence and cohesion.",
-   'score': 85,
-   'metadata': {'llm_calls': 1,
-    'prompt_tokens': 10982,
-    'output_tokens': 515,
-    'context_data': {'entities': Empty DataFrame
-     Columns: [in_context]
-     Index: [],
-     'sources':     id                                               text
-     0   45   they faced. "If it's truly sentient, we're no...
-     1   31   set the tempo for an undertaking that travers...
-     2   27  , and not a small measure of trepidation. "Thi...
-     3   23  Sam Rivera, ever the source of technological a...
-     4   24  Keep the communication channels open. But let ...
-     5   26  eterred, Jordan cast a determined glance at th...
-     6    0  # Operation: Dulce\n\n## Chapter 1\n\nThe thru...
-     7   16   a new cosmic paradigm.\n\nAlex Mercer watched...
-     8   32   cosmos—secrets that, until now, had been lost...
-     9   14   a communal outreach beyond the stars. As dawn...
-     10  18   the universe.\n\nIn a symphony of clicks and ...
-     11  44   It's a... symphony. It's as if they're teachi...
-     12  41   conviction that knowledge was more than power...
-     13   8   I'm right, what we're looking at isn't random...
-     14  10   but felt by all. The walls didn't just whispe...
-     15   3  , weighing his words carefully. "Our tech is t...
-     16  21   an undercurrent of intensity carried forth in...}},
-   'id': 61},
-  {'query': 'In what ways does Mercer balance military protocol with the need for adaptability in the face of unknown challenges?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 62},
-  {'query': 'What are the key challenges Mercer faces during the operations at Dulce Base?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 63},
-  {'query': "How does Mercer's relationship with other team members, like Dr. Jordan Hayes, impact their mission's success?",
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 64},
-  {'query': 'What specific actions did Mercer take during the interstellar communication efforts?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 65},
-  {'query': "How does Mercer's leadership style influence the team's approach to the alien signal?",
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 66},
-  {'query': 'What is the nature of the relationship between Mercer and Washington in the context of the mission?',
-   'answer': "The data provided does not mention any character named Washington in relation to Agent Alex Mercer or the mission at Dulce Base. The narrative primarily focuses on the interactions and dynamics between Alex Mercer and other team members such as Jordan Hayes, Taylor Cruz, and Sam Rivera. These interactions highlight Mercer's role as a leader and a key figure in navigating the complexities of the mission, which involves deciphering alien communications and managing team dynamics in a high-stakes environment [Data: Sources (9, 42, 45, 31, 27, 23, 24, 26, 0, 16, 32, 14, 18, 44, 41, 8, 10)].\n\nIn the absence of any mention of Washington, it is not possible to determine the nature of any relationship between Mercer and Washington within the context of the mission. If Washington is a character or entity relevant to the mission, further data or context would be needed to explore this relationship.",
-   'score': 0,
-   'metadata': {'llm_calls': 1,
-    'prompt_tokens': 10981,
-    'output_tokens': 294,
-    'context_data': {'entities': Empty DataFrame
-     Columns: [in_context]
-     Index: [],
-     'sources':     id                                               text
-     0    9   "The silence here... It's almost as if the ba...
-     1   42   the dark heart of Dulce's secrets. \n\nAnd th...
-     2   45   they faced. "If it's truly sentient, we're no...
-     3   31   set the tempo for an undertaking that travers...
-     4   27  , and not a small measure of trepidation. "Thi...
-     5   23  Sam Rivera, ever the source of technological a...
-     6   24  Keep the communication channels open. But let ...
-     7   26  eterred, Jordan cast a determined glance at th...
-     8    0  # Operation: Dulce\n\n## Chapter 1\n\nThe thru...
-     9   16   a new cosmic paradigm.\n\nAlex Mercer watched...
-     10  32   cosmos—secrets that, until now, had been lost...
-     11  14   a communal outreach beyond the stars. As dawn...
-     12  18   the universe.\n\nIn a symphony of clicks and ...
-     13  44   It's a... symphony. It's as if they're teachi...
-     14  41   conviction that knowledge was more than power...
-     15   8   I'm right, what we're looking at isn't random...
-     16  10   but felt by all. The walls didn't just whispe...}},
-   'id': 67},
-  {'query': "Are there any specific directives or communications from Washington that impact the team's operations?",
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 68},
-  {'query': "How does the team perceive Washington's role in their mission?",
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 69},
-  {'query': "What specific experiences or background might influence Alex Mercer's optimistic approach?",
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 70},
-  {'query': "How does Taylor Cruz's military background shape their cautious perspective?",
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 71},
-  {'query': "What role does Dr. Jordan Hayes play in mediating between Alex and Taylor's viewpoints?",
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 72},
-  {'query': "How do the team's differing perspectives impact their overall strategy in dealing with the Cosmic Vocalization?",
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 73},
-  {'query': "What are the potential consequences of Alex Mercer's and Taylor Cruz's differing approaches to the mission?",
-   'answer': "Alex Mercer and Taylor Cruz represent two distinct approaches to the mission at Dulce Base, each with potential consequences for the outcome of their operation. Alex Mercer is portrayed as a leader who values intuition, trust, and a balanced strategy when dealing with the unknown. His approach is characterized by a willingness to engage with the alien signal cautiously, yet optimistically, recognizing the potential for both profound discovery and significant risk [Data: Sources (45, 31, 27, 23, 24)]. This approach could lead to successful communication and understanding with the alien intelligence, fostering a new era of cosmic diplomacy and collaboration. However, it also carries the risk of underestimating potential threats if the signal's intentions are not as benign as hoped.\n\nOn the other hand, Taylor Cruz embodies a more pragmatic and cautious stance, emphasizing the importance of protocol, risk assessment, and maintaining control over the situation. Taylor's approach is rooted in a deep-seated concern for the potential dangers posed by the alien signal, advocating for a measured and defensive response [Data: Sources (31, 27, 16, 32, 14)]. This could prevent the team from falling into traps or making hasty decisions that could lead to disaster. However, it might also hinder the team's ability to fully explore and understand the opportunities presented by the alien contact, potentially missing out on valuable insights or alliances.\n\nThe differing approaches of Alex Mercer and Taylor Cruz highlight a fundamental tension between exploration and caution, which is central to the mission's success. Balancing these perspectives could be crucial in navigating the complexities of first contact with an alien intelligence, ensuring that the team remains open to new possibilities while safeguarding against unforeseen threats.",
-   'score': 85,
-   'metadata': {'llm_calls': 1,
-    'prompt_tokens': 10982,
-    'output_tokens': 461,
-    'context_data': {'entities': Empty DataFrame
-     Columns: [in_context]
-     Index: [],
-     'sources':     id                                               text
-     0   45   they faced. "If it's truly sentient, we're no...
-     1   31   set the tempo for an undertaking that travers...
-     2   27  , and not a small measure of trepidation. "Thi...
-     3   23  Sam Rivera, ever the source of technological a...
-     4   24  Keep the communication channels open. But let ...
-     5   26  eterred, Jordan cast a determined glance at th...
-     6    0  # Operation: Dulce\n\n## Chapter 1\n\nThe thru...
-     7   16   a new cosmic paradigm.\n\nAlex Mercer watched...
-     8   32   cosmos—secrets that, until now, had been lost...
-     9   14   a communal outreach beyond the stars. As dawn...
-     10  18   the universe.\n\nIn a symphony of clicks and ...
-     11  44   It's a... symphony. It's as if they're teachi...
-     12  41   conviction that knowledge was more than power...
-     13   8   I'm right, what we're looking at isn't random...
-     14  10   but felt by all. The walls didn't just whispe...
-     15   3  , weighing his words carefully. "Our tech is t...
-     16  21   an undercurrent of intensity carried forth in...}},
-   'id': 74},
-  {'query': 'What specific strategies does Alex Mercer employ to address the challenges at Dulce Base?',
-   'answer': "Alex Mercer, a key figure in the operations at Dulce Base, employs a variety of strategies to address the complex challenges presented by the enigmatic signals and potential extraterrestrial contact. His approach is characterized by a blend of caution, collaboration, and adaptability, which are crucial in navigating the unknowns of interstellar communication.\n\n**Cautious Optimism and Strategic Communication**\n\nAlex demonstrates a cautious yet optimistic approach when dealing with the signals from beyond. He emphasizes the importance of keeping communication channels open while ensuring that no message or pulse goes unchecked, recognizing the potential for both breakthrough and disaster [Data: Sources (45, 23, 24)]. This balanced strategy reflects his understanding of the delicate nature of their work, as he acknowledges the possibility of the signals being either a Rosetta Stone or a Tower of Babel [Data: Sources (23, 24)].\n\n**Collaborative Leadership and Trust**\n\nThroughout the operation, Alex relies heavily on the expertise of his team, fostering an environment of trust and collaboration. He frequently engages with team members like Dr. Jordan Hayes, Taylor Cruz, and Sam Rivera, valuing their insights and encouraging a collective effort to decode the signals [Data: Sources (45, 23, 24, 44)]. His leadership style is not authoritarian but rather inclusive, as he seeks input from his team and respects their expertise, which is crucial in such a high-stakes and uncertain environment.\n\n**Adaptability and Preparedness**\n\nAlex's strategies also include a high degree of adaptability. He is aware of the evolving nature of the signals and the need to adjust their approach as new information becomes available. This is evident in his response to the signals' increasing complexity and the potential for them to be a form of communication or even an invitation [Data: Sources (31, 32, 44)]. He prepares his team for various outcomes, emphasizing the importance of being ready for whatever answers back from the unknown [Data: Sources (27, 41)].\n\nIn summary, Alex Mercer's strategies at Dulce Base are a testament to his ability to balance caution with curiosity, foster a collaborative team environment, and remain adaptable in the face of unprecedented challenges. His leadership is pivotal in guiding the Paranormal Military Squad through the complexities of potential first contact with an extraterrestrial intelligence.",
-   'score': 85,
-   'metadata': {'llm_calls': 1,
-    'prompt_tokens': 10982,
-    'output_tokens': 613,
-    'context_data': {'entities': Empty DataFrame
-     Columns: [in_context]
-     Index: [],
-     'sources':     id                                               text
-     0   45   they faced. "If it's truly sentient, we're no...
-     1   31   set the tempo for an undertaking that travers...
-     2   27  , and not a small measure of trepidation. "Thi...
-     3   23  Sam Rivera, ever the source of technological a...
-     4   24  Keep the communication channels open. But let ...
-     5   26  eterred, Jordan cast a determined glance at th...
-     6    0  # Operation: Dulce\n\n## Chapter 1\n\nThe thru...
-     7   16   a new cosmic paradigm.\n\nAlex Mercer watched...
-     8   32   cosmos—secrets that, until now, had been lost...
-     9   14   a communal outreach beyond the stars. As dawn...
-     10  18   the universe.\n\nIn a symphony of clicks and ...
-     11  44   It's a... symphony. It's as if they're teachi...
-     12  41   conviction that knowledge was more than power...
-     13   8   I'm right, what we're looking at isn't random...
-     14  10   but felt by all. The walls didn't just whispe...
-     15   3  , weighing his words carefully. "Our tech is t...
-     16  21   an undercurrent of intensity carried forth in...}},
-   'id': 75},
-  {'query': 'How do the team dynamics influence the handling of the alien signal?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 76},
-  {'query': 'What are the potential risks associated with the alien signal, and how does the team plan to mitigate them?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 77},
-  {'query': "How does the evolving nature of the alien signal impact the team's approach?",
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 78},
-  {'query': 'What role does each team member play in overcoming the challenges at Dulce Base?',
-   'answer': "### Team Dynamics and Roles at Dulce Base\n\nThe team at Dulce Base is composed of several key members, each bringing unique skills and perspectives to the mission. Their roles are crucial in navigating the complex challenges they face, particularly in the context of Operation: Dulce.\n\n**Agent Alex Mercer** is portrayed as a central figure, often acting as a bridge between the team members and the overarching mission objectives. He is depicted as a reliable and steady presence, providing leadership and strategic oversight. Mercer's role involves balancing the need for adherence to protocol with the necessity of exploring the unknown, as he navigates the tension between compliance and curiosity [Data: Sources (0, 8, 9, 16)].\n\n**Dr. Jordan Hayes** serves as the scientific mind of the team, focusing on the analysis and interpretation of alien signals. Jordan's expertise in decryption and understanding complex patterns is pivotal in unraveling the mysteries of the alien communication. Their role is characterized by a blend of skepticism and open-mindedness, which allows them to adapt to the evolving nature of the mission [Data: Sources (6, 33, 45, 49)].\n\n**Sam Rivera** is the tech-savvy member of the team, responsible for handling electronic anomalies and interfacing with alien technology. Sam's role is crucial in bridging the technological gap between human and alien systems, often providing innovative solutions to technical challenges. Their enthusiasm and optimism about forming a connection with the alien intelligence are vital in maintaining the team's morale and focus [Data: Sources (8, 42, 49)].\n\n**Taylor Cruz** embodies the military precision and authority within the team. Cruz's role involves ensuring that the team adheres to protocols and maintains a disciplined approach to the mission. Despite their authoritative demeanor, Cruz is also shown to be adaptable, recognizing the need for caution and strategic thinking in the face of unknown threats [Data: Sources (0, 9, 16, 45)].\n\n### Commentary\n\nThe dynamics within the team are complex, with each member contributing to the mission's success through their specialized skills and perspectives. The interplay between scientific inquiry, technological innovation, and military discipline creates a multifaceted approach to the challenges at Dulce Base. This synergy is essential in navigating the uncertainties and potential threats posed by the alien presence.\n\nOverall, the team's ability to adapt and collaborate is a testament to their collective strength, allowing them to transform from mere operatives into pioneers of interstellar diplomacy.\n",
-   'score': 85,
-   'metadata': {'llm_calls': 1,
-    'prompt_tokens': 10980,
-    'output_tokens': 622,
-    'context_data': {'entities': Empty DataFrame
-     Columns: [in_context]
-     Index: [],
-     'sources':     id                                               text
-     0   12   keep the team grounded. No one goes off-cours...
-     1   40   and the distant hum of machinery hinted at Du...
-     2    6   ordered, their voice echoing slightly before ...
-     3    8   I'm right, what we're looking at isn't random...
-     4    0  # Operation: Dulce\n\n## Chapter 1\n\nThe thru...
-     5   33   were locked onto the display screen, where an...
-     6   15   than the last.\n\nThen, with a sudden burst t...
-     7   22   his team into the core of their approach, his...
-     8   25   his fingers hovering over the command keys. W...
-     9   16   a new cosmic paradigm.\n\nAlex Mercer watched...
-     10   8   I'm right, what we're looking at isn't random...
-     11   9   "The silence here... It's almost as if the ba...
-     12  42   the dark heart of Dulce's secrets. \n\nAnd th...
-     13  49   on. In his eyes flashed the foreboding excite...
-     14  45   they faced. "If it's truly sentient, we're no...
-     15  27  , and not a small measure of trepidation. "Thi...
-     16  16   a new cosmic paradigm.\n\nAlex Mercer watched...}},
-   'id': 79},
-  {'query': 'What specific technologies are used at Dulce Base for interstellar communication?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 80},
-  {'query': 'How did the agents at Dulce Base first detect the alien signals?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 81},
-  {'query': 'What are the potential risks associated with the interstellar communication efforts at Dulce Base?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 82},
-  {'query': 'How does the narrative of Dulce Base compare to real-world theories about extraterrestrial communication?',
-   'answer': "The narrative of Dulce Base, as depicted in the sources, presents a fictionalized account of humanity's first contact with extraterrestrial intelligence, focusing on the challenges and philosophical implications of such an encounter. This narrative is rich with themes of communication, adaptation, and the potential for both collaboration and conflict with an alien intelligence. The story unfolds in a high-stakes environment where a team of agents, including Alex Mercer, work to decode and respond to alien signals, highlighting the tension between scientific curiosity and the need for caution [Data: Sources (26, 6, 38, 27, 5, 9, 30, 46, 29, 31, 32, 3, 23, 47, 15, 35)].\n\nIn comparison, real-world theories about extraterrestrial communication often revolve around the Search for Extraterrestrial Intelligence (SETI) and the potential methods and implications of contacting alien civilizations. These theories consider the use of radio signals, laser transmissions, and other forms of communication that could be detected across vast interstellar distances. A key aspect of these theories is the development of protocols for how humanity should respond to a detected signal, balancing the excitement of potential contact with the risks of revealing our presence to unknown entities.\n\nBoth the fictional narrative and real-world theories grapple with the concept of communication across different forms of intelligence. In the Dulce Base story, the alien signals are described as evolving and adapting, suggesting a form of sentience that challenges the characters to rethink their approach to communication [Data: Sources (26, 38, 27, 30, 46)]. Similarly, real-world discussions often focus on the challenges of interpreting signals from a civilization that may have a fundamentally different understanding of communication and language.\n\nOverall, the narrative of Dulce Base serves as a dramatized exploration of themes that are central to real-world discussions about extraterrestrial communication, including the potential for mutual understanding and the existential risks involved in such an encounter.",
-   'score': 85,
-   'metadata': {'llm_calls': 1,
-    'prompt_tokens': 10982,
-    'output_tokens': 532,
-    'context_data': {'entities': Empty DataFrame
-     Columns: [in_context]
-     Index: [],
-     'sources':     id                                               text
-     0   26  eterred, Jordan cast a determined glance at th...
-     1    6   ordered, their voice echoing slightly before ...
-     2   38   urged, his voice bearing the gravitas of thei...
-     3   27  , and not a small measure of trepidation. "Thi...
-     4    5   very walls of the shaft—a whisper of somethin...
-     5    9   "The silence here... It's almost as if the ba...
-     6   30   emissaries to a celestial congress we're only...
-     7   46   was now actively partaking in an exchange not...
-     8   29  crum of insight and expertise, and felt the so...
-     9   45   they faced. "If it's truly sentient, we're no...
-     10  31   set the tempo for an undertaking that travers...
-     11  32   cosmos—secrets that, until now, had been lost...
-     12   3  , weighing his words carefully. "Our tech is t...
-     13  23  Sam Rivera, ever the source of technological a...
-     14  47   revealing a tinge of skepticism at Taylor Cru...
-     15  15   than the last.\n\nThen, with a sudden burst t...
-     16  35  , every keystroke an intricate step in their t...}},
-   'id': 83},
-  {'query': 'What role does Alex Mercer play in the interstellar communication efforts at Dulce Base?',
-   'answer': "Alex Mercer plays a pivotal role in the interstellar communication efforts at Dulce Base, acting as a leader and strategist within the Paranormal Military Squad. His responsibilities include overseeing the team's operations and ensuring that communication channels with the alien signal remain open and secure. Mercer is depicted as a figure of authority and trust, often providing guidance and support to his team members, such as Dr. Jordan Hayes, Taylor Cruz, and Sam Rivera, as they work to decode and understand the alien signals [Data: Sources (45, 31, 27, 23, 24)].\n\nMercer is portrayed as a calm and steady presence amidst the high-stakes environment of Dulce Base. He is described as having a blend of military discipline and intellectual curiosity, which allows him to navigate the complexities of the mission effectively. His leadership style is characterized by a balance of caution and optimism, as he encourages his team to proceed with both curiosity and prudence when interacting with the alien intelligence [Data: Sources (45, 31, 27, 23, 24)].\n\nThroughout the mission, Mercer emphasizes the importance of maintaining open communication and ensuring that every message and signal is carefully monitored. He understands the potential implications of their work, recognizing that their efforts could either bridge a gap between humanity and an alien civilization or lead to unforeseen consequences. Mercer's role is crucial in orchestrating the team's efforts to engage with the alien signal, making him a central figure in the unfolding narrative of interstellar diplomacy [Data: Sources (45, 31, 27, 23, 24)].",
-   'score': 85,
-   'metadata': {'llm_calls': 1,
-    'prompt_tokens': 10982,
-    'output_tokens': 438,
-    'context_data': {'entities': Empty DataFrame
-     Columns: [in_context]
-     Index: [],
-     'sources':     id                                               text
-     0   45   they faced. "If it's truly sentient, we're no...
-     1   31   set the tempo for an undertaking that travers...
-     2   27  , and not a small measure of trepidation. "Thi...
-     3   23  Sam Rivera, ever the source of technological a...
-     4   24  Keep the communication channels open. But let ...
-     5   26  eterred, Jordan cast a determined glance at th...
-     6    0  # Operation: Dulce\n\n## Chapter 1\n\nThe thru...
-     7   16   a new cosmic paradigm.\n\nAlex Mercer watched...
-     8   32   cosmos—secrets that, until now, had been lost...
-     9   14   a communal outreach beyond the stars. As dawn...
-     10  18   the universe.\n\nIn a symphony of clicks and ...
-     11  44   It's a... symphony. It's as if they're teachi...
-     12  41   conviction that knowledge was more than power...
-     13   8   I'm right, what we're looking at isn't random...
-     14  10   but felt by all. The walls didn't just whispe...
-     15   3  , weighing his words carefully. "Our tech is t...
-     16  21   an undercurrent of intensity carried forth in...}},
-   'id': 84},
-  {'query': 'What are the specific challenges Alex Mercer faces in his role?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 85},
-  {'query': 'What is the nature of the alien signal that Alex Mercer and his team are dealing with?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 86},
-  {'query': 'How does Alex Mercer balance caution and curiosity in his approach?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 87},
-  {'query': 'What are the potential risks associated with the alien contact at the Dulce Facility?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 88},
-  {'query': 'What specific strategies has Alex Mercer implemented in response to cosmic signals?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 89},
-  {'query': "How does Alex Mercer's leadership style compare to other members of the Paranormal Military Squad?",
-   'answer': "Alex Mercer's leadership style is characterized by a blend of determination, strategic thinking, and a deep respect for his team's expertise. Throughout the operation at Dulce Base, Mercer demonstrates a balanced approach, combining military discipline with a willingness to engage in collaborative problem-solving. He often seeks input from his team members, such as Dr. Jordan Hayes and Sam Rivera, valuing their insights and expertise in navigating the complex challenges they face [Data: Sources (45, 31, 27, 23, 24)].\n\nIn contrast, Taylor Cruz exhibits a more authoritative and pragmatic leadership style. Cruz is often seen emphasizing protocol and caution, ensuring that the team remains focused on their objectives and aware of potential risks. This approach sometimes leads to tension, as Cruz's insistence on protocol can clash with the more exploratory and adaptive strategies favored by Mercer and others [Data: Sources (0, 16, 8, 3, 21)].\n\nDr. Jordan Hayes, while not in a formal leadership position, plays a crucial role in guiding the team's scientific and analytical efforts. Hayes's leadership is more subtle, characterized by a focus on adaptability and a willingness to embrace the unknown. This complements Mercer's approach, as both value the importance of understanding and interpreting the alien signals they encounter [Data: Sources (45, 31, 27, 23, 24)].\n\nSam Rivera, on the other hand, brings a youthful enthusiasm and technological acumen to the team. Rivera's approach is more collaborative and optimistic, often focusing on the potential for discovery and connection with the alien intelligence. This perspective aligns well with Mercer's strategic vision, as both are open to exploring new possibilities and learning from the unknown [Data: Sources (45, 31, 27, 23, 24)].\n\nOverall, Mercer's leadership style is distinguished by his ability to integrate the diverse strengths of his team members, fostering an environment where collaboration and strategic thinking are paramount. This contrasts with Cruz's more rigid adherence to protocol and Hayes's and Rivera's focus on adaptability and exploration.",
-   'score': 85,
-   'metadata': {'llm_calls': 1,
-    'prompt_tokens': 10982,
-    'output_tokens': 534,
-    'context_data': {'entities': Empty DataFrame
-     Columns: [in_context]
-     Index: [],
-     'sources':     id                                               text
-     0   45   they faced. "If it's truly sentient, we're no...
-     1   31   set the tempo for an undertaking that travers...
-     2   27  , and not a small measure of trepidation. "Thi...
-     3   23  Sam Rivera, ever the source of technological a...
-     4   24  Keep the communication channels open. But let ...
-     5   26  eterred, Jordan cast a determined glance at th...
-     6    0  # Operation: Dulce\n\n## Chapter 1\n\nThe thru...
-     7   16   a new cosmic paradigm.\n\nAlex Mercer watched...
-     8   32   cosmos—secrets that, until now, had been lost...
-     9   14   a communal outreach beyond the stars. As dawn...
-     10  18   the universe.\n\nIn a symphony of clicks and ...
-     11  44   It's a... symphony. It's as if they're teachi...
-     12  41   conviction that knowledge was more than power...
-     13   8   I'm right, what we're looking at isn't random...
-     14  10   but felt by all. The walls didn't just whispe...
-     15   3  , weighing his words carefully. "Our tech is t...
-     16  21   an undercurrent of intensity carried forth in...}},
-   'id': 90},
-  {'query': "What are the potential risks and benefits of Mercer's approach to cosmic events?",
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 91},
-  {'query': 'How does Alex Mercer balance military protocols with the need for scientific exploration?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 92},
-  {'query': 'What role does Alex Mercer play in the decision-making process of the Paranormal Military Squad?',
-   'answer': "Alex Mercer plays a pivotal role in the decision-making process of the Paranormal Military Squad, acting as a leader and a mediator among the team members. His presence is marked by a blend of authority and collaboration, as he often seeks input from his colleagues while guiding the team through complex situations. For instance, Alex is seen surveying his team with a sense of determination and trust, indicating his leadership role in maintaining open communication channels and ensuring that no message or pulse goes unchecked [Data: Sources (45, 23, 24)].\n\nIn the command center of Dulce Base, Alex's leadership is evident as he balances the need for cautious optimism with the potential risks involved in their mission. He encourages his team to keep the communication channels open while being vigilant about the messages they receive, highlighting his strategic approach to the unknown [Data: Sources (23, 24)]. Alex's interactions with his team members, such as Dr. Jordan Hayes and Taylor Cruz, demonstrate his ability to integrate diverse perspectives into the decision-making process, ensuring that the team remains adaptable and prepared for any eventuality [Data: Sources (45, 23, 24)].\n\nMoreover, Alex's role extends beyond mere leadership; he embodies the spirit of exploration and diplomacy, recognizing the historic weight of their task and the potential for a new cosmic relationship. His actions reflect a commitment to understanding and engaging with the unknown, positioning him as a key figure in shaping the squad's response to extraterrestrial signals [Data: Sources (45, 24, 44)].",
-   'score': 85,
-   'metadata': {'llm_calls': 1,
-    'prompt_tokens': 10982,
-    'output_tokens': 444,
-    'context_data': {'entities': Empty DataFrame
-     Columns: [in_context]
-     Index: [],
-     'sources':     id                                               text
-     0   45   they faced. "If it's truly sentient, we're no...
-     1   31   set the tempo for an undertaking that travers...
-     2   27  , and not a small measure of trepidation. "Thi...
-     3   23  Sam Rivera, ever the source of technological a...
-     4   24  Keep the communication channels open. But let ...
-     5   26  eterred, Jordan cast a determined glance at th...
-     6    0  # Operation: Dulce\n\n## Chapter 1\n\nThe thru...
-     7   16   a new cosmic paradigm.\n\nAlex Mercer watched...
-     8   32   cosmos—secrets that, until now, had been lost...
-     9   14   a communal outreach beyond the stars. As dawn...
-     10  18   the universe.\n\nIn a symphony of clicks and ...
-     11  44   It's a... symphony. It's as if they're teachi...
-     12  41   conviction that knowledge was more than power...
-     13   8   I'm right, what we're looking at isn't random...
-     14  10   but felt by all. The walls didn't just whispe...
-     15   3  , weighing his words carefully. "Our tech is t...
-     16  21   an undercurrent of intensity carried forth in...}},
-   'id': 93},
-  {'query': 'What specific skills does Alex Mercer bring to the Paranormal Military Squad?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 94},
-  {'query': "How does Mercer’s leadership style influence the team's approach to extraterrestrial communication?",
-   'answer': "Agent Alex Mercer plays a pivotal role in guiding his team through the complexities of extraterrestrial communication, as evidenced by the various interactions and decisions documented in the sources. Mercer's leadership style is characterized by a blend of cautious optimism, strategic foresight, and a deep respect for the expertise of his team members.\n\nMercer demonstrates a balanced approach to leadership by fostering an environment where open communication and collaboration are encouraged. He is seen engaging with his team members, such as Dr. Jordan Hayes, Taylor Cruz, and Sam Rivera, in a manner that values their input and expertise. For instance, Mercer often seeks Jordan's insights on the evolving alien signals, acknowledging the importance of their analytical skills in deciphering the complex patterns [Data: Sources (45, 31, 27)]. This collaborative approach not only empowers the team but also ensures that diverse perspectives are considered in their strategy.\n\nMoreover, Mercer's leadership is marked by a strategic caution that tempers the team's enthusiasm with a necessary level of prudence. He emphasizes the importance of keeping communication channels open while ensuring that no message or pulse goes unchecked, highlighting the potential risks and rewards of their mission [Data: Sources (23, 24, 44)]. This careful balance between exploration and caution reflects Mercer's understanding of the stakes involved in their interstellar dialogue.\n\nMercer's ability to inspire confidence and maintain focus amidst uncertainty is another key aspect of his leadership. He reassures his team of the significance of their work, framing their mission as a historic opportunity to engage with an intelligence beyond Earth. This perspective not only motivates the team but also aligns their efforts towards a common goal of understanding and diplomacy [Data: Sources (18, 21, 41)].\n\nIn summary, Mercer's leadership style significantly influences the team's approach to extraterrestrial communication by fostering a collaborative environment, balancing caution with curiosity, and inspiring a shared sense of purpose. His ability to navigate the complexities of their mission with strategic foresight and respect for his team's expertise is crucial in their efforts to bridge the cosmic divide.",
-   'score': 85,
-   'metadata': {'llm_calls': 1,
-    'prompt_tokens': 10982,
-    'output_tokens': 543,
-    'context_data': {'entities': Empty DataFrame
-     Columns: [in_context]
-     Index: [],
-     'sources':     id                                               text
-     0   45   they faced. "If it's truly sentient, we're no...
-     1   31   set the tempo for an undertaking that travers...
-     2   27  , and not a small measure of trepidation. "Thi...
-     3   23  Sam Rivera, ever the source of technological a...
-     4   24  Keep the communication channels open. But let ...
-     5   26  eterred, Jordan cast a determined glance at th...
-     6    0  # Operation: Dulce\n\n## Chapter 1\n\nThe thru...
-     7   16   a new cosmic paradigm.\n\nAlex Mercer watched...
-     8   32   cosmos—secrets that, until now, had been lost...
-     9   14   a communal outreach beyond the stars. As dawn...
-     10  18   the universe.\n\nIn a symphony of clicks and ...
-     11  44   It's a... symphony. It's as if they're teachi...
-     12  41   conviction that knowledge was more than power...
-     13   8   I'm right, what we're looking at isn't random...
-     14  10   but felt by all. The walls didn't just whispe...
-     15   3  , weighing his words carefully. "Our tech is t...
-     16  21   an undercurrent of intensity carried forth in...}},
-   'id': 95},
-  {'query': 'What are the potential risks and rewards of the mission at Dulce Base?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 96},
-  {'query': 'How does the team balance military protocol with the unknowns of alien contact?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 97},
-  {'query': 'What are the implications of successful communication with extraterrestrial intelligence for humanity?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 98},
-  {'query': 'What specific skills does Agent Mercer bring to the Paranormal Military Squad?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 99},
-  {'query': "How does Agent Mercer's leadership style influence the team's dynamics?",
-   'answer': "Agent Alex Mercer's leadership style is characterized by a blend of determination, strategic thinking, and a deep respect for his team's expertise, which significantly influences the dynamics within the Paranormal Military Squad. Mercer's approach is not one of authoritarian command but rather one that values collaboration and the collective intelligence of his team members. This is evident in his interactions with Dr. Jordan Hayes, where he acknowledges their expertise and invites collaboration rather than dictating orders [Data: Sources (18, 44, 41)].\n\nMercer demonstrates a keen ability to balance military discipline with the need for open dialogue and adaptability. He encourages his team to remain focused on their mission while also being open to the unknown variables they encounter, as seen when he advises Jordan to keep the communication channels open and to approach the alien signal with cautious optimism [Data: Sources (23, 24, 44)]. This approach fosters a sense of shared responsibility and trust among the team members, allowing them to navigate the complexities of their mission with a united front.\n\nFurthermore, Mercer's leadership is marked by his ability to inspire confidence and maintain composure under pressure. His presence is a stabilizing force, providing reassurance to his team as they face the unknown. This is particularly important in high-stakes situations, such as when the team is deciphering alien signals and contemplating the implications of their findings [Data: Sources (18, 41, 44)]. By valuing each team member's input and maintaining a strategic focus, Mercer effectively guides the team through the challenges they encounter, enhancing their cohesion and effectiveness as a unit.",
-   'score': 85,
-   'metadata': {'llm_calls': 1,
-    'prompt_tokens': 10981,
-    'output_tokens': 430,
-    'context_data': {'entities': Empty DataFrame
-     Columns: [in_context]
-     Index: [],
-     'sources':     id                                               text
-     0    9   "The silence here... It's almost as if the ba...
-     1   42   the dark heart of Dulce's secrets. \n\nAnd th...
-     2   45   they faced. "If it's truly sentient, we're no...
-     3   31   set the tempo for an undertaking that travers...
-     4   27  , and not a small measure of trepidation. "Thi...
-     5   23  Sam Rivera, ever the source of technological a...
-     6   24  Keep the communication channels open. But let ...
-     7   26  eterred, Jordan cast a determined glance at th...
-     8    0  # Operation: Dulce\n\n## Chapter 1\n\nThe thru...
-     9   16   a new cosmic paradigm.\n\nAlex Mercer watched...
-     10  32   cosmos—secrets that, until now, had been lost...
-     11  14   a communal outreach beyond the stars. As dawn...
-     12  18   the universe.\n\nIn a symphony of clicks and ...
-     13  44   It's a... symphony. It's as if they're teachi...
-     14  41   conviction that knowledge was more than power...
-     15   8   I'm right, what we're looking at isn't random...
-     16  10   but felt by all. The walls didn't just whispe...}},
-   'id': 100},
-  {'query': 'In what ways does Agent Mercer collaborate with Dr. Jordan Hayes?',
-   'answer': "Agent Alex Mercer and Dr. Jordan Hayes collaborate closely in their mission to decipher alien communications and navigate the complexities of their task at Dulce Base. Their partnership is characterized by mutual respect and a shared commitment to discovery, which is evident in several key interactions.\n\n**Shared Mission and Goals**\n\nMercer and Hayes are united by their dedication to understanding the alien signals they are tasked with decoding. They both recognize the potential implications of their work, not just for their mission but for humanity as a whole. This shared vision is a driving force behind their collaboration, as they work together to unravel the mysteries presented by the alien communications [Data: Sources (17, 33, 23)].\n\n**Complementary Skills and Roles**\n\nDr. Jordan Hayes brings a scientific and analytical perspective to the team, focusing on the technical aspects of decoding the alien signals. Mercer's role complements this by providing strategic oversight and ensuring that the team's efforts align with broader mission objectives. This dynamic allows them to tackle the challenges from both a technical and strategic standpoint, enhancing their effectiveness as a team [Data: Sources (17, 33, 23)].\n\n**Mutual Support and Trust**\n\nThroughout their mission, Mercer and Hayes demonstrate a strong sense of trust and support for one another. Mercer often relies on Hayes's expertise in decryption and analysis, while Hayes values Mercer's leadership and strategic insights. This mutual reliance is crucial as they face the unknown, and it underscores the strength of their collaboration [Data: Sources (17, 33, 23)].\n\n**Navigating Challenges Together**\n\nThe duo faces numerous challenges, including the need to interpret complex alien signals and the pressure of potential existential threats. They navigate these challenges by maintaining open communication and a shared focus on their objectives. Their ability to work together effectively is a testament to their complementary skills and shared dedication to their mission [Data: Sources (17, 33, 23)].\n\nIn summary, Agent Mercer and Dr. Jordan Hayes collaborate through a combination of shared goals, complementary skills, mutual trust, and effective communication. Their partnership is pivotal to the success of their mission at Dulce Base, as they work together to bridge the gap between human and alien understanding.",
-   'score': 85,
-   'metadata': {'llm_calls': 1,
-    'prompt_tokens': 11312,
-    'output_tokens': 558,
-    'context_data': {'entities': Empty DataFrame
-     Columns: [in_context]
-     Index: [],
-     'sources':     id                                               text
-     0   42   the dark heart of Dulce's secrets. \n\nAnd th...
-     1   47   revealing a tinge of skepticism at Taylor Cru...
-     2    1  's authoritarian performance. _Protocols_, Jor...
-     3   13   primacy within.\n\n"The closer we get to unlo...
-     4   39  , a moderate undertone of exhilaration within ...
-     5   12   keep the team grounded. No one goes off-cours...
-     6    2  , rehearsing the speech for their subordinates...
-     7   17   on the sequences that danced across the scree...
-     8    7  , while Alex clenched his jaw, the buzz of fru...
-     9   33   were locked onto the display screen, where an...
-     10  22   his team into the core of their approach, his...
-     11  40   and the distant hum of machinery hinted at Du...
-     12  45   they faced. "If it's truly sentient, we're no...
-     13  31   set the tempo for an undertaking that travers...
-     14  27  , and not a small measure of trepidation. "Thi...
-     15  23  Sam Rivera, ever the source of technological a...
-     16  24  Keep the communication channels open. But let ...
-     17  26  eterred, Jordan cast a determined glance at th...}},
-   'id': 101},
-  {'query': 'What are the key challenges Agent Mercer faces in his role?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 102},
-  {'query': "How does Agent Mercer's approach to the mission differ from Taylor Cruz's?",
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 103},
-  {'query': 'What specific technologies are used at Dulce Base for decoding alien signals?',
-   'answer': "The Dulce Base command center is equipped with advanced technological systems designed to decode and interact with alien signals. The team, led by Alex Mercer, utilizes a variety of sophisticated tools and methodologies to engage with these extraterrestrial communications. \n\nOne of the primary technologies mentioned is a complex array of cosmic translators, which are used to interpret the alien script that appears on their monitors [Data: Sources (29, 31, 32)]. These translators are part of a broader system of decryption algorithms that Dr. Jordan Hayes and the team employ to break through layers of encryption and understand the signals' content [Data: Sources (23, 45)].\n\nThe command center is also described as having a central comms array, which is crucial for managing the flow of information and ensuring that the signals are properly recorded and analyzed [Data: Sources (15, 46)]. This setup allows the team to maintain open communication channels and adapt to the evolving nature of the signals, which are described as learning and changing in response to the team's interactions [Data: Sources (23, 38)].\n\nOverall, the technologies at Dulce Base are not just about decoding signals but also about engaging in a form of dialogue with an alien intelligence, requiring both technical precision and a nuanced understanding of potential extraterrestrial communication methods.",
-   'score': 70,
-   'metadata': {'llm_calls': 1,
-    'prompt_tokens': 10982,
-    'output_tokens': 383,
-    'context_data': {'entities': Empty DataFrame
-     Columns: [in_context]
-     Index: [],
-     'sources':     id                                               text
-     0   26  eterred, Jordan cast a determined glance at th...
-     1    6   ordered, their voice echoing slightly before ...
-     2   38   urged, his voice bearing the gravitas of thei...
-     3   27  , and not a small measure of trepidation. "Thi...
-     4    5   very walls of the shaft—a whisper of somethin...
-     5    9   "The silence here... It's almost as if the ba...
-     6   30   emissaries to a celestial congress we're only...
-     7   46   was now actively partaking in an exchange not...
-     8   29  crum of insight and expertise, and felt the so...
-     9   45   they faced. "If it's truly sentient, we're no...
-     10  31   set the tempo for an undertaking that travers...
-     11  32   cosmos—secrets that, until now, had been lost...
-     12   3  , weighing his words carefully. "Our tech is t...
-     13  23  Sam Rivera, ever the source of technological a...
-     14  47   revealing a tinge of skepticism at Taylor Cru...
-     15  15   than the last.\n\nThen, with a sudden burst t...
-     16  35  , every keystroke an intricate step in their t...}},
-   'id': 104},
-  {'query': 'How do the roles of different team members at Dulce Base contribute to interspecies communication?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 105},
-  {'query': 'What challenges does the team face in maintaining secure communication with extraterrestrial intelligences?',
-   'answer': "The team faces several significant challenges in maintaining secure communication with extraterrestrial intelligences, as depicted in the sources. One of the primary challenges is the complexity and unfamiliarity of the alien signals. The team, led by Dr. Jordan Hayes, is tasked with deciphering a signal that is not only encrypted but also represents a thought process alien to human understanding [Data: Sources (17, 25, 32)]. This requires them to unravel a 'linguistic lock,' which is essentially a test of comprehension, indicating that the communication is not straightforward and demands a high level of cognitive and technical skill to interpret [Data: Sources (17)].\n\nAnother challenge is the potential for misinterpretation or misunderstanding of the signals. The signals are described as having a structured, intentional pattern, akin to a song or symphony, which suggests that they are complex and possibly laden with meaning that could be easily misconstrued [Data: Sources (10, 26)]. The team must navigate these complexities carefully to avoid miscommunication that could lead to unintended consequences.\n\nAdditionally, there is the challenge of ensuring that the communication remains secure and controlled. The alien intelligence is described as adapting to the team's attempts to decrypt the signals, which implies a level of sophistication that could potentially outpace human technology [Data: Sources (26, 19)]. This necessitates a cautious approach to ensure that the communication does not become a liability or a threat.\n\nFinally, the team must contend with the psychological and strategic implications of their communication efforts. The potential for the signals to be either a friendly overture or a coded threat adds a layer of tension and urgency to their work, requiring them to balance scientific curiosity with military prudence [Data: Sources (22, 19)]. The team, therefore, operates under the constant pressure of making decisions that could have far-reaching consequences for humanity.\n\nOverall, the challenges in maintaining secure communication with extraterrestrial intelligences are multifaceted, involving technical, interpretative, and strategic dimensions that the team must navigate with precision and care.",
-   'score': 85,
-   'metadata': {'llm_calls': 1,
-    'prompt_tokens': 10981,
-    'output_tokens': 529,
-    'context_data': {'entities': Empty DataFrame
-     Columns: [in_context]
-     Index: [],
-     'sources':     id                                               text
-     0   17   on the sequences that danced across the scree...
-     1   25   his fingers hovering over the command keys. W...
-     2   32   cosmos—secrets that, until now, had been lost...
-     3   22   his team into the core of their approach, his...
-     4   26  eterred, Jordan cast a determined glance at th...
-     5   19   extraterrestrial sentience that had outreache...
-     6   40   and the distant hum of machinery hinted at Du...
-     7   11  , whose steady presence and ready tech affirme...
-     8    9   "The silence here... It's almost as if the ba...
-     9   20   bridge—or the abysses into which they might u...
-     10  33   were locked onto the display screen, where an...
-     11  13   primacy within.\n\n"The closer we get to unlo...
-     12   4   stepping into their exchange. The authority i...
-     13   1  's authoritarian performance. _Protocols_, Jor...
-     14   7  , while Alex clenched his jaw, the buzz of fru...
-     15  47   revealing a tinge of skepticism at Taylor Cru...
-     16  42   the dark heart of Dulce's secrets. \n\nAnd th...}},
-   'id': 106},
-  {'query': "How does the base's location and infrastructure support its mission in interspecies communication?",
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 107},
-  {'query': 'What are the potential risks and rewards of engaging in interspecies communication at Dulce Base?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 108},
-  {'query': 'What role does each team member play in utilizing these technologies?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 109},
-  {'query': 'How does the team ensure the security of their communication systems?',
-   'answer': 'The team at the Dulce base employs several strategies to ensure the security of their communication systems, reflecting a blend of technological vigilance and strategic foresight. The narrative reveals a high level of awareness and preparedness among the team members, who are acutely aware of the potential threats posed by both terrestrial and extraterrestrial sources.\n\n**Technological Measures**\n\nThe team utilizes advanced decoding equipment to manage and interpret incoming transmissions, which are often non-human in origin. Sam Rivera, for instance, is noted for adjusting the sensitivity of the decoding equipment to transform alien signals into visual symbols, indicating a sophisticated level of technological capability [Data: Sources (13)]. This suggests that the team is equipped with cutting-edge technology designed to handle complex and potentially hostile communications.\n\n**Operational Protocols**\n\nOperational protocols are strictly adhered to, as evidenced by Taylor Cruz\'s emphasis on maintaining silence and vigilance during operations. Cruz\'s directive to "move forward, eyes open, mouths shut" underscores the importance of minimizing chatter to prevent any potential security breaches [Data: Sources (9)]. This approach highlights the team\'s commitment to maintaining operational security through disciplined communication practices.\n\n**Adaptive Strategies**\n\nThe team also demonstrates adaptability in their approach to communication security. They are aware of the need to remain flexible in the face of unknown variables, as articulated by Jordan Hayes, who emphasizes the importance of adaptability in interpreting signal distortions and system malfunctions [Data: Sources (1)]. This adaptability is crucial in an environment where the nature of the threat is not fully understood.\n\n**Collective Vigilance**\n\nCollective vigilance is another key aspect of their security strategy. The team members are portrayed as being constantly alert to the potential for unexpected developments, such as power fluctuations or anomalous signals, which could indicate a breach or an opportunity for contact [Data: Sources (9, 13)]. This collective awareness ensures that the team can respond swiftly to any threats to their communication systems.\n\nOverall, the team\'s approach to securing their communication systems is multifaceted, involving a combination of advanced technology, strict operational protocols, adaptability, and collective vigilance. These strategies are essential in maintaining the integrity of their mission in the face of both known and unknown threats.',
-   'score': 70,
-   'metadata': {'llm_calls': 1,
-    'prompt_tokens': 11315,
-    'output_tokens': 568,
-    'context_data': {'entities': Empty DataFrame
-     Columns: [in_context]
-     Index: [],
-     'sources':     id                                               text
-     0   12   keep the team grounded. No one goes off-cours...
-     1   13   primacy within.\n\n"The closer we get to unlo...
-     2   22   his team into the core of their approach, his...
-     3   10   but felt by all. The walls didn't just whispe...
-     4    9   "The silence here... It's almost as if the ba...
-     5   36  's luminescence. "Remember, while we seek comm...
-     6   46   was now actively partaking in an exchange not...
-     7    6   ordered, their voice echoing slightly before ...
-     8   26  eterred, Jordan cast a determined glance at th...
-     9   14   a communal outreach beyond the stars. As dawn...
-     10  39  , a moderate undertone of exhilaration within ...
-     11  18   the universe.\n\nIn a symphony of clicks and ...
-     12   9   "The silence here... It's almost as if the ba...
-     13  20   bridge—or the abysses into which they might u...
-     14  33   were locked onto the display screen, where an...
-     15  13   primacy within.\n\n"The closer we get to unlo...
-     16   4   stepping into their exchange. The authority i...
-     17   1  's authoritarian performance. _Protocols_, Jor...}},
-   'id': 110},
-  {'query': 'What are the potential risks associated with using these technologies for extraterrestrial communication?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 111},
-  {'query': 'Are there any historical precedents for the technologies used by the team?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 112},
-  {'query': 'How do the technologies used compare to current real-world communication technologies?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 113},
-  {'query': 'What specific role does Agent Mercer play within the Paranormal Military Squad?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 114},
-  {'query': 'How does the team ensure the security of their communications with alien intelligence?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 115},
-  {'query': "What are the potential risks associated with the Paranormal Military Squad's mission?",
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 116},
-  {'query': 'How does the squad balance scientific inquiry with military protocols?',
-   'answer': "The Paranormal Military Squad operates at the intersection of scientific exploration and military discipline, a balance that is crucial given the nature of their mission. The team, led by figures such as Alex Mercer, Jordan Hayes, Taylor Cruz, and Sam Rivera, is tasked with deciphering alien signals and establishing communication with extraterrestrial intelligence. This mission requires a delicate balance between adhering to military protocols and embracing the flexibility needed for scientific discovery.\n\nIn the command center of Dulce Base, the team is constantly aware of the dual nature of their task. Alex Mercer, as a leader, embodies this balance by ensuring that the team remains grounded in military discipline while also encouraging scientific curiosity. For instance, when faced with the alien signal, Alex emphasizes the importance of understanding intent, urging the team to keep communication channels open while ensuring that no message goes unchecked [Data: Sources (23, 24, 49)].\n\nJordan Hayes, a key scientific mind in the team, highlights the importance of adaptability in their approach. They recognize that the unknown variables in their mission exceed the known, suggesting that the team must remain flexible and open to new possibilities beyond the constraints of established protocols [Data: Sources (0, 23)]. This sentiment is echoed by Sam Rivera, who notes the evolving nature of the alien signal, likening it to a conversation where both parties are learning each other's language in real time [Data: Sources (23, 24)].\n\nTaylor Cruz, on the other hand, serves as a reminder of the importance of caution and adherence to protocol. They frequently emphasize the need for careful analysis and the potential risks involved in their mission, ensuring that the team does not become complacent in their scientific pursuits [Data: Sources (0, 23, 24)]. This dynamic creates a tension between exploration and caution, with each team member contributing to a balanced approach that respects both scientific inquiry and military discipline.\n\nOverall, the squad's ability to balance these two aspects is a testament to their expertise and the leadership of Alex Mercer, who navigates the complexities of their mission with a strategic mind and a commitment to both scientific and military objectives.",
-   'score': 85,
-   'metadata': {'llm_calls': 1,
-    'prompt_tokens': 10982,
-    'output_tokens': 538,
-    'context_data': {'entities': Empty DataFrame
-     Columns: [in_context]
-     Index: [],
-     'sources':     id                                               text
-     0   17   on the sequences that danced across the scree...
-     1   32   cosmos—secrets that, until now, had been lost...
-     2   28   "and in every word we script, in every respon...
-     3   34  Our responses so far have echoed their complex...
-     4   25   his fingers hovering over the command keys. W...
-     5   30   emissaries to a celestial congress we're only...
-     6   11  , whose steady presence and ready tech affirme...
-     7   36  's luminescence. "Remember, while we seek comm...
-     8   37   from across the console, their eyes not leavi...
-     9   15   than the last.\n\nThen, with a sudden burst t...
-     10  18   the universe.\n\nIn a symphony of clicks and ...
-     11  44   It's a... symphony. It's as if they're teachi...
-     12  24  Keep the communication channels open. But let ...
-     13  49   on. In his eyes flashed the foreboding excite...
-     14  21   an undercurrent of intensity carried forth in...
-     15   0  # Operation: Dulce\n\n## Chapter 1\n\nThe thru...
-     16  23  Sam Rivera, ever the source of technological a...}},
-   'id': 117},
-  {'query': "What are the implications of the squad's work for humanity's future?",
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 118},
-  {'query': 'What specific challenges does Agent Mercer face in his role?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 119},
-  {'query': "How does Mercer's leadership style evolve throughout the mission?",
-   'answer': "Agent Alex Mercer's leadership style evolves significantly throughout the mission at Dulce Base, reflecting a journey from compliance to a more nuanced and collaborative approach. Initially, Mercer is portrayed as a soldier adhering strictly to protocol, as seen in his interactions with Taylor Cruz and Jordan Hayes. He demonstrates a willingness to follow orders and maintain discipline, even when his instincts suggest otherwise [Data: Sources (0, 8)].\n\nAs the mission progresses, Mercer's leadership begins to shift. He becomes more open to collaboration and values the input of his team members. This is evident when he engages with Dr. Jordan Hayes and Sam Rivera, acknowledging their expertise and encouraging their contributions to the mission's success. Mercer's approach becomes more inclusive, as he balances the need for caution with the pursuit of understanding the alien signals they encounter [Data: Sources (9, 23, 24)].\n\nMercer's leadership is further characterized by his ability to adapt to the evolving situation. He recognizes the importance of maintaining open communication channels and ensuring that every message is carefully analyzed, reflecting a strategic mindset that values both caution and exploration. This adaptability is crucial as the team navigates the complexities of potential first contact with an alien intelligence [Data: Sources (23, 24, 44)].\n\nBy the end of the mission, Mercer's leadership style has transformed into one that is not only directive but also supportive and empowering. He trusts his team to take initiative and make critical decisions, fostering an environment where each member feels valued and integral to the mission's success. This evolution highlights Mercer's growth as a leader who can balance authority with empathy and collaboration, ultimately guiding his team through unprecedented challenges [Data: Sources (14, 18, 41)].",
-   'score': 85,
-   'metadata': {'llm_calls': 1,
-    'prompt_tokens': 10981,
-    'output_tokens': 454,
-    'context_data': {'entities': Empty DataFrame
-     Columns: [in_context]
-     Index: [],
-     'sources':     id                                               text
-     0    9   "The silence here... It's almost as if the ba...
-     1   42   the dark heart of Dulce's secrets. \n\nAnd th...
-     2   45   they faced. "If it's truly sentient, we're no...
-     3   31   set the tempo for an undertaking that travers...
-     4   27  , and not a small measure of trepidation. "Thi...
-     5   23  Sam Rivera, ever the source of technological a...
-     6   24  Keep the communication channels open. But let ...
-     7   26  eterred, Jordan cast a determined glance at th...
-     8    0  # Operation: Dulce\n\n## Chapter 1\n\nThe thru...
-     9   16   a new cosmic paradigm.\n\nAlex Mercer watched...
-     10  32   cosmos—secrets that, until now, had been lost...
-     11  14   a communal outreach beyond the stars. As dawn...
-     12  18   the universe.\n\nIn a symphony of clicks and ...
-     13  44   It's a... symphony. It's as if they're teachi...
-     14  41   conviction that knowledge was more than power...
-     15   8   I'm right, what we're looking at isn't random...
-     16  10   but felt by all. The walls didn't just whispe...}},
-   'id': 120},
-  {'query': "What are the key moments that define Mercer's relationship with Cruz?",
-   'answer': "Agent Alex Mercer and Taylor Cruz have a complex relationship characterized by a mix of professional tension and mutual respect. Their interactions are marked by a balance between compliance with protocol and the pursuit of deeper understanding.\n\nOne key moment occurs when Cruz questions Mercer's commitment to the mission, asking if he is having second thoughts. Mercer responds with a strained smile, affirming his dedication while internally grappling with the weight of compliance versus curiosity [Data: Sources (0)]. This interaction sets the tone for their relationship, highlighting Cruz's authoritative stance and Mercer's internal conflict.\n\nAnother significant interaction is when Cruz emphasizes the importance of protocol, dismissing speculation as counter-productive. Mercer agrees outwardly, but his compliance is layered with unspoken complexities, indicating a subtle resistance to Cruz's rigid approach [Data: Sources (0)]. This moment underscores the tension between Mercer's desire to explore beyond the boundaries of protocol and Cruz's insistence on adherence to established procedures.\n\nDespite these tensions, there are moments of mutual understanding. For instance, when Cruz acknowledges the potential of the technology they are dealing with, there is a brief moment of respect between them. This suggests that beneath their professional differences, there is a shared recognition of the mission's significance [Data: Sources (7)].\n\nOverall, Mercer's relationship with Cruz is defined by a dynamic interplay of authority, compliance, and a shared commitment to the mission, with moments of tension giving way to mutual respect as they navigate the complexities of their task.",
-   'score': 85,
-   'metadata': {'llm_calls': 1,
-    'prompt_tokens': 10982,
-    'output_tokens': 400,
-    'context_data': {'entities': Empty DataFrame
-     Columns: [in_context]
-     Index: [],
-     'sources':     id                                               text
-     0    9   "The silence here... It's almost as if the ba...
-     1   42   the dark heart of Dulce's secrets. \n\nAnd th...
-     2    4   stepping into their exchange. The authority i...
-     3   12   keep the team grounded. No one goes off-cours...
-     4    2  , rehearsing the speech for their subordinates...
-     5    6   ordered, their voice echoing slightly before ...
-     6    1  's authoritarian performance. _Protocols_, Jor...
-     7    7  , while Alex clenched his jaw, the buzz of fru...
-     8   45   they faced. "If it's truly sentient, we're no...
-     9   31   set the tempo for an undertaking that travers...
-     10  27  , and not a small measure of trepidation. "Thi...
-     11  23  Sam Rivera, ever the source of technological a...
-     12  24  Keep the communication channels open. But let ...
-     13  26  eterred, Jordan cast a determined glance at th...
-     14   0  # Operation: Dulce\n\n## Chapter 1\n\nThe thru...
-     15  16   a new cosmic paradigm.\n\nAlex Mercer watched...
-     16  32   cosmos—secrets that, until now, had been lost...}},
-   'id': 121},
-  {'query': "How does Mercer support Rivera's technological contributions?",
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 122},
-  {'query': 'In what ways does Mercer balance protocol with exploration?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 123},
-  {'query': 'What specific technologies does the team use to secure their communications?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 124},
-  {'query': 'How does the team handle potential breaches in their communication systems?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 125},
-  {'query': 'What role does each team member play in maintaining communication security?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 126},
-  {'query': "How do the team's communication security measures compare to standard military protocols?",
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 127},
-  {'query': "What are the potential threats to the team's communication systems?",
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 128},
-  {'query': "What are the specific roles of other team members like Dr. Jordan Hayes and Taylor Cruz in supporting Alex Mercer's strategies?",
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 129},
-  {'query': "How does Alex Mercer's leadership style compare to traditional military leadership approaches?",
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 130},
-  {'query': 'What are the potential risks and rewards of the strategies employed by Alex Mercer at Dulce Base?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 131},
-  {'query': 'How does the team at Dulce Base ensure the security of their communications with the extraterrestrial signals?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 132},
-  {'query': "What are the implications of Alex Mercer's strategies for future interstellar communications and diplomacy?",
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 133},
-  {'query': 'What specific actions does Agent Mercer take to foster collaboration within the team?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 134},
-  {'query': "How does Agent Mercer's leadership style compare to that of Taylor Cruz?",
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 135},
-  {'query': "In what ways does Agent Mercer's leadership impact the team's decision-making process?",
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 136},
-  {'query': 'How does Agent Mercer handle conflicts or disagreements within the team?',
-   'answer': "Agent Alex Mercer is depicted as a leader who navigates conflicts and disagreements within the team with a blend of diplomacy, respect, and strategic foresight. Throughout the narrative, Mercer is shown to value the input and expertise of his team members, fostering an environment where collaboration is prioritized over hierarchy.\n\nIn situations of tension or potential conflict, Mercer often acts as a mediator, seeking to bridge gaps between differing perspectives. For instance, when faced with the challenge of deciphering alien signals, Mercer encourages open dialogue and values the insights of Dr. Jordan Hayes and Sam Rivera, acknowledging their expertise and inviting collaboration rather than dictating orders [Data: Sources (18, 44, 41)]. This approach not only helps in resolving disagreements but also strengthens the team's collective resolve and adaptability.\n\nMercer also demonstrates a keen awareness of the importance of maintaining morale and unity within the team. He is described as having a steady presence, providing reassurance and guidance, which helps to mitigate the stress and uncertainty inherent in their mission [Data: Sources (18, 44)]. By fostering a sense of shared purpose and mutual respect, Mercer effectively manages conflicts, ensuring that the team remains focused on their objectives despite the challenges they face.\n\nOverall, Agent Mercer handles conflicts by promoting a culture of respect, open communication, and strategic collaboration, which allows the team to navigate the complexities of their mission with cohesion and resilience.",
-   'score': 85,
-   'metadata': {'llm_calls': 1,
-    'prompt_tokens': 10981,
-    'output_tokens': 378,
-    'context_data': {'entities': Empty DataFrame
-     Columns: [in_context]
-     Index: [],
-     'sources':     id                                               text
-     0    9   "The silence here... It's almost as if the ba...
-     1   42   the dark heart of Dulce's secrets. \n\nAnd th...
-     2   45   they faced. "If it's truly sentient, we're no...
-     3   31   set the tempo for an undertaking that travers...
-     4   27  , and not a small measure of trepidation. "Thi...
-     5   23  Sam Rivera, ever the source of technological a...
-     6   24  Keep the communication channels open. But let ...
-     7   26  eterred, Jordan cast a determined glance at th...
-     8    0  # Operation: Dulce\n\n## Chapter 1\n\nThe thru...
-     9   16   a new cosmic paradigm.\n\nAlex Mercer watched...
-     10  32   cosmos—secrets that, until now, had been lost...
-     11  14   a communal outreach beyond the stars. As dawn...
-     12  18   the universe.\n\nIn a symphony of clicks and ...
-     13  44   It's a... symphony. It's as if they're teachi...
-     14  41   conviction that knowledge was more than power...
-     15   8   I'm right, what we're looking at isn't random...
-     16  10   but felt by all. The walls didn't just whispe...}},
-   'id': 137},
-  {'query': "What are some examples of challenges the team faces that test Mercer's leadership abilities?",
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 138},
-  {'query': "What specific strategies does Alex Mercer employ to manage the team's interactions with extraterrestrial signals?",
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 139},
-  {'query': "How does Alex Mercer balance the need for caution with the pursuit of knowledge in the squad's missions?",
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 140},
-  {'query': 'In what ways does Alex Mercer collaborate with other team members like Dr. Jordan Hayes and Taylor Cruz?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 141},
-  {'query': 'What are the challenges Alex Mercer faces in his leadership role within the Paranormal Military Squad?',
-   'answer': "Alex Mercer, as a leader within the Paranormal Military Squad, faces a multitude of challenges that test his resolve, adaptability, and strategic acumen. One of the primary challenges is navigating the unknown and potentially dangerous nature of their mission, which involves deciphering and interacting with an alien signal that could have profound implications for humanity. This task requires not only technical expertise but also a deep understanding of the potential risks and rewards involved in such unprecedented contact [Data: Sources (45, 31, 27, 23, 24)].\n\nMercer must also manage the diverse perspectives and expertise within his team, which includes individuals like Dr. Jordan Hayes, Taylor Cruz, and Sam Rivera. Each team member brings their own insights and concerns to the table, such as Jordan's focus on the signal's complexity and potential empathy, Taylor's caution regarding the risks of alien interaction, and Sam's enthusiasm for technological breakthroughs. Balancing these viewpoints while maintaining a cohesive and effective team dynamic is a significant leadership challenge [Data: Sources (45, 31, 27, 23, 24)].\n\nFurthermore, Mercer is tasked with ensuring that the team's actions align with broader strategic goals and protocols, even as they venture into uncharted territory. This involves making critical decisions about how to proceed with the alien communication, weighing the potential for groundbreaking discoveries against the risks of miscommunication or conflict. The pressure to make the right choices in such a high-stakes environment is immense, and Mercer's ability to remain calm and decisive is crucial to the mission's success [Data: Sources (45, 31, 27, 23, 24)].\n\nOverall, Alex Mercer's leadership role is characterized by the need to navigate complex interpersonal dynamics, manage the inherent uncertainties of their mission, and make strategic decisions that could have far-reaching consequences for humanity's future.",
-   'score': 85,
-   'metadata': {'llm_calls': 1,
-    'prompt_tokens': 10982,
-    'output_tokens': 483,
-    'context_data': {'entities': Empty DataFrame
-     Columns: [in_context]
-     Index: [],
-     'sources':     id                                               text
-     0   45   they faced. "If it's truly sentient, we're no...
-     1   31   set the tempo for an undertaking that travers...
-     2   27  , and not a small measure of trepidation. "Thi...
-     3   23  Sam Rivera, ever the source of technological a...
-     4   24  Keep the communication channels open. But let ...
-     5   26  eterred, Jordan cast a determined glance at th...
-     6    0  # Operation: Dulce\n\n## Chapter 1\n\nThe thru...
-     7   16   a new cosmic paradigm.\n\nAlex Mercer watched...
-     8   32   cosmos—secrets that, until now, had been lost...
-     9   14   a communal outreach beyond the stars. As dawn...
-     10  18   the universe.\n\nIn a symphony of clicks and ...
-     11  44   It's a... symphony. It's as if they're teachi...
-     12  41   conviction that knowledge was more than power...
-     13   8   I'm right, what we're looking at isn't random...
-     14  10   but felt by all. The walls didn't just whispe...
-     15   3  , weighing his words carefully. "Our tech is t...
-     16  21   an undercurrent of intensity carried forth in...}},
-   'id': 142},
-  {'query': "How does Alex Mercer's decision-making impact the overall mission outcomes of the Paranormal Military Squad?",
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 143},
-  {'query': "How does Mercer's relationship with Cruz evolve throughout the mission?",
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 144},
-  {'query': "What are the specific instances where Mercer challenges Cruz's authority?",
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 145},
-  {'query': "How do Mercer's interactions with other team members influence his relationship with Cruz?",
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 146},
-  {'query': "What are the underlying motivations for Cruz's authoritative approach?",
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 147},
-  {'query': "In what ways does Mercer's internal conflict affect his decision-making during the mission?",
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 148},
-  {'query': 'What specific strategies does Alex Mercer employ to facilitate communication with the alien signal?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 149},
-  {'query': "How does Alex Mercer's leadership style impact the team's approach to the mission?",
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 150},
-  {'query': 'What challenges does Alex Mercer face in maintaining secure communication channels with the alien intelligence?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 151},
-  {'query': "How do other team members perceive Alex Mercer's role and leadership during the mission?",
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 152},
-  {'query': 'What are the potential consequences of the interstellar communication efforts led by Alex Mercer?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 153},
-  {'query': 'What are the origins of the Dulce Base conspiracy theory?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 154},
-  {'query': 'Have any government agencies officially commented on the existence of Dulce Base?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 155},
-  {'query': 'What are the most common claims made by alleged whistleblowers about Dulce Base?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 156},
-  {'query': 'How do conspiracy theories about Dulce Base compare to other alleged secret bases?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 157},
-  {'query': 'What role does Alex Mercer play in the fictional narratives about Dulce Base?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 158},
-  {'query': 'What specific technologies are used by the Dulce Base team to secure their communications?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 159},
-  {'query': "How does Alex Mercer's leadership style influence the team's approach to security?",
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 160},
-  {'query': 'What are the potential risks identified by the team in communicating with extraterrestrial beings?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 161},
-  {'query': 'How does the team balance security with the need for open communication with extraterrestrial entities?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 162},
-  {'query': "What role does intuition play in the team's security strategy at Dulce Base?",
-   'answer': "Intuition plays a significant role in the team's security strategy at Dulce Base, complementing their adherence to protocols and technical expertise. The narrative reveals that the team, particularly Alex Mercer and Jordan Hayes, often rely on their instincts to navigate the complexities and uncertainties of their mission.\n\nFor instance, Alex Mercer is depicted as someone who, despite his compliance with protocols, harbors a natural inclination to question and explore beyond the given directives. This is evident when he senses the base's silence as a sign of something more profound, suggesting that his intuition is alerting him to potential hidden threats or opportunities [Data: Sources (9, 6, 5)]. Similarly, Jordan Hayes's ability to detect anomalies and interpret signals is not solely based on technical skills but also on an intuitive understanding of the situation, which allows them to identify patterns and potential threats that might not be immediately apparent [Data: Sources (16, 38, 30)].\n\nThe team's interactions also highlight the importance of intuition in their decision-making process. For example, when faced with unexpected situations, such as the appearance of a drone or the discovery of a concealed panel, the team members rely on their instincts to assess the situation quickly and respond effectively [Data: Sources (6, 5)]. This reliance on intuition is further emphasized by the dynamic between the team members, where trust and shared understanding allow them to act cohesively even in the absence of explicit communication [Data: Sources (8, 27)].\n\nOverall, intuition is portrayed as a critical component of the team's security strategy, enabling them to adapt to the unpredictable environment of Dulce Base and make informed decisions that balance caution with the need for exploration.",
-   'score': 85,
-   'metadata': {'llm_calls': 1,
-    'prompt_tokens': 10981,
-    'output_tokens': 445,
-    'context_data': {'entities': Empty DataFrame
-     Columns: [in_context]
-     Index: [],
-     'sources':     id                                               text
-     0   12   keep the team grounded. No one goes off-cours...
-     1   40   and the distant hum of machinery hinted at Du...
-     2    6   ordered, their voice echoing slightly before ...
-     3    8   I'm right, what we're looking at isn't random...
-     4    0  # Operation: Dulce\n\n## Chapter 1\n\nThe thru...
-     5   33   were locked onto the display screen, where an...
-     6   15   than the last.\n\nThen, with a sudden burst t...
-     7   22   his team into the core of their approach, his...
-     8   25   his fingers hovering over the command keys. W...
-     9   16   a new cosmic paradigm.\n\nAlex Mercer watched...
-     10   8   I'm right, what we're looking at isn't random...
-     11   6   ordered, their voice echoing slightly before ...
-     12  38   urged, his voice bearing the gravitas of thei...
-     13  27  , and not a small measure of trepidation. "Thi...
-     14   5   very walls of the shaft—a whisper of somethin...
-     15   9   "The silence here... It's almost as if the ba...
-     16  30   emissaries to a celestial congress we're only...}},
-   'id': 163},
-  {'query': 'What specific strategies does Alex Mercer employ to maintain communication with the alien signal?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 164},
-  {'query': "How does Alex Mercer's leadership style influence the team's approach to the alien communication?",
-   'answer': "Alex Mercer's leadership style plays a pivotal role in shaping the team's approach to the alien communication at Dulce Base. His leadership is characterized by a blend of cautious optimism, strategic foresight, and a deep respect for the expertise of his team members. This is evident in the way he interacts with his team, particularly with Dr. Jordan Hayes, Taylor Cruz, and Sam Rivera, as they navigate the complexities of decoding and responding to the alien signal.\n\nMercer demonstrates a balanced approach, encouraging open communication and collaboration among the team. He values the input of each member, as seen when he acknowledges Jordan Hayes's expertise in decryption and encourages them to keep the communication channels open, emphasizing the importance of understanding the alien signal's intent [Data: Sources (45, 23, 24)]. His leadership style fosters an environment where team members feel empowered to share their insights and concerns, which is crucial in a situation where the unknowns are vast and the stakes are high.\n\nMoreover, Mercer's ability to maintain composure and provide clear direction under pressure helps the team remain focused on their objectives. He is aware of the potential risks involved in the mission and urges caution, yet he also recognizes the historic opportunity they have to engage with an extraterrestrial intelligence. This dual focus on caution and opportunity is reflected in his directive to proceed with a strategy that balances curiosity with prudence [Data: Sources (31, 27, 44)].\n\nOverall, Alex Mercer's leadership style is instrumental in guiding the team through the challenges of alien communication. His approach ensures that the team remains cohesive and adaptive, ready to tackle the unknowns of their mission with both scientific rigor and diplomatic sensitivity.",
-   'score': 85,
-   'metadata': {'llm_calls': 1,
-    'prompt_tokens': 10982,
-    'output_tokens': 450,
-    'context_data': {'entities': Empty DataFrame
-     Columns: [in_context]
-     Index: [],
-     'sources':     id                                               text
-     0   45   they faced. "If it's truly sentient, we're no...
-     1   31   set the tempo for an undertaking that travers...
-     2   27  , and not a small measure of trepidation. "Thi...
-     3   23  Sam Rivera, ever the source of technological a...
-     4   24  Keep the communication channels open. But let ...
-     5   26  eterred, Jordan cast a determined glance at th...
-     6    0  # Operation: Dulce\n\n## Chapter 1\n\nThe thru...
-     7   16   a new cosmic paradigm.\n\nAlex Mercer watched...
-     8   32   cosmos—secrets that, until now, had been lost...
-     9   14   a communal outreach beyond the stars. As dawn...
-     10  18   the universe.\n\nIn a symphony of clicks and ...
-     11  44   It's a... symphony. It's as if they're teachi...
-     12  41   conviction that knowledge was more than power...
-     13   8   I'm right, what we're looking at isn't random...
-     14  10   but felt by all. The walls didn't just whispe...
-     15   3  , weighing his words carefully. "Our tech is t...
-     16  21   an undercurrent of intensity carried forth in...}},
-   'id': 165},
-  {'query': 'What challenges does Alex Mercer face in balancing caution and curiosity during the communication process?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 166},
-  {'query': "How do other team members perceive Alex Mercer's role and contributions at Dulce Base?",
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 167},
-  {'query': "What are the potential implications of Alex Mercer's decisions on the future of human-alien communication?",
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 168},
-  {'query': 'What specific strategies does Alex Mercer employ to maintain team morale during the mission?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 169},
-  {'query': "How does Alex Mercer's leadership style influence the team's approach to the unknown?",
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 170},
-  {'query': "In what ways does Alex Mercer collaborate with other team members to address the mission's challenges?",
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 171},
-  {'query': 'What are the potential risks Alex Mercer is most concerned about during the mission?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 172},
-  {'query': 'How does Alex Mercer’s background prepare him for the challenges faced in the mission?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 173},
-  {'query': 'What specific technologies does Sam Rivera use to decode alien signals?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 174},
-  {'query': "How does Alex Mercer's leadership style influence the team's approach to alien communication?",
-   'answer': "Alex Mercer's leadership style plays a pivotal role in shaping the team's approach to alien communication, characterized by a blend of cautious optimism, strategic foresight, and collaborative engagement. His leadership is marked by a balance between maintaining protocol and encouraging innovative thinking, which is crucial in the context of deciphering and responding to extraterrestrial signals.\n\nMercer demonstrates a deep respect for his team's expertise, often deferring to their specialized knowledge while guiding the overall mission. For instance, he acknowledges Dr. Jordan Hayes's expertise in decryption and encourages them to explore the alien code with both caution and curiosity [Data: Sources (45, 31, 27)]. This approach fosters an environment where team members feel empowered to contribute their insights, enhancing the collective problem-solving capacity of the group.\n\nMoreover, Mercer's leadership is characterized by a strategic balance between risk management and exploration. He is acutely aware of the potential dangers posed by the alien signal, as evidenced by his insistence on keeping communication channels open while ensuring that no message goes unchecked [Data: Sources (23, 24, 26)]. This dual focus on vigilance and open-mindedness allows the team to navigate the complexities of alien communication with a measured approach, avoiding hasty conclusions while remaining open to groundbreaking discoveries.\n\nMercer's ability to inspire trust and confidence among his team members is also evident. He often uses gestures of camaraderie, such as resting a hand on a colleague's shoulder, to reinforce a sense of unity and shared purpose [Data: Sources (23, 24)]. This interpersonal dynamic not only strengthens team cohesion but also ensures that each member is aligned with the mission's objectives, thereby enhancing the team's overall effectiveness in engaging with the unknown.\n\nIn summary, Alex Mercer's leadership style significantly influences the team's approach to alien communication by fostering a culture of respect, strategic caution, and collaborative innovation. His ability to balance protocol with creative problem-solving enables the team to effectively engage with the complexities of extraterrestrial signals, positioning them as both protectors and pioneers in the realm of cosmic diplomacy.",
-   'score': 85,
-   'metadata': {'llm_calls': 1,
-    'prompt_tokens': 10982,
-    'output_tokens': 540,
-    'context_data': {'entities': Empty DataFrame
-     Columns: [in_context]
-     Index: [],
-     'sources':     id                                               text
-     0   45   they faced. "If it's truly sentient, we're no...
-     1   31   set the tempo for an undertaking that travers...
-     2   27  , and not a small measure of trepidation. "Thi...
-     3   23  Sam Rivera, ever the source of technological a...
-     4   24  Keep the communication channels open. But let ...
-     5   26  eterred, Jordan cast a determined glance at th...
-     6    0  # Operation: Dulce\n\n## Chapter 1\n\nThe thru...
-     7   16   a new cosmic paradigm.\n\nAlex Mercer watched...
-     8   32   cosmos—secrets that, until now, had been lost...
-     9   14   a communal outreach beyond the stars. As dawn...
-     10  18   the universe.\n\nIn a symphony of clicks and ...
-     11  44   It's a... symphony. It's as if they're teachi...
-     12  41   conviction that knowledge was more than power...
-     13   8   I'm right, what we're looking at isn't random...
-     14  10   but felt by all. The walls didn't just whispe...
-     15   3  , weighing his words carefully. "Our tech is t...
-     16  21   an undercurrent of intensity carried forth in...}},
-   'id': 175},
-  {'query': 'What challenges do Sam Rivera and Alex Mercer face in their respective roles during the mission?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 176},
-  {'query': "How does the team's dynamic change as they progress in their mission at Dulce Base?",
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 177},
-  {'query': 'What are the potential risks of miscommunication in their interactions with alien intelligence?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 178},
-  {'query': 'What specific challenges did the team face at Dulce Base?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 179},
-  {'query': "How does Alex Mercer's leadership style influence the team's dynamics?",
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 180},
-  {'query': "What are the implications of the alien communication for the team's mission?",
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 181},
-  {'query': "How does Sam Rivera's technical expertise contribute to the mission's success?",
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 182},
-  {'query': "In what ways does Taylor Cruz's military background impact decision-making at Dulce Base?",
-   'answer': "Taylor Cruz's military background significantly influences decision-making at Dulce Base, primarily through their emphasis on protocol, discipline, and risk management. Cruz's approach is characterized by a strong adherence to established procedures and a focus on maintaining control over the situation, which is evident in their interactions with other team members. For instance, Cruz often emphasizes the importance of following protocols and discourages speculation, as seen when they remind the team that 'speculation is counter-productive' and that they have 'protocols for a reason' [Data: Sources (0, 9)]. This insistence on protocol reflects a military mindset that values order and predictability, especially in high-stakes environments.\n\nCruz's leadership style also manifests in their authoritative communication, often taking charge of discussions and directing the team's focus towards actionable intelligence rather than philosophical musings. This is evident when Cruz interrupts a conversation between Alex Mercer and Jordan Hayes, urging them to concentrate on the task at hand rather than engaging in philosophical discussions [Data: Sources (40, 3)]. Such behavior underscores a pragmatic approach to decision-making, prioritizing immediate, tangible outcomes over abstract considerations.\n\nMoreover, Cruz's military background instills a sense of caution and preparedness in the team. They frequently remind the team of the potential risks involved in their mission, advocating for a measured response to new discoveries, such as when they express concern over the potential hostility of alien intentions and the need to assess risks to humanity [Data: Sources (31, 12)]. This cautious stance is indicative of a military perspective that prioritizes the safety and security of the team and the mission above all else.\n\nOverall, Taylor Cruz's military background shapes their decision-making at Dulce Base by fostering a disciplined, protocol-driven approach that emphasizes control, risk management, and a focus on actionable results.",
-   'score': 85,
-   'metadata': {'llm_calls': 1,
-    'prompt_tokens': 10982,
-    'output_tokens': 478,
-    'context_data': {'entities': Empty DataFrame
-     Columns: [in_context]
-     Index: [],
-     'sources':     id                                               text
-     0   45   they faced. "If it's truly sentient, we're no...
-     1   27  , and not a small measure of trepidation. "Thi...
-     2   16   a new cosmic paradigm.\n\nAlex Mercer watched...
-     3   31   set the tempo for an undertaking that travers...
-     4   14   a communal outreach beyond the stars. As dawn...
-     5    5   very walls of the shaft—a whisper of somethin...
-     6   18   the universe.\n\nIn a symphony of clicks and ...
-     7    9   "The silence here... It's almost as if the ba...
-     8   41   conviction that knowledge was more than power...
-     9    3  , weighing his words carefully. "Our tech is t...
-     10  21   an undercurrent of intensity carried forth in...
-     11  43   of a cosmic message that could redefine their...
-     12   0  # Operation: Dulce\n\n## Chapter 1\n\nThe thru...
-     13  20   bridge—or the abysses into which they might u...
-     14  32   cosmos—secrets that, until now, had been lost...
-     15  28   "and in every word we script, in every respon...
-     16  40   and the distant hum of machinery hinted at Du...}},
-   'id': 183},
-  {'query': 'What specific challenges does Mercer face in leading the Paranormal Military Squad?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 184},
-  {'query': "How do other team members perceive Mercer's leadership style?",
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 185},
-  {'query': "In what ways does Mercer's leadership style evolve throughout the mission?",
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 186},
-  {'query': "How does Mercer's leadership compare to that of other leaders within the Paranormal Military Squad?",
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 187},
-  {'query': "What are the key outcomes of Mercer's leadership on the mission's success?",
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 188},
-  {'query': 'What specific challenges did Mercer face that influenced his leadership style?',
-   'answer': "Agent Alex Mercer, a key figure in the Paranormal Military Squad, faced numerous challenges that significantly influenced his leadership style. One of the primary challenges was the enigmatic and high-stakes nature of the mission at Dulce Base, which required a delicate balance between military discipline and open-mindedness to the unknown. The mission involved deciphering alien signals and potentially making first contact with an extraterrestrial intelligence, a task that demanded both caution and innovation [Data: Sources (9, 42, 45, 31, 27)].\n\nMercer's leadership was tested by the need to maintain team cohesion amidst the uncertainty and potential danger of the mission. He had to navigate the tension between following strict protocols and adapting to the evolving situation, as the alien signal's complexity and potential sentience became apparent. This required him to foster a collaborative environment where team members like Dr. Jordan Hayes and Sam Rivera could contribute their expertise and insights, while also ensuring that the team remained vigilant and prepared for any unforeseen developments [Data: Sources (9, 42, 45, 31, 27)].\n\nAnother challenge was managing the diverse personalities and perspectives within his team. For instance, Taylor Cruz's pragmatic and authoritative approach often clashed with the more exploratory and adaptive strategies favored by Mercer and others. This dynamic required Mercer to act as a mediator, balancing the need for caution with the pursuit of knowledge and understanding [Data: Sources (9, 42, 45, 31, 27)].\n\nOverall, Mercer's leadership style was shaped by the need to integrate discipline with flexibility, ensuring that his team could effectively respond to the unprecedented challenges posed by their mission. His ability to adapt and lead through uncertainty was crucial in navigating the complex and potentially transformative encounter with an alien intelligence.",
-   'score': 85,
-   'metadata': {'llm_calls': 1,
-    'prompt_tokens': 10981,
-    'output_tokens': 479,
-    'context_data': {'entities': Empty DataFrame
-     Columns: [in_context]
-     Index: [],
-     'sources':     id                                               text
-     0    9   "The silence here... It's almost as if the ba...
-     1   42   the dark heart of Dulce's secrets. \n\nAnd th...
-     2   45   they faced. "If it's truly sentient, we're no...
-     3   31   set the tempo for an undertaking that travers...
-     4   27  , and not a small measure of trepidation. "Thi...
-     5   23  Sam Rivera, ever the source of technological a...
-     6   24  Keep the communication channels open. But let ...
-     7   26  eterred, Jordan cast a determined glance at th...
-     8    0  # Operation: Dulce\n\n## Chapter 1\n\nThe thru...
-     9   16   a new cosmic paradigm.\n\nAlex Mercer watched...
-     10  32   cosmos—secrets that, until now, had been lost...
-     11  14   a communal outreach beyond the stars. As dawn...
-     12  18   the universe.\n\nIn a symphony of clicks and ...
-     13  44   It's a... symphony. It's as if they're teachi...
-     14  41   conviction that knowledge was more than power...
-     15   8   I'm right, what we're looking at isn't random...
-     16  10   but felt by all. The walls didn't just whispe...}},
-   'id': 189},
-  {'query': "How did Mercer's interactions with other team members impact his leadership approach?",
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 190},
-  {'query': "In what ways did the mission's outcomes reflect Mercer's leadership evolution?",
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 191},
-  {'query': "How did Mercer's leadership style compare to that of Taylor Cruz?",
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 192},
-  {'query': "What role did Mercer's personal beliefs play in his leadership decisions?",
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 193},
-  {'query': "What are some specific examples of Mercer's leadership in action?",
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 194},
-  {'query': 'How does Mercer interact with other team members like Dr. Jordan Hayes and Taylor Cruz?',
-   'answer': "Agent Alex Mercer plays a pivotal role in the interactions within the Paranormal Military Squad, particularly with team members like Dr. Jordan Hayes and Taylor Cruz. His leadership style is characterized by a blend of authority and collaboration, which is evident in his interactions with his colleagues.\n\n**Interaction with Dr. Jordan Hayes:**\n\nMercer demonstrates a deep respect for Dr. Jordan Hayes's expertise, often relying on their analytical skills to navigate complex situations. For instance, when Jordan is working on decryption algorithms, Mercer shows trust and companionship by resting a hand on Jordan's shoulder, signaling both support and confidence in their abilities [Data: Sources (23, 24)]. He values Jordan's insights, as seen when he asks for status updates and encourages them to keep communication channels open, recognizing the potential of their work to bridge cosmic divides [Data: Sources (16, 32)]. This relationship is marked by mutual respect and a shared commitment to the mission's success.\n\n**Interaction with Taylor Cruz:**\n\nMercer's interactions with Taylor Cruz are marked by a balance of caution and pragmatism. Taylor often brings a dose of realism and caution to the team's discussions, urging Mercer and others to consider the potential risks of their actions. For example, Taylor advises caution when dealing with the unknown signal, emphasizing the need for a measured response [Data: Sources (16, 31)]. Mercer acknowledges Taylor's concerns, understanding the importance of maintaining a grounded approach even as they explore the unknown. This dynamic reflects a professional relationship where Mercer's leadership is complemented by Taylor's vigilance and adherence to protocol.\n\nOverall, Mercer's interactions with his team members highlight his ability to lead with both authority and empathy, fostering an environment where expertise and caution are equally valued. His role as a leader is not just about giving orders but also about listening and adapting to the insights and concerns of his team, ensuring that their collective efforts are aligned towards the mission's goals.",
-   'score': 85,
-   'metadata': {'llm_calls': 1,
-    'prompt_tokens': 10982,
-    'output_tokens': 505,
-    'context_data': {'entities': Empty DataFrame
-     Columns: [in_context]
-     Index: [],
-     'sources':     id                                               text
-     0   45   they faced. "If it's truly sentient, we're no...
-     1   31   set the tempo for an undertaking that travers...
-     2   27  , and not a small measure of trepidation. "Thi...
-     3   23  Sam Rivera, ever the source of technological a...
-     4   24  Keep the communication channels open. But let ...
-     5   26  eterred, Jordan cast a determined glance at th...
-     6    0  # Operation: Dulce\n\n## Chapter 1\n\nThe thru...
-     7   16   a new cosmic paradigm.\n\nAlex Mercer watched...
-     8   32   cosmos—secrets that, until now, had been lost...
-     9   14   a communal outreach beyond the stars. As dawn...
-     10  18   the universe.\n\nIn a symphony of clicks and ...
-     11  44   It's a... symphony. It's as if they're teachi...
-     12  41   conviction that knowledge was more than power...
-     13   8   I'm right, what we're looking at isn't random...
-     14  10   but felt by all. The walls didn't just whispe...
-     15   3  , weighing his words carefully. "Our tech is t...
-     16  21   an undercurrent of intensity carried forth in...}},
-   'id': 195},
-  {'query': 'What challenges has Mercer faced in the mission, and how has he overcome them?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 196},
-  {'query': "In what ways does Mercer's military background influence his approach to the mission?",
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 197},
-  {'query': 'How does Mercer balance the need for caution with the pursuit of discovery in their operations?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 198},
-  {'query': 'What role does Alex Mercer play in the narrative of Dulce Base?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 199},
-  {'query': 'How do the characters in Dulce Base perceive the risks of extraterrestrial communication?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 200},
-  {'query': 'What are the key challenges faced by the team in decoding the alien signals in Dulce Base?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 201},
-  {'query': 'How does the fictional portrayal of Dulce Base align with scientific protocols for first contact?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 202},
-  {'query': "What philosophical questions are raised by the narrative of Dulce Base regarding humanity's place in the universe?",
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 203},
-  {'query': 'What specific roles do each team member play in addressing these communication challenges?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 204},
-  {'query': 'How does the team ensure the security of their communication systems against potential alien interference?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 205},
-  {'query': 'What technologies are being used to decode and interpret the alien signals?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 206},
-  {'query': 'What are the potential risks if the communication with extraterrestrial intelligences is misinterpreted?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 207},
-  {'query': 'How does the team balance the need for scientific exploration with military security concerns?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 208},
-  {'query': 'What specific skills does Agent Mercer bring to the team?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 209},
-  {'query': "How does Dr. Jordan Hayes's expertise contribute to the mission?",
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 210},
-  {'query': 'What challenges do Mercer and Hayes face in their collaboration?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 211},
-  {'query': 'How does the team dynamic change when new information is discovered?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 212},
-  {'query': 'What role does trust play in the collaboration between Mercer and Hayes?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 213},
-  {'query': 'What specific actions has Alex Mercer taken that demonstrate his leadership during the mission?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 214},
-  {'query': 'How does Alex Mercer handle conflicts or disagreements within the team?',
-   'answer': 'Alex Mercer, as depicted in the sources, handles conflicts and disagreements within the team with a blend of diplomacy, respect, and strategic foresight. His leadership style is characterized by a balance between command and collaboration, ensuring that each team member\'s expertise is acknowledged and utilized effectively.\n\nIn situations of tension or disagreement, Alex often acts as a mediator, fostering an environment where open communication is encouraged. For instance, when faced with the challenge of interpreting alien signals, Alex leans on the expertise of Dr. Jordan Hayes and others, showing trust in their abilities while maintaining a steady oversight [Data: Sources (45, 31, 27, 23, 24)]. He is described as having a "diplomatic tenor" in his interactions, which suggests a focus on maintaining harmony and ensuring that all voices are heard [Data: Sources (32, 14, 18)].\n\nMoreover, Alex\'s approach to leadership is not authoritarian; instead, he values the input of his team members and often seeks their thoughts and insights before making decisions. This is evident when he asks for the team\'s thoughts during critical moments, indicating a collaborative approach to problem-solving [Data: Sources (18, 21)]. His ability to adapt his leadership style to the needs of the situation, balancing caution with curiosity, further highlights his effectiveness in managing team dynamics [Data: Sources (21, 44)].\n\nOverall, Alex Mercer\'s handling of conflicts and disagreements is marked by a commitment to collective success, leveraging the strengths of his team while guiding them through the complexities of their mission.',
-   'score': 85,
-   'metadata': {'llm_calls': 1,
-    'prompt_tokens': 10982,
-    'output_tokens': 415,
-    'context_data': {'entities': Empty DataFrame
-     Columns: [in_context]
-     Index: [],
-     'sources':     id                                               text
-     0   45   they faced. "If it's truly sentient, we're no...
-     1   31   set the tempo for an undertaking that travers...
-     2   27  , and not a small measure of trepidation. "Thi...
-     3   23  Sam Rivera, ever the source of technological a...
-     4   24  Keep the communication channels open. But let ...
-     5   26  eterred, Jordan cast a determined glance at th...
-     6    0  # Operation: Dulce\n\n## Chapter 1\n\nThe thru...
-     7   16   a new cosmic paradigm.\n\nAlex Mercer watched...
-     8   32   cosmos—secrets that, until now, had been lost...
-     9   14   a communal outreach beyond the stars. As dawn...
-     10  18   the universe.\n\nIn a symphony of clicks and ...
-     11  44   It's a... symphony. It's as if they're teachi...
-     12  41   conviction that knowledge was more than power...
-     13   8   I'm right, what we're looking at isn't random...
-     14  10   but felt by all. The walls didn't just whispe...
-     15   3  , weighing his words carefully. "Our tech is t...
-     16  21   an undercurrent of intensity carried forth in...}},
-   'id': 215},
-  {'query': 'What are the key challenges Alex Mercer faces in his role during the mission?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 216},
-  {'query': "How do Alex Mercer's decisions impact the overall mission strategy?",
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 217},
-  {'query': 'In what ways does Alex Mercer collaborate with other team members to achieve mission objectives?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 218},
-  {'query': "What specific role does Alex Mercer play in the team's response to the alien signals?",
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 219},
-  {'query': 'How does Dr. Jordan Hayes contribute to the understanding of the alien signals?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 220},
-  {'query': "What are Taylor Cruz's concerns regarding the alien signals?",
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 221},
-  {'query': "How does Sam Rivera's perspective influence the team's approach to the signals?",
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 222},
-  {'query': 'What are the potential implications of the alien signals for humanity, according to the team?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 223},
-  {'query': "How did Mercer's past experiences prepare him for the challenges at Dulce Base?",
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 224},
-  {'query': 'What specific strategies did Mercer employ to maintain team cohesion?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 225},
-  {'query': "How did Mercer's interactions with team members like Jordan Hayes and Taylor Cruz influence his decision-making?",
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 226},
-  {'query': "What role did Mercer's leadership play in the team's ability to communicate with the alien intelligence?",
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 227},
-  {'query': "How did Mercer's leadership style evolve throughout the mission at Dulce Base?",
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 228},
-  {'query': 'Who are the key team members working with Mercer on the mission?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 229},
-  {'query': 'What are the main challenges Mercer faces during the mission?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 230},
-  {'query': 'How does Mercer interact with Taylor Cruz during the mission?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 231},
-  {'query': 'What role does Jordan Hayes play in the mission alongside Mercer?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 232},
-  {'query': 'What is the significance of the alien communication in the mission?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 233},
-  {'query': 'What specific protocols does Taylor Cruz emphasize during the mission?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 234},
-  {'query': "How do other team members, like Jordan Hayes and Sam Rivera, align with or differ from Mercer and Cruz's approaches?",
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 235},
-  {'query': 'What are the historical precedents for missions with similar exploratory and cautious approaches?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 236},
-  {'query': "How might the mission's outcome differ if either Mercer's or Cruz's approach were solely followed?",
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 237},
-  {'query': 'What specific protocols does the squad follow during their missions?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 238},
-  {'query': "How does Alex Mercer's leadership style influence the team's approach to balancing science and military protocols?",
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 239},
-  {'query': 'What are the potential risks of prioritizing scientific inquiry over military protocols?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 240},
-  {'query': 'How does the team handle disagreements between scientific and military priorities?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 241},
-  {'query': 'What role does each team member play in maintaining this balance?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 242},
-  {'query': 'What specific role does Alex Mercer play in the team dynamics at Dulce?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 243},
-  {'query': "How does Taylor Cruz's leadership style impact the team's operations?",
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 244},
-  {'query': 'What are the potential implications of the alien technology discovered at Dulce?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 245},
-  {'query': 'How do the team members balance protocol with the need for adaptability?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 246},
-  {'query': 'What ethical considerations arise from the potential contact with alien intelligence?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 247},
-  {'query': 'What role does Alex Mercer play in the operations at Dulce Base?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 248},
-  {'query': 'How does the team at Dulce Base ensure the security of their communications with alien intelligences?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 249},
-  {'query': 'What are the potential risks associated with decoding and interacting with alien signals?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 250},
-  {'query': 'How does the team adapt their technology to the evolving nature of the alien signals?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 251},
-  {'query': "What is the significance of the alien signals being described as 'learning' and 'changing'?",
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 252},
-  {'query': 'What specific strategies does Alex Mercer use to resolve conflicts?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 253},
-  {'query': 'How does Alex Mercer’s leadership style compare to other team members?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 254},
-  {'query': 'What are some examples of conflicts Alex Mercer has resolved?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 255},
-  {'query': 'How does Alex Mercer’s background influence his conflict resolution approach?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 256},
-  {'query': "What role does trust play in Alex Mercer's leadership within the team?",
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 257},
-  {'query': 'What specific challenges did Alex Mercer face during the operation at Dulce Base?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 258},
-  {'query': "How did Taylor Cruz's leadership style impact the team's dynamics?",
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 259},
-  {'query': "In what ways did Dr. Jordan Hayes contribute to the team's success?",
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 260},
-  {'query': "What role did Sam Rivera's technological skills play in the mission?",
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 261},
-  {'query': "How did the team's approach to the alien signals evolve over time?",
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 262},
-  {'query': 'What specific role does Agent Alex Mercer play in the mission?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 263},
-  {'query': 'How does the team plan to establish communication with the alien intelligence?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 264},
-  {'query': 'What are the potential risks associated with the mission at Dulce?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 265},
-  {'query': 'What is the significance of the alien signal being sentient?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 266},
-  {'query': 'How does the team balance scientific discovery with the potential threat of the unknown?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 267},
-  {'query': "What is Alex Mercer's background and how does it prepare him for this mission?",
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 268},
-  {'query': 'How does Alex Mercer manage team dynamics and individual contributions during the mission?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 269},
-  {'query': 'What are the potential consequences of misinterpreting the alien signal?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 270},
-  {'query': 'How does the mission at Dulce Base fit into the broader objectives of the Paranormal Military Squad?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 271},
-  {'query': 'What are the personal stakes for Alex Mercer in this mission?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 272},
-  {'query': 'What is the relationship between Agent Alex Mercer and Dr. Jordan Hayes?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 273},
-  {'query': "How does Taylor Cruz's leadership style impact the team's dynamics?",
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 274},
-  {'query': 'What specific challenges does Dr. Jordan Hayes face in interpreting alien signals?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 275},
-  {'query': 'How does the team balance scientific inquiry with military protocols?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 276},
-  {'query': 'What are the potential risks that Taylor Cruz is concerned about in the mission?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 277},
-  {'query': 'What specific strategies does Mercer employ to manage team dynamics during high-stress situations?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 278},
-  {'query': "How does Mercer's background and experience influence his approach to leadership?",
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 279},
-  {'query': 'In what ways does Mercer adapt his leadership style to address the evolving challenges of extraterrestrial communication?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 280},
-  {'query': "How do team members perceive Mercer's leadership, and how does it affect their performance?",
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 281},
-  {'query': "What are the potential risks and benefits of Mercer's leadership style in the context of interstellar diplomacy?",
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 282},
-  {'query': 'What specific strategies does Alex Mercer employ to manage team dynamics during high-stress situations?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 283},
-  {'query': "How does Alex Mercer's background influence his approach to leadership in the context of alien communication?",
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 284},
-  {'query': 'In what ways does Alex Mercer balance the need for protocol with the necessity for innovation?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 285},
-  {'query': "How do other team members perceive Alex Mercer's leadership style?",
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 286},
-  {'query': "What are the potential risks and benefits of Mercer's leadership approach in the context of alien communication?",
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 287},
-  {'query': "How does Taylor Cruz's leadership style compare to that of Alex Mercer?",
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 288},
-  {'query': 'What specific protocols does Taylor Cruz enforce at Dulce Base?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 289},
-  {'query': "How do other team members respond to Taylor Cruz's military-influenced decision-making?",
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 290},
-  {'query': "In what ways does Taylor Cruz's approach impact the team's ability to adapt to unexpected situations?",
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 291},
-  {'query': "What are the potential drawbacks of Taylor Cruz's strict adherence to military protocols?",
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 292},
-  {'query': 'What specific strategies does Agent Mercer use to resolve conflicts?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 293},
-  {'query': "How does Mercer's leadership style impact team dynamics?",
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 294},
-  {'query': "Are there any instances where Mercer's approach to conflict resolution is challenged?",
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 295},
-  {'query': "How do other team members perceive Mercer's conflict resolution skills?",
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 296},
-  {'query': "What role does communication play in Mercer's conflict management approach?",
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 297},
-  {'query': 'What specific actions does Alex Mercer take to ensure team cohesion during the mission?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 298},
-  {'query': 'In what ways does Alex Mercer balance caution and curiosity in his leadership approach?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 299},
-  {'query': "How does Alex Mercer's leadership style compare to that of other leaders in similar situations?",
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 300},
-  {'query': 'What challenges does Alex Mercer face in maintaining his leadership style under pressure?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 301},
-  {'query': 'What specific strategies does Alex Mercer employ to manage his team effectively?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 302},
-  {'query': 'How does Alex Mercer handle the ethical implications of interacting with an alien intelligence?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 303},
-  {'query': 'What are the personal challenges Alex Mercer faces in his leadership role?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 304},
-  {'query': 'How does Alex Mercer balance caution and curiosity in his decision-making process?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 305},
-  {'query': "What role does Alex Mercer's past experience play in his current leadership challenges?",
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 306},
-  {'query': "What is the significance of the Dulce Base operation in Alex Mercer's career?",
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 307},
-  {'query': 'How does Alex Mercer handle the ethical implications of their mission?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 308},
-  {'query': 'What are the key decisions made by Alex Mercer during the mission?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 309},
-  {'query': "How does Alex Mercer's intuition influence his leadership style?",
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 310},
-  {'query': "In what ways does Jordan Hayes's intuition contribute to the team's success?",
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 311},
-  {'query': 'How does the team balance intuition with established protocols?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 312},
-  {'query': "What specific instances demonstrate the effectiveness of intuition in the team's operations?",
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 313},
-  {'query': "How does the team's reliance on intuition affect their interactions with each other?",
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 314},
-  {'query': 'What specific leadership qualities does Mercer exhibit in high-pressure situations?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 315},
-  {'query': "How does Mercer's relationship with Sam Rivera differ from his interactions with Jordan Hayes and Taylor Cruz?",
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 316},
-  {'query': "What are some examples of Mercer's decision-making process during critical moments?",
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 317},
-  {'query': 'How does Mercer balance the need for caution with the pursuit of discovery?',
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 318},
-  {'query': "In what ways does Mercer contribute to the team's overall mission success?",
-   'answer': None,
-   'score': None,
-   'metadata': {'llm_calls': 0, 'prompt_tokens': 0, 'output_tokens': 0},
-   'id': 319}],
- 'edges': [{'source': 0, 'target': 1, 'weight': 1.0},
-  {'source': 0, 'target': 2, 'weight': 1.0},
-  {'source': 0, 'target': 3, 'weight': 1.0},
-  {'source': 0, 'target': 4, 'weight': 1.0},
-  {'source': 0, 'target': 5, 'weight': 1.0},
-  {'source': 0, 'target': 6, 'weight': 1.0},
-  {'source': 0, 'target': 7, 'weight': 1.0},
-  {'source': 0, 'target': 8, 'weight': 1.0},
-  {'source': 0, 'target': 9, 'weight': 1.0},
-  {'source': 0, 'target': 10, 'weight': 1.0},
-  {'source': 0, 'target': 11, 'weight': 1.0},
-  {'source': 0, 'target': 12, 'weight': 1.0},
-  {'source': 0, 'target': 13, 'weight': 1.0},
-  {'source': 0, 'target': 14, 'weight': 1.0},
-  {'source': 0, 'target': 15, 'weight': 1.0},
-  {'source': 0, 'target': 16, 'weight': 1.0},
-  {'source': 0, 'target': 17, 'weight': 1.0},
-  {'source': 0, 'target': 18, 'weight': 1.0},
-  {'source': 0, 'target': 19, 'weight': 1.0},
-  {'source': 0, 'target': 20, 'weight': 1.0},
-  {'source': 0, 'target': 21, 'weight': 1.0},
-  {'source': 0, 'target': 22, 'weight': 1.0},
-  {'source': 0, 'target': 23, 'weight': 1.0},
-  {'source': 0, 'target': 24, 'weight': 1.0},
-  {'source': 0, 'target': 25, 'weight': 1.0},
-  {'source': 1, 'target': 55, 'weight': 1.0},
-  {'source': 1, 'target': 56, 'weight': 1.0},
-  {'source': 1, 'target': 57, 'weight': 1.0},
-  {'source': 1, 'target': 58, 'weight': 1.0},
-  {'source': 1, 'target': 59, 'weight': 1.0},
-  {'source': 3, 'target': 75, 'weight': 1.0},
-  {'source': 3, 'target': 76, 'weight': 1.0},
-  {'source': 3, 'target': 77, 'weight': 1.0},
-  {'source': 3, 'target': 78, 'weight': 1.0},
-  {'source': 3, 'target': 79, 'weight': 1.0},
-  {'source': 4, 'target': 50, 'weight': 1.0},
-  {'source': 4, 'target': 51, 'weight': 1.0},
-  {'source': 4, 'target': 52, 'weight': 1.0},
-  {'source': 4, 'target': 53, 'weight': 1.0},
-  {'source': 4, 'target': 54, 'weight': 1.0},
-  {'source': 5, 'target': 80, 'weight': 1.0},
-  {'source': 5, 'target': 81, 'weight': 1.0},
-  {'source': 5, 'target': 82, 'weight': 1.0},
-  {'source': 5, 'target': 83, 'weight': 1.0},
-  {'source': 5, 'target': 84, 'weight': 1.0},
-  {'source': 6, 'target': 26, 'weight': 1.0},
-  {'source': 6, 'target': 27, 'weight': 1.0},
-  {'source': 6, 'target': 28, 'weight': 1.0},
-  {'source': 6, 'target': 29, 'weight': 1.0},
-  {'source': 6, 'target': 30, 'weight': 1.0},
-  {'source': 7, 'target': 99, 'weight': 1.0},
-  {'source': 7, 'target': 100, 'weight': 1.0},
-  {'source': 7, 'target': 101, 'weight': 1.0},
-  {'source': 7, 'target': 102, 'weight': 1.0},
-  {'source': 7, 'target': 103, 'weight': 1.0},
-  {'source': 9, 'target': 31, 'weight': 1.0},
-  {'source': 9, 'target': 32, 'weight': 1.0},
-  {'source': 9, 'target': 33, 'weight': 1.0},
-  {'source': 9, 'target': 34, 'weight': 1.0},
-  {'source': 9, 'target': 35, 'weight': 1.0},
-  {'source': 11, 'target': 263, 'weight': 1.0},
-  {'source': 11, 'target': 264, 'weight': 1.0},
-  {'source': 11, 'target': 265, 'weight': 1.0},
-  {'source': 11, 'target': 266, 'weight': 1.0},
-  {'source': 11, 'target': 267, 'weight': 1.0},
-  {'source': 12, 'target': 104, 'weight': 1.0},
-  {'source': 12, 'target': 105, 'weight': 1.0},
-  {'source': 12, 'target': 106, 'weight': 1.0},
-  {'source': 12, 'target': 107, 'weight': 1.0},
-  {'source': 12, 'target': 108, 'weight': 1.0},
-  {'source': 13, 'target': 109, 'weight': 1.0},
-  {'source': 13, 'target': 110, 'weight': 1.0},
-  {'source': 13, 'target': 111, 'weight': 1.0},
-  {'source': 13, 'target': 112, 'weight': 1.0},
-  {'source': 13, 'target': 113, 'weight': 1.0},
-  {'source': 14, 'target': 36, 'weight': 1.0},
-  {'source': 14, 'target': 37, 'weight': 1.0},
-  {'source': 14, 'target': 38, 'weight': 1.0},
-  {'source': 14, 'target': 39, 'weight': 1.0},
-  {'source': 14, 'target': 40, 'weight': 1.0},
-  {'source': 15, 'target': 45, 'weight': 1.0},
-  {'source': 15, 'target': 46, 'weight': 1.0},
-  {'source': 15, 'target': 47, 'weight': 1.0},
-  {'source': 15, 'target': 48, 'weight': 1.0},
-  {'source': 15, 'target': 49, 'weight': 1.0},
-  {'source': 16, 'target': 65, 'weight': 1.0},
-  {'source': 16, 'target': 66, 'weight': 1.0},
-  {'source': 16, 'target': 67, 'weight': 1.0},
-  {'source': 16, 'target': 68, 'weight': 1.0},
-  {'source': 16, 'target': 69, 'weight': 1.0},
-  {'source': 17, 'target': 119, 'weight': 1.0},
-  {'source': 17, 'target': 120, 'weight': 1.0},
-  {'source': 17, 'target': 121, 'weight': 1.0},
-  {'source': 17, 'target': 122, 'weight': 1.0},
-  {'source': 17, 'target': 123, 'weight': 1.0},
-  {'source': 18, 'target': 114, 'weight': 1.0},
-  {'source': 18, 'target': 115, 'weight': 1.0},
-  {'source': 18, 'target': 116, 'weight': 1.0},
-  {'source': 18, 'target': 117, 'weight': 1.0},
-  {'source': 18, 'target': 118, 'weight': 1.0},
-  {'source': 19, 'target': 60, 'weight': 1.0},
-  {'source': 19, 'target': 61, 'weight': 1.0},
-  {'source': 19, 'target': 62, 'weight': 1.0},
-  {'source': 19, 'target': 63, 'weight': 1.0},
-  {'source': 19, 'target': 64, 'weight': 1.0},
-  {'source': 20, 'target': 94, 'weight': 1.0},
-  {'source': 20, 'target': 95, 'weight': 1.0},
-  {'source': 20, 'target': 96, 'weight': 1.0},
-  {'source': 20, 'target': 97, 'weight': 1.0},
-  {'source': 20, 'target': 98, 'weight': 1.0},
-  {'source': 21, 'target': 85, 'weight': 1.0},
-  {'source': 21, 'target': 27, 'weight': 1.0},
-  {'source': 21, 'target': 86, 'weight': 1.0},
-  {'source': 21, 'target': 87, 'weight': 1.0},
-  {'source': 21, 'target': 88, 'weight': 1.0},
-  {'source': 22, 'target': 70, 'weight': 1.0},
-  {'source': 22, 'target': 71, 'weight': 1.0},
-  {'source': 22, 'target': 72, 'weight': 1.0},
-  {'source': 22, 'target': 73, 'weight': 1.0},
-  {'source': 22, 'target': 74, 'weight': 1.0},
-  {'source': 23, 'target': 41, 'weight': 1.0},
-  {'source': 23, 'target': 27, 'weight': 1.0},
-  {'source': 23, 'target': 42, 'weight': 1.0},
-  {'source': 23, 'target': 43, 'weight': 1.0},
-  {'source': 23, 'target': 44, 'weight': 1.0},
-  {'source': 24, 'target': 89, 'weight': 1.0},
-  {'source': 24, 'target': 90, 'weight': 1.0},
-  {'source': 24, 'target': 91, 'weight': 1.0},
-  {'source': 24, 'target': 92, 'weight': 1.0},
-  {'source': 24, 'target': 93, 'weight': 1.0},
-  {'source': 26, 'target': 268, 'weight': 1.0},
-  {'source': 26, 'target': 269, 'weight': 1.0},
-  {'source': 26, 'target': 270, 'weight': 1.0},
-  {'source': 26, 'target': 271, 'weight': 1.0},
-  {'source': 26, 'target': 272, 'weight': 1.0},
-  {'source': 29, 'target': 169, 'weight': 1.0},
-  {'source': 29, 'target': 170, 'weight': 1.0},
-  {'source': 29, 'target': 171, 'weight': 1.0},
-  {'source': 29, 'target': 172, 'weight': 1.0},
-  {'source': 29, 'target': 173, 'weight': 1.0},
-  {'source': 32, 'target': 164, 'weight': 1.0},
-  {'source': 32, 'target': 165, 'weight': 1.0},
-  {'source': 32, 'target': 166, 'weight': 1.0},
-  {'source': 32, 'target': 167, 'weight': 1.0},
-  {'source': 32, 'target': 168, 'weight': 1.0},
-  {'source': 33, 'target': 159, 'weight': 1.0},
-  {'source': 33, 'target': 160, 'weight': 1.0},
-  {'source': 33, 'target': 161, 'weight': 1.0},
-  {'source': 33, 'target': 162, 'weight': 1.0},
-  {'source': 33, 'target': 163, 'weight': 1.0},
-  {'source': 35, 'target': 219, 'weight': 1.0},
-  {'source': 35, 'target': 220, 'weight': 1.0},
-  {'source': 35, 'target': 221, 'weight': 1.0},
-  {'source': 35, 'target': 222, 'weight': 1.0},
-  {'source': 35, 'target': 223, 'weight': 1.0},
-  {'source': 36, 'target': 273, 'weight': 1.0},
-  {'source': 36, 'target': 274, 'weight': 1.0},
-  {'source': 36, 'target': 275, 'weight': 1.0},
-  {'source': 36, 'target': 276, 'weight': 1.0},
-  {'source': 36, 'target': 277, 'weight': 1.0},
-  {'source': 40, 'target': 243, 'weight': 1.0},
-  {'source': 40, 'target': 244, 'weight': 1.0},
-  {'source': 40, 'target': 245, 'weight': 1.0},
-  {'source': 40, 'target': 246, 'weight': 1.0},
-  {'source': 40, 'target': 247, 'weight': 1.0},
-  {'source': 41, 'target': 85, 'weight': 1.0},
-  {'source': 41, 'target': 27, 'weight': 1.0},
-  {'source': 41, 'target': 307, 'weight': 1.0},
-  {'source': 41, 'target': 308, 'weight': 1.0},
-  {'source': 41, 'target': 309, 'weight': 1.0},
-  {'source': 43, 'target': 214, 'weight': 1.0},
-  {'source': 43, 'target': 215, 'weight': 1.0},
-  {'source': 43, 'target': 216, 'weight': 1.0},
-  {'source': 43, 'target': 217, 'weight': 1.0},
-  {'source': 43, 'target': 218, 'weight': 1.0},
-  {'source': 47, 'target': 154, 'weight': 1.0},
-  {'source': 47, 'target': 155, 'weight': 1.0},
-  {'source': 47, 'target': 156, 'weight': 1.0},
-  {'source': 47, 'target': 157, 'weight': 1.0},
-  {'source': 47, 'target': 158, 'weight': 1.0},
-  {'source': 53, 'target': 174, 'weight': 1.0},
-  {'source': 53, 'target': 175, 'weight': 1.0},
-  {'source': 53, 'target': 176, 'weight': 1.0},
-  {'source': 53, 'target': 177, 'weight': 1.0},
-  {'source': 53, 'target': 178, 'weight': 1.0},
-  {'source': 60, 'target': 194, 'weight': 1.0},
-  {'source': 60, 'target': 195, 'weight': 1.0},
-  {'source': 60, 'target': 196, 'weight': 1.0},
-  {'source': 60, 'target': 197, 'weight': 1.0},
-  {'source': 60, 'target': 198, 'weight': 1.0},
-  {'source': 61, 'target': 184, 'weight': 1.0},
-  {'source': 61, 'target': 185, 'weight': 1.0},
-  {'source': 61, 'target': 186, 'weight': 1.0},
-  {'source': 61, 'target': 187, 'weight': 1.0},
-  {'source': 61, 'target': 188, 'weight': 1.0},
-  {'source': 67, 'target': 229, 'weight': 1.0},
-  {'source': 67, 'target': 230, 'weight': 1.0},
-  {'source': 67, 'target': 231, 'weight': 1.0},
-  {'source': 67, 'target': 232, 'weight': 1.0},
-  {'source': 67, 'target': 233, 'weight': 1.0},
-  {'source': 74, 'target': 180, 'weight': 1.0},
-  {'source': 74, 'target': 234, 'weight': 1.0},
-  {'source': 74, 'target': 235, 'weight': 1.0},
-  {'source': 74, 'target': 236, 'weight': 1.0},
-  {'source': 74, 'target': 237, 'weight': 1.0},
-  {'source': 75, 'target': 129, 'weight': 1.0},
-  {'source': 75, 'target': 130, 'weight': 1.0},
-  {'source': 75, 'target': 131, 'weight': 1.0},
-  {'source': 75, 'target': 132, 'weight': 1.0},
-  {'source': 75, 'target': 133, 'weight': 1.0},
-  {'source': 79, 'target': 179, 'weight': 1.0},
-  {'source': 79, 'target': 180, 'weight': 1.0},
-  {'source': 79, 'target': 181, 'weight': 1.0},
-  {'source': 79, 'target': 182, 'weight': 1.0},
-  {'source': 79, 'target': 183, 'weight': 1.0},
-  {'source': 83, 'target': 199, 'weight': 1.0},
-  {'source': 83, 'target': 200, 'weight': 1.0},
-  {'source': 83, 'target': 201, 'weight': 1.0},
-  {'source': 83, 'target': 202, 'weight': 1.0},
-  {'source': 83, 'target': 203, 'weight': 1.0},
-  {'source': 84, 'target': 149, 'weight': 1.0},
-  {'source': 84, 'target': 150, 'weight': 1.0},
-  {'source': 84, 'target': 151, 'weight': 1.0},
-  {'source': 84, 'target': 152, 'weight': 1.0},
-  {'source': 84, 'target': 153, 'weight': 1.0},
-  {'source': 90, 'target': 258, 'weight': 1.0},
-  {'source': 90, 'target': 259, 'weight': 1.0},
-  {'source': 90, 'target': 260, 'weight': 1.0},
-  {'source': 90, 'target': 261, 'weight': 1.0},
-  {'source': 90, 'target': 262, 'weight': 1.0},
-  {'source': 93, 'target': 139, 'weight': 1.0},
-  {'source': 93, 'target': 140, 'weight': 1.0},
-  {'source': 93, 'target': 141, 'weight': 1.0},
-  {'source': 93, 'target': 142, 'weight': 1.0},
-  {'source': 93, 'target': 143, 'weight': 1.0},
-  {'source': 95, 'target': 278, 'weight': 1.0},
-  {'source': 95, 'target': 279, 'weight': 1.0},
-  {'source': 95, 'target': 280, 'weight': 1.0},
-  {'source': 95, 'target': 281, 'weight': 1.0},
-  {'source': 95, 'target': 282, 'weight': 1.0},
-  {'source': 100, 'target': 134, 'weight': 1.0},
-  {'source': 100, 'target': 135, 'weight': 1.0},
-  {'source': 100, 'target': 136, 'weight': 1.0},
-  {'source': 100, 'target': 137, 'weight': 1.0},
-  {'source': 100, 'target': 138, 'weight': 1.0},
-  {'source': 101, 'target': 209, 'weight': 1.0},
-  {'source': 101, 'target': 210, 'weight': 1.0},
-  {'source': 101, 'target': 211, 'weight': 1.0},
-  {'source': 101, 'target': 212, 'weight': 1.0},
-  {'source': 101, 'target': 213, 'weight': 1.0},
-  {'source': 104, 'target': 248, 'weight': 1.0},
-  {'source': 104, 'target': 249, 'weight': 1.0},
-  {'source': 104, 'target': 250, 'weight': 1.0},
-  {'source': 104, 'target': 251, 'weight': 1.0},
-  {'source': 104, 'target': 252, 'weight': 1.0},
-  {'source': 106, 'target': 204, 'weight': 1.0},
-  {'source': 106, 'target': 205, 'weight': 1.0},
-  {'source': 106, 'target': 206, 'weight': 1.0},
-  {'source': 106, 'target': 207, 'weight': 1.0},
-  {'source': 106, 'target': 208, 'weight': 1.0},
-  {'source': 110, 'target': 124, 'weight': 1.0},
-  {'source': 110, 'target': 125, 'weight': 1.0},
-  {'source': 110, 'target': 126, 'weight': 1.0},
-  {'source': 110, 'target': 127, 'weight': 1.0},
-  {'source': 110, 'target': 128, 'weight': 1.0},
-  {'source': 117, 'target': 238, 'weight': 1.0},
-  {'source': 117, 'target': 239, 'weight': 1.0},
-  {'source': 117, 'target': 240, 'weight': 1.0},
-  {'source': 117, 'target': 241, 'weight': 1.0},
-  {'source': 117, 'target': 242, 'weight': 1.0},
-  {'source': 120, 'target': 189, 'weight': 1.0},
-  {'source': 120, 'target': 190, 'weight': 1.0},
-  {'source': 120, 'target': 191, 'weight': 1.0},
-  {'source': 120, 'target': 192, 'weight': 1.0},
-  {'source': 120, 'target': 193, 'weight': 1.0},
-  {'source': 121, 'target': 144, 'weight': 1.0},
-  {'source': 121, 'target': 145, 'weight': 1.0},
-  {'source': 121, 'target': 146, 'weight': 1.0},
-  {'source': 121, 'target': 147, 'weight': 1.0},
-  {'source': 121, 'target': 148, 'weight': 1.0},
-  {'source': 137, 'target': 293, 'weight': 1.0},
-  {'source': 137, 'target': 294, 'weight': 1.0},
-  {'source': 137, 'target': 295, 'weight': 1.0},
-  {'source': 137, 'target': 296, 'weight': 1.0},
-  {'source': 137, 'target': 297, 'weight': 1.0},
-  {'source': 142, 'target': 302, 'weight': 1.0},
-  {'source': 142, 'target': 303, 'weight': 1.0},
-  {'source': 142, 'target': 304, 'weight': 1.0},
-  {'source': 142, 'target': 305, 'weight': 1.0},
-  {'source': 142, 'target': 306, 'weight': 1.0},
-  {'source': 163, 'target': 310, 'weight': 1.0},
-  {'source': 163, 'target': 311, 'weight': 1.0},
-  {'source': 163, 'target': 312, 'weight': 1.0},
-  {'source': 163, 'target': 313, 'weight': 1.0},
-  {'source': 163, 'target': 314, 'weight': 1.0},
-  {'source': 165, 'target': 298, 'weight': 1.0},
-  {'source': 165, 'target': 286, 'weight': 1.0},
-  {'source': 165, 'target': 299, 'weight': 1.0},
-  {'source': 165, 'target': 300, 'weight': 1.0},
-  {'source': 165, 'target': 301, 'weight': 1.0},
-  {'source': 175, 'target': 283, 'weight': 1.0},
-  {'source': 175, 'target': 284, 'weight': 1.0},
-  {'source': 175, 'target': 285, 'weight': 1.0},
-  {'source': 175, 'target': 286, 'weight': 1.0},
-  {'source': 175, 'target': 287, 'weight': 1.0},
-  {'source': 183, 'target': 288, 'weight': 1.0},
-  {'source': 183, 'target': 289, 'weight': 1.0},
-  {'source': 183, 'target': 290, 'weight': 1.0},
-  {'source': 183, 'target': 291, 'weight': 1.0},
-  {'source': 183, 'target': 292, 'weight': 1.0},
-  {'source': 189, 'target': 224, 'weight': 1.0},
-  {'source': 189, 'target': 225, 'weight': 1.0},
-  {'source': 189, 'target': 226, 'weight': 1.0},
-  {'source': 189, 'target': 227, 'weight': 1.0},
-  {'source': 189, 'target': 228, 'weight': 1.0},
-  {'source': 195, 'target': 315, 'weight': 1.0},
-  {'source': 195, 'target': 316, 'weight': 1.0},
-  {'source': 195, 'target': 317, 'weight': 1.0},
-  {'source': 195, 'target': 318, 'weight': 1.0},
-  {'source': 195, 'target': 319, 'weight': 1.0},
-  {'source': 215, 'target': 253, 'weight': 1.0},
-  {'source': 215, 'target': 254, 'weight': 1.0},
-  {'source': 215, 'target': 255, 'weight': 1.0},
-  {'source': 215, 'target': 256, 'weight': 1.0},
-  {'source': 215, 'target': 257, 'weight': 1.0}]}</pre>
+<div class="jp-OutputArea-child">
+<div class="jp-OutputPrompt jp-OutputArea-prompt"></div>
+<div class="jp-RenderedText jp-OutputArea-output" data-mime-type="application/vnd.jupyter.stderr" tabindex="0">
+<pre>
+<span class="ansi-red-fg">---------------------------------------------------------------------------</span>
+<span class="ansi-red-fg">NameError</span>                                 Traceback (most recent call last)
+Cell <span class="ansi-green-fg">In[7], line 1</span>
+<span class="ansi-green-fg">----&gt; 1</span> <span class="ansi-yellow-bg">resp</span><span style="color: rgb(98,98,98)">.</span>response
+
+<span class="ansi-red-fg">NameError</span>: name 'resp' is not defined</pre>
 </div>
 </div>
 </div>
@@ -6097,10 +2609,16 @@ search = DRIFTSearch(
 <div class="jp-Collapser jp-OutputCollapser jp-Cell-outputCollapser">
 </div>
 <div class="jp-OutputArea jp-Cell-outputArea">
-<div class="jp-OutputArea-child jp-OutputArea-executeResult">
-<div class="jp-OutputPrompt jp-OutputArea-prompt">Out[8]:</div>
-<div class="jp-RenderedText jp-OutputArea-output jp-OutputArea-executeResult" data-mime-type="text/plain" tabindex="0">
-<pre>'# Alex Mercer\'s Role and Influence as an Agent\n\nAlex Mercer is a distinguished figure within the context of the Paranormal Military Squad at Dulce Base, with his influence extending across multiple strategic and operational domains. As a key member, Mercer is involved in the oversight of critical operations related to extraterrestrial intelligence and the strategic response to alien communications. His approach to leadership within the squad is marked by a blend of caution and analytical engagement, facilitating both the advancement of their mission objectives and ensuring adherence to protocol.\n\nMercer is noted for his pivotal role in decision-making processes, where his strategic acumen and experience contribute significantly to shaping the team\'s interactions with cosmic entities. Mercer\'s emphasis is on balancing safety with exploration, ensuring that the squad\'s engagements with extraterrestrial communications align with broader diplomatic and cosmic goals. This involves careful consideration of risks while pursuing the mission at Dulce Base, a high-tech facility known for its focus on interstellar communication.\n\nCollaboratively, Mercer works closely with other team members like Taylor Cruz, Jordan Hayes, and Sam Rivera, each contributing unique expertise to the team\'s mission. The dynamics among these members not only highlight Mercer\'s leadership but also underscore the collective efforts required to decode and strategize responses to alien signals. Mercer’s mentorship within the Paranormal Military Squad is instrumental in enhancing the squad\'s morale and operational efficiency, reinforcing his status as a mentor and leader.\n\nIn summary, Agent Alex Mercer serves as a cornerstone for the Paranormal Military Squad\'s operations at Dulce Base, providing strategic oversight and mentorship that is crucial for their interstellar communication initiatives. Through his leadership, Mercer navigates the complexities of alien communication, guiding the team towards potential cosmic partnerships while ensuring mission integrity and safety remain paramount.\n\n\n# Understanding Agent Alex Mercer\'s Role in Paranormal Activities at Dulce Base\n\nAgent Alex Mercer is a prominent member of the Paranormal Military Squad, operating chiefly at the Dulce Military Base, where significant efforts are being made to decode and establish communication with extraterrestrial intelligence. In these operations, Mercer plays a crucial role in both strategic planning and the execution of missions related to interstellar dialogue and the investigation of paranormal anomalies.\n\nHis involvement is particularly highlighted during \'Operation: Dulce,\' a high-stakes mission that not only aims to observe but also actively interact with paranormal entities, marking a significant evolution in understanding extraterrestrial phenomena. Mercer is recognized for his tactical insight, guiding the mission’s strategic decisions, and exploring its implications for humanity. Despite his outward compliance, Mercer\'s subtle determination suggests a complex dynamic with the authority figures around him, adding a nuanced layer to his interactions within the team.\n\nMercer\'s expertise in signal analysis, alongside other key personnel such as Taylor Cruz and Dr. Jordan Hayes, is vital for deciphering cosmic signals, which are believed to be structured communications from alien intelligence. These operations, centered at Dulce Base, position the team at the forefront of potentially groundbreaking technological and scientific advancements related to extraterrestrial communication.\n\nFurthermore, his collaboration with Dr. Jordan Hayes enhances the overall mission\'s success by integrating scientific research with strategic military objectives. These efforts are instrumental in preparing responses for potential extraterrestrial entities, making Mercer a critical asset in the community that operates on the cutting edge of both technology and extraterrestrial diplomacy.\n\nAgent Mercer\'s role is pivotal not only because of his direct contributions but also due to his ability to navigate the challenges of working in a high-tech, high-stress environment where understanding and preparing for extraterrestrial threats is the primary objective. This makes his presence and activities at Dulce Base integral to the continued success of these missions.\n\n# Understanding Agent Mercer and Their Role at Dulce\n\nAlex Mercer is a key figure in the operations associated with Dulce, a clandestine site known for its involvement in interspecies communication and paranormal military activities. Situated underground in New Mexico, Dulce serves as the hub for the Paranormal Military Squad, a group engaged in high-stakes operations involving alien communications. Mercer\'s contributions are integral to the success of these missions, highlighting his leadership and operational roles within this specialized community.\n\nIn the context of the Dulce Team and the Underground Command Center, Alex Mercer emerges as a central agency driving the interspecies communication project. His leadership in strategic guidance and operational management underscores his influence and critical position in the project\'s direction and success. These efforts are mirrored in the complex environment of Dulce, which requires adept navigation of its oppressive and challenging conditions to ensure mission success.\n\nThe Central Terminal and Viewing Monitors located at Dulce Base are essential to Mercer’s work, especially in handling extraterrestrial signals. His involvement with these technologies suggests a position of operational or strategic leadership, pivotal during significant moments of extraterrestrial communication operations. Mercer, alongside other key personnel, exhibits a reliable capacity to manage the critical aspects of extraterrestrial signal handling and analysis.\n\nThe community and operations Mercer is a part of illustrate a larger context involving high-security measures, collaboration between a diverse team of experts, and a focus on maintaining intergalactic communication integrity. The collective efforts of Mercer\'s team in handling distress signals and extraterrestrial data are instrumental in the broader context of Dulce\'s operations, reflecting both the historical significance and future implications of their contributions to cosmic exploration and security.\n\n\n# Understanding Agent Mercer\n\nBased on the summaries of the communities related to Earth\'s interstellar communication efforts, Agent Mercer appears to be connected to the intricate network of individuals operating from crucial locations such as Dulce Base. The community summaries place significant emphasis on the Paranormal Military Squad and the operations at Dulce Base, suggesting a strategic and hierarchical structure. Within this framework, an entity like Agent Mercer could play a vital role in managing, directing, or executing parts of the mission, particularly involving first contact and interstellar communication with extraterrestrial entities. \n\nThe summaries highlight the central role of key figures such as Cruz and Rivera, as well as Washington, in the coordination of interstellar communication efforts and defense measures. Cruz’s leadership is critical in missions that appoint Washington and Agent Mercer as part of the communication and strategic command network. With Rivera\'s technical expertise greatly influencing mission success, it is plausible that Agent Mercer is involved in supporting these operations directly or indirectly, potentially as a liaison or operative within the Paranormal Military Squad.\n\nReferences to communication tasks, security, and operational strategies point towards a highly sensitive environment in which Mercer might operate. Given Dulce Base’s role as a central hub in Earth’s cosmic outreach, any agent, including Mercer, stationed there would presumably partake in mission-critical activities, which could range from technical implementation to strategic planning and responses to extraterrestrial interactions. The extensively fortified position in which these operations are conducted suggests that agents like Mercer are key to maintaining both operational security and success during high-stakes interstellar engagements. Thus, while the summaries do not specifically mention Agent Mercer, the context indicates that this figure might be integral to executing, planning, or overseeing parts of these complex and diplomatic interstellar missions.\n\n\n# Understanding Agent Mercer\'s Role within Cosmic Interactions and Extraterrestrial Communications\n\nAgent Mercer, identified as Alex Mercer within various community contexts, appears to be a pivotal figure in an intricate web of cosmic and extraterrestrial interactions. Within the Cosmic Vocalization and Universe Interaction community, Mercer is portrayed as an interpreter of cosmic phenomena, viewing the Cosmic Vocalization as part of an "interstellar duet." This suggests an approach where Mercer sees these cosmic events as exchanges, perhaps necessitating a response or understanding from our end [Data: Relationships (55)]. His involvement in this domain indicates a focus on deciphering potential cosmic signals which may range from benign to threatening.\n\nMercer\'s role extends into the operations at the Dulce Facility, a noted extraterrestrial communication hub. Here, Mercer, alongside others like Taylor Cruz, Jordan Hayes, and Sam Rivera, contributes significantly to the communication efforts with alien intelligence. This role involves setting communication frequencies and managing signals, hinting at a highly technical and strategic aspect of his work, essential for successful extraterrestrial interactions [Data: Relationships (40, 41, 42, 94, 95)].\n\nMoreover, Mercer is intertwined with larger strategic responses to cosmic phenomena, as indicated by his involvement with entities like the Paranormal Military Squad. This military group perceives cosmic events as part of a greater strategic landscape impacting security measures [Data: Relationships (240)]. Mercer\'s involvement with both scientific exploration and strategic defense initiatives underscores his comprehensive role in navigating the complex cosmos-human dynamics.\n\nThrough these roles, Mercer emerges as a person of significant influence and expertise, navigating both the scientific and security implications of cosmic and extraterrestrial phenomena. His work within these spheres suggests that he might be at the forefront of interpreting and responding to cosmic challenges and opportunities, contributing both to human understanding and to potentially pivotal defense strategies.'</pre>
+<div class="jp-OutputArea-child">
+<div class="jp-OutputPrompt jp-OutputArea-prompt"></div>
+<div class="jp-RenderedText jp-OutputArea-output" data-mime-type="application/vnd.jupyter.stderr" tabindex="0">
+<pre>
+<span class="ansi-red-fg">---------------------------------------------------------------------------</span>
+<span class="ansi-red-fg">NameError</span>                                 Traceback (most recent call last)
+Cell <span class="ansi-green-fg">In[8], line 1</span>
+<span class="ansi-green-fg">----&gt; 1</span> <span class="ansi-yellow-bg">resp</span><span style="color: rgb(98,98,98)">.</span>response[<span style="color: rgb(175,0,0)">"</span><span style="color: rgb(175,0,0)">nodes</span><span style="color: rgb(175,0,0)">"</span>][<span style="color: rgb(98,98,98)">0</span>][<span style="color: rgb(175,0,0)">"</span><span style="color: rgb(175,0,0)">answer</span><span style="color: rgb(175,0,0)">"</span>]
+
+<span class="ansi-red-fg">NameError</span>: name 'resp' is not defined</pre>
 </div>
 </div>
 </div>
diff --git a/examples_notebooks/global_search/index.html b/examples_notebooks/global_search/index.html
index c3ecc23e..0b06515e 100644
--- a/examples_notebooks/global_search/index.html
+++ b/examples_notebooks/global_search/index.html
@@ -2578,22 +2578,186 @@ print(result.response)</div>
 <div class="jp-OutputArea jp-Cell-outputArea">
 <div class="jp-OutputArea-child">
 <div class="jp-OutputPrompt jp-OutputArea-prompt"></div>
+<div class="jp-RenderedText jp-OutputArea-output" data-mime-type="application/vnd.jupyter.stderr" tabindex="0">
+<pre>Exception in _map_response_single_batch
+Traceback (most recent call last):
+  File "/home/runner/work/graphrag/graphrag/graphrag/query/structured_search/global_search/search.py", line 233, in _map_response_single_batch
+    search_response = await self.llm.agenerate(
+                      ^^^^^^^^^^^^^^^^^^^^^^^^^
+  File "/home/runner/work/graphrag/graphrag/graphrag/query/llm/oai/chat_openai.py", line 142, in agenerate
+    async for attempt in retryer:
+  File "/home/runner/.cache/pypoetry/virtualenvs/graphrag-F2jvqev7-py3.11/lib/python3.11/site-packages/tenacity/asyncio/__init__.py", line 166, in __anext__
+    do = await self.iter(retry_state=self._retry_state)
+         ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+  File "/home/runner/.cache/pypoetry/virtualenvs/graphrag-F2jvqev7-py3.11/lib/python3.11/site-packages/tenacity/asyncio/__init__.py", line 153, in iter
+    result = await action(retry_state)
+             ^^^^^^^^^^^^^^^^^^^^^^^^^
+  File "/home/runner/.cache/pypoetry/virtualenvs/graphrag-F2jvqev7-py3.11/lib/python3.11/site-packages/tenacity/_utils.py", line 99, in inner
+    return call(*args, **kwargs)
+           ^^^^^^^^^^^^^^^^^^^^^
+  File "/home/runner/.cache/pypoetry/virtualenvs/graphrag-F2jvqev7-py3.11/lib/python3.11/site-packages/tenacity/__init__.py", line 418, in exc_check
+    raise retry_exc.reraise()
+          ^^^^^^^^^^^^^^^^^^^
+  File "/home/runner/.cache/pypoetry/virtualenvs/graphrag-F2jvqev7-py3.11/lib/python3.11/site-packages/tenacity/__init__.py", line 185, in reraise
+    raise self.last_attempt.result()
+          ^^^^^^^^^^^^^^^^^^^^^^^^^^
+  File "/opt/hostedtoolcache/Python/3.11.10/x64/lib/python3.11/concurrent/futures/_base.py", line 449, in result
+    return self.__get_result()
+           ^^^^^^^^^^^^^^^^^^^
+  File "/opt/hostedtoolcache/Python/3.11.10/x64/lib/python3.11/concurrent/futures/_base.py", line 401, in __get_result
+    raise self._exception
+  File "/home/runner/work/graphrag/graphrag/graphrag/query/llm/oai/chat_openai.py", line 144, in agenerate
+    return await self._agenerate(
+           ^^^^^^^^^^^^^^^^^^^^^^
+  File "/home/runner/work/graphrag/graphrag/graphrag/query/llm/oai/chat_openai.py", line 268, in _agenerate
+    response = await self.async_client.chat.completions.create(  # type: ignore
+               ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+  File "/home/runner/.cache/pypoetry/virtualenvs/graphrag-F2jvqev7-py3.11/lib/python3.11/site-packages/openai/resources/chat/completions.py", line 1661, in create
+    return await self._post(
+           ^^^^^^^^^^^^^^^^^
+  File "/home/runner/.cache/pypoetry/virtualenvs/graphrag-F2jvqev7-py3.11/lib/python3.11/site-packages/openai/_base_client.py", line 1838, in post
+    return await self.request(cast_to, opts, stream=stream, stream_cls=stream_cls)
+           ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
+  File "/home/runner/.cache/pypoetry/virtualenvs/graphrag-F2jvqev7-py3.11/lib/python3.11/site-packages/openai/_base_client.py", line 1532, in request
+    return await self._request(
+           ^^^^^^^^^^^^^^^^^^^^
+  File "/home/runner/.cache/pypoetry/virtualenvs/graphrag-F2jvqev7-py3.11/lib/python3.11/site-packages/openai/_base_client.py", line 1618, in _request
+    return await self._retry_request(
+           ^^^^^^^^^^^^^^^^^^^^^^^^^^
+  File "/home/runner/.cache/pypoetry/virtualenvs/graphrag-F2jvqev7-py3.11/lib/python3.11/site-packages/openai/_base_client.py", line 1665, in _retry_request
+    return await self._request(
+           ^^^^^^^^^^^^^^^^^^^^
+  File "/home/runner/.cache/pypoetry/virtualenvs/graphrag-F2jvqev7-py3.11/lib/python3.11/site-packages/openai/_base_client.py", line 1618, in _request
+    return await self._retry_request(
+           ^^^^^^^^^^^^^^^^^^^^^^^^^^
+  File "/home/runner/.cache/pypoetry/virtualenvs/graphrag-F2jvqev7-py3.11/lib/python3.11/site-packages/openai/_base_client.py", line 1665, in _retry_request
+    return await self._request(
+           ^^^^^^^^^^^^^^^^^^^^
+  File "/home/runner/.cache/pypoetry/virtualenvs/graphrag-F2jvqev7-py3.11/lib/python3.11/site-packages/openai/_base_client.py", line 1618, in _request
+    return await self._retry_request(
+           ^^^^^^^^^^^^^^^^^^^^^^^^^^
+  File "/home/runner/.cache/pypoetry/virtualenvs/graphrag-F2jvqev7-py3.11/lib/python3.11/site-packages/openai/_base_client.py", line 1665, in _retry_request
+    return await self._request(
+           ^^^^^^^^^^^^^^^^^^^^
+  File "/home/runner/.cache/pypoetry/virtualenvs/graphrag-F2jvqev7-py3.11/lib/python3.11/site-packages/openai/_base_client.py", line 1618, in _request
+    return await self._retry_request(
+           ^^^^^^^^^^^^^^^^^^^^^^^^^^
+  File "/home/runner/.cache/pypoetry/virtualenvs/graphrag-F2jvqev7-py3.11/lib/python3.11/site-packages/openai/_base_client.py", line 1665, in _retry_request
+    return await self._request(
+           ^^^^^^^^^^^^^^^^^^^^
+  File "/home/runner/.cache/pypoetry/virtualenvs/graphrag-F2jvqev7-py3.11/lib/python3.11/site-packages/openai/_base_client.py", line 1618, in _request
+    return await self._retry_request(
+           ^^^^^^^^^^^^^^^^^^^^^^^^^^
+  File "/home/runner/.cache/pypoetry/virtualenvs/graphrag-F2jvqev7-py3.11/lib/python3.11/site-packages/openai/_base_client.py", line 1665, in _retry_request
+    return await self._request(
+           ^^^^^^^^^^^^^^^^^^^^
+  File "/home/runner/.cache/pypoetry/virtualenvs/graphrag-F2jvqev7-py3.11/lib/python3.11/site-packages/openai/_base_client.py", line 1618, in _request
+    return await self._retry_request(
+           ^^^^^^^^^^^^^^^^^^^^^^^^^^
+  File "/home/runner/.cache/pypoetry/virtualenvs/graphrag-F2jvqev7-py3.11/lib/python3.11/site-packages/openai/_base_client.py", line 1665, in _retry_request
+    return await self._request(
+           ^^^^^^^^^^^^^^^^^^^^
+  File "/home/runner/.cache/pypoetry/virtualenvs/graphrag-F2jvqev7-py3.11/lib/python3.11/site-packages/openai/_base_client.py", line 1618, in _request
+    return await self._retry_request(
+           ^^^^^^^^^^^^^^^^^^^^^^^^^^
+  File "/home/runner/.cache/pypoetry/virtualenvs/graphrag-F2jvqev7-py3.11/lib/python3.11/site-packages/openai/_base_client.py", line 1665, in _retry_request
+    return await self._request(
+           ^^^^^^^^^^^^^^^^^^^^
+  File "/home/runner/.cache/pypoetry/virtualenvs/graphrag-F2jvqev7-py3.11/lib/python3.11/site-packages/openai/_base_client.py", line 1618, in _request
+    return await self._retry_request(
+           ^^^^^^^^^^^^^^^^^^^^^^^^^^
+  File "/home/runner/.cache/pypoetry/virtualenvs/graphrag-F2jvqev7-py3.11/lib/python3.11/site-packages/openai/_base_client.py", line 1665, in _retry_request
+    return await self._request(
+           ^^^^^^^^^^^^^^^^^^^^
+  File "/home/runner/.cache/pypoetry/virtualenvs/graphrag-F2jvqev7-py3.11/lib/python3.11/site-packages/openai/_base_client.py", line 1618, in _request
+    return await self._retry_request(
+           ^^^^^^^^^^^^^^^^^^^^^^^^^^
+  File "/home/runner/.cache/pypoetry/virtualenvs/graphrag-F2jvqev7-py3.11/lib/python3.11/site-packages/openai/_base_client.py", line 1665, in _retry_request
+    return await self._request(
+           ^^^^^^^^^^^^^^^^^^^^
+  File "/home/runner/.cache/pypoetry/virtualenvs/graphrag-F2jvqev7-py3.11/lib/python3.11/site-packages/openai/_base_client.py", line 1618, in _request
+    return await self._retry_request(
+           ^^^^^^^^^^^^^^^^^^^^^^^^^^
+  File "/home/runner/.cache/pypoetry/virtualenvs/graphrag-F2jvqev7-py3.11/lib/python3.11/site-packages/openai/_base_client.py", line 1665, in _retry_request
+    return await self._request(
+           ^^^^^^^^^^^^^^^^^^^^
+  File "/home/runner/.cache/pypoetry/virtualenvs/graphrag-F2jvqev7-py3.11/lib/python3.11/site-packages/openai/_base_client.py", line 1618, in _request
+    return await self._retry_request(
+           ^^^^^^^^^^^^^^^^^^^^^^^^^^
+  File "/home/runner/.cache/pypoetry/virtualenvs/graphrag-F2jvqev7-py3.11/lib/python3.11/site-packages/openai/_base_client.py", line 1665, in _retry_request
+    return await self._request(
+           ^^^^^^^^^^^^^^^^^^^^
+  File "/home/runner/.cache/pypoetry/virtualenvs/graphrag-F2jvqev7-py3.11/lib/python3.11/site-packages/openai/_base_client.py", line 1618, in _request
+    return await self._retry_request(
+           ^^^^^^^^^^^^^^^^^^^^^^^^^^
+  File "/home/runner/.cache/pypoetry/virtualenvs/graphrag-F2jvqev7-py3.11/lib/python3.11/site-packages/openai/_base_client.py", line 1665, in _retry_request
+    return await self._request(
+           ^^^^^^^^^^^^^^^^^^^^
+  File "/home/runner/.cache/pypoetry/virtualenvs/graphrag-F2jvqev7-py3.11/lib/python3.11/site-packages/openai/_base_client.py", line 1618, in _request
+    return await self._retry_request(
+           ^^^^^^^^^^^^^^^^^^^^^^^^^^
+  File "/home/runner/.cache/pypoetry/virtualenvs/graphrag-F2jvqev7-py3.11/lib/python3.11/site-packages/openai/_base_client.py", line 1665, in _retry_request
+    return await self._request(
+           ^^^^^^^^^^^^^^^^^^^^
+  File "/home/runner/.cache/pypoetry/virtualenvs/graphrag-F2jvqev7-py3.11/lib/python3.11/site-packages/openai/_base_client.py", line 1618, in _request
+    return await self._retry_request(
+           ^^^^^^^^^^^^^^^^^^^^^^^^^^
+  File "/home/runner/.cache/pypoetry/virtualenvs/graphrag-F2jvqev7-py3.11/lib/python3.11/site-packages/openai/_base_client.py", line 1665, in _retry_request
+    return await self._request(
+           ^^^^^^^^^^^^^^^^^^^^
+  File "/home/runner/.cache/pypoetry/virtualenvs/graphrag-F2jvqev7-py3.11/lib/python3.11/site-packages/openai/_base_client.py", line 1618, in _request
+    return await self._retry_request(
+           ^^^^^^^^^^^^^^^^^^^^^^^^^^
+  File "/home/runner/.cache/pypoetry/virtualenvs/graphrag-F2jvqev7-py3.11/lib/python3.11/site-packages/openai/_base_client.py", line 1665, in _retry_request
+    return await self._request(
+           ^^^^^^^^^^^^^^^^^^^^
+  File "/home/runner/.cache/pypoetry/virtualenvs/graphrag-F2jvqev7-py3.11/lib/python3.11/site-packages/openai/_base_client.py", line 1618, in _request
+    return await self._retry_request(
+           ^^^^^^^^^^^^^^^^^^^^^^^^^^
+  File "/home/runner/.cache/pypoetry/virtualenvs/graphrag-F2jvqev7-py3.11/lib/python3.11/site-packages/openai/_base_client.py", line 1665, in _retry_request
+    return await self._request(
+           ^^^^^^^^^^^^^^^^^^^^
+  File "/home/runner/.cache/pypoetry/virtualenvs/graphrag-F2jvqev7-py3.11/lib/python3.11/site-packages/openai/_base_client.py", line 1618, in _request
+    return await self._retry_request(
+           ^^^^^^^^^^^^^^^^^^^^^^^^^^
+  File "/home/runner/.cache/pypoetry/virtualenvs/graphrag-F2jvqev7-py3.11/lib/python3.11/site-packages/openai/_base_client.py", line 1665, in _retry_request
+    return await self._request(
+           ^^^^^^^^^^^^^^^^^^^^
+  File "/home/runner/.cache/pypoetry/virtualenvs/graphrag-F2jvqev7-py3.11/lib/python3.11/site-packages/openai/_base_client.py", line 1618, in _request
+    return await self._retry_request(
+           ^^^^^^^^^^^^^^^^^^^^^^^^^^
+  File "/home/runner/.cache/pypoetry/virtualenvs/graphrag-F2jvqev7-py3.11/lib/python3.11/site-packages/openai/_base_client.py", line 1665, in _retry_request
+    return await self._request(
+           ^^^^^^^^^^^^^^^^^^^^
+  File "/home/runner/.cache/pypoetry/virtualenvs/graphrag-F2jvqev7-py3.11/lib/python3.11/site-packages/openai/_base_client.py", line 1618, in _request
+    return await self._retry_request(
+           ^^^^^^^^^^^^^^^^^^^^^^^^^^
+  File "/home/runner/.cache/pypoetry/virtualenvs/graphrag-F2jvqev7-py3.11/lib/python3.11/site-packages/openai/_base_client.py", line 1665, in _retry_request
+    return await self._request(
+           ^^^^^^^^^^^^^^^^^^^^
+  File "/home/runner/.cache/pypoetry/virtualenvs/graphrag-F2jvqev7-py3.11/lib/python3.11/site-packages/openai/_base_client.py", line 1618, in _request
+    return await self._retry_request(
+           ^^^^^^^^^^^^^^^^^^^^^^^^^^
+  File "/home/runner/.cache/pypoetry/virtualenvs/graphrag-F2jvqev7-py3.11/lib/python3.11/site-packages/openai/_base_client.py", line 1665, in _retry_request
+    return await self._request(
+           ^^^^^^^^^^^^^^^^^^^^
+  File "/home/runner/.cache/pypoetry/virtualenvs/graphrag-F2jvqev7-py3.11/lib/python3.11/site-packages/openai/_base_client.py", line 1633, in _request
+    raise self._make_status_error_from_response(err.response) from None
+openai.RateLimitError: Error code: 429 - {'error': {'message': 'You exceeded your current quota, please check your plan and billing details. For more information on this error, read the docs: https://platform.openai.com/docs/guides/error-codes/api-errors.', 'type': 'insufficient_quota', 'param': None, 'code': 'insufficient_quota'}}
+</pre>
+</div>
+</div>
+<div class="jp-OutputArea-child">
+<div class="jp-OutputPrompt jp-OutputArea-prompt"></div>
+<div class="jp-RenderedText jp-OutputArea-output" data-mime-type="application/vnd.jupyter.stderr" tabindex="0">
+<pre>Warning: All map responses have score 0 (i.e., no relevant information found from the dataset), returning a canned 'I do not know' answer. You can try enabling `allow_general_knowledge` to encourage the LLM to incorporate relevant general knowledge, at the risk of increasing hallucinations.
+</pre>
+</div>
+</div>
+<div class="jp-OutputArea-child">
+<div class="jp-OutputPrompt jp-OutputArea-prompt"></div>
 <div class="jp-RenderedText jp-OutputArea-output" data-mime-type="text/plain" tabindex="0">
-<pre>### Overview of Cosmic Vocalization
-
-Cosmic Vocalization is a phenomenon that has garnered significant attention from various individuals and groups. It is perceived as a cosmic event with potential implications for security and interstellar communication. The phenomenon is described as part of an "interstellar duet," suggesting that it may involve a form of communication or interaction with cosmic entities or events [Data: Reports (6)].
-
-### Key Stakeholders
-
-1. **Paranormal Military Squad**: This group is actively engaged with Cosmic Vocalization, indicating that it is considered a matter of strategic importance. Their involvement suggests that the phenomenon is being monitored and possibly addressed as part of broader security measures [Data: Reports (6)].
-
-2. **Alex Mercer**: Alex Mercer views Cosmic Vocalization as part of an interstellar duet, which implies a responsive or interactive approach to the phenomenon. This perspective highlights the potential for Cosmic Vocalization to be more than a passive occurrence, possibly involving active communication or signaling [Data: Reports (6)].
-
-3. **Taylor Cruz**: Taylor Cruz has expressed concerns about Cosmic Vocalization, fearing it might be a "homing tune." This raises the possibility of the phenomenon being a signal or beacon, which could have implications for security and urgency in addressing the phenomenon [Data: Reports (6)].
-
-### Implications
-
-The involvement of these stakeholders underscores the complexity and potential significance of Cosmic Vocalization. The strategic engagement by the Paranormal Military Squad suggests that it may have implications for national or global security. Meanwhile, the perspectives of Alex Mercer and Taylor Cruz highlight the dual nature of the phenomenon as both a potential communication tool and a possible threat. Further investigation and monitoring are likely necessary to fully understand and address the implications of Cosmic Vocalization.
+<pre>I am sorry but I am unable to answer this question given the provided data.
 </pre>
 </div>
 </div>
@@ -2844,7 +3008,7 @@ print(
 <div class="jp-OutputArea-child">
 <div class="jp-OutputPrompt jp-OutputArea-prompt"></div>
 <div class="jp-RenderedText jp-OutputArea-output" data-mime-type="text/plain" tabindex="0">
-<pre>LLM calls: 2. Prompt tokens: 11238. Output tokens: 535.
+<pre>LLM calls: 1. Prompt tokens: 10330. Output tokens: 0.
 </pre>
 </div>
 </div>
diff --git a/examples_notebooks/global_search_with_dynamic_community_selection/index.html b/examples_notebooks/global_search_with_dynamic_community_selection/index.html
index 8a46a2bd..995f03c6 100644
--- a/examples_notebooks/global_search_with_dynamic_community_selection/index.html
+++ b/examples_notebooks/global_search_with_dynamic_community_selection/index.html
@@ -2538,27 +2538,319 @@ print(result.response)</div>
 <div class="jp-OutputArea jp-Cell-outputArea">
 <div class="jp-OutputArea-child">
 <div class="jp-OutputPrompt jp-OutputArea-prompt"></div>
-<div class="jp-RenderedText jp-OutputArea-output" data-mime-type="text/plain" tabindex="0">
-<pre>### Overview of Cosmic Vocalization
+<div class="jp-RenderedText jp-OutputArea-output" data-mime-type="application/vnd.jupyter.stderr" tabindex="0">
+<pre>
+<span class="ansi-red-fg">---------------------------------------------------------------------------</span>
+<span class="ansi-red-fg">RateLimitError</span>                            Traceback (most recent call last)
+Cell <span class="ansi-green-fg">In[9], line 1</span>
+<span class="ansi-green-fg">----&gt; 1</span> result <span style="color: rgb(98,98,98)">=</span> <span class="ansi-bold" style="color: rgb(0,135,0)">await</span> search_engine<span style="color: rgb(98,98,98)">.</span>asearch(
+<span class="ansi-green-intense-fg ansi-bold">      2</span>     <span style="color: rgb(175,0,0)">"</span><span style="color: rgb(175,0,0)">What is Cosmic Vocalization and who are involved in it?</span><span style="color: rgb(175,0,0)">"</span>
+<span class="ansi-green-intense-fg ansi-bold">      3</span> )
+<span class="ansi-green-intense-fg ansi-bold">      5</span> <span style="color: rgb(0,135,0)">print</span>(result<span style="color: rgb(98,98,98)">.</span>response)
 
-Cosmic Vocalization is a phenomenon that has captured the attention of various individuals and groups within the community. It is perceived as a significant cosmic event, with different interpretations and implications for those involved.
+File <span class="ansi-green-fg">~/work/graphrag/graphrag/graphrag/query/structured_search/global_search/search.py:157</span>, in <span class="ansi-cyan-fg">GlobalSearch.asearch</span><span class="ansi-blue-fg">(self, query, conversation_history, **kwargs)</span>
+<span class="ansi-green-intense-fg ansi-bold">    154</span> llm_calls, prompt_tokens, output_tokens <span style="color: rgb(98,98,98)">=</span> {}, {}, {}
+<span class="ansi-green-intense-fg ansi-bold">    156</span> start_time <span style="color: rgb(98,98,98)">=</span> time<span style="color: rgb(98,98,98)">.</span>time()
+<span class="ansi-green-fg">--&gt; 157</span> context_result <span style="color: rgb(98,98,98)">=</span> <span class="ansi-bold" style="color: rgb(0,135,0)">await</span> <span style="color: rgb(0,135,0)">self</span><span style="color: rgb(98,98,98)">.</span>context_builder<span style="color: rgb(98,98,98)">.</span>build_context(
+<span class="ansi-green-intense-fg ansi-bold">    158</span>     query<span style="color: rgb(98,98,98)">=</span>query,
+<span class="ansi-green-intense-fg ansi-bold">    159</span>     conversation_history<span style="color: rgb(98,98,98)">=</span>conversation_history,
+<span class="ansi-green-intense-fg ansi-bold">    160</span>     <span style="color: rgb(98,98,98)">*</span><span style="color: rgb(98,98,98)">*</span><span style="color: rgb(0,135,0)">self</span><span style="color: rgb(98,98,98)">.</span>context_builder_params,
+<span class="ansi-green-intense-fg ansi-bold">    161</span> )
+<span class="ansi-green-intense-fg ansi-bold">    162</span> llm_calls[<span style="color: rgb(175,0,0)">"</span><span style="color: rgb(175,0,0)">build_context</span><span style="color: rgb(175,0,0)">"</span>] <span style="color: rgb(98,98,98)">=</span> context_result<span style="color: rgb(98,98,98)">.</span>llm_calls
+<span class="ansi-green-intense-fg ansi-bold">    163</span> prompt_tokens[<span style="color: rgb(175,0,0)">"</span><span style="color: rgb(175,0,0)">build_context</span><span style="color: rgb(175,0,0)">"</span>] <span style="color: rgb(98,98,98)">=</span> context_result<span style="color: rgb(98,98,98)">.</span>prompt_tokens
 
-### Key Perspectives and Concerns
+File <span class="ansi-green-fg">~/work/graphrag/graphrag/graphrag/query/structured_search/global_search/community_context.py:98</span>, in <span class="ansi-cyan-fg">GlobalCommunityContext.build_context</span><span class="ansi-blue-fg">(self, query, conversation_history, use_community_summary, column_delimiter, shuffle_data, include_community_rank, min_community_rank, community_rank_name, include_community_weight, community_weight_name, normalize_community_weight, max_tokens, context_name, conversation_history_user_turns_only, conversation_history_max_turns, **kwargs)</span>
+<span class="ansi-green-intense-fg ansi-bold">     93</span> community_reports <span style="color: rgb(98,98,98)">=</span> <span style="color: rgb(0,135,0)">self</span><span style="color: rgb(98,98,98)">.</span>community_reports
+<span class="ansi-green-intense-fg ansi-bold">     94</span> <span class="ansi-bold" style="color: rgb(0,135,0)">if</span> <span style="color: rgb(0,135,0)">self</span><span style="color: rgb(98,98,98)">.</span>dynamic_community_selection <span class="ansi-bold" style="color: rgb(175,0,255)">is</span> <span class="ansi-bold" style="color: rgb(175,0,255)">not</span> <span class="ansi-bold" style="color: rgb(0,135,0)">None</span>:
+<span class="ansi-green-intense-fg ansi-bold">     95</span>     (
+<span class="ansi-green-intense-fg ansi-bold">     96</span>         community_reports,
+<span class="ansi-green-intense-fg ansi-bold">     97</span>         dynamic_info,
+<span class="ansi-green-fg">---&gt; 98</span>     ) <span style="color: rgb(98,98,98)">=</span> <span class="ansi-bold" style="color: rgb(0,135,0)">await</span> <span style="color: rgb(0,135,0)">self</span><span style="color: rgb(98,98,98)">.</span>dynamic_community_selection<span style="color: rgb(98,98,98)">.</span>select(query)
+<span class="ansi-green-intense-fg ansi-bold">     99</span>     llm_calls <span style="color: rgb(98,98,98)">+</span><span style="color: rgb(98,98,98)">=</span> dynamic_info[<span style="color: rgb(175,0,0)">"</span><span style="color: rgb(175,0,0)">llm_calls</span><span style="color: rgb(175,0,0)">"</span>]
+<span class="ansi-green-intense-fg ansi-bold">    100</span>     prompt_tokens <span style="color: rgb(98,98,98)">+</span><span style="color: rgb(98,98,98)">=</span> dynamic_info[<span style="color: rgb(175,0,0)">"</span><span style="color: rgb(175,0,0)">prompt_tokens</span><span style="color: rgb(175,0,0)">"</span>]
 
-Alex Mercer views Cosmic Vocalization as part of an interstellar duet, suggesting a responsive and perhaps harmonious interaction with cosmic events. This perspective highlights the potential for Cosmic Vocalization to be seen as a form of communication or interaction on a cosmic scale [Data: Reports (6)].
+File <span class="ansi-green-fg">~/work/graphrag/graphrag/graphrag/query/context_builder/dynamic_community_selection.py:106</span>, in <span class="ansi-cyan-fg">DynamicCommunitySelection.select</span><span class="ansi-blue-fg">(self, query)</span>
+<span class="ansi-green-intense-fg ansi-bold">    103</span> relevant_communities <span style="color: rgb(98,98,98)">=</span> <span style="color: rgb(0,135,0)">set</span>()
+<span class="ansi-green-intense-fg ansi-bold">    105</span> <span class="ansi-bold" style="color: rgb(0,135,0)">while</span> queue:
+<span class="ansi-green-fg">--&gt; 106</span>     gather_results <span style="color: rgb(98,98,98)">=</span> <span class="ansi-bold" style="color: rgb(0,135,0)">await</span> asyncio<span style="color: rgb(98,98,98)">.</span>gather(<span style="color: rgb(98,98,98)">*</span>[
+<span class="ansi-green-intense-fg ansi-bold">    107</span>         rate_relevancy(
+<span class="ansi-green-intense-fg ansi-bold">    108</span>             query<span style="color: rgb(98,98,98)">=</span>query,
+<span class="ansi-green-intense-fg ansi-bold">    109</span>             description<span style="color: rgb(98,98,98)">=</span>(
+<span class="ansi-green-intense-fg ansi-bold">    110</span>                 <span style="color: rgb(0,135,0)">self</span><span style="color: rgb(98,98,98)">.</span>reports[community]<span style="color: rgb(98,98,98)">.</span>summary
+<span class="ansi-green-intense-fg ansi-bold">    111</span>                 <span class="ansi-bold" style="color: rgb(0,135,0)">if</span> <span style="color: rgb(0,135,0)">self</span><span style="color: rgb(98,98,98)">.</span>use_summary
+<span class="ansi-green-intense-fg ansi-bold">    112</span>                 <span class="ansi-bold" style="color: rgb(0,135,0)">else</span> <span style="color: rgb(0,135,0)">self</span><span style="color: rgb(98,98,98)">.</span>reports[community]<span style="color: rgb(98,98,98)">.</span>full_content
+<span class="ansi-green-intense-fg ansi-bold">    113</span>             ),
+<span class="ansi-green-intense-fg ansi-bold">    114</span>             llm<span style="color: rgb(98,98,98)">=</span><span style="color: rgb(0,135,0)">self</span><span style="color: rgb(98,98,98)">.</span>llm,
+<span class="ansi-green-intense-fg ansi-bold">    115</span>             token_encoder<span style="color: rgb(98,98,98)">=</span><span style="color: rgb(0,135,0)">self</span><span style="color: rgb(98,98,98)">.</span>token_encoder,
+<span class="ansi-green-intense-fg ansi-bold">    116</span>             rate_query<span style="color: rgb(98,98,98)">=</span><span style="color: rgb(0,135,0)">self</span><span style="color: rgb(98,98,98)">.</span>rate_query,
+<span class="ansi-green-intense-fg ansi-bold">    117</span>             num_repeats<span style="color: rgb(98,98,98)">=</span><span style="color: rgb(0,135,0)">self</span><span style="color: rgb(98,98,98)">.</span>num_repeats,
+<span class="ansi-green-intense-fg ansi-bold">    118</span>             semaphore<span style="color: rgb(98,98,98)">=</span><span style="color: rgb(0,135,0)">self</span><span style="color: rgb(98,98,98)">.</span>semaphore,
+<span class="ansi-green-intense-fg ansi-bold">    119</span>             <span style="color: rgb(98,98,98)">*</span><span style="color: rgb(98,98,98)">*</span><span style="color: rgb(0,135,0)">self</span><span style="color: rgb(98,98,98)">.</span>llm_kwargs,
+<span class="ansi-green-intense-fg ansi-bold">    120</span>         )
+<span class="ansi-green-intense-fg ansi-bold">    121</span>         <span class="ansi-bold" style="color: rgb(0,135,0)">for</span> community <span class="ansi-bold" style="color: rgb(175,0,255)">in</span> queue
+<span class="ansi-green-intense-fg ansi-bold">    122</span>     ])
+<span class="ansi-green-intense-fg ansi-bold">    124</span>     communities_to_rate <span style="color: rgb(98,98,98)">=</span> []
+<span class="ansi-green-intense-fg ansi-bold">    125</span>     <span class="ansi-bold" style="color: rgb(0,135,0)">for</span> community, result <span class="ansi-bold" style="color: rgb(175,0,255)">in</span> <span style="color: rgb(0,135,0)">zip</span>(queue, gather_results, strict<span style="color: rgb(98,98,98)">=</span><span class="ansi-bold" style="color: rgb(0,135,0)">True</span>):
 
-On the other hand, Taylor Cruz raises concerns about the implications of Cosmic Vocalization, fearing it might serve as a homing tune. This interpretation adds a layer of urgency and potential threat, suggesting that the phenomenon could attract unwanted attention or pose risks to those who are aware of it [Data: Reports (6)].
+File <span class="ansi-green-fg">~/work/graphrag/graphrag/graphrag/query/context_builder/rate_relevancy.py:55</span>, in <span class="ansi-cyan-fg">rate_relevancy</span><span class="ansi-blue-fg">(query, description, llm, token_encoder, rate_query, num_repeats, semaphore, **llm_kwargs)</span>
+<span class="ansi-green-intense-fg ansi-bold">     53</span> <span class="ansi-bold" style="color: rgb(0,135,0)">for</span> _ <span class="ansi-bold" style="color: rgb(175,0,255)">in</span> <span style="color: rgb(0,135,0)">range</span>(num_repeats):
+<span class="ansi-green-intense-fg ansi-bold">     54</span>     <span class="ansi-bold" style="color: rgb(0,135,0)">async</span> <span class="ansi-bold" style="color: rgb(0,135,0)">with</span> semaphore <span class="ansi-bold" style="color: rgb(0,135,0)">if</span> semaphore <span class="ansi-bold" style="color: rgb(175,0,255)">is</span> <span class="ansi-bold" style="color: rgb(175,0,255)">not</span> <span class="ansi-bold" style="color: rgb(0,135,0)">None</span> <span class="ansi-bold" style="color: rgb(0,135,0)">else</span> nullcontext():
+<span class="ansi-green-fg">---&gt; 55</span>         response <span style="color: rgb(98,98,98)">=</span> <span class="ansi-bold" style="color: rgb(0,135,0)">await</span> llm<span style="color: rgb(98,98,98)">.</span>agenerate(messages<span style="color: rgb(98,98,98)">=</span>messages, <span style="color: rgb(98,98,98)">*</span><span style="color: rgb(98,98,98)">*</span>llm_kwargs)
+<span class="ansi-green-intense-fg ansi-bold">     56</span>     <span class="ansi-bold" style="color: rgb(0,135,0)">try</span>:
+<span class="ansi-green-intense-fg ansi-bold">     57</span>         _, parsed_response <span style="color: rgb(98,98,98)">=</span> try_parse_json_object(response)
 
-### Involvement of the Paranormal Military Squad
+File <span class="ansi-green-fg">~/work/graphrag/graphrag/graphrag/query/llm/oai/chat_openai.py:142</span>, in <span class="ansi-cyan-fg">ChatOpenAI.agenerate</span><span class="ansi-blue-fg">(self, messages, streaming, callbacks, **kwargs)</span>
+<span class="ansi-green-intense-fg ansi-bold">    135</span> <span class="ansi-bold" style="color: rgb(0,135,0)">try</span>:
+<span class="ansi-green-intense-fg ansi-bold">    136</span>     retryer <span style="color: rgb(98,98,98)">=</span> AsyncRetrying(
+<span class="ansi-green-intense-fg ansi-bold">    137</span>         stop<span style="color: rgb(98,98,98)">=</span>stop_after_attempt(<span style="color: rgb(0,135,0)">self</span><span style="color: rgb(98,98,98)">.</span>max_retries),
+<span class="ansi-green-intense-fg ansi-bold">    138</span>         wait<span style="color: rgb(98,98,98)">=</span>wait_exponential_jitter(<span style="color: rgb(0,135,0)">max</span><span style="color: rgb(98,98,98)">=</span><span style="color: rgb(98,98,98)">10</span>),
+<span class="ansi-green-intense-fg ansi-bold">    139</span>         reraise<span style="color: rgb(98,98,98)">=</span><span class="ansi-bold" style="color: rgb(0,135,0)">True</span>,
+<span class="ansi-green-intense-fg ansi-bold">    140</span>         retry<span style="color: rgb(98,98,98)">=</span>retry_if_exception_type(<span style="color: rgb(0,135,0)">self</span><span style="color: rgb(98,98,98)">.</span>retry_error_types),  <span style="color: rgb(95,135,135)"># type: ignore</span>
+<span class="ansi-green-intense-fg ansi-bold">    141</span>     )
+<span class="ansi-green-fg">--&gt; 142</span>     <span class="ansi-bold" style="color: rgb(0,135,0)">async</span> <span class="ansi-bold" style="color: rgb(0,135,0)">for</span> attempt <span class="ansi-bold" style="color: rgb(175,0,255)">in</span> retryer:
+<span class="ansi-green-intense-fg ansi-bold">    143</span>         <span class="ansi-bold" style="color: rgb(0,135,0)">with</span> attempt:
+<span class="ansi-green-intense-fg ansi-bold">    144</span>             <span class="ansi-bold" style="color: rgb(0,135,0)">return</span> <span class="ansi-bold" style="color: rgb(0,135,0)">await</span> <span style="color: rgb(0,135,0)">self</span><span style="color: rgb(98,98,98)">.</span>_agenerate(
+<span class="ansi-green-intense-fg ansi-bold">    145</span>                 messages<span style="color: rgb(98,98,98)">=</span>messages,
+<span class="ansi-green-intense-fg ansi-bold">    146</span>                 streaming<span style="color: rgb(98,98,98)">=</span>streaming,
+<span class="ansi-green-intense-fg ansi-bold">    147</span>                 callbacks<span style="color: rgb(98,98,98)">=</span>callbacks,
+<span class="ansi-green-intense-fg ansi-bold">    148</span>                 <span style="color: rgb(98,98,98)">*</span><span style="color: rgb(98,98,98)">*</span>kwargs,
+<span class="ansi-green-intense-fg ansi-bold">    149</span>             )
 
-The Paranormal Military Squad is actively engaged with Cosmic Vocalization, indicating its strategic importance in their mission. Their involvement underscores the significance of Cosmic Vocalization in security measures and suggests that it is being taken seriously by entities responsible for safeguarding against potential cosmic threats [Data: Reports (6)].
+File <span class="ansi-green-fg">~/.cache/pypoetry/virtualenvs/graphrag-F2jvqev7-py3.11/lib/python3.11/site-packages/tenacity/asyncio/__init__.py:166</span>, in <span class="ansi-cyan-fg">AsyncRetrying.__anext__</span><span class="ansi-blue-fg">(self)</span>
+<span class="ansi-green-intense-fg ansi-bold">    164</span> <span class="ansi-bold" style="color: rgb(0,135,0)">async</span> <span class="ansi-bold" style="color: rgb(0,135,0)">def</span> <span style="color: rgb(0,0,255)">__anext__</span>(<span style="color: rgb(0,135,0)">self</span>) <span style="color: rgb(98,98,98)">-</span><span style="color: rgb(98,98,98)">&gt;</span> AttemptManager:
+<span class="ansi-green-intense-fg ansi-bold">    165</span>     <span class="ansi-bold" style="color: rgb(0,135,0)">while</span> <span class="ansi-bold" style="color: rgb(0,135,0)">True</span>:
+<span class="ansi-green-fg">--&gt; 166</span>         do <span style="color: rgb(98,98,98)">=</span> <span class="ansi-bold" style="color: rgb(0,135,0)">await</span> <span style="color: rgb(0,135,0)">self</span><span style="color: rgb(98,98,98)">.</span>iter(retry_state<span style="color: rgb(98,98,98)">=</span><span style="color: rgb(0,135,0)">self</span><span style="color: rgb(98,98,98)">.</span>_retry_state)
+<span class="ansi-green-intense-fg ansi-bold">    167</span>         <span class="ansi-bold" style="color: rgb(0,135,0)">if</span> do <span class="ansi-bold" style="color: rgb(175,0,255)">is</span> <span class="ansi-bold" style="color: rgb(0,135,0)">None</span>:
+<span class="ansi-green-intense-fg ansi-bold">    168</span>             <span class="ansi-bold" style="color: rgb(0,135,0)">raise</span> <span class="ansi-bold" style="color: rgb(215,95,95)">StopAsyncIteration</span>
 
-### Metaphorical Interpretation
+File <span class="ansi-green-fg">~/.cache/pypoetry/virtualenvs/graphrag-F2jvqev7-py3.11/lib/python3.11/site-packages/tenacity/asyncio/__init__.py:153</span>, in <span class="ansi-cyan-fg">AsyncRetrying.iter</span><span class="ansi-blue-fg">(self, retry_state)</span>
+<span class="ansi-green-intense-fg ansi-bold">    151</span> result <span style="color: rgb(98,98,98)">=</span> <span class="ansi-bold" style="color: rgb(0,135,0)">None</span>
+<span class="ansi-green-intense-fg ansi-bold">    152</span> <span class="ansi-bold" style="color: rgb(0,135,0)">for</span> action <span class="ansi-bold" style="color: rgb(175,0,255)">in</span> <span style="color: rgb(0,135,0)">self</span><span style="color: rgb(98,98,98)">.</span>iter_state<span style="color: rgb(98,98,98)">.</span>actions:
+<span class="ansi-green-fg">--&gt; 153</span>     result <span style="color: rgb(98,98,98)">=</span> <span class="ansi-bold" style="color: rgb(0,135,0)">await</span> action(retry_state)
+<span class="ansi-green-intense-fg ansi-bold">    154</span> <span class="ansi-bold" style="color: rgb(0,135,0)">return</span> result
 
-The Universe is metaphorically treated as a concert hall by the Paranormal Military Squad, which reflects a broader perspective on how cosmic events like Cosmic Vocalization are interpreted and responded to by human entities. This metaphor suggests a view of the universe as a stage for cosmic interactions, where events are not only observed but also responded to in a strategic manner [Data: Reports (6)].
+File <span class="ansi-green-fg">~/.cache/pypoetry/virtualenvs/graphrag-F2jvqev7-py3.11/lib/python3.11/site-packages/tenacity/_utils.py:99</span>, in <span class="ansi-cyan-fg">wrap_to_async_func.&lt;locals&gt;.inner</span><span class="ansi-blue-fg">(*args, **kwargs)</span>
+<span class="ansi-green-intense-fg ansi-bold">     98</span> <span class="ansi-bold" style="color: rgb(0,135,0)">async</span> <span class="ansi-bold" style="color: rgb(0,135,0)">def</span> <span style="color: rgb(0,0,255)">inner</span>(<span style="color: rgb(98,98,98)">*</span>args: typing<span style="color: rgb(98,98,98)">.</span>Any, <span style="color: rgb(98,98,98)">*</span><span style="color: rgb(98,98,98)">*</span>kwargs: typing<span style="color: rgb(98,98,98)">.</span>Any) <span style="color: rgb(98,98,98)">-</span><span style="color: rgb(98,98,98)">&gt;</span> typing<span style="color: rgb(98,98,98)">.</span>Any:
+<span class="ansi-green-fg">---&gt; 99</span>     <span class="ansi-bold" style="color: rgb(0,135,0)">return</span> <span class="ansi-yellow-bg">call</span><span class="ansi-yellow-bg">(</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">*</span><span class="ansi-yellow-bg">args</span><span class="ansi-yellow-bg">,</span><span class="ansi-yellow-bg"> </span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">*</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">*</span><span class="ansi-yellow-bg">kwargs</span><span class="ansi-yellow-bg">)</span>
 
-In summary, Cosmic Vocalization is a multifaceted phenomenon involving various interpretations and responses from individuals like Alex Mercer and Taylor Cruz, as well as strategic engagement by the Paranormal Military Squad. Each perspective contributes to a complex understanding of its potential implications and significance.
-</pre>
+File <span class="ansi-green-fg">~/.cache/pypoetry/virtualenvs/graphrag-F2jvqev7-py3.11/lib/python3.11/site-packages/tenacity/__init__.py:418</span>, in <span class="ansi-cyan-fg">BaseRetrying._post_stop_check_actions.&lt;locals&gt;.exc_check</span><span class="ansi-blue-fg">(rs)</span>
+<span class="ansi-green-intense-fg ansi-bold">    416</span> retry_exc <span style="color: rgb(98,98,98)">=</span> <span style="color: rgb(0,135,0)">self</span><span style="color: rgb(98,98,98)">.</span>retry_error_cls(fut)
+<span class="ansi-green-intense-fg ansi-bold">    417</span> <span class="ansi-bold" style="color: rgb(0,135,0)">if</span> <span style="color: rgb(0,135,0)">self</span><span style="color: rgb(98,98,98)">.</span>reraise:
+<span class="ansi-green-fg">--&gt; 418</span>     <span class="ansi-bold" style="color: rgb(0,135,0)">raise</span> <span class="ansi-yellow-bg">retry_exc</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">.</span><span class="ansi-yellow-bg">reraise</span><span class="ansi-yellow-bg">(</span><span class="ansi-yellow-bg">)</span>
+<span class="ansi-green-intense-fg ansi-bold">    419</span> <span class="ansi-bold" style="color: rgb(0,135,0)">raise</span> retry_exc <span class="ansi-bold" style="color: rgb(0,135,0)">from</span> <span class="ansi-bold" style="color: rgb(0,0,255)">fut</span><span class="ansi-bold" style="color: rgb(0,0,255)">.</span><span class="ansi-bold" style="color: rgb(0,0,255)">exception</span>()
+
+File <span class="ansi-green-fg">~/.cache/pypoetry/virtualenvs/graphrag-F2jvqev7-py3.11/lib/python3.11/site-packages/tenacity/__init__.py:185</span>, in <span class="ansi-cyan-fg">RetryError.reraise</span><span class="ansi-blue-fg">(self)</span>
+<span class="ansi-green-intense-fg ansi-bold">    183</span> <span class="ansi-bold" style="color: rgb(0,135,0)">def</span> <span style="color: rgb(0,0,255)">reraise</span>(<span style="color: rgb(0,135,0)">self</span>) <span style="color: rgb(98,98,98)">-</span><span style="color: rgb(98,98,98)">&gt;</span> t<span style="color: rgb(98,98,98)">.</span>NoReturn:
+<span class="ansi-green-intense-fg ansi-bold">    184</span>     <span class="ansi-bold" style="color: rgb(0,135,0)">if</span> <span style="color: rgb(0,135,0)">self</span><span style="color: rgb(98,98,98)">.</span>last_attempt<span style="color: rgb(98,98,98)">.</span>failed:
+<span class="ansi-green-fg">--&gt; 185</span>         <span class="ansi-bold" style="color: rgb(0,135,0)">raise</span> <span class="ansi-yellow-bg" style="color: rgb(0,135,0)">self</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">.</span><span class="ansi-yellow-bg">last_attempt</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">.</span><span class="ansi-yellow-bg">result</span><span class="ansi-yellow-bg">(</span><span class="ansi-yellow-bg">)</span>
+<span class="ansi-green-intense-fg ansi-bold">    186</span>     <span class="ansi-bold" style="color: rgb(0,135,0)">raise</span> <span style="color: rgb(0,135,0)">self</span>
+
+File <span class="ansi-green-fg">/opt/hostedtoolcache/Python/3.11.10/x64/lib/python3.11/concurrent/futures/_base.py:449</span>, in <span class="ansi-cyan-fg">Future.result</span><span class="ansi-blue-fg">(self, timeout)</span>
+<span class="ansi-green-intense-fg ansi-bold">    447</span>     <span class="ansi-bold" style="color: rgb(0,135,0)">raise</span> CancelledError()
+<span class="ansi-green-intense-fg ansi-bold">    448</span> <span class="ansi-bold" style="color: rgb(0,135,0)">elif</span> <span style="color: rgb(0,135,0)">self</span><span style="color: rgb(98,98,98)">.</span>_state <span style="color: rgb(98,98,98)">==</span> FINISHED:
+<span class="ansi-green-fg">--&gt; 449</span>     <span class="ansi-bold" style="color: rgb(0,135,0)">return</span> <span class="ansi-yellow-bg" style="color: rgb(0,135,0)">self</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">.</span><span class="ansi-yellow-bg">__get_result</span><span class="ansi-yellow-bg">(</span><span class="ansi-yellow-bg">)</span>
+<span class="ansi-green-intense-fg ansi-bold">    451</span> <span style="color: rgb(0,135,0)">self</span><span style="color: rgb(98,98,98)">.</span>_condition<span style="color: rgb(98,98,98)">.</span>wait(timeout)
+<span class="ansi-green-intense-fg ansi-bold">    453</span> <span class="ansi-bold" style="color: rgb(0,135,0)">if</span> <span style="color: rgb(0,135,0)">self</span><span style="color: rgb(98,98,98)">.</span>_state <span class="ansi-bold" style="color: rgb(175,0,255)">in</span> [CANCELLED, CANCELLED_AND_NOTIFIED]:
+
+File <span class="ansi-green-fg">/opt/hostedtoolcache/Python/3.11.10/x64/lib/python3.11/concurrent/futures/_base.py:401</span>, in <span class="ansi-cyan-fg">Future.__get_result</span><span class="ansi-blue-fg">(self)</span>
+<span class="ansi-green-intense-fg ansi-bold">    399</span> <span class="ansi-bold" style="color: rgb(0,135,0)">if</span> <span style="color: rgb(0,135,0)">self</span><span style="color: rgb(98,98,98)">.</span>_exception:
+<span class="ansi-green-intense-fg ansi-bold">    400</span>     <span class="ansi-bold" style="color: rgb(0,135,0)">try</span>:
+<span class="ansi-green-fg">--&gt; 401</span>         <span class="ansi-bold" style="color: rgb(0,135,0)">raise</span> <span style="color: rgb(0,135,0)">self</span><span style="color: rgb(98,98,98)">.</span>_exception
+<span class="ansi-green-intense-fg ansi-bold">    402</span>     <span class="ansi-bold" style="color: rgb(0,135,0)">finally</span>:
+<span class="ansi-green-intense-fg ansi-bold">    403</span>         <span style="color: rgb(95,135,135)"># Break a reference cycle with the exception in self._exception</span>
+<span class="ansi-green-intense-fg ansi-bold">    404</span>         <span style="color: rgb(0,135,0)">self</span> <span style="color: rgb(98,98,98)">=</span> <span class="ansi-bold" style="color: rgb(0,135,0)">None</span>
+
+File <span class="ansi-green-fg">~/work/graphrag/graphrag/graphrag/query/llm/oai/chat_openai.py:144</span>, in <span class="ansi-cyan-fg">ChatOpenAI.agenerate</span><span class="ansi-blue-fg">(self, messages, streaming, callbacks, **kwargs)</span>
+<span class="ansi-green-intense-fg ansi-bold">    142</span>     <span class="ansi-bold" style="color: rgb(0,135,0)">async</span> <span class="ansi-bold" style="color: rgb(0,135,0)">for</span> attempt <span class="ansi-bold" style="color: rgb(175,0,255)">in</span> retryer:
+<span class="ansi-green-intense-fg ansi-bold">    143</span>         <span class="ansi-bold" style="color: rgb(0,135,0)">with</span> attempt:
+<span class="ansi-green-fg">--&gt; 144</span>             <span class="ansi-bold" style="color: rgb(0,135,0)">return</span> <span class="ansi-bold" style="color: rgb(0,135,0)">await</span> <span style="color: rgb(0,135,0)">self</span><span style="color: rgb(98,98,98)">.</span>_agenerate(
+<span class="ansi-green-intense-fg ansi-bold">    145</span>                 messages<span style="color: rgb(98,98,98)">=</span>messages,
+<span class="ansi-green-intense-fg ansi-bold">    146</span>                 streaming<span style="color: rgb(98,98,98)">=</span>streaming,
+<span class="ansi-green-intense-fg ansi-bold">    147</span>                 callbacks<span style="color: rgb(98,98,98)">=</span>callbacks,
+<span class="ansi-green-intense-fg ansi-bold">    148</span>                 <span style="color: rgb(98,98,98)">*</span><span style="color: rgb(98,98,98)">*</span>kwargs,
+<span class="ansi-green-intense-fg ansi-bold">    149</span>             )
+<span class="ansi-green-intense-fg ansi-bold">    150</span> <span class="ansi-bold" style="color: rgb(0,135,0)">except</span> RetryError <span class="ansi-bold" style="color: rgb(0,135,0)">as</span> e:
+<span class="ansi-green-intense-fg ansi-bold">    151</span>     <span style="color: rgb(0,135,0)">self</span><span style="color: rgb(98,98,98)">.</span>_reporter<span style="color: rgb(98,98,98)">.</span>error(<span style="color: rgb(175,0,0)">f</span><span style="color: rgb(175,0,0)">"</span><span style="color: rgb(175,0,0)">Error at agenerate(): </span><span class="ansi-bold" style="color: rgb(175,95,135)">{</span>e<span class="ansi-bold" style="color: rgb(175,95,135)">}</span><span style="color: rgb(175,0,0)">"</span>)
+
+File <span class="ansi-green-fg">~/work/graphrag/graphrag/graphrag/query/llm/oai/chat_openai.py:268</span>, in <span class="ansi-cyan-fg">ChatOpenAI._agenerate</span><span class="ansi-blue-fg">(self, messages, streaming, callbacks, **kwargs)</span>
+<span class="ansi-green-intense-fg ansi-bold">    266</span> <span class="ansi-bold" style="color: rgb(0,135,0)">if</span> <span class="ansi-bold" style="color: rgb(175,0,255)">not</span> model:
+<span class="ansi-green-intense-fg ansi-bold">    267</span>     <span class="ansi-bold" style="color: rgb(0,135,0)">raise</span> <span class="ansi-bold" style="color: rgb(215,95,95)">ValueError</span>(_MODEL_REQUIRED_MSG)
+<span class="ansi-green-fg">--&gt; 268</span> response <span style="color: rgb(98,98,98)">=</span> <span class="ansi-bold" style="color: rgb(0,135,0)">await</span> <span style="color: rgb(0,135,0)">self</span><span style="color: rgb(98,98,98)">.</span>async_client<span style="color: rgb(98,98,98)">.</span>chat<span style="color: rgb(98,98,98)">.</span>completions<span style="color: rgb(98,98,98)">.</span>create(  <span style="color: rgb(95,135,135)"># type: ignore</span>
+<span class="ansi-green-intense-fg ansi-bold">    269</span>     model<span style="color: rgb(98,98,98)">=</span>model,
+<span class="ansi-green-intense-fg ansi-bold">    270</span>     messages<span style="color: rgb(98,98,98)">=</span>messages,  <span style="color: rgb(95,135,135)"># type: ignore</span>
+<span class="ansi-green-intense-fg ansi-bold">    271</span>     stream<span style="color: rgb(98,98,98)">=</span>streaming,
+<span class="ansi-green-intense-fg ansi-bold">    272</span>     <span style="color: rgb(98,98,98)">*</span><span style="color: rgb(98,98,98)">*</span>kwargs,
+<span class="ansi-green-intense-fg ansi-bold">    273</span> )
+<span class="ansi-green-intense-fg ansi-bold">    274</span> <span class="ansi-bold" style="color: rgb(0,135,0)">if</span> streaming:
+<span class="ansi-green-intense-fg ansi-bold">    275</span>     full_response <span style="color: rgb(98,98,98)">=</span> <span style="color: rgb(175,0,0)">"</span><span style="color: rgb(175,0,0)">"</span>
+
+File <span class="ansi-green-fg">~/.cache/pypoetry/virtualenvs/graphrag-F2jvqev7-py3.11/lib/python3.11/site-packages/openai/resources/chat/completions.py:1661</span>, in <span class="ansi-cyan-fg">AsyncCompletions.create</span><span class="ansi-blue-fg">(self, messages, model, audio, frequency_penalty, function_call, functions, logit_bias, logprobs, max_completion_tokens, max_tokens, metadata, modalities, n, parallel_tool_calls, prediction, presence_penalty, response_format, seed, service_tier, stop, store, stream, stream_options, temperature, tool_choice, tools, top_logprobs, top_p, user, extra_headers, extra_query, extra_body, timeout)</span>
+<span class="ansi-green-intense-fg ansi-bold">   1620</span> <span style="color: rgb(175,0,255)">@required_args</span>([<span style="color: rgb(175,0,0)">"</span><span style="color: rgb(175,0,0)">messages</span><span style="color: rgb(175,0,0)">"</span>, <span style="color: rgb(175,0,0)">"</span><span style="color: rgb(175,0,0)">model</span><span style="color: rgb(175,0,0)">"</span>], [<span style="color: rgb(175,0,0)">"</span><span style="color: rgb(175,0,0)">messages</span><span style="color: rgb(175,0,0)">"</span>, <span style="color: rgb(175,0,0)">"</span><span style="color: rgb(175,0,0)">model</span><span style="color: rgb(175,0,0)">"</span>, <span style="color: rgb(175,0,0)">"</span><span style="color: rgb(175,0,0)">stream</span><span style="color: rgb(175,0,0)">"</span>])
+<span class="ansi-green-intense-fg ansi-bold">   1621</span> <span class="ansi-bold" style="color: rgb(0,135,0)">async</span> <span class="ansi-bold" style="color: rgb(0,135,0)">def</span> <span style="color: rgb(0,0,255)">create</span>(
+<span class="ansi-green-intense-fg ansi-bold">   1622</span>     <span style="color: rgb(0,135,0)">self</span>,
+<span class="ansi-green-fg">   (...)</span>
+<span class="ansi-green-intense-fg ansi-bold">   1658</span>     timeout: <span style="color: rgb(0,135,0)">float</span> <span style="color: rgb(98,98,98)">|</span> httpx<span style="color: rgb(98,98,98)">.</span>Timeout <span style="color: rgb(98,98,98)">|</span> <span class="ansi-bold" style="color: rgb(0,135,0)">None</span> <span style="color: rgb(98,98,98)">|</span> NotGiven <span style="color: rgb(98,98,98)">=</span> NOT_GIVEN,
+<span class="ansi-green-intense-fg ansi-bold">   1659</span> ) <span style="color: rgb(98,98,98)">-</span><span style="color: rgb(98,98,98)">&gt;</span> ChatCompletion <span style="color: rgb(98,98,98)">|</span> AsyncStream[ChatCompletionChunk]:
+<span class="ansi-green-intense-fg ansi-bold">   1660</span>     validate_response_format(response_format)
+<span class="ansi-green-fg">-&gt; 1661</span>     <span class="ansi-bold" style="color: rgb(0,135,0)">return</span> <span class="ansi-bold" style="color: rgb(0,135,0)">await</span> <span style="color: rgb(0,135,0)">self</span><span style="color: rgb(98,98,98)">.</span>_post(
+<span class="ansi-green-intense-fg ansi-bold">   1662</span>         <span style="color: rgb(175,0,0)">"</span><span style="color: rgb(175,0,0)">/chat/completions</span><span style="color: rgb(175,0,0)">"</span>,
+<span class="ansi-green-intense-fg ansi-bold">   1663</span>         body<span style="color: rgb(98,98,98)">=</span><span class="ansi-bold" style="color: rgb(0,135,0)">await</span> async_maybe_transform(
+<span class="ansi-green-intense-fg ansi-bold">   1664</span>             {
+<span class="ansi-green-intense-fg ansi-bold">   1665</span>                 <span style="color: rgb(175,0,0)">"</span><span style="color: rgb(175,0,0)">messages</span><span style="color: rgb(175,0,0)">"</span>: messages,
+<span class="ansi-green-intense-fg ansi-bold">   1666</span>                 <span style="color: rgb(175,0,0)">"</span><span style="color: rgb(175,0,0)">model</span><span style="color: rgb(175,0,0)">"</span>: model,
+<span class="ansi-green-intense-fg ansi-bold">   1667</span>                 <span style="color: rgb(175,0,0)">"</span><span style="color: rgb(175,0,0)">audio</span><span style="color: rgb(175,0,0)">"</span>: audio,
+<span class="ansi-green-intense-fg ansi-bold">   1668</span>                 <span style="color: rgb(175,0,0)">"</span><span style="color: rgb(175,0,0)">frequency_penalty</span><span style="color: rgb(175,0,0)">"</span>: frequency_penalty,
+<span class="ansi-green-intense-fg ansi-bold">   1669</span>                 <span style="color: rgb(175,0,0)">"</span><span style="color: rgb(175,0,0)">function_call</span><span style="color: rgb(175,0,0)">"</span>: function_call,
+<span class="ansi-green-intense-fg ansi-bold">   1670</span>                 <span style="color: rgb(175,0,0)">"</span><span style="color: rgb(175,0,0)">functions</span><span style="color: rgb(175,0,0)">"</span>: functions,
+<span class="ansi-green-intense-fg ansi-bold">   1671</span>                 <span style="color: rgb(175,0,0)">"</span><span style="color: rgb(175,0,0)">logit_bias</span><span style="color: rgb(175,0,0)">"</span>: logit_bias,
+<span class="ansi-green-intense-fg ansi-bold">   1672</span>                 <span style="color: rgb(175,0,0)">"</span><span style="color: rgb(175,0,0)">logprobs</span><span style="color: rgb(175,0,0)">"</span>: logprobs,
+<span class="ansi-green-intense-fg ansi-bold">   1673</span>                 <span style="color: rgb(175,0,0)">"</span><span style="color: rgb(175,0,0)">max_completion_tokens</span><span style="color: rgb(175,0,0)">"</span>: max_completion_tokens,
+<span class="ansi-green-intense-fg ansi-bold">   1674</span>                 <span style="color: rgb(175,0,0)">"</span><span style="color: rgb(175,0,0)">max_tokens</span><span style="color: rgb(175,0,0)">"</span>: max_tokens,
+<span class="ansi-green-intense-fg ansi-bold">   1675</span>                 <span style="color: rgb(175,0,0)">"</span><span style="color: rgb(175,0,0)">metadata</span><span style="color: rgb(175,0,0)">"</span>: metadata,
+<span class="ansi-green-intense-fg ansi-bold">   1676</span>                 <span style="color: rgb(175,0,0)">"</span><span style="color: rgb(175,0,0)">modalities</span><span style="color: rgb(175,0,0)">"</span>: modalities,
+<span class="ansi-green-intense-fg ansi-bold">   1677</span>                 <span style="color: rgb(175,0,0)">"</span><span style="color: rgb(175,0,0)">n</span><span style="color: rgb(175,0,0)">"</span>: n,
+<span class="ansi-green-intense-fg ansi-bold">   1678</span>                 <span style="color: rgb(175,0,0)">"</span><span style="color: rgb(175,0,0)">parallel_tool_calls</span><span style="color: rgb(175,0,0)">"</span>: parallel_tool_calls,
+<span class="ansi-green-intense-fg ansi-bold">   1679</span>                 <span style="color: rgb(175,0,0)">"</span><span style="color: rgb(175,0,0)">prediction</span><span style="color: rgb(175,0,0)">"</span>: prediction,
+<span class="ansi-green-intense-fg ansi-bold">   1680</span>                 <span style="color: rgb(175,0,0)">"</span><span style="color: rgb(175,0,0)">presence_penalty</span><span style="color: rgb(175,0,0)">"</span>: presence_penalty,
+<span class="ansi-green-intense-fg ansi-bold">   1681</span>                 <span style="color: rgb(175,0,0)">"</span><span style="color: rgb(175,0,0)">response_format</span><span style="color: rgb(175,0,0)">"</span>: response_format,
+<span class="ansi-green-intense-fg ansi-bold">   1682</span>                 <span style="color: rgb(175,0,0)">"</span><span style="color: rgb(175,0,0)">seed</span><span style="color: rgb(175,0,0)">"</span>: seed,
+<span class="ansi-green-intense-fg ansi-bold">   1683</span>                 <span style="color: rgb(175,0,0)">"</span><span style="color: rgb(175,0,0)">service_tier</span><span style="color: rgb(175,0,0)">"</span>: service_tier,
+<span class="ansi-green-intense-fg ansi-bold">   1684</span>                 <span style="color: rgb(175,0,0)">"</span><span style="color: rgb(175,0,0)">stop</span><span style="color: rgb(175,0,0)">"</span>: stop,
+<span class="ansi-green-intense-fg ansi-bold">   1685</span>                 <span style="color: rgb(175,0,0)">"</span><span style="color: rgb(175,0,0)">store</span><span style="color: rgb(175,0,0)">"</span>: store,
+<span class="ansi-green-intense-fg ansi-bold">   1686</span>                 <span style="color: rgb(175,0,0)">"</span><span style="color: rgb(175,0,0)">stream</span><span style="color: rgb(175,0,0)">"</span>: stream,
+<span class="ansi-green-intense-fg ansi-bold">   1687</span>                 <span style="color: rgb(175,0,0)">"</span><span style="color: rgb(175,0,0)">stream_options</span><span style="color: rgb(175,0,0)">"</span>: stream_options,
+<span class="ansi-green-intense-fg ansi-bold">   1688</span>                 <span style="color: rgb(175,0,0)">"</span><span style="color: rgb(175,0,0)">temperature</span><span style="color: rgb(175,0,0)">"</span>: temperature,
+<span class="ansi-green-intense-fg ansi-bold">   1689</span>                 <span style="color: rgb(175,0,0)">"</span><span style="color: rgb(175,0,0)">tool_choice</span><span style="color: rgb(175,0,0)">"</span>: tool_choice,
+<span class="ansi-green-intense-fg ansi-bold">   1690</span>                 <span style="color: rgb(175,0,0)">"</span><span style="color: rgb(175,0,0)">tools</span><span style="color: rgb(175,0,0)">"</span>: tools,
+<span class="ansi-green-intense-fg ansi-bold">   1691</span>                 <span style="color: rgb(175,0,0)">"</span><span style="color: rgb(175,0,0)">top_logprobs</span><span style="color: rgb(175,0,0)">"</span>: top_logprobs,
+<span class="ansi-green-intense-fg ansi-bold">   1692</span>                 <span style="color: rgb(175,0,0)">"</span><span style="color: rgb(175,0,0)">top_p</span><span style="color: rgb(175,0,0)">"</span>: top_p,
+<span class="ansi-green-intense-fg ansi-bold">   1693</span>                 <span style="color: rgb(175,0,0)">"</span><span style="color: rgb(175,0,0)">user</span><span style="color: rgb(175,0,0)">"</span>: user,
+<span class="ansi-green-intense-fg ansi-bold">   1694</span>             },
+<span class="ansi-green-intense-fg ansi-bold">   1695</span>             completion_create_params<span style="color: rgb(98,98,98)">.</span>CompletionCreateParams,
+<span class="ansi-green-intense-fg ansi-bold">   1696</span>         ),
+<span class="ansi-green-intense-fg ansi-bold">   1697</span>         options<span style="color: rgb(98,98,98)">=</span>make_request_options(
+<span class="ansi-green-intense-fg ansi-bold">   1698</span>             extra_headers<span style="color: rgb(98,98,98)">=</span>extra_headers, extra_query<span style="color: rgb(98,98,98)">=</span>extra_query, extra_body<span style="color: rgb(98,98,98)">=</span>extra_body, timeout<span style="color: rgb(98,98,98)">=</span>timeout
+<span class="ansi-green-intense-fg ansi-bold">   1699</span>         ),
+<span class="ansi-green-intense-fg ansi-bold">   1700</span>         cast_to<span style="color: rgb(98,98,98)">=</span>ChatCompletion,
+<span class="ansi-green-intense-fg ansi-bold">   1701</span>         stream<span style="color: rgb(98,98,98)">=</span>stream <span class="ansi-bold" style="color: rgb(175,0,255)">or</span> <span class="ansi-bold" style="color: rgb(0,135,0)">False</span>,
+<span class="ansi-green-intense-fg ansi-bold">   1702</span>         stream_cls<span style="color: rgb(98,98,98)">=</span>AsyncStream[ChatCompletionChunk],
+<span class="ansi-green-intense-fg ansi-bold">   1703</span>     )
+
+File <span class="ansi-green-fg">~/.cache/pypoetry/virtualenvs/graphrag-F2jvqev7-py3.11/lib/python3.11/site-packages/openai/_base_client.py:1838</span>, in <span class="ansi-cyan-fg">AsyncAPIClient.post</span><span class="ansi-blue-fg">(self, path, cast_to, body, files, options, stream, stream_cls)</span>
+<span class="ansi-green-intense-fg ansi-bold">   1824</span> <span class="ansi-bold" style="color: rgb(0,135,0)">async</span> <span class="ansi-bold" style="color: rgb(0,135,0)">def</span> <span style="color: rgb(0,0,255)">post</span>(
+<span class="ansi-green-intense-fg ansi-bold">   1825</span>     <span style="color: rgb(0,135,0)">self</span>,
+<span class="ansi-green-intense-fg ansi-bold">   1826</span>     path: <span style="color: rgb(0,135,0)">str</span>,
+<span class="ansi-green-fg">   (...)</span>
+<span class="ansi-green-intense-fg ansi-bold">   1833</span>     stream_cls: <span style="color: rgb(0,135,0)">type</span>[_AsyncStreamT] <span style="color: rgb(98,98,98)">|</span> <span class="ansi-bold" style="color: rgb(0,135,0)">None</span> <span style="color: rgb(98,98,98)">=</span> <span class="ansi-bold" style="color: rgb(0,135,0)">None</span>,
+<span class="ansi-green-intense-fg ansi-bold">   1834</span> ) <span style="color: rgb(98,98,98)">-</span><span style="color: rgb(98,98,98)">&gt;</span> ResponseT <span style="color: rgb(98,98,98)">|</span> _AsyncStreamT:
+<span class="ansi-green-intense-fg ansi-bold">   1835</span>     opts <span style="color: rgb(98,98,98)">=</span> FinalRequestOptions<span style="color: rgb(98,98,98)">.</span>construct(
+<span class="ansi-green-intense-fg ansi-bold">   1836</span>         method<span style="color: rgb(98,98,98)">=</span><span style="color: rgb(175,0,0)">"</span><span style="color: rgb(175,0,0)">post</span><span style="color: rgb(175,0,0)">"</span>, url<span style="color: rgb(98,98,98)">=</span>path, json_data<span style="color: rgb(98,98,98)">=</span>body, files<span style="color: rgb(98,98,98)">=</span><span class="ansi-bold" style="color: rgb(0,135,0)">await</span> async_to_httpx_files(files), <span style="color: rgb(98,98,98)">*</span><span style="color: rgb(98,98,98)">*</span>options
+<span class="ansi-green-intense-fg ansi-bold">   1837</span>     )
+<span class="ansi-green-fg">-&gt; 1838</span>     <span class="ansi-bold" style="color: rgb(0,135,0)">return</span> <span class="ansi-bold" style="color: rgb(0,135,0)">await</span> <span style="color: rgb(0,135,0)">self</span><span style="color: rgb(98,98,98)">.</span>request(cast_to, opts, stream<span style="color: rgb(98,98,98)">=</span>stream, stream_cls<span style="color: rgb(98,98,98)">=</span>stream_cls)
+
+File <span class="ansi-green-fg">~/.cache/pypoetry/virtualenvs/graphrag-F2jvqev7-py3.11/lib/python3.11/site-packages/openai/_base_client.py:1532</span>, in <span class="ansi-cyan-fg">AsyncAPIClient.request</span><span class="ansi-blue-fg">(self, cast_to, options, stream, stream_cls, remaining_retries)</span>
+<span class="ansi-green-intense-fg ansi-bold">   1529</span> <span class="ansi-bold" style="color: rgb(0,135,0)">else</span>:
+<span class="ansi-green-intense-fg ansi-bold">   1530</span>     retries_taken <span style="color: rgb(98,98,98)">=</span> <span style="color: rgb(98,98,98)">0</span>
+<span class="ansi-green-fg">-&gt; 1532</span> <span class="ansi-bold" style="color: rgb(0,135,0)">return</span> <span class="ansi-bold" style="color: rgb(0,135,0)">await</span> <span style="color: rgb(0,135,0)">self</span><span style="color: rgb(98,98,98)">.</span>_request(
+<span class="ansi-green-intense-fg ansi-bold">   1533</span>     cast_to<span style="color: rgb(98,98,98)">=</span>cast_to,
+<span class="ansi-green-intense-fg ansi-bold">   1534</span>     options<span style="color: rgb(98,98,98)">=</span>options,
+<span class="ansi-green-intense-fg ansi-bold">   1535</span>     stream<span style="color: rgb(98,98,98)">=</span>stream,
+<span class="ansi-green-intense-fg ansi-bold">   1536</span>     stream_cls<span style="color: rgb(98,98,98)">=</span>stream_cls,
+<span class="ansi-green-intense-fg ansi-bold">   1537</span>     retries_taken<span style="color: rgb(98,98,98)">=</span>retries_taken,
+<span class="ansi-green-intense-fg ansi-bold">   1538</span> )
+
+File <span class="ansi-green-fg">~/.cache/pypoetry/virtualenvs/graphrag-F2jvqev7-py3.11/lib/python3.11/site-packages/openai/_base_client.py:1618</span>, in <span class="ansi-cyan-fg">AsyncAPIClient._request</span><span class="ansi-blue-fg">(self, cast_to, options, stream, stream_cls, retries_taken)</span>
+<span class="ansi-green-intense-fg ansi-bold">   1616</span> <span class="ansi-bold" style="color: rgb(0,135,0)">if</span> remaining_retries <span style="color: rgb(98,98,98)">&gt;</span> <span style="color: rgb(98,98,98)">0</span> <span class="ansi-bold" style="color: rgb(175,0,255)">and</span> <span style="color: rgb(0,135,0)">self</span><span style="color: rgb(98,98,98)">.</span>_should_retry(err<span style="color: rgb(98,98,98)">.</span>response):
+<span class="ansi-green-intense-fg ansi-bold">   1617</span>     <span class="ansi-bold" style="color: rgb(0,135,0)">await</span> err<span style="color: rgb(98,98,98)">.</span>response<span style="color: rgb(98,98,98)">.</span>aclose()
+<span class="ansi-green-fg">-&gt; 1618</span>     <span class="ansi-bold" style="color: rgb(0,135,0)">return</span> <span class="ansi-bold" style="color: rgb(0,135,0)">await</span> <span style="color: rgb(0,135,0)">self</span><span style="color: rgb(98,98,98)">.</span>_retry_request(
+<span class="ansi-green-intense-fg ansi-bold">   1619</span>         input_options,
+<span class="ansi-green-intense-fg ansi-bold">   1620</span>         cast_to,
+<span class="ansi-green-intense-fg ansi-bold">   1621</span>         retries_taken<span style="color: rgb(98,98,98)">=</span>retries_taken,
+<span class="ansi-green-intense-fg ansi-bold">   1622</span>         response_headers<span style="color: rgb(98,98,98)">=</span>err<span style="color: rgb(98,98,98)">.</span>response<span style="color: rgb(98,98,98)">.</span>headers,
+<span class="ansi-green-intense-fg ansi-bold">   1623</span>         stream<span style="color: rgb(98,98,98)">=</span>stream,
+<span class="ansi-green-intense-fg ansi-bold">   1624</span>         stream_cls<span style="color: rgb(98,98,98)">=</span>stream_cls,
+<span class="ansi-green-intense-fg ansi-bold">   1625</span>     )
+<span class="ansi-green-intense-fg ansi-bold">   1627</span> <span style="color: rgb(95,135,135)"># If the response is streamed then we need to explicitly read the response</span>
+<span class="ansi-green-intense-fg ansi-bold">   1628</span> <span style="color: rgb(95,135,135)"># to completion before attempting to access the response text.</span>
+<span class="ansi-green-intense-fg ansi-bold">   1629</span> <span class="ansi-bold" style="color: rgb(0,135,0)">if</span> <span class="ansi-bold" style="color: rgb(175,0,255)">not</span> err<span style="color: rgb(98,98,98)">.</span>response<span style="color: rgb(98,98,98)">.</span>is_closed:
+
+File <span class="ansi-green-fg">~/.cache/pypoetry/virtualenvs/graphrag-F2jvqev7-py3.11/lib/python3.11/site-packages/openai/_base_client.py:1665</span>, in <span class="ansi-cyan-fg">AsyncAPIClient._retry_request</span><span class="ansi-blue-fg">(self, options, cast_to, retries_taken, response_headers, stream, stream_cls)</span>
+<span class="ansi-green-intense-fg ansi-bold">   1661</span> log<span style="color: rgb(98,98,98)">.</span>info(<span style="color: rgb(175,0,0)">"</span><span style="color: rgb(175,0,0)">Retrying request to </span><span class="ansi-bold" style="color: rgb(175,95,135)">%s</span><span style="color: rgb(175,0,0)"> in </span><span class="ansi-bold" style="color: rgb(175,95,135)">%f</span><span style="color: rgb(175,0,0)"> seconds</span><span style="color: rgb(175,0,0)">"</span>, options<span style="color: rgb(98,98,98)">.</span>url, timeout)
+<span class="ansi-green-intense-fg ansi-bold">   1663</span> <span class="ansi-bold" style="color: rgb(0,135,0)">await</span> anyio<span style="color: rgb(98,98,98)">.</span>sleep(timeout)
+<span class="ansi-green-fg">-&gt; 1665</span> <span class="ansi-bold" style="color: rgb(0,135,0)">return</span> <span class="ansi-bold" style="color: rgb(0,135,0)">await</span> <span style="color: rgb(0,135,0)">self</span><span style="color: rgb(98,98,98)">.</span>_request(
+<span class="ansi-green-intense-fg ansi-bold">   1666</span>     options<span style="color: rgb(98,98,98)">=</span>options,
+<span class="ansi-green-intense-fg ansi-bold">   1667</span>     cast_to<span style="color: rgb(98,98,98)">=</span>cast_to,
+<span class="ansi-green-intense-fg ansi-bold">   1668</span>     retries_taken<span style="color: rgb(98,98,98)">=</span>retries_taken <span style="color: rgb(98,98,98)">+</span> <span style="color: rgb(98,98,98)">1</span>,
+<span class="ansi-green-intense-fg ansi-bold">   1669</span>     stream<span style="color: rgb(98,98,98)">=</span>stream,
+<span class="ansi-green-intense-fg ansi-bold">   1670</span>     stream_cls<span style="color: rgb(98,98,98)">=</span>stream_cls,
+<span class="ansi-green-intense-fg ansi-bold">   1671</span> )
+
+File <span class="ansi-green-fg">~/.cache/pypoetry/virtualenvs/graphrag-F2jvqev7-py3.11/lib/python3.11/site-packages/openai/_base_client.py:1618</span>, in <span class="ansi-cyan-fg">AsyncAPIClient._request</span><span class="ansi-blue-fg">(self, cast_to, options, stream, stream_cls, retries_taken)</span>
+<span class="ansi-green-intense-fg ansi-bold">   1616</span> <span class="ansi-bold" style="color: rgb(0,135,0)">if</span> remaining_retries <span style="color: rgb(98,98,98)">&gt;</span> <span style="color: rgb(98,98,98)">0</span> <span class="ansi-bold" style="color: rgb(175,0,255)">and</span> <span style="color: rgb(0,135,0)">self</span><span style="color: rgb(98,98,98)">.</span>_should_retry(err<span style="color: rgb(98,98,98)">.</span>response):
+<span class="ansi-green-intense-fg ansi-bold">   1617</span>     <span class="ansi-bold" style="color: rgb(0,135,0)">await</span> err<span style="color: rgb(98,98,98)">.</span>response<span style="color: rgb(98,98,98)">.</span>aclose()
+<span class="ansi-green-fg">-&gt; 1618</span>     <span class="ansi-bold" style="color: rgb(0,135,0)">return</span> <span class="ansi-bold" style="color: rgb(0,135,0)">await</span> <span style="color: rgb(0,135,0)">self</span><span style="color: rgb(98,98,98)">.</span>_retry_request(
+<span class="ansi-green-intense-fg ansi-bold">   1619</span>         input_options,
+<span class="ansi-green-intense-fg ansi-bold">   1620</span>         cast_to,
+<span class="ansi-green-intense-fg ansi-bold">   1621</span>         retries_taken<span style="color: rgb(98,98,98)">=</span>retries_taken,
+<span class="ansi-green-intense-fg ansi-bold">   1622</span>         response_headers<span style="color: rgb(98,98,98)">=</span>err<span style="color: rgb(98,98,98)">.</span>response<span style="color: rgb(98,98,98)">.</span>headers,
+<span class="ansi-green-intense-fg ansi-bold">   1623</span>         stream<span style="color: rgb(98,98,98)">=</span>stream,
+<span class="ansi-green-intense-fg ansi-bold">   1624</span>         stream_cls<span style="color: rgb(98,98,98)">=</span>stream_cls,
+<span class="ansi-green-intense-fg ansi-bold">   1625</span>     )
+<span class="ansi-green-intense-fg ansi-bold">   1627</span> <span style="color: rgb(95,135,135)"># If the response is streamed then we need to explicitly read the response</span>
+<span class="ansi-green-intense-fg ansi-bold">   1628</span> <span style="color: rgb(95,135,135)"># to completion before attempting to access the response text.</span>
+<span class="ansi-green-intense-fg ansi-bold">   1629</span> <span class="ansi-bold" style="color: rgb(0,135,0)">if</span> <span class="ansi-bold" style="color: rgb(175,0,255)">not</span> err<span style="color: rgb(98,98,98)">.</span>response<span style="color: rgb(98,98,98)">.</span>is_closed:
+
+File <span class="ansi-green-fg">~/.cache/pypoetry/virtualenvs/graphrag-F2jvqev7-py3.11/lib/python3.11/site-packages/openai/_base_client.py:1665</span>, in <span class="ansi-cyan-fg">AsyncAPIClient._retry_request</span><span class="ansi-blue-fg">(self, options, cast_to, retries_taken, response_headers, stream, stream_cls)</span>
+<span class="ansi-green-intense-fg ansi-bold">   1661</span> log<span style="color: rgb(98,98,98)">.</span>info(<span style="color: rgb(175,0,0)">"</span><span style="color: rgb(175,0,0)">Retrying request to </span><span class="ansi-bold" style="color: rgb(175,95,135)">%s</span><span style="color: rgb(175,0,0)"> in </span><span class="ansi-bold" style="color: rgb(175,95,135)">%f</span><span style="color: rgb(175,0,0)"> seconds</span><span style="color: rgb(175,0,0)">"</span>, options<span style="color: rgb(98,98,98)">.</span>url, timeout)
+<span class="ansi-green-intense-fg ansi-bold">   1663</span> <span class="ansi-bold" style="color: rgb(0,135,0)">await</span> anyio<span style="color: rgb(98,98,98)">.</span>sleep(timeout)
+<span class="ansi-green-fg">-&gt; 1665</span> <span class="ansi-bold" style="color: rgb(0,135,0)">return</span> <span class="ansi-bold" style="color: rgb(0,135,0)">await</span> <span style="color: rgb(0,135,0)">self</span><span style="color: rgb(98,98,98)">.</span>_request(
+<span class="ansi-green-intense-fg ansi-bold">   1666</span>     options<span style="color: rgb(98,98,98)">=</span>options,
+<span class="ansi-green-intense-fg ansi-bold">   1667</span>     cast_to<span style="color: rgb(98,98,98)">=</span>cast_to,
+<span class="ansi-green-intense-fg ansi-bold">   1668</span>     retries_taken<span style="color: rgb(98,98,98)">=</span>retries_taken <span style="color: rgb(98,98,98)">+</span> <span style="color: rgb(98,98,98)">1</span>,
+<span class="ansi-green-intense-fg ansi-bold">   1669</span>     stream<span style="color: rgb(98,98,98)">=</span>stream,
+<span class="ansi-green-intense-fg ansi-bold">   1670</span>     stream_cls<span style="color: rgb(98,98,98)">=</span>stream_cls,
+<span class="ansi-green-intense-fg ansi-bold">   1671</span> )
+
+    <span class="ansi-red-fg">[... skipping similar frames: AsyncAPIClient._request at line 1618 (17 times), AsyncAPIClient._retry_request at line 1665 (17 times)]</span>
+
+File <span class="ansi-green-fg">~/.cache/pypoetry/virtualenvs/graphrag-F2jvqev7-py3.11/lib/python3.11/site-packages/openai/_base_client.py:1618</span>, in <span class="ansi-cyan-fg">AsyncAPIClient._request</span><span class="ansi-blue-fg">(self, cast_to, options, stream, stream_cls, retries_taken)</span>
+<span class="ansi-green-intense-fg ansi-bold">   1616</span> <span class="ansi-bold" style="color: rgb(0,135,0)">if</span> remaining_retries <span style="color: rgb(98,98,98)">&gt;</span> <span style="color: rgb(98,98,98)">0</span> <span class="ansi-bold" style="color: rgb(175,0,255)">and</span> <span style="color: rgb(0,135,0)">self</span><span style="color: rgb(98,98,98)">.</span>_should_retry(err<span style="color: rgb(98,98,98)">.</span>response):
+<span class="ansi-green-intense-fg ansi-bold">   1617</span>     <span class="ansi-bold" style="color: rgb(0,135,0)">await</span> err<span style="color: rgb(98,98,98)">.</span>response<span style="color: rgb(98,98,98)">.</span>aclose()
+<span class="ansi-green-fg">-&gt; 1618</span>     <span class="ansi-bold" style="color: rgb(0,135,0)">return</span> <span class="ansi-bold" style="color: rgb(0,135,0)">await</span> <span style="color: rgb(0,135,0)">self</span><span style="color: rgb(98,98,98)">.</span>_retry_request(
+<span class="ansi-green-intense-fg ansi-bold">   1619</span>         input_options,
+<span class="ansi-green-intense-fg ansi-bold">   1620</span>         cast_to,
+<span class="ansi-green-intense-fg ansi-bold">   1621</span>         retries_taken<span style="color: rgb(98,98,98)">=</span>retries_taken,
+<span class="ansi-green-intense-fg ansi-bold">   1622</span>         response_headers<span style="color: rgb(98,98,98)">=</span>err<span style="color: rgb(98,98,98)">.</span>response<span style="color: rgb(98,98,98)">.</span>headers,
+<span class="ansi-green-intense-fg ansi-bold">   1623</span>         stream<span style="color: rgb(98,98,98)">=</span>stream,
+<span class="ansi-green-intense-fg ansi-bold">   1624</span>         stream_cls<span style="color: rgb(98,98,98)">=</span>stream_cls,
+<span class="ansi-green-intense-fg ansi-bold">   1625</span>     )
+<span class="ansi-green-intense-fg ansi-bold">   1627</span> <span style="color: rgb(95,135,135)"># If the response is streamed then we need to explicitly read the response</span>
+<span class="ansi-green-intense-fg ansi-bold">   1628</span> <span style="color: rgb(95,135,135)"># to completion before attempting to access the response text.</span>
+<span class="ansi-green-intense-fg ansi-bold">   1629</span> <span class="ansi-bold" style="color: rgb(0,135,0)">if</span> <span class="ansi-bold" style="color: rgb(175,0,255)">not</span> err<span style="color: rgb(98,98,98)">.</span>response<span style="color: rgb(98,98,98)">.</span>is_closed:
+
+File <span class="ansi-green-fg">~/.cache/pypoetry/virtualenvs/graphrag-F2jvqev7-py3.11/lib/python3.11/site-packages/openai/_base_client.py:1665</span>, in <span class="ansi-cyan-fg">AsyncAPIClient._retry_request</span><span class="ansi-blue-fg">(self, options, cast_to, retries_taken, response_headers, stream, stream_cls)</span>
+<span class="ansi-green-intense-fg ansi-bold">   1661</span> log<span style="color: rgb(98,98,98)">.</span>info(<span style="color: rgb(175,0,0)">"</span><span style="color: rgb(175,0,0)">Retrying request to </span><span class="ansi-bold" style="color: rgb(175,95,135)">%s</span><span style="color: rgb(175,0,0)"> in </span><span class="ansi-bold" style="color: rgb(175,95,135)">%f</span><span style="color: rgb(175,0,0)"> seconds</span><span style="color: rgb(175,0,0)">"</span>, options<span style="color: rgb(98,98,98)">.</span>url, timeout)
+<span class="ansi-green-intense-fg ansi-bold">   1663</span> <span class="ansi-bold" style="color: rgb(0,135,0)">await</span> anyio<span style="color: rgb(98,98,98)">.</span>sleep(timeout)
+<span class="ansi-green-fg">-&gt; 1665</span> <span class="ansi-bold" style="color: rgb(0,135,0)">return</span> <span class="ansi-bold" style="color: rgb(0,135,0)">await</span> <span style="color: rgb(0,135,0)">self</span><span style="color: rgb(98,98,98)">.</span>_request(
+<span class="ansi-green-intense-fg ansi-bold">   1666</span>     options<span style="color: rgb(98,98,98)">=</span>options,
+<span class="ansi-green-intense-fg ansi-bold">   1667</span>     cast_to<span style="color: rgb(98,98,98)">=</span>cast_to,
+<span class="ansi-green-intense-fg ansi-bold">   1668</span>     retries_taken<span style="color: rgb(98,98,98)">=</span>retries_taken <span style="color: rgb(98,98,98)">+</span> <span style="color: rgb(98,98,98)">1</span>,
+<span class="ansi-green-intense-fg ansi-bold">   1669</span>     stream<span style="color: rgb(98,98,98)">=</span>stream,
+<span class="ansi-green-intense-fg ansi-bold">   1670</span>     stream_cls<span style="color: rgb(98,98,98)">=</span>stream_cls,
+<span class="ansi-green-intense-fg ansi-bold">   1671</span> )
+
+File <span class="ansi-green-fg">~/.cache/pypoetry/virtualenvs/graphrag-F2jvqev7-py3.11/lib/python3.11/site-packages/openai/_base_client.py:1633</span>, in <span class="ansi-cyan-fg">AsyncAPIClient._request</span><span class="ansi-blue-fg">(self, cast_to, options, stream, stream_cls, retries_taken)</span>
+<span class="ansi-green-intense-fg ansi-bold">   1630</span>         <span class="ansi-bold" style="color: rgb(0,135,0)">await</span> err<span style="color: rgb(98,98,98)">.</span>response<span style="color: rgb(98,98,98)">.</span>aread()
+<span class="ansi-green-intense-fg ansi-bold">   1632</span>     log<span style="color: rgb(98,98,98)">.</span>debug(<span style="color: rgb(175,0,0)">"</span><span style="color: rgb(175,0,0)">Re-raising status error</span><span style="color: rgb(175,0,0)">"</span>)
+<span class="ansi-green-fg">-&gt; 1633</span>     <span class="ansi-bold" style="color: rgb(0,135,0)">raise</span> <span style="color: rgb(0,135,0)">self</span><span style="color: rgb(98,98,98)">.</span>_make_status_error_from_response(err<span style="color: rgb(98,98,98)">.</span>response) <span class="ansi-bold" style="color: rgb(0,135,0)">from</span> <span class="ansi-bold" style="color: rgb(0,135,0)">None</span>
+<span class="ansi-green-intense-fg ansi-bold">   1635</span> <span class="ansi-bold" style="color: rgb(0,135,0)">return</span> <span class="ansi-bold" style="color: rgb(0,135,0)">await</span> <span style="color: rgb(0,135,0)">self</span><span style="color: rgb(98,98,98)">.</span>_process_response(
+<span class="ansi-green-intense-fg ansi-bold">   1636</span>     cast_to<span style="color: rgb(98,98,98)">=</span>cast_to,
+<span class="ansi-green-intense-fg ansi-bold">   1637</span>     options<span style="color: rgb(98,98,98)">=</span>options,
+<span class="ansi-green-fg">   (...)</span>
+<span class="ansi-green-intense-fg ansi-bold">   1641</span>     retries_taken<span style="color: rgb(98,98,98)">=</span>retries_taken,
+<span class="ansi-green-intense-fg ansi-bold">   1642</span> )
+
+<span class="ansi-red-fg">RateLimitError</span>: Error code: 429 - {'error': {'message': 'You exceeded your current quota, please check your plan and billing details. For more information on this error, read the docs: https://platform.openai.com/docs/guides/error-codes/api-errors.', 'type': 'insufficient_quota', 'param': None, 'code': 'insufficient_quota'}}</pre>
 </div>
 </div>
 </div>
@@ -2596,94 +2888,17 @@ result.context_data["reports"]</div>
 <div class="jp-Collapser jp-OutputCollapser jp-Cell-outputCollapser">
 </div>
 <div class="jp-OutputArea jp-Cell-outputArea">
-<div class="jp-OutputArea-child jp-OutputArea-executeResult">
-<div class="jp-OutputPrompt jp-OutputArea-prompt">Out[10]:</div>
-<div class="jp-RenderedHTMLCommon jp-RenderedHTML jp-OutputArea-output jp-OutputArea-executeResult" data-mime-type="text/html" tabindex="0">
-<div>
-<style scoped="">
-    .dataframe tbody tr th:only-of-type {
-        vertical-align: middle;
-    }
+<div class="jp-OutputArea-child">
+<div class="jp-OutputPrompt jp-OutputArea-prompt"></div>
+<div class="jp-RenderedText jp-OutputArea-output" data-mime-type="application/vnd.jupyter.stderr" tabindex="0">
+<pre>
+<span class="ansi-red-fg">---------------------------------------------------------------------------</span>
+<span class="ansi-red-fg">NameError</span>                                 Traceback (most recent call last)
+Cell <span class="ansi-green-fg">In[10], line 2</span>
+<span class="ansi-green-intense-fg ansi-bold">      1</span> <span style="color: rgb(95,135,135)"># inspect the data used to build the context for the LLM responses</span>
+<span class="ansi-green-fg">----&gt; 2</span> <span class="ansi-yellow-bg">result</span><span style="color: rgb(98,98,98)">.</span>context_data[<span style="color: rgb(175,0,0)">"</span><span style="color: rgb(175,0,0)">reports</span><span style="color: rgb(175,0,0)">"</span>]
 
-    .dataframe tbody tr th {
-        vertical-align: top;
-    }
-
-    .dataframe thead th {
-        text-align: right;
-    }
-</style>
-<table border="1" class="dataframe">
-<thead>
-<tr style="text-align: right;">
-<th></th>
-<th>id</th>
-<th>title</th>
-<th>occurrence weight</th>
-<th>content</th>
-<th>rank</th>
-</tr>
-</thead>
-<tbody>
-<tr>
-<th>0</th>
-<td>15</td>
-<td>Dulce Base and the Paranormal Military Squad: ...</td>
-<td>1.00</td>
-<td># Dulce Base and the Paranormal Military Squad...</td>
-<td>9.5</td>
-</tr>
-<tr>
-<th>1</th>
-<td>1</td>
-<td>Earth's Interstellar Communication Initiative</td>
-<td>0.16</td>
-<td># Earth's Interstellar Communication Initiativ...</td>
-<td>8.5</td>
-</tr>
-<tr>
-<th>2</th>
-<td>16</td>
-<td>Dulce Military Base and Alien Intelligence Com...</td>
-<td>0.08</td>
-<td># Dulce Military Base and Alien Intelligence C...</td>
-<td>8.5</td>
-</tr>
-<tr>
-<th>3</th>
-<td>4</td>
-<td>Dulce Facility and Control Room of Dulce: Extr...</td>
-<td>0.02</td>
-<td># Dulce Facility and Control Room of Dulce: Ex...</td>
-<td>8.5</td>
-</tr>
-<tr>
-<th>4</th>
-<td>17</td>
-<td>Dulce Team and Underground Command Center: Int...</td>
-<td>0.02</td>
-<td># Dulce Team and Underground Command Center: I...</td>
-<td>8.5</td>
-</tr>
-<tr>
-<th>5</th>
-<td>19</td>
-<td>Central Terminal and Viewing Monitors at Dulce...</td>
-<td>0.02</td>
-<td># Central Terminal and Viewing Monitors at Dul...</td>
-<td>8.5</td>
-</tr>
-<tr>
-<th>6</th>
-<td>6</td>
-<td>Cosmic Vocalization and Universe Interactions</td>
-<td>0.02</td>
-<td># Cosmic Vocalization and Universe Interaction...</td>
-<td>7.5</td>
-</tr>
-</tbody>
-</table>
-</div>
+<span class="ansi-red-fg">NameError</span>: name 'result' is not defined</pre>
 </div>
 </div>
 </div>
@@ -2755,12 +2970,17 @@ print(
 <div class="jp-OutputArea jp-Cell-outputArea">
 <div class="jp-OutputArea-child">
 <div class="jp-OutputPrompt jp-OutputArea-prompt"></div>
-<div class="jp-RenderedText jp-OutputArea-output" data-mime-type="text/plain" tabindex="0">
-<pre>Build context (gpt-4o-mini)
-LLM calls: 12. Prompt tokens: 8565. Output tokens: 1111.
-Map-reduce (gpt-4o)
-LLM calls: 2. Prompt tokens: 5918. Output tokens: 614.
-</pre>
+<div class="jp-RenderedText jp-OutputArea-output" data-mime-type="application/vnd.jupyter.stderr" tabindex="0">
+<pre>
+<span class="ansi-red-fg">---------------------------------------------------------------------------</span>
+<span class="ansi-red-fg">NameError</span>                                 Traceback (most recent call last)
+Cell <span class="ansi-green-fg">In[11], line 2</span>
+<span class="ansi-green-intense-fg ansi-bold">      1</span> <span style="color: rgb(95,135,135)"># inspect number of LLM calls and tokens in dynamic community selection</span>
+<span class="ansi-green-fg">----&gt; 2</span> llm_calls <span style="color: rgb(98,98,98)">=</span> <span class="ansi-yellow-bg">result</span><span style="color: rgb(98,98,98)">.</span>llm_calls_categories[<span style="color: rgb(175,0,0)">"</span><span style="color: rgb(175,0,0)">build_context</span><span style="color: rgb(175,0,0)">"</span>]
+<span class="ansi-green-intense-fg ansi-bold">      3</span> prompt_tokens <span style="color: rgb(98,98,98)">=</span> result<span style="color: rgb(98,98,98)">.</span>prompt_tokens_categories[<span style="color: rgb(175,0,0)">"</span><span style="color: rgb(175,0,0)">build_context</span><span style="color: rgb(175,0,0)">"</span>]
+<span class="ansi-green-intense-fg ansi-bold">      4</span> output_tokens <span style="color: rgb(98,98,98)">=</span> result<span style="color: rgb(98,98,98)">.</span>output_tokens_categories[<span style="color: rgb(175,0,0)">"</span><span style="color: rgb(175,0,0)">build_context</span><span style="color: rgb(175,0,0)">"</span>]
+
+<span class="ansi-red-fg">NameError</span>: name 'result' is not defined</pre>
 </div>
 </div>
 </div>
diff --git a/examples_notebooks/local_search/index.html b/examples_notebooks/local_search/index.html
index 6cf5500d..c1a4c388 100644
--- a/examples_notebooks/local_search/index.html
+++ b/examples_notebooks/local_search/index.html
@@ -3349,26 +3349,112 @@ print(result.response)</div>
 <div class="jp-OutputArea-child">
 <div class="jp-OutputPrompt jp-OutputArea-prompt"></div>
 <div class="jp-RenderedText jp-OutputArea-output" data-mime-type="text/plain" tabindex="0">
-<pre>### Overview of Agent Mercer
-
-Agent Alex Mercer is a prominent figure within the Paranormal Military Squad, playing a crucial role in Operation: Dulce at the Dulce Base. He is recognized for his strategic and commanding presence, particularly in overseeing operations related to communication with extraterrestrial intelligence. His responsibilities include initiating broadcasts to communicate with extraterrestrial beings, decoding alien messages, and leading the team in understanding and responding to these communications [Data: Entities (0)].
-
-### Role and Responsibilities
-
-Mercer is deeply involved in the philosophical and strategic aspects of interstellar communication, viewing these interactions as a form of cosmic dialogue. His leadership style is characterized by a blend of determination, compliance with mission protocols, and a protective approach towards his team. He collaborates with team members like Jordan Hayes, exploring secured areas and engaging in high-stakes, secretive operations. Mercer is also known for his intellectual curiosity and deep involvement in the mission's implications for humanity [Data: Entities (0); Sources (40, 42)].
-
-### Relationships and Influence
-
-Agent Mercer is depicted as a thoughtful mentor, particularly to Sam Rivera, emphasizing the importance of intuition and trust beyond protocol. His mentorship has a significant influence on Rivera's actions and confidence. Additionally, Mercer shares a collaborative relationship with Dr. Jordan Hayes, working together on alien technology during Operation: Dulce. This partnership is marked by a shared commitment to discovery and understanding the broader implications of their mission [Data: Relationships (167, 336); Sources (40, 42)].
-
-### Challenges and Philosophical Approach
-
-Despite his outward compliance, Mercer harbors a subtle form of determination that resists easy submission to authority. This is evident during the briefings for Operation: Dulce, where he contemplates the broader stakes of their mission beyond the immediate parameters. His approach to leadership and decision-making is informed by a balance of skepticism and optimism, as he navigates the complexities of human-alien communication and the potential paradigm shifts it represents [Data: Claims (1); Sources (40, 42)].
-
-In summary, Agent Alex Mercer is a pivotal figure in the Paranormal Military Squad, whose leadership and strategic insights are instrumental in the team's efforts to engage with extraterrestrial intelligence. His role extends beyond mere operational duties, encompassing a broader philosophical engagement with the implications of their mission for humanity.
+<pre>Error embedding chunk {'OpenAIEmbedding': "Error code: 429 - {'error': {'message': 'You exceeded your current quota, please check your plan and billing details. For more information on this error, read the docs: https://platform.openai.com/docs/guides/error-codes/api-errors.', 'type': 'insufficient_quota', 'param': None, 'code': 'insufficient_quota'}}"}
 </pre>
 </div>
 </div>
+<div class="jp-OutputArea-child">
+<div class="jp-OutputPrompt jp-OutputArea-prompt"></div>
+<div class="jp-RenderedText jp-OutputArea-output" data-mime-type="application/vnd.jupyter.stderr" tabindex="0">
+<pre>
+<span class="ansi-red-fg">---------------------------------------------------------------------------</span>
+<span class="ansi-red-fg">ZeroDivisionError</span>                         Traceback (most recent call last)
+Cell <span class="ansi-green-fg">In[13], line 1</span>
+<span class="ansi-green-fg">----&gt; 1</span> result <span style="color: rgb(98,98,98)">=</span> <span class="ansi-bold" style="color: rgb(0,135,0)">await</span> search_engine<span style="color: rgb(98,98,98)">.</span>asearch(<span style="color: rgb(175,0,0)">"</span><span style="color: rgb(175,0,0)">Tell me about Agent Mercer</span><span style="color: rgb(175,0,0)">"</span>)
+<span class="ansi-green-intense-fg ansi-bold">      2</span> <span style="color: rgb(0,135,0)">print</span>(result<span style="color: rgb(98,98,98)">.</span>response)
+
+File <span class="ansi-green-fg">~/work/graphrag/graphrag/graphrag/query/structured_search/local_search/search.py:67</span>, in <span class="ansi-cyan-fg">LocalSearch.asearch</span><span class="ansi-blue-fg">(self, query, conversation_history, **kwargs)</span>
+<span class="ansi-green-intense-fg ansi-bold">     65</span> search_prompt <span style="color: rgb(98,98,98)">=</span> <span style="color: rgb(175,0,0)">"</span><span style="color: rgb(175,0,0)">"</span>
+<span class="ansi-green-intense-fg ansi-bold">     66</span> llm_calls, prompt_tokens, output_tokens <span style="color: rgb(98,98,98)">=</span> {}, {}, {}
+<span class="ansi-green-fg">---&gt; 67</span> context_result <span style="color: rgb(98,98,98)">=</span> <span class="ansi-yellow-bg" style="color: rgb(0,135,0)">self</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">.</span><span class="ansi-yellow-bg">context_builder</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">.</span><span class="ansi-yellow-bg">build_context</span><span class="ansi-yellow-bg">(</span>
+<span class="ansi-green-intense-fg ansi-bold">     68</span> <span class="ansi-yellow-bg">    </span><span class="ansi-yellow-bg">query</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">=</span><span class="ansi-yellow-bg">query</span><span class="ansi-yellow-bg">,</span>
+<span class="ansi-green-intense-fg ansi-bold">     69</span> <span class="ansi-yellow-bg">    </span><span class="ansi-yellow-bg">conversation_history</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">=</span><span class="ansi-yellow-bg">conversation_history</span><span class="ansi-yellow-bg">,</span>
+<span class="ansi-green-intense-fg ansi-bold">     70</span> <span class="ansi-yellow-bg">    </span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">*</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">*</span><span class="ansi-yellow-bg">kwargs</span><span class="ansi-yellow-bg">,</span>
+<span class="ansi-green-intense-fg ansi-bold">     71</span> <span class="ansi-yellow-bg">    </span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">*</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">*</span><span class="ansi-yellow-bg" style="color: rgb(0,135,0)">self</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">.</span><span class="ansi-yellow-bg">context_builder_params</span><span class="ansi-yellow-bg">,</span>
+<span class="ansi-green-intense-fg ansi-bold">     72</span> <span class="ansi-yellow-bg">)</span>
+<span class="ansi-green-intense-fg ansi-bold">     73</span> llm_calls[<span style="color: rgb(175,0,0)">"</span><span style="color: rgb(175,0,0)">build_context</span><span style="color: rgb(175,0,0)">"</span>] <span style="color: rgb(98,98,98)">=</span> context_result<span style="color: rgb(98,98,98)">.</span>llm_calls
+<span class="ansi-green-intense-fg ansi-bold">     74</span> prompt_tokens[<span style="color: rgb(175,0,0)">"</span><span style="color: rgb(175,0,0)">build_context</span><span style="color: rgb(175,0,0)">"</span>] <span style="color: rgb(98,98,98)">=</span> context_result<span style="color: rgb(98,98,98)">.</span>prompt_tokens
+
+File <span class="ansi-green-fg">~/work/graphrag/graphrag/graphrag/query/structured_search/local_search/mixed_context.py:139</span>, in <span class="ansi-cyan-fg">LocalSearchMixedContext.build_context</span><span class="ansi-blue-fg">(self, query, conversation_history, include_entity_names, exclude_entity_names, conversation_history_max_turns, conversation_history_user_turns_only, max_tokens, text_unit_prop, community_prop, top_k_mapped_entities, top_k_relationships, include_community_rank, include_entity_rank, rank_description, include_relationship_weight, relationship_ranking_attribute, return_candidate_context, use_community_summary, min_community_rank, community_context_name, column_delimiter, **kwargs)</span>
+<span class="ansi-green-intense-fg ansi-bold">    134</span>     pre_user_questions <span style="color: rgb(98,98,98)">=</span> <span style="color: rgb(175,0,0)">"</span><span class="ansi-bold" style="color: rgb(175,95,0)">\n</span><span style="color: rgb(175,0,0)">"</span><span style="color: rgb(98,98,98)">.</span>join(
+<span class="ansi-green-intense-fg ansi-bold">    135</span>         conversation_history<span style="color: rgb(98,98,98)">.</span>get_user_turns(conversation_history_max_turns)
+<span class="ansi-green-intense-fg ansi-bold">    136</span>     )
+<span class="ansi-green-intense-fg ansi-bold">    137</span>     query <span style="color: rgb(98,98,98)">=</span> <span style="color: rgb(175,0,0)">f</span><span style="color: rgb(175,0,0)">"</span><span class="ansi-bold" style="color: rgb(175,95,135)">{</span>query<span class="ansi-bold" style="color: rgb(175,95,135)">}</span><span class="ansi-bold" style="color: rgb(175,95,0)">\n</span><span class="ansi-bold" style="color: rgb(175,95,135)">{</span>pre_user_questions<span class="ansi-bold" style="color: rgb(175,95,135)">}</span><span style="color: rgb(175,0,0)">"</span>
+<span class="ansi-green-fg">--&gt; 139</span> selected_entities <span style="color: rgb(98,98,98)">=</span> <span class="ansi-yellow-bg">map_query_to_entities</span><span class="ansi-yellow-bg">(</span>
+<span class="ansi-green-intense-fg ansi-bold">    140</span> <span class="ansi-yellow-bg">    </span><span class="ansi-yellow-bg">query</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">=</span><span class="ansi-yellow-bg">query</span><span class="ansi-yellow-bg">,</span>
+<span class="ansi-green-intense-fg ansi-bold">    141</span> <span class="ansi-yellow-bg">    </span><span class="ansi-yellow-bg">text_embedding_vectorstore</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">=</span><span class="ansi-yellow-bg" style="color: rgb(0,135,0)">self</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">.</span><span class="ansi-yellow-bg">entity_text_embeddings</span><span class="ansi-yellow-bg">,</span>
+<span class="ansi-green-intense-fg ansi-bold">    142</span> <span class="ansi-yellow-bg">    </span><span class="ansi-yellow-bg">text_embedder</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">=</span><span class="ansi-yellow-bg" style="color: rgb(0,135,0)">self</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">.</span><span class="ansi-yellow-bg">text_embedder</span><span class="ansi-yellow-bg">,</span>
+<span class="ansi-green-intense-fg ansi-bold">    143</span> <span class="ansi-yellow-bg">    </span><span class="ansi-yellow-bg">all_entities_dict</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">=</span><span class="ansi-yellow-bg" style="color: rgb(0,135,0)">self</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">.</span><span class="ansi-yellow-bg">entities</span><span class="ansi-yellow-bg">,</span>
+<span class="ansi-green-intense-fg ansi-bold">    144</span> <span class="ansi-yellow-bg">    </span><span class="ansi-yellow-bg">embedding_vectorstore_key</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">=</span><span class="ansi-yellow-bg" style="color: rgb(0,135,0)">self</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">.</span><span class="ansi-yellow-bg">embedding_vectorstore_key</span><span class="ansi-yellow-bg">,</span>
+<span class="ansi-green-intense-fg ansi-bold">    145</span> <span class="ansi-yellow-bg">    </span><span class="ansi-yellow-bg">include_entity_names</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">=</span><span class="ansi-yellow-bg">include_entity_names</span><span class="ansi-yellow-bg">,</span>
+<span class="ansi-green-intense-fg ansi-bold">    146</span> <span class="ansi-yellow-bg">    </span><span class="ansi-yellow-bg">exclude_entity_names</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">=</span><span class="ansi-yellow-bg">exclude_entity_names</span><span class="ansi-yellow-bg">,</span>
+<span class="ansi-green-intense-fg ansi-bold">    147</span> <span class="ansi-yellow-bg">    </span><span class="ansi-yellow-bg">k</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">=</span><span class="ansi-yellow-bg">top_k_mapped_entities</span><span class="ansi-yellow-bg">,</span>
+<span class="ansi-green-intense-fg ansi-bold">    148</span> <span class="ansi-yellow-bg">    </span><span class="ansi-yellow-bg">oversample_scaler</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">=</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">2</span><span class="ansi-yellow-bg">,</span>
+<span class="ansi-green-intense-fg ansi-bold">    149</span> <span class="ansi-yellow-bg">)</span>
+<span class="ansi-green-intense-fg ansi-bold">    151</span> <span style="color: rgb(95,135,135)"># build context</span>
+<span class="ansi-green-intense-fg ansi-bold">    152</span> final_context <span style="color: rgb(98,98,98)">=</span> <span style="color: rgb(0,135,0)">list</span>[<span style="color: rgb(0,135,0)">str</span>]()
+
+File <span class="ansi-green-fg">~/work/graphrag/graphrag/graphrag/query/context_builder/entity_extraction.py:58</span>, in <span class="ansi-cyan-fg">map_query_to_entities</span><span class="ansi-blue-fg">(query, text_embedding_vectorstore, text_embedder, all_entities_dict, embedding_vectorstore_key, include_entity_names, exclude_entity_names, k, oversample_scaler)</span>
+<span class="ansi-green-intense-fg ansi-bold">     54</span> matched_entities <span style="color: rgb(98,98,98)">=</span> []
+<span class="ansi-green-intense-fg ansi-bold">     55</span> <span class="ansi-bold" style="color: rgb(0,135,0)">if</span> query <span style="color: rgb(98,98,98)">!=</span> <span style="color: rgb(175,0,0)">"</span><span style="color: rgb(175,0,0)">"</span>:
+<span class="ansi-green-intense-fg ansi-bold">     56</span>     <span style="color: rgb(95,135,135)"># get entities with highest semantic similarity to query</span>
+<span class="ansi-green-intense-fg ansi-bold">     57</span>     <span style="color: rgb(95,135,135)"># oversample to account for excluded entities</span>
+<span class="ansi-green-fg">---&gt; 58</span>     search_results <span style="color: rgb(98,98,98)">=</span> <span class="ansi-yellow-bg">text_embedding_vectorstore</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">.</span><span class="ansi-yellow-bg">similarity_search_by_text</span><span class="ansi-yellow-bg">(</span>
+<span class="ansi-green-intense-fg ansi-bold">     59</span> <span class="ansi-yellow-bg">        </span><span class="ansi-yellow-bg">text</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">=</span><span class="ansi-yellow-bg">query</span><span class="ansi-yellow-bg">,</span>
+<span class="ansi-green-intense-fg ansi-bold">     60</span> <span class="ansi-yellow-bg">        </span><span class="ansi-yellow-bg">text_embedder</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">=</span><span class="ansi-yellow-bg ansi-bold" style="color: rgb(0,135,0)">lambda</span><span class="ansi-yellow-bg"> </span><span class="ansi-yellow-bg">t</span><span class="ansi-yellow-bg">:</span><span class="ansi-yellow-bg"> </span><span class="ansi-yellow-bg">text_embedder</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">.</span><span class="ansi-yellow-bg">embed</span><span class="ansi-yellow-bg">(</span><span class="ansi-yellow-bg">t</span><span class="ansi-yellow-bg">)</span><span class="ansi-yellow-bg">,</span>
+<span class="ansi-green-intense-fg ansi-bold">     61</span> <span class="ansi-yellow-bg">        </span><span class="ansi-yellow-bg">k</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">=</span><span class="ansi-yellow-bg">k</span><span class="ansi-yellow-bg"> </span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">*</span><span class="ansi-yellow-bg"> </span><span class="ansi-yellow-bg">oversample_scaler</span><span class="ansi-yellow-bg">,</span>
+<span class="ansi-green-intense-fg ansi-bold">     62</span> <span class="ansi-yellow-bg">    </span><span class="ansi-yellow-bg">)</span>
+<span class="ansi-green-intense-fg ansi-bold">     63</span>     <span class="ansi-bold" style="color: rgb(0,135,0)">for</span> result <span class="ansi-bold" style="color: rgb(175,0,255)">in</span> search_results:
+<span class="ansi-green-intense-fg ansi-bold">     64</span>         <span class="ansi-bold" style="color: rgb(0,135,0)">if</span> embedding_vectorstore_key <span style="color: rgb(98,98,98)">==</span> EntityVectorStoreKey<span style="color: rgb(98,98,98)">.</span>ID <span class="ansi-bold" style="color: rgb(175,0,255)">and</span> <span style="color: rgb(0,135,0)">isinstance</span>(
+<span class="ansi-green-intense-fg ansi-bold">     65</span>             result<span style="color: rgb(98,98,98)">.</span>document<span style="color: rgb(98,98,98)">.</span>id, <span style="color: rgb(0,135,0)">str</span>
+<span class="ansi-green-intense-fg ansi-bold">     66</span>         ):
+
+File <span class="ansi-green-fg">~/work/graphrag/graphrag/graphrag/vector_stores/lancedb.py:134</span>, in <span class="ansi-cyan-fg">LanceDBVectorStore.similarity_search_by_text</span><span class="ansi-blue-fg">(self, text, text_embedder, k, **kwargs)</span>
+<span class="ansi-green-intense-fg ansi-bold">    130</span> <span class="ansi-bold" style="color: rgb(0,135,0)">def</span> <span style="color: rgb(0,0,255)">similarity_search_by_text</span>(
+<span class="ansi-green-intense-fg ansi-bold">    131</span>     <span style="color: rgb(0,135,0)">self</span>, text: <span style="color: rgb(0,135,0)">str</span>, text_embedder: TextEmbedder, k: <span style="color: rgb(0,135,0)">int</span> <span style="color: rgb(98,98,98)">=</span> <span style="color: rgb(98,98,98)">10</span>, <span style="color: rgb(98,98,98)">*</span><span style="color: rgb(98,98,98)">*</span>kwargs: Any
+<span class="ansi-green-intense-fg ansi-bold">    132</span> ) <span style="color: rgb(98,98,98)">-</span><span style="color: rgb(98,98,98)">&gt;</span> <span style="color: rgb(0,135,0)">list</span>[VectorStoreSearchResult]:
+<span class="ansi-green-intense-fg ansi-bold">    133</span> <span style="color: rgb(188,188,188)">    </span><span style="color: rgb(175,0,0)">"""Perform a similarity search using a given input text."""</span>
+<span class="ansi-green-fg">--&gt; 134</span>     query_embedding <span style="color: rgb(98,98,98)">=</span> <span class="ansi-yellow-bg">text_embedder</span><span class="ansi-yellow-bg">(</span><span class="ansi-yellow-bg">text</span><span class="ansi-yellow-bg">)</span>
+<span class="ansi-green-intense-fg ansi-bold">    135</span>     <span class="ansi-bold" style="color: rgb(0,135,0)">if</span> query_embedding:
+<span class="ansi-green-intense-fg ansi-bold">    136</span>         <span class="ansi-bold" style="color: rgb(0,135,0)">return</span> <span style="color: rgb(0,135,0)">self</span><span style="color: rgb(98,98,98)">.</span>similarity_search_by_vector(query_embedding, k)
+
+File <span class="ansi-green-fg">~/work/graphrag/graphrag/graphrag/query/context_builder/entity_extraction.py:60</span>, in <span class="ansi-cyan-fg">map_query_to_entities.&lt;locals&gt;.&lt;lambda&gt;</span><span class="ansi-blue-fg">(t)</span>
+<span class="ansi-green-intense-fg ansi-bold">     54</span> matched_entities <span style="color: rgb(98,98,98)">=</span> []
+<span class="ansi-green-intense-fg ansi-bold">     55</span> <span class="ansi-bold" style="color: rgb(0,135,0)">if</span> query <span style="color: rgb(98,98,98)">!=</span> <span style="color: rgb(175,0,0)">"</span><span style="color: rgb(175,0,0)">"</span>:
+<span class="ansi-green-intense-fg ansi-bold">     56</span>     <span style="color: rgb(95,135,135)"># get entities with highest semantic similarity to query</span>
+<span class="ansi-green-intense-fg ansi-bold">     57</span>     <span style="color: rgb(95,135,135)"># oversample to account for excluded entities</span>
+<span class="ansi-green-intense-fg ansi-bold">     58</span>     search_results <span style="color: rgb(98,98,98)">=</span> text_embedding_vectorstore<span style="color: rgb(98,98,98)">.</span>similarity_search_by_text(
+<span class="ansi-green-intense-fg ansi-bold">     59</span>         text<span style="color: rgb(98,98,98)">=</span>query,
+<span class="ansi-green-fg">---&gt; 60</span>         text_embedder<span style="color: rgb(98,98,98)">=</span><span class="ansi-bold" style="color: rgb(0,135,0)">lambda</span> t: <span class="ansi-yellow-bg">text_embedder</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">.</span><span class="ansi-yellow-bg">embed</span><span class="ansi-yellow-bg">(</span><span class="ansi-yellow-bg">t</span><span class="ansi-yellow-bg">)</span>,
+<span class="ansi-green-intense-fg ansi-bold">     61</span>         k<span style="color: rgb(98,98,98)">=</span>k <span style="color: rgb(98,98,98)">*</span> oversample_scaler,
+<span class="ansi-green-intense-fg ansi-bold">     62</span>     )
+<span class="ansi-green-intense-fg ansi-bold">     63</span>     <span class="ansi-bold" style="color: rgb(0,135,0)">for</span> result <span class="ansi-bold" style="color: rgb(175,0,255)">in</span> search_results:
+<span class="ansi-green-intense-fg ansi-bold">     64</span>         <span class="ansi-bold" style="color: rgb(0,135,0)">if</span> embedding_vectorstore_key <span style="color: rgb(98,98,98)">==</span> EntityVectorStoreKey<span style="color: rgb(98,98,98)">.</span>ID <span class="ansi-bold" style="color: rgb(175,0,255)">and</span> <span style="color: rgb(0,135,0)">isinstance</span>(
+<span class="ansi-green-intense-fg ansi-bold">     65</span>             result<span style="color: rgb(98,98,98)">.</span>document<span style="color: rgb(98,98,98)">.</span>id, <span style="color: rgb(0,135,0)">str</span>
+<span class="ansi-green-intense-fg ansi-bold">     66</span>         ):
+
+File <span class="ansi-green-fg">~/work/graphrag/graphrag/graphrag/query/llm/oai/embedding.py:96</span>, in <span class="ansi-cyan-fg">OpenAIEmbedding.embed</span><span class="ansi-blue-fg">(self, text, **kwargs)</span>
+<span class="ansi-green-intense-fg ansi-bold">     90</span>         <span style="color: rgb(0,135,0)">self</span><span style="color: rgb(98,98,98)">.</span>_reporter<span style="color: rgb(98,98,98)">.</span>error(
+<span class="ansi-green-intense-fg ansi-bold">     91</span>             message<span style="color: rgb(98,98,98)">=</span><span style="color: rgb(175,0,0)">"</span><span style="color: rgb(175,0,0)">Error embedding chunk</span><span style="color: rgb(175,0,0)">"</span>,
+<span class="ansi-green-intense-fg ansi-bold">     92</span>             details<span style="color: rgb(98,98,98)">=</span>{<span style="color: rgb(0,135,0)">self</span><span style="color: rgb(98,98,98)">.</span><span style="color: rgb(0,0,135)">__class__</span><span style="color: rgb(98,98,98)">.</span><span style="color: rgb(0,0,135)">__name__</span>: <span style="color: rgb(0,135,0)">str</span>(e)},
+<span class="ansi-green-intense-fg ansi-bold">     93</span>         )
+<span class="ansi-green-intense-fg ansi-bold">     95</span>         <span class="ansi-bold" style="color: rgb(0,135,0)">continue</span>
+<span class="ansi-green-fg">---&gt; 96</span> chunk_embeddings <span style="color: rgb(98,98,98)">=</span> <span class="ansi-yellow-bg">np</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">.</span><span class="ansi-yellow-bg">average</span><span class="ansi-yellow-bg">(</span><span class="ansi-yellow-bg">chunk_embeddings</span><span class="ansi-yellow-bg">,</span><span class="ansi-yellow-bg"> </span><span class="ansi-yellow-bg">axis</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">=</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">0</span><span class="ansi-yellow-bg">,</span><span class="ansi-yellow-bg"> </span><span class="ansi-yellow-bg">weights</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">=</span><span class="ansi-yellow-bg">chunk_lens</span><span class="ansi-yellow-bg">)</span>
+<span class="ansi-green-intense-fg ansi-bold">     97</span> chunk_embeddings <span style="color: rgb(98,98,98)">=</span> chunk_embeddings <span style="color: rgb(98,98,98)">/</span> np<span style="color: rgb(98,98,98)">.</span>linalg<span style="color: rgb(98,98,98)">.</span>norm(chunk_embeddings)
+<span class="ansi-green-intense-fg ansi-bold">     98</span> <span class="ansi-bold" style="color: rgb(0,135,0)">return</span> chunk_embeddings<span style="color: rgb(98,98,98)">.</span>tolist()
+
+File <span class="ansi-green-fg">~/.cache/pypoetry/virtualenvs/graphrag-F2jvqev7-py3.11/lib/python3.11/site-packages/numpy/lib/function_base.py:550</span>, in <span class="ansi-cyan-fg">average</span><span class="ansi-blue-fg">(a, axis, weights, returned, keepdims)</span>
+<span class="ansi-green-intense-fg ansi-bold">    548</span>     scl <span style="color: rgb(98,98,98)">=</span> wgt<span style="color: rgb(98,98,98)">.</span>sum(axis<span style="color: rgb(98,98,98)">=</span>axis, dtype<span style="color: rgb(98,98,98)">=</span>result_dtype, <span style="color: rgb(98,98,98)">*</span><span style="color: rgb(98,98,98)">*</span>keepdims_kw)
+<span class="ansi-green-intense-fg ansi-bold">    549</span>     <span class="ansi-bold" style="color: rgb(0,135,0)">if</span> np<span style="color: rgb(98,98,98)">.</span>any(scl <span style="color: rgb(98,98,98)">==</span> <span style="color: rgb(98,98,98)">0.0</span>):
+<span class="ansi-green-fg">--&gt; 550</span>         <span class="ansi-bold" style="color: rgb(0,135,0)">raise</span> <span class="ansi-bold" style="color: rgb(215,95,95)">ZeroDivisionError</span>(
+<span class="ansi-green-intense-fg ansi-bold">    551</span>             <span style="color: rgb(175,0,0)">"</span><span style="color: rgb(175,0,0)">Weights sum to zero, can</span><span style="color: rgb(175,0,0)">'</span><span style="color: rgb(175,0,0)">t be normalized</span><span style="color: rgb(175,0,0)">"</span>)
+<span class="ansi-green-intense-fg ansi-bold">    553</span>     avg <span style="color: rgb(98,98,98)">=</span> avg_as_array <span style="color: rgb(98,98,98)">=</span> np<span style="color: rgb(98,98,98)">.</span>multiply(a, wgt,
+<span class="ansi-green-intense-fg ansi-bold">    554</span>                       dtype<span style="color: rgb(98,98,98)">=</span>result_dtype)<span style="color: rgb(98,98,98)">.</span>sum(axis, <span style="color: rgb(98,98,98)">*</span><span style="color: rgb(98,98,98)">*</span>keepdims_kw) <span style="color: rgb(98,98,98)">/</span> scl
+<span class="ansi-green-intense-fg ansi-bold">    556</span> <span class="ansi-bold" style="color: rgb(0,135,0)">if</span> returned:
+
+<span class="ansi-red-fg">ZeroDivisionError</span>: Weights sum to zero, can't be normalized</pre>
+</div>
+</div>
 </div>
 </div>
 </div>
@@ -3409,26 +3495,113 @@ print(result.response)</div>
 <div class="jp-OutputArea-child">
 <div class="jp-OutputPrompt jp-OutputArea-prompt"></div>
 <div class="jp-RenderedText jp-OutputArea-output" data-mime-type="text/plain" tabindex="0">
-<pre>### Overview of Dr. Jordan Hayes
-
-Dr. Jordan Hayes is a prominent scientist at Dulce Base, playing a crucial role in the Paranormal Military Squad's efforts to understand and communicate with extraterrestrial entities. Dr. Hayes's work is primarily focused on decoding and analyzing alien signals and codes, which are essential for interstellar communication and potentially interspecies interaction. This involves decrypting algorithms, interpreting cosmic signals, and analyzing the implications of alien society [Data: Entities (2, 17, 47); Relationships (201, 322, 283)].
-
-### Key Contributions and Expertise
-
-Dr. Hayes is noted for their adaptability and skepticism, qualities that are essential given the uncertainties and unknown challenges of their mission. They are deeply involved in the scientific exploration aspects of Operation: Dulce, where their efforts are on the verge of a significant scientific breakthrough. Dr. Hayes leads efforts in isolating and understanding complex alien signals that resemble human cognition, suggesting that these signals are artificial and patterned, indicating a tandem evolution with humanity [Data: Entities (2, 17); Claims (60, 83, 91, 134)].
-
-### Collaborative Efforts and Leadership
-
-In addition to their scientific endeavors, Dr. Hayes is involved in setting up lab stations, operating the mainframe, and playing a crucial role in the command center at Dulce Base. They work closely with colleagues like Alex Mercer, engaging in thoughtful dialogue and showing analytical thinking about the mission's uncertainties. Dr. Hayes's attention to detail is also evident in their discovery of significant panels among secured doorways and their contemplation of the mission's broader ramifications [Data: Entities (2); Relationships (26, 270, 254)].
-
-### Challenges and Philosophical Reflections
-
-Dr. Hayes's work is not without its challenges. They have reflected on their own skepticism and its potential as a blind spot, indicating a moment of self-awareness and growth. This introspection is crucial as they navigate the complexities of alien communication and the profound implications of their findings on physics and the possibilities of their mission [Data: Claims (13, 2); Sources (4, 42)].
-
-In summary, Dr. Jordan Hayes is a vital asset to the Paranormal Military Squad, contributing significantly to the understanding of extraterrestrial communications and the potential for interstellar diplomacy. Their work at Dulce Base is characterized by a blend of scientific rigor, adaptability, and philosophical inquiry, making them a key figure in the ongoing exploration of the unknown.
+<pre>Error embedding chunk {'OpenAIEmbedding': "Error code: 429 - {'error': {'message': 'You exceeded your current quota, please check your plan and billing details. For more information on this error, read the docs: https://platform.openai.com/docs/guides/error-codes/api-errors.', 'type': 'insufficient_quota', 'param': None, 'code': 'insufficient_quota'}}"}
 </pre>
 </div>
 </div>
+<div class="jp-OutputArea-child">
+<div class="jp-OutputPrompt jp-OutputArea-prompt"></div>
+<div class="jp-RenderedText jp-OutputArea-output" data-mime-type="application/vnd.jupyter.stderr" tabindex="0">
+<pre>
+<span class="ansi-red-fg">---------------------------------------------------------------------------</span>
+<span class="ansi-red-fg">ZeroDivisionError</span>                         Traceback (most recent call last)
+Cell <span class="ansi-green-fg">In[14], line 2</span>
+<span class="ansi-green-intense-fg ansi-bold">      1</span> question <span style="color: rgb(98,98,98)">=</span> <span style="color: rgb(175,0,0)">"</span><span style="color: rgb(175,0,0)">Tell me about Dr. Jordan Hayes</span><span style="color: rgb(175,0,0)">"</span>
+<span class="ansi-green-fg">----&gt; 2</span> result <span style="color: rgb(98,98,98)">=</span> <span class="ansi-bold" style="color: rgb(0,135,0)">await</span> search_engine<span style="color: rgb(98,98,98)">.</span>asearch(question)
+<span class="ansi-green-intense-fg ansi-bold">      3</span> <span style="color: rgb(0,135,0)">print</span>(result<span style="color: rgb(98,98,98)">.</span>response)
+
+File <span class="ansi-green-fg">~/work/graphrag/graphrag/graphrag/query/structured_search/local_search/search.py:67</span>, in <span class="ansi-cyan-fg">LocalSearch.asearch</span><span class="ansi-blue-fg">(self, query, conversation_history, **kwargs)</span>
+<span class="ansi-green-intense-fg ansi-bold">     65</span> search_prompt <span style="color: rgb(98,98,98)">=</span> <span style="color: rgb(175,0,0)">"</span><span style="color: rgb(175,0,0)">"</span>
+<span class="ansi-green-intense-fg ansi-bold">     66</span> llm_calls, prompt_tokens, output_tokens <span style="color: rgb(98,98,98)">=</span> {}, {}, {}
+<span class="ansi-green-fg">---&gt; 67</span> context_result <span style="color: rgb(98,98,98)">=</span> <span class="ansi-yellow-bg" style="color: rgb(0,135,0)">self</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">.</span><span class="ansi-yellow-bg">context_builder</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">.</span><span class="ansi-yellow-bg">build_context</span><span class="ansi-yellow-bg">(</span>
+<span class="ansi-green-intense-fg ansi-bold">     68</span> <span class="ansi-yellow-bg">    </span><span class="ansi-yellow-bg">query</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">=</span><span class="ansi-yellow-bg">query</span><span class="ansi-yellow-bg">,</span>
+<span class="ansi-green-intense-fg ansi-bold">     69</span> <span class="ansi-yellow-bg">    </span><span class="ansi-yellow-bg">conversation_history</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">=</span><span class="ansi-yellow-bg">conversation_history</span><span class="ansi-yellow-bg">,</span>
+<span class="ansi-green-intense-fg ansi-bold">     70</span> <span class="ansi-yellow-bg">    </span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">*</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">*</span><span class="ansi-yellow-bg">kwargs</span><span class="ansi-yellow-bg">,</span>
+<span class="ansi-green-intense-fg ansi-bold">     71</span> <span class="ansi-yellow-bg">    </span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">*</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">*</span><span class="ansi-yellow-bg" style="color: rgb(0,135,0)">self</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">.</span><span class="ansi-yellow-bg">context_builder_params</span><span class="ansi-yellow-bg">,</span>
+<span class="ansi-green-intense-fg ansi-bold">     72</span> <span class="ansi-yellow-bg">)</span>
+<span class="ansi-green-intense-fg ansi-bold">     73</span> llm_calls[<span style="color: rgb(175,0,0)">"</span><span style="color: rgb(175,0,0)">build_context</span><span style="color: rgb(175,0,0)">"</span>] <span style="color: rgb(98,98,98)">=</span> context_result<span style="color: rgb(98,98,98)">.</span>llm_calls
+<span class="ansi-green-intense-fg ansi-bold">     74</span> prompt_tokens[<span style="color: rgb(175,0,0)">"</span><span style="color: rgb(175,0,0)">build_context</span><span style="color: rgb(175,0,0)">"</span>] <span style="color: rgb(98,98,98)">=</span> context_result<span style="color: rgb(98,98,98)">.</span>prompt_tokens
+
+File <span class="ansi-green-fg">~/work/graphrag/graphrag/graphrag/query/structured_search/local_search/mixed_context.py:139</span>, in <span class="ansi-cyan-fg">LocalSearchMixedContext.build_context</span><span class="ansi-blue-fg">(self, query, conversation_history, include_entity_names, exclude_entity_names, conversation_history_max_turns, conversation_history_user_turns_only, max_tokens, text_unit_prop, community_prop, top_k_mapped_entities, top_k_relationships, include_community_rank, include_entity_rank, rank_description, include_relationship_weight, relationship_ranking_attribute, return_candidate_context, use_community_summary, min_community_rank, community_context_name, column_delimiter, **kwargs)</span>
+<span class="ansi-green-intense-fg ansi-bold">    134</span>     pre_user_questions <span style="color: rgb(98,98,98)">=</span> <span style="color: rgb(175,0,0)">"</span><span class="ansi-bold" style="color: rgb(175,95,0)">\n</span><span style="color: rgb(175,0,0)">"</span><span style="color: rgb(98,98,98)">.</span>join(
+<span class="ansi-green-intense-fg ansi-bold">    135</span>         conversation_history<span style="color: rgb(98,98,98)">.</span>get_user_turns(conversation_history_max_turns)
+<span class="ansi-green-intense-fg ansi-bold">    136</span>     )
+<span class="ansi-green-intense-fg ansi-bold">    137</span>     query <span style="color: rgb(98,98,98)">=</span> <span style="color: rgb(175,0,0)">f</span><span style="color: rgb(175,0,0)">"</span><span class="ansi-bold" style="color: rgb(175,95,135)">{</span>query<span class="ansi-bold" style="color: rgb(175,95,135)">}</span><span class="ansi-bold" style="color: rgb(175,95,0)">\n</span><span class="ansi-bold" style="color: rgb(175,95,135)">{</span>pre_user_questions<span class="ansi-bold" style="color: rgb(175,95,135)">}</span><span style="color: rgb(175,0,0)">"</span>
+<span class="ansi-green-fg">--&gt; 139</span> selected_entities <span style="color: rgb(98,98,98)">=</span> <span class="ansi-yellow-bg">map_query_to_entities</span><span class="ansi-yellow-bg">(</span>
+<span class="ansi-green-intense-fg ansi-bold">    140</span> <span class="ansi-yellow-bg">    </span><span class="ansi-yellow-bg">query</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">=</span><span class="ansi-yellow-bg">query</span><span class="ansi-yellow-bg">,</span>
+<span class="ansi-green-intense-fg ansi-bold">    141</span> <span class="ansi-yellow-bg">    </span><span class="ansi-yellow-bg">text_embedding_vectorstore</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">=</span><span class="ansi-yellow-bg" style="color: rgb(0,135,0)">self</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">.</span><span class="ansi-yellow-bg">entity_text_embeddings</span><span class="ansi-yellow-bg">,</span>
+<span class="ansi-green-intense-fg ansi-bold">    142</span> <span class="ansi-yellow-bg">    </span><span class="ansi-yellow-bg">text_embedder</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">=</span><span class="ansi-yellow-bg" style="color: rgb(0,135,0)">self</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">.</span><span class="ansi-yellow-bg">text_embedder</span><span class="ansi-yellow-bg">,</span>
+<span class="ansi-green-intense-fg ansi-bold">    143</span> <span class="ansi-yellow-bg">    </span><span class="ansi-yellow-bg">all_entities_dict</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">=</span><span class="ansi-yellow-bg" style="color: rgb(0,135,0)">self</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">.</span><span class="ansi-yellow-bg">entities</span><span class="ansi-yellow-bg">,</span>
+<span class="ansi-green-intense-fg ansi-bold">    144</span> <span class="ansi-yellow-bg">    </span><span class="ansi-yellow-bg">embedding_vectorstore_key</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">=</span><span class="ansi-yellow-bg" style="color: rgb(0,135,0)">self</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">.</span><span class="ansi-yellow-bg">embedding_vectorstore_key</span><span class="ansi-yellow-bg">,</span>
+<span class="ansi-green-intense-fg ansi-bold">    145</span> <span class="ansi-yellow-bg">    </span><span class="ansi-yellow-bg">include_entity_names</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">=</span><span class="ansi-yellow-bg">include_entity_names</span><span class="ansi-yellow-bg">,</span>
+<span class="ansi-green-intense-fg ansi-bold">    146</span> <span class="ansi-yellow-bg">    </span><span class="ansi-yellow-bg">exclude_entity_names</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">=</span><span class="ansi-yellow-bg">exclude_entity_names</span><span class="ansi-yellow-bg">,</span>
+<span class="ansi-green-intense-fg ansi-bold">    147</span> <span class="ansi-yellow-bg">    </span><span class="ansi-yellow-bg">k</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">=</span><span class="ansi-yellow-bg">top_k_mapped_entities</span><span class="ansi-yellow-bg">,</span>
+<span class="ansi-green-intense-fg ansi-bold">    148</span> <span class="ansi-yellow-bg">    </span><span class="ansi-yellow-bg">oversample_scaler</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">=</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">2</span><span class="ansi-yellow-bg">,</span>
+<span class="ansi-green-intense-fg ansi-bold">    149</span> <span class="ansi-yellow-bg">)</span>
+<span class="ansi-green-intense-fg ansi-bold">    151</span> <span style="color: rgb(95,135,135)"># build context</span>
+<span class="ansi-green-intense-fg ansi-bold">    152</span> final_context <span style="color: rgb(98,98,98)">=</span> <span style="color: rgb(0,135,0)">list</span>[<span style="color: rgb(0,135,0)">str</span>]()
+
+File <span class="ansi-green-fg">~/work/graphrag/graphrag/graphrag/query/context_builder/entity_extraction.py:58</span>, in <span class="ansi-cyan-fg">map_query_to_entities</span><span class="ansi-blue-fg">(query, text_embedding_vectorstore, text_embedder, all_entities_dict, embedding_vectorstore_key, include_entity_names, exclude_entity_names, k, oversample_scaler)</span>
+<span class="ansi-green-intense-fg ansi-bold">     54</span> matched_entities <span style="color: rgb(98,98,98)">=</span> []
+<span class="ansi-green-intense-fg ansi-bold">     55</span> <span class="ansi-bold" style="color: rgb(0,135,0)">if</span> query <span style="color: rgb(98,98,98)">!=</span> <span style="color: rgb(175,0,0)">"</span><span style="color: rgb(175,0,0)">"</span>:
+<span class="ansi-green-intense-fg ansi-bold">     56</span>     <span style="color: rgb(95,135,135)"># get entities with highest semantic similarity to query</span>
+<span class="ansi-green-intense-fg ansi-bold">     57</span>     <span style="color: rgb(95,135,135)"># oversample to account for excluded entities</span>
+<span class="ansi-green-fg">---&gt; 58</span>     search_results <span style="color: rgb(98,98,98)">=</span> <span class="ansi-yellow-bg">text_embedding_vectorstore</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">.</span><span class="ansi-yellow-bg">similarity_search_by_text</span><span class="ansi-yellow-bg">(</span>
+<span class="ansi-green-intense-fg ansi-bold">     59</span> <span class="ansi-yellow-bg">        </span><span class="ansi-yellow-bg">text</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">=</span><span class="ansi-yellow-bg">query</span><span class="ansi-yellow-bg">,</span>
+<span class="ansi-green-intense-fg ansi-bold">     60</span> <span class="ansi-yellow-bg">        </span><span class="ansi-yellow-bg">text_embedder</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">=</span><span class="ansi-yellow-bg ansi-bold" style="color: rgb(0,135,0)">lambda</span><span class="ansi-yellow-bg"> </span><span class="ansi-yellow-bg">t</span><span class="ansi-yellow-bg">:</span><span class="ansi-yellow-bg"> </span><span class="ansi-yellow-bg">text_embedder</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">.</span><span class="ansi-yellow-bg">embed</span><span class="ansi-yellow-bg">(</span><span class="ansi-yellow-bg">t</span><span class="ansi-yellow-bg">)</span><span class="ansi-yellow-bg">,</span>
+<span class="ansi-green-intense-fg ansi-bold">     61</span> <span class="ansi-yellow-bg">        </span><span class="ansi-yellow-bg">k</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">=</span><span class="ansi-yellow-bg">k</span><span class="ansi-yellow-bg"> </span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">*</span><span class="ansi-yellow-bg"> </span><span class="ansi-yellow-bg">oversample_scaler</span><span class="ansi-yellow-bg">,</span>
+<span class="ansi-green-intense-fg ansi-bold">     62</span> <span class="ansi-yellow-bg">    </span><span class="ansi-yellow-bg">)</span>
+<span class="ansi-green-intense-fg ansi-bold">     63</span>     <span class="ansi-bold" style="color: rgb(0,135,0)">for</span> result <span class="ansi-bold" style="color: rgb(175,0,255)">in</span> search_results:
+<span class="ansi-green-intense-fg ansi-bold">     64</span>         <span class="ansi-bold" style="color: rgb(0,135,0)">if</span> embedding_vectorstore_key <span style="color: rgb(98,98,98)">==</span> EntityVectorStoreKey<span style="color: rgb(98,98,98)">.</span>ID <span class="ansi-bold" style="color: rgb(175,0,255)">and</span> <span style="color: rgb(0,135,0)">isinstance</span>(
+<span class="ansi-green-intense-fg ansi-bold">     65</span>             result<span style="color: rgb(98,98,98)">.</span>document<span style="color: rgb(98,98,98)">.</span>id, <span style="color: rgb(0,135,0)">str</span>
+<span class="ansi-green-intense-fg ansi-bold">     66</span>         ):
+
+File <span class="ansi-green-fg">~/work/graphrag/graphrag/graphrag/vector_stores/lancedb.py:134</span>, in <span class="ansi-cyan-fg">LanceDBVectorStore.similarity_search_by_text</span><span class="ansi-blue-fg">(self, text, text_embedder, k, **kwargs)</span>
+<span class="ansi-green-intense-fg ansi-bold">    130</span> <span class="ansi-bold" style="color: rgb(0,135,0)">def</span> <span style="color: rgb(0,0,255)">similarity_search_by_text</span>(
+<span class="ansi-green-intense-fg ansi-bold">    131</span>     <span style="color: rgb(0,135,0)">self</span>, text: <span style="color: rgb(0,135,0)">str</span>, text_embedder: TextEmbedder, k: <span style="color: rgb(0,135,0)">int</span> <span style="color: rgb(98,98,98)">=</span> <span style="color: rgb(98,98,98)">10</span>, <span style="color: rgb(98,98,98)">*</span><span style="color: rgb(98,98,98)">*</span>kwargs: Any
+<span class="ansi-green-intense-fg ansi-bold">    132</span> ) <span style="color: rgb(98,98,98)">-</span><span style="color: rgb(98,98,98)">&gt;</span> <span style="color: rgb(0,135,0)">list</span>[VectorStoreSearchResult]:
+<span class="ansi-green-intense-fg ansi-bold">    133</span> <span style="color: rgb(188,188,188)">    </span><span style="color: rgb(175,0,0)">"""Perform a similarity search using a given input text."""</span>
+<span class="ansi-green-fg">--&gt; 134</span>     query_embedding <span style="color: rgb(98,98,98)">=</span> <span class="ansi-yellow-bg">text_embedder</span><span class="ansi-yellow-bg">(</span><span class="ansi-yellow-bg">text</span><span class="ansi-yellow-bg">)</span>
+<span class="ansi-green-intense-fg ansi-bold">    135</span>     <span class="ansi-bold" style="color: rgb(0,135,0)">if</span> query_embedding:
+<span class="ansi-green-intense-fg ansi-bold">    136</span>         <span class="ansi-bold" style="color: rgb(0,135,0)">return</span> <span style="color: rgb(0,135,0)">self</span><span style="color: rgb(98,98,98)">.</span>similarity_search_by_vector(query_embedding, k)
+
+File <span class="ansi-green-fg">~/work/graphrag/graphrag/graphrag/query/context_builder/entity_extraction.py:60</span>, in <span class="ansi-cyan-fg">map_query_to_entities.&lt;locals&gt;.&lt;lambda&gt;</span><span class="ansi-blue-fg">(t)</span>
+<span class="ansi-green-intense-fg ansi-bold">     54</span> matched_entities <span style="color: rgb(98,98,98)">=</span> []
+<span class="ansi-green-intense-fg ansi-bold">     55</span> <span class="ansi-bold" style="color: rgb(0,135,0)">if</span> query <span style="color: rgb(98,98,98)">!=</span> <span style="color: rgb(175,0,0)">"</span><span style="color: rgb(175,0,0)">"</span>:
+<span class="ansi-green-intense-fg ansi-bold">     56</span>     <span style="color: rgb(95,135,135)"># get entities with highest semantic similarity to query</span>
+<span class="ansi-green-intense-fg ansi-bold">     57</span>     <span style="color: rgb(95,135,135)"># oversample to account for excluded entities</span>
+<span class="ansi-green-intense-fg ansi-bold">     58</span>     search_results <span style="color: rgb(98,98,98)">=</span> text_embedding_vectorstore<span style="color: rgb(98,98,98)">.</span>similarity_search_by_text(
+<span class="ansi-green-intense-fg ansi-bold">     59</span>         text<span style="color: rgb(98,98,98)">=</span>query,
+<span class="ansi-green-fg">---&gt; 60</span>         text_embedder<span style="color: rgb(98,98,98)">=</span><span class="ansi-bold" style="color: rgb(0,135,0)">lambda</span> t: <span class="ansi-yellow-bg">text_embedder</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">.</span><span class="ansi-yellow-bg">embed</span><span class="ansi-yellow-bg">(</span><span class="ansi-yellow-bg">t</span><span class="ansi-yellow-bg">)</span>,
+<span class="ansi-green-intense-fg ansi-bold">     61</span>         k<span style="color: rgb(98,98,98)">=</span>k <span style="color: rgb(98,98,98)">*</span> oversample_scaler,
+<span class="ansi-green-intense-fg ansi-bold">     62</span>     )
+<span class="ansi-green-intense-fg ansi-bold">     63</span>     <span class="ansi-bold" style="color: rgb(0,135,0)">for</span> result <span class="ansi-bold" style="color: rgb(175,0,255)">in</span> search_results:
+<span class="ansi-green-intense-fg ansi-bold">     64</span>         <span class="ansi-bold" style="color: rgb(0,135,0)">if</span> embedding_vectorstore_key <span style="color: rgb(98,98,98)">==</span> EntityVectorStoreKey<span style="color: rgb(98,98,98)">.</span>ID <span class="ansi-bold" style="color: rgb(175,0,255)">and</span> <span style="color: rgb(0,135,0)">isinstance</span>(
+<span class="ansi-green-intense-fg ansi-bold">     65</span>             result<span style="color: rgb(98,98,98)">.</span>document<span style="color: rgb(98,98,98)">.</span>id, <span style="color: rgb(0,135,0)">str</span>
+<span class="ansi-green-intense-fg ansi-bold">     66</span>         ):
+
+File <span class="ansi-green-fg">~/work/graphrag/graphrag/graphrag/query/llm/oai/embedding.py:96</span>, in <span class="ansi-cyan-fg">OpenAIEmbedding.embed</span><span class="ansi-blue-fg">(self, text, **kwargs)</span>
+<span class="ansi-green-intense-fg ansi-bold">     90</span>         <span style="color: rgb(0,135,0)">self</span><span style="color: rgb(98,98,98)">.</span>_reporter<span style="color: rgb(98,98,98)">.</span>error(
+<span class="ansi-green-intense-fg ansi-bold">     91</span>             message<span style="color: rgb(98,98,98)">=</span><span style="color: rgb(175,0,0)">"</span><span style="color: rgb(175,0,0)">Error embedding chunk</span><span style="color: rgb(175,0,0)">"</span>,
+<span class="ansi-green-intense-fg ansi-bold">     92</span>             details<span style="color: rgb(98,98,98)">=</span>{<span style="color: rgb(0,135,0)">self</span><span style="color: rgb(98,98,98)">.</span><span style="color: rgb(0,0,135)">__class__</span><span style="color: rgb(98,98,98)">.</span><span style="color: rgb(0,0,135)">__name__</span>: <span style="color: rgb(0,135,0)">str</span>(e)},
+<span class="ansi-green-intense-fg ansi-bold">     93</span>         )
+<span class="ansi-green-intense-fg ansi-bold">     95</span>         <span class="ansi-bold" style="color: rgb(0,135,0)">continue</span>
+<span class="ansi-green-fg">---&gt; 96</span> chunk_embeddings <span style="color: rgb(98,98,98)">=</span> <span class="ansi-yellow-bg">np</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">.</span><span class="ansi-yellow-bg">average</span><span class="ansi-yellow-bg">(</span><span class="ansi-yellow-bg">chunk_embeddings</span><span class="ansi-yellow-bg">,</span><span class="ansi-yellow-bg"> </span><span class="ansi-yellow-bg">axis</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">=</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">0</span><span class="ansi-yellow-bg">,</span><span class="ansi-yellow-bg"> </span><span class="ansi-yellow-bg">weights</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">=</span><span class="ansi-yellow-bg">chunk_lens</span><span class="ansi-yellow-bg">)</span>
+<span class="ansi-green-intense-fg ansi-bold">     97</span> chunk_embeddings <span style="color: rgb(98,98,98)">=</span> chunk_embeddings <span style="color: rgb(98,98,98)">/</span> np<span style="color: rgb(98,98,98)">.</span>linalg<span style="color: rgb(98,98,98)">.</span>norm(chunk_embeddings)
+<span class="ansi-green-intense-fg ansi-bold">     98</span> <span class="ansi-bold" style="color: rgb(0,135,0)">return</span> chunk_embeddings<span style="color: rgb(98,98,98)">.</span>tolist()
+
+File <span class="ansi-green-fg">~/.cache/pypoetry/virtualenvs/graphrag-F2jvqev7-py3.11/lib/python3.11/site-packages/numpy/lib/function_base.py:550</span>, in <span class="ansi-cyan-fg">average</span><span class="ansi-blue-fg">(a, axis, weights, returned, keepdims)</span>
+<span class="ansi-green-intense-fg ansi-bold">    548</span>     scl <span style="color: rgb(98,98,98)">=</span> wgt<span style="color: rgb(98,98,98)">.</span>sum(axis<span style="color: rgb(98,98,98)">=</span>axis, dtype<span style="color: rgb(98,98,98)">=</span>result_dtype, <span style="color: rgb(98,98,98)">*</span><span style="color: rgb(98,98,98)">*</span>keepdims_kw)
+<span class="ansi-green-intense-fg ansi-bold">    549</span>     <span class="ansi-bold" style="color: rgb(0,135,0)">if</span> np<span style="color: rgb(98,98,98)">.</span>any(scl <span style="color: rgb(98,98,98)">==</span> <span style="color: rgb(98,98,98)">0.0</span>):
+<span class="ansi-green-fg">--&gt; 550</span>         <span class="ansi-bold" style="color: rgb(0,135,0)">raise</span> <span class="ansi-bold" style="color: rgb(215,95,95)">ZeroDivisionError</span>(
+<span class="ansi-green-intense-fg ansi-bold">    551</span>             <span style="color: rgb(175,0,0)">"</span><span style="color: rgb(175,0,0)">Weights sum to zero, can</span><span style="color: rgb(175,0,0)">'</span><span style="color: rgb(175,0,0)">t be normalized</span><span style="color: rgb(175,0,0)">"</span>)
+<span class="ansi-green-intense-fg ansi-bold">    553</span>     avg <span style="color: rgb(98,98,98)">=</span> avg_as_array <span style="color: rgb(98,98,98)">=</span> np<span style="color: rgb(98,98,98)">.</span>multiply(a, wgt,
+<span class="ansi-green-intense-fg ansi-bold">    554</span>                       dtype<span style="color: rgb(98,98,98)">=</span>result_dtype)<span style="color: rgb(98,98,98)">.</span>sum(axis, <span style="color: rgb(98,98,98)">*</span><span style="color: rgb(98,98,98)">*</span>keepdims_kw) <span style="color: rgb(98,98,98)">/</span> scl
+<span class="ansi-green-intense-fg ansi-bold">    556</span> <span class="ansi-bold" style="color: rgb(0,135,0)">if</span> returned:
+
+<span class="ansi-red-fg">ZeroDivisionError</span>: Weights sum to zero, can't be normalized</pre>
+</div>
+</div>
 </div>
 </div>
 </div>
@@ -3473,78 +3646,16 @@ In summary, Dr. Jordan Hayes is a vital asset to the Paranormal Military Squad,
 <div class="jp-Collapser jp-OutputCollapser jp-Cell-outputCollapser">
 </div>
 <div class="jp-OutputArea jp-Cell-outputArea">
-<div class="jp-OutputArea-child jp-OutputArea-executeResult">
-<div class="jp-OutputPrompt jp-OutputArea-prompt">Out[15]:</div>
-<div class="jp-RenderedHTMLCommon jp-RenderedHTML jp-OutputArea-output jp-OutputArea-executeResult" data-mime-type="text/html" tabindex="0">
-<div>
-<style scoped="">
-    .dataframe tbody tr th:only-of-type {
-        vertical-align: middle;
-    }
+<div class="jp-OutputArea-child">
+<div class="jp-OutputPrompt jp-OutputArea-prompt"></div>
+<div class="jp-RenderedText jp-OutputArea-output" data-mime-type="application/vnd.jupyter.stderr" tabindex="0">
+<pre>
+<span class="ansi-red-fg">---------------------------------------------------------------------------</span>
+<span class="ansi-red-fg">NameError</span>                                 Traceback (most recent call last)
+Cell <span class="ansi-green-fg">In[15], line 1</span>
+<span class="ansi-green-fg">----&gt; 1</span> <span class="ansi-yellow-bg">result</span><span style="color: rgb(98,98,98)">.</span>context_data[<span style="color: rgb(175,0,0)">"</span><span style="color: rgb(175,0,0)">entities</span><span style="color: rgb(175,0,0)">"</span>]<span style="color: rgb(98,98,98)">.</span>head()
 
-    .dataframe tbody tr th {
-        vertical-align: top;
-    }
-
-    .dataframe thead th {
-        text-align: right;
-    }
-</style>
-<table border="1" class="dataframe">
-<thead>
-<tr style="text-align: right;">
-<th></th>
-<th>id</th>
-<th>entity</th>
-<th>description</th>
-<th>number of relationships</th>
-<th>in_context</th>
-</tr>
-</thead>
-<tbody>
-<tr>
-<th>0</th>
-<td>17</td>
-<td>DR. JORDAN HAYES</td>
-<td>Dr. Jordan Hayes is a key scientist at Dulce B...</td>
-<td>18</td>
-<td>True</td>
-</tr>
-<tr>
-<th>1</th>
-<td>7</td>
-<td>JORDAN</td>
-<td>Jordan Hayes is a key member of the Paranormal...</td>
-<td>22</td>
-<td>True</td>
-</tr>
-<tr>
-<th>2</th>
-<td>2</td>
-<td>JORDAN HAYES</td>
-<td>Dr. Jordan Hayes is a central figure at Dulce ...</td>
-<td>48</td>
-<td>True</td>
-</tr>
-<tr>
-<th>3</th>
-<td>47</td>
-<td>DR. HAYES</td>
-<td>Dr. Hayes is a scientist working on understand...</td>
-<td>1</td>
-<td>True</td>
-</tr>
-<tr>
-<th>4</th>
-<td>10</td>
-<td>AGENT HAYES</td>
-<td>Agent Hayes is known for emphasizing empowerme...</td>
-<td>4</td>
-<td>True</td>
-</tr>
-</tbody>
-</table>
-</div>
+<span class="ansi-red-fg">NameError</span>: name 'result' is not defined</pre>
 </div>
 </div>
 </div>
@@ -3580,97 +3691,23 @@ In summary, Dr. Jordan Hayes is a vital asset to the Paranormal Military Squad,
 <div class="jp-Collapser jp-OutputCollapser jp-Cell-outputCollapser">
 </div>
 <div class="jp-OutputArea jp-Cell-outputArea">
-<div class="jp-OutputArea-child jp-OutputArea-executeResult">
-<div class="jp-OutputPrompt jp-OutputArea-prompt">Out[16]:</div>
-<div class="jp-RenderedHTMLCommon jp-RenderedHTML jp-OutputArea-output jp-OutputArea-executeResult" data-mime-type="text/html" tabindex="0">
-<div>
-<style scoped="">
-    .dataframe tbody tr th:only-of-type {
-        vertical-align: middle;
-    }
+<div class="jp-OutputArea-child">
+<div class="jp-OutputPrompt jp-OutputArea-prompt"></div>
+<div class="jp-RenderedText jp-OutputArea-output" data-mime-type="application/vnd.jupyter.stderr" tabindex="0">
+<pre>
+<span class="ansi-red-fg">---------------------------------------------------------------------------</span>
+<span class="ansi-red-fg">NameError</span>                                 Traceback (most recent call last)
+Cell <span class="ansi-green-fg">In[16], line 1</span>
+<span class="ansi-green-fg">----&gt; 1</span> <span class="ansi-yellow-bg">result</span><span style="color: rgb(98,98,98)">.</span>context_data[<span style="color: rgb(175,0,0)">"</span><span style="color: rgb(175,0,0)">relationships</span><span style="color: rgb(175,0,0)">"</span>]<span style="color: rgb(98,98,98)">.</span>head()
 
-    .dataframe tbody tr th {
-        vertical-align: top;
-    }
-
-    .dataframe thead th {
-        text-align: right;
-    }
-</style>
-<table border="1" class="dataframe">
-<thead>
-<tr style="text-align: right;">
-<th></th>
-<th>id</th>
-<th>source</th>
-<th>target</th>
-<th>description</th>
-<th>weight</th>
-<th>links</th>
-<th>in_context</th>
-</tr>
-</thead>
-<tbody>
-<tr>
-<th>0</th>
-<td>260</td>
-<td>JORDAN</td>
-<td>DR. JORDAN HAYES</td>
-<td>Dr. Jordan Hayes and Jordan refer to the same ...</td>
-<td>1.0</td>
-<td>1</td>
-<td>True</td>
-</tr>
-<tr>
-<th>1</th>
-<td>50</td>
-<td>ALEX MERCER</td>
-<td>JORDAN</td>
-<td>Alex Mercer values Jordan's analytical approac...</td>
-<td>1.0</td>
-<td>2</td>
-<td>True</td>
-</tr>
-<tr>
-<th>2</th>
-<td>26</td>
-<td>ALEX MERCER</td>
-<td>DR. JORDAN HAYES</td>
-<td>Alex Mercer and Dr. Jordan Hayes are collabora...</td>
-<td>5.0</td>
-<td>2</td>
-<td>True</td>
-</tr>
-<tr>
-<th>3</th>
-<td>77</td>
-<td>TAYLOR CRUZ</td>
-<td>JORDAN</td>
-<td>Jordan and Taylor Cruz are team members workin...</td>
-<td>4.0</td>
-<td>2</td>
-<td>True</td>
-</tr>
-<tr>
-<th>4</th>
-<td>82</td>
-<td>TAYLOR CRUZ</td>
-<td>DR. JORDAN HAYES</td>
-<td>Dr. Jordan Hayes and Taylor Cruz are colleague...</td>
-<td>4.0</td>
-<td>2</td>
-<td>True</td>
-</tr>
-</tbody>
-</table>
+<span class="ansi-red-fg">NameError</span>: name 'result' is not defined</pre>
 </div>
 </div>
 </div>
 </div>
 </div>
-</div>
-</div><div class="jp-Cell jp-CodeCell jp-Notebook-cell jp-mod-noOutputs">
-<div class="jp-Cell jp-CodeCell jp-Notebook-cell jp-mod-noOutputs">
+</div><div class="jp-Cell jp-CodeCell jp-Notebook-cell">
+<div class="jp-Cell jp-CodeCell jp-Notebook-cell">
 <div class="jp-Cell-inputWrapper" tabindex="0">
 <div class="jp-Collapser jp-InputCollapser jp-Cell-inputCollapser">
 </div>
@@ -3697,6 +3734,25 @@ In summary, Dr. Jordan Hayes is a vital asset to the Paranormal Military Squad,
 </div>
 </div>
 </div>
+<div class="jp-Cell-outputWrapper">
+<div class="jp-Collapser jp-OutputCollapser jp-Cell-outputCollapser">
+</div>
+<div class="jp-OutputArea jp-Cell-outputArea">
+<div class="jp-OutputArea-child">
+<div class="jp-OutputPrompt jp-OutputArea-prompt"></div>
+<div class="jp-RenderedText jp-OutputArea-output" data-mime-type="application/vnd.jupyter.stderr" tabindex="0">
+<pre>
+<span class="ansi-red-fg">---------------------------------------------------------------------------</span>
+<span class="ansi-red-fg">NameError</span>                                 Traceback (most recent call last)
+Cell <span class="ansi-green-fg">In[17], line 1</span>
+<span class="ansi-green-fg">----&gt; 1</span> <span class="ansi-bold" style="color: rgb(0,135,0)">if</span> <span style="color: rgb(175,0,0)">"</span><span style="color: rgb(175,0,0)">reports</span><span style="color: rgb(175,0,0)">"</span> <span class="ansi-bold" style="color: rgb(175,0,255)">in</span> <span class="ansi-yellow-bg">result</span><span style="color: rgb(98,98,98)">.</span>context_data:
+<span class="ansi-green-intense-fg ansi-bold">      2</span>     result<span style="color: rgb(98,98,98)">.</span>context_data[<span style="color: rgb(175,0,0)">"</span><span style="color: rgb(175,0,0)">reports</span><span style="color: rgb(175,0,0)">"</span>]<span style="color: rgb(98,98,98)">.</span>head()
+
+<span class="ansi-red-fg">NameError</span>: name 'result' is not defined</pre>
+</div>
+</div>
+</div>
+</div>
 </div>
 </div><div class="jp-Cell jp-CodeCell jp-Notebook-cell">
 <div class="jp-Cell jp-CodeCell jp-Notebook-cell">
@@ -3728,60 +3784,16 @@ In summary, Dr. Jordan Hayes is a vital asset to the Paranormal Military Squad,
 <div class="jp-Collapser jp-OutputCollapser jp-Cell-outputCollapser">
 </div>
 <div class="jp-OutputArea jp-Cell-outputArea">
-<div class="jp-OutputArea-child jp-OutputArea-executeResult">
-<div class="jp-OutputPrompt jp-OutputArea-prompt">Out[18]:</div>
-<div class="jp-RenderedHTMLCommon jp-RenderedHTML jp-OutputArea-output jp-OutputArea-executeResult" data-mime-type="text/html" tabindex="0">
-<div>
-<style scoped="">
-    .dataframe tbody tr th:only-of-type {
-        vertical-align: middle;
-    }
+<div class="jp-OutputArea-child">
+<div class="jp-OutputPrompt jp-OutputArea-prompt"></div>
+<div class="jp-RenderedText jp-OutputArea-output" data-mime-type="application/vnd.jupyter.stderr" tabindex="0">
+<pre>
+<span class="ansi-red-fg">---------------------------------------------------------------------------</span>
+<span class="ansi-red-fg">NameError</span>                                 Traceback (most recent call last)
+Cell <span class="ansi-green-fg">In[18], line 1</span>
+<span class="ansi-green-fg">----&gt; 1</span> <span class="ansi-yellow-bg">result</span><span style="color: rgb(98,98,98)">.</span>context_data[<span style="color: rgb(175,0,0)">"</span><span style="color: rgb(175,0,0)">sources</span><span style="color: rgb(175,0,0)">"</span>]<span style="color: rgb(98,98,98)">.</span>head()
 
-    .dataframe tbody tr th {
-        vertical-align: top;
-    }
-
-    .dataframe thead th {
-        text-align: right;
-    }
-</style>
-<table border="1" class="dataframe">
-<thead>
-<tr style="text-align: right;">
-<th></th>
-<th>id</th>
-<th>text</th>
-</tr>
-</thead>
-<tbody>
-<tr>
-<th>0</th>
-<td>40</td>
-<td>and the distant hum of machinery hinted at Du...</td>
-</tr>
-<tr>
-<th>1</th>
-<td>18</td>
-<td>the universe.\n\nIn a symphony of clicks and ...</td>
-</tr>
-<tr>
-<th>2</th>
-<td>37</td>
-<td>from across the console, their eyes not leavi...</td>
-</tr>
-<tr>
-<th>3</th>
-<td>19</td>
-<td>extraterrestrial sentience that had outreache...</td>
-</tr>
-<tr>
-<th>4</th>
-<td>44</td>
-<td>It's a... symphony. It's as if they're teachi...</td>
-</tr>
-</tbody>
-</table>
-</div>
+<span class="ansi-red-fg">NameError</span>: name 'result' is not defined</pre>
 </div>
 </div>
 </div>
@@ -3821,21 +3833,15 @@ In summary, Dr. Jordan Hayes is a vital asset to the Paranormal Military Squad,
 <div class="jp-OutputArea jp-Cell-outputArea">
 <div class="jp-OutputArea-child">
 <div class="jp-OutputPrompt jp-OutputArea-prompt"></div>
-<div class="jp-RenderedText jp-OutputArea-output" data-mime-type="text/plain" tabindex="0">
-<pre>   id            entity object_id status start_date end_date  \
-0   2  DR. JORDAN HAYES      NONE   TRUE       NONE     NONE   
-1  13  DR. JORDAN HAYES      NONE   TRUE       NONE     NONE   
-2  60  DR. JORDAN HAYES      NONE   TRUE       NONE     NONE   
-3  83  DR. JORDAN HAYES      NONE   TRUE       NONE     NONE   
-4  91  DR. JORDAN HAYES      NONE   TRUE       NONE     NONE   
+<div class="jp-RenderedText jp-OutputArea-output" data-mime-type="application/vnd.jupyter.stderr" tabindex="0">
+<pre>
+<span class="ansi-red-fg">---------------------------------------------------------------------------</span>
+<span class="ansi-red-fg">NameError</span>                                 Traceback (most recent call last)
+Cell <span class="ansi-green-fg">In[19], line 1</span>
+<span class="ansi-green-fg">----&gt; 1</span> <span class="ansi-bold" style="color: rgb(0,135,0)">if</span> <span style="color: rgb(175,0,0)">"</span><span style="color: rgb(175,0,0)">claims</span><span style="color: rgb(175,0,0)">"</span> <span class="ansi-bold" style="color: rgb(175,0,255)">in</span> <span class="ansi-yellow-bg">result</span><span style="color: rgb(98,98,98)">.</span>context_data:
+<span class="ansi-green-intense-fg ansi-bold">      2</span>     <span style="color: rgb(0,135,0)">print</span>(result<span style="color: rgb(98,98,98)">.</span>context_data[<span style="color: rgb(175,0,0)">"</span><span style="color: rgb(175,0,0)">claims</span><span style="color: rgb(175,0,0)">"</span>]<span style="color: rgb(98,98,98)">.</span>head())
 
-                                         description  in_context  
-0  Dr. Jordan Hayes emphasizes the importance of ...        True  
-1  Dr. Jordan Hayes reflected on their own skepti...        True  
-2  Dr. Jordan Hayes was focused on deciphering al...        True  
-3  Dr. Jordan Hayes successfully worked through t...        True  
-4  Dr. Jordan Hayes led the efforts in isolating ...        True  
-</pre>
+<span class="ansi-red-fg">NameError</span>: name 'result' is not defined</pre>
 </div>
 </div>
 </div>
@@ -3949,10 +3955,122 @@ print(candidate_questions.response)</div>
 <div class="jp-OutputArea-child">
 <div class="jp-OutputPrompt jp-OutputArea-prompt"></div>
 <div class="jp-RenderedText jp-OutputArea-output" data-mime-type="text/plain" tabindex="0">
-<pre>['- What is the role of Agent Alex Mercer in Operation: Dulce?', '- How does the Paranormal Military Squad interact with extraterrestrial intelligence at Dulce Base?', '- What are the main objectives of Operation: Dulce?', '- How does Taylor Cruz contribute to the mission at Dulce Base?', '- What challenges do the agents face at Dulce Base during their mission?']
+<pre>Error embedding chunk {'OpenAIEmbedding': "Error code: 429 - {'error': {'message': 'You exceeded your current quota, please check your plan and billing details. For more information on this error, read the docs: https://platform.openai.com/docs/guides/error-codes/api-errors.', 'type': 'insufficient_quota', 'param': None, 'code': 'insufficient_quota'}}"}
 </pre>
 </div>
 </div>
+<div class="jp-OutputArea-child">
+<div class="jp-OutputPrompt jp-OutputArea-prompt"></div>
+<div class="jp-RenderedText jp-OutputArea-output" data-mime-type="application/vnd.jupyter.stderr" tabindex="0">
+<pre>
+<span class="ansi-red-fg">---------------------------------------------------------------------------</span>
+<span class="ansi-red-fg">ZeroDivisionError</span>                         Traceback (most recent call last)
+Cell <span class="ansi-green-fg">In[21], line 5</span>
+<span class="ansi-green-intense-fg ansi-bold">      1</span> question_history <span style="color: rgb(98,98,98)">=</span> [
+<span class="ansi-green-intense-fg ansi-bold">      2</span>     <span style="color: rgb(175,0,0)">"</span><span style="color: rgb(175,0,0)">Tell me about Agent Mercer</span><span style="color: rgb(175,0,0)">"</span>,
+<span class="ansi-green-intense-fg ansi-bold">      3</span>     <span style="color: rgb(175,0,0)">"</span><span style="color: rgb(175,0,0)">What happens in Dulce military base?</span><span style="color: rgb(175,0,0)">"</span>,
+<span class="ansi-green-intense-fg ansi-bold">      4</span> ]
+<span class="ansi-green-fg">----&gt; 5</span> candidate_questions <span style="color: rgb(98,98,98)">=</span> <span class="ansi-bold" style="color: rgb(0,135,0)">await</span> question_generator<span style="color: rgb(98,98,98)">.</span>agenerate(
+<span class="ansi-green-intense-fg ansi-bold">      6</span>     question_history<span style="color: rgb(98,98,98)">=</span>question_history, context_data<span style="color: rgb(98,98,98)">=</span><span class="ansi-bold" style="color: rgb(0,135,0)">None</span>, question_count<span style="color: rgb(98,98,98)">=</span><span style="color: rgb(98,98,98)">5</span>
+<span class="ansi-green-intense-fg ansi-bold">      7</span> )
+<span class="ansi-green-intense-fg ansi-bold">      8</span> <span style="color: rgb(0,135,0)">print</span>(candidate_questions<span style="color: rgb(98,98,98)">.</span>response)
+
+File <span class="ansi-green-fg">~/work/graphrag/graphrag/graphrag/query/question_gen/local_gen.py:79</span>, in <span class="ansi-cyan-fg">LocalQuestionGen.agenerate</span><span class="ansi-blue-fg">(self, question_history, context_data, question_count, **kwargs)</span>
+<span class="ansi-green-intense-fg ansi-bold">     73</span>     conversation_history <span style="color: rgb(98,98,98)">=</span> ConversationHistory<span style="color: rgb(98,98,98)">.</span>from_list(history)
+<span class="ansi-green-intense-fg ansi-bold">     75</span> <span class="ansi-bold" style="color: rgb(0,135,0)">if</span> context_data <span class="ansi-bold" style="color: rgb(175,0,255)">is</span> <span class="ansi-bold" style="color: rgb(0,135,0)">None</span>:
+<span class="ansi-green-intense-fg ansi-bold">     76</span>     <span style="color: rgb(95,135,135)"># generate context data based on the question history</span>
+<span class="ansi-green-intense-fg ansi-bold">     77</span>     result <span style="color: rgb(98,98,98)">=</span> cast(
+<span class="ansi-green-intense-fg ansi-bold">     78</span>         ContextBuilderResult,
+<span class="ansi-green-fg">---&gt; 79</span>         <span class="ansi-yellow-bg" style="color: rgb(0,135,0)">self</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">.</span><span class="ansi-yellow-bg">context_builder</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">.</span><span class="ansi-yellow-bg">build_context</span><span class="ansi-yellow-bg">(</span>
+<span class="ansi-green-intense-fg ansi-bold">     80</span> <span class="ansi-yellow-bg">            </span><span class="ansi-yellow-bg">query</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">=</span><span class="ansi-yellow-bg">question_text</span><span class="ansi-yellow-bg">,</span>
+<span class="ansi-green-intense-fg ansi-bold">     81</span> <span class="ansi-yellow-bg">            </span><span class="ansi-yellow-bg">conversation_history</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">=</span><span class="ansi-yellow-bg">conversation_history</span><span class="ansi-yellow-bg">,</span>
+<span class="ansi-green-intense-fg ansi-bold">     82</span> <span class="ansi-yellow-bg">            </span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">*</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">*</span><span class="ansi-yellow-bg">kwargs</span><span class="ansi-yellow-bg">,</span>
+<span class="ansi-green-intense-fg ansi-bold">     83</span> <span class="ansi-yellow-bg">            </span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">*</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">*</span><span class="ansi-yellow-bg" style="color: rgb(0,135,0)">self</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">.</span><span class="ansi-yellow-bg">context_builder_params</span><span class="ansi-yellow-bg">,</span>
+<span class="ansi-green-intense-fg ansi-bold">     84</span> <span class="ansi-yellow-bg">        </span><span class="ansi-yellow-bg">)</span>,
+<span class="ansi-green-intense-fg ansi-bold">     85</span>     )
+<span class="ansi-green-intense-fg ansi-bold">     86</span>     context_data <span style="color: rgb(98,98,98)">=</span> cast(<span style="color: rgb(0,135,0)">str</span>, result<span style="color: rgb(98,98,98)">.</span>context_chunks)
+<span class="ansi-green-intense-fg ansi-bold">     87</span>     context_records <span style="color: rgb(98,98,98)">=</span> result<span style="color: rgb(98,98,98)">.</span>context_records
+
+File <span class="ansi-green-fg">~/work/graphrag/graphrag/graphrag/query/structured_search/local_search/mixed_context.py:139</span>, in <span class="ansi-cyan-fg">LocalSearchMixedContext.build_context</span><span class="ansi-blue-fg">(self, query, conversation_history, include_entity_names, exclude_entity_names, conversation_history_max_turns, conversation_history_user_turns_only, max_tokens, text_unit_prop, community_prop, top_k_mapped_entities, top_k_relationships, include_community_rank, include_entity_rank, rank_description, include_relationship_weight, relationship_ranking_attribute, return_candidate_context, use_community_summary, min_community_rank, community_context_name, column_delimiter, **kwargs)</span>
+<span class="ansi-green-intense-fg ansi-bold">    134</span>     pre_user_questions <span style="color: rgb(98,98,98)">=</span> <span style="color: rgb(175,0,0)">"</span><span class="ansi-bold" style="color: rgb(175,95,0)">\n</span><span style="color: rgb(175,0,0)">"</span><span style="color: rgb(98,98,98)">.</span>join(
+<span class="ansi-green-intense-fg ansi-bold">    135</span>         conversation_history<span style="color: rgb(98,98,98)">.</span>get_user_turns(conversation_history_max_turns)
+<span class="ansi-green-intense-fg ansi-bold">    136</span>     )
+<span class="ansi-green-intense-fg ansi-bold">    137</span>     query <span style="color: rgb(98,98,98)">=</span> <span style="color: rgb(175,0,0)">f</span><span style="color: rgb(175,0,0)">"</span><span class="ansi-bold" style="color: rgb(175,95,135)">{</span>query<span class="ansi-bold" style="color: rgb(175,95,135)">}</span><span class="ansi-bold" style="color: rgb(175,95,0)">\n</span><span class="ansi-bold" style="color: rgb(175,95,135)">{</span>pre_user_questions<span class="ansi-bold" style="color: rgb(175,95,135)">}</span><span style="color: rgb(175,0,0)">"</span>
+<span class="ansi-green-fg">--&gt; 139</span> selected_entities <span style="color: rgb(98,98,98)">=</span> <span class="ansi-yellow-bg">map_query_to_entities</span><span class="ansi-yellow-bg">(</span>
+<span class="ansi-green-intense-fg ansi-bold">    140</span> <span class="ansi-yellow-bg">    </span><span class="ansi-yellow-bg">query</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">=</span><span class="ansi-yellow-bg">query</span><span class="ansi-yellow-bg">,</span>
+<span class="ansi-green-intense-fg ansi-bold">    141</span> <span class="ansi-yellow-bg">    </span><span class="ansi-yellow-bg">text_embedding_vectorstore</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">=</span><span class="ansi-yellow-bg" style="color: rgb(0,135,0)">self</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">.</span><span class="ansi-yellow-bg">entity_text_embeddings</span><span class="ansi-yellow-bg">,</span>
+<span class="ansi-green-intense-fg ansi-bold">    142</span> <span class="ansi-yellow-bg">    </span><span class="ansi-yellow-bg">text_embedder</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">=</span><span class="ansi-yellow-bg" style="color: rgb(0,135,0)">self</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">.</span><span class="ansi-yellow-bg">text_embedder</span><span class="ansi-yellow-bg">,</span>
+<span class="ansi-green-intense-fg ansi-bold">    143</span> <span class="ansi-yellow-bg">    </span><span class="ansi-yellow-bg">all_entities_dict</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">=</span><span class="ansi-yellow-bg" style="color: rgb(0,135,0)">self</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">.</span><span class="ansi-yellow-bg">entities</span><span class="ansi-yellow-bg">,</span>
+<span class="ansi-green-intense-fg ansi-bold">    144</span> <span class="ansi-yellow-bg">    </span><span class="ansi-yellow-bg">embedding_vectorstore_key</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">=</span><span class="ansi-yellow-bg" style="color: rgb(0,135,0)">self</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">.</span><span class="ansi-yellow-bg">embedding_vectorstore_key</span><span class="ansi-yellow-bg">,</span>
+<span class="ansi-green-intense-fg ansi-bold">    145</span> <span class="ansi-yellow-bg">    </span><span class="ansi-yellow-bg">include_entity_names</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">=</span><span class="ansi-yellow-bg">include_entity_names</span><span class="ansi-yellow-bg">,</span>
+<span class="ansi-green-intense-fg ansi-bold">    146</span> <span class="ansi-yellow-bg">    </span><span class="ansi-yellow-bg">exclude_entity_names</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">=</span><span class="ansi-yellow-bg">exclude_entity_names</span><span class="ansi-yellow-bg">,</span>
+<span class="ansi-green-intense-fg ansi-bold">    147</span> <span class="ansi-yellow-bg">    </span><span class="ansi-yellow-bg">k</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">=</span><span class="ansi-yellow-bg">top_k_mapped_entities</span><span class="ansi-yellow-bg">,</span>
+<span class="ansi-green-intense-fg ansi-bold">    148</span> <span class="ansi-yellow-bg">    </span><span class="ansi-yellow-bg">oversample_scaler</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">=</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">2</span><span class="ansi-yellow-bg">,</span>
+<span class="ansi-green-intense-fg ansi-bold">    149</span> <span class="ansi-yellow-bg">)</span>
+<span class="ansi-green-intense-fg ansi-bold">    151</span> <span style="color: rgb(95,135,135)"># build context</span>
+<span class="ansi-green-intense-fg ansi-bold">    152</span> final_context <span style="color: rgb(98,98,98)">=</span> <span style="color: rgb(0,135,0)">list</span>[<span style="color: rgb(0,135,0)">str</span>]()
+
+File <span class="ansi-green-fg">~/work/graphrag/graphrag/graphrag/query/context_builder/entity_extraction.py:58</span>, in <span class="ansi-cyan-fg">map_query_to_entities</span><span class="ansi-blue-fg">(query, text_embedding_vectorstore, text_embedder, all_entities_dict, embedding_vectorstore_key, include_entity_names, exclude_entity_names, k, oversample_scaler)</span>
+<span class="ansi-green-intense-fg ansi-bold">     54</span> matched_entities <span style="color: rgb(98,98,98)">=</span> []
+<span class="ansi-green-intense-fg ansi-bold">     55</span> <span class="ansi-bold" style="color: rgb(0,135,0)">if</span> query <span style="color: rgb(98,98,98)">!=</span> <span style="color: rgb(175,0,0)">"</span><span style="color: rgb(175,0,0)">"</span>:
+<span class="ansi-green-intense-fg ansi-bold">     56</span>     <span style="color: rgb(95,135,135)"># get entities with highest semantic similarity to query</span>
+<span class="ansi-green-intense-fg ansi-bold">     57</span>     <span style="color: rgb(95,135,135)"># oversample to account for excluded entities</span>
+<span class="ansi-green-fg">---&gt; 58</span>     search_results <span style="color: rgb(98,98,98)">=</span> <span class="ansi-yellow-bg">text_embedding_vectorstore</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">.</span><span class="ansi-yellow-bg">similarity_search_by_text</span><span class="ansi-yellow-bg">(</span>
+<span class="ansi-green-intense-fg ansi-bold">     59</span> <span class="ansi-yellow-bg">        </span><span class="ansi-yellow-bg">text</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">=</span><span class="ansi-yellow-bg">query</span><span class="ansi-yellow-bg">,</span>
+<span class="ansi-green-intense-fg ansi-bold">     60</span> <span class="ansi-yellow-bg">        </span><span class="ansi-yellow-bg">text_embedder</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">=</span><span class="ansi-yellow-bg ansi-bold" style="color: rgb(0,135,0)">lambda</span><span class="ansi-yellow-bg"> </span><span class="ansi-yellow-bg">t</span><span class="ansi-yellow-bg">:</span><span class="ansi-yellow-bg"> </span><span class="ansi-yellow-bg">text_embedder</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">.</span><span class="ansi-yellow-bg">embed</span><span class="ansi-yellow-bg">(</span><span class="ansi-yellow-bg">t</span><span class="ansi-yellow-bg">)</span><span class="ansi-yellow-bg">,</span>
+<span class="ansi-green-intense-fg ansi-bold">     61</span> <span class="ansi-yellow-bg">        </span><span class="ansi-yellow-bg">k</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">=</span><span class="ansi-yellow-bg">k</span><span class="ansi-yellow-bg"> </span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">*</span><span class="ansi-yellow-bg"> </span><span class="ansi-yellow-bg">oversample_scaler</span><span class="ansi-yellow-bg">,</span>
+<span class="ansi-green-intense-fg ansi-bold">     62</span> <span class="ansi-yellow-bg">    </span><span class="ansi-yellow-bg">)</span>
+<span class="ansi-green-intense-fg ansi-bold">     63</span>     <span class="ansi-bold" style="color: rgb(0,135,0)">for</span> result <span class="ansi-bold" style="color: rgb(175,0,255)">in</span> search_results:
+<span class="ansi-green-intense-fg ansi-bold">     64</span>         <span class="ansi-bold" style="color: rgb(0,135,0)">if</span> embedding_vectorstore_key <span style="color: rgb(98,98,98)">==</span> EntityVectorStoreKey<span style="color: rgb(98,98,98)">.</span>ID <span class="ansi-bold" style="color: rgb(175,0,255)">and</span> <span style="color: rgb(0,135,0)">isinstance</span>(
+<span class="ansi-green-intense-fg ansi-bold">     65</span>             result<span style="color: rgb(98,98,98)">.</span>document<span style="color: rgb(98,98,98)">.</span>id, <span style="color: rgb(0,135,0)">str</span>
+<span class="ansi-green-intense-fg ansi-bold">     66</span>         ):
+
+File <span class="ansi-green-fg">~/work/graphrag/graphrag/graphrag/vector_stores/lancedb.py:134</span>, in <span class="ansi-cyan-fg">LanceDBVectorStore.similarity_search_by_text</span><span class="ansi-blue-fg">(self, text, text_embedder, k, **kwargs)</span>
+<span class="ansi-green-intense-fg ansi-bold">    130</span> <span class="ansi-bold" style="color: rgb(0,135,0)">def</span> <span style="color: rgb(0,0,255)">similarity_search_by_text</span>(
+<span class="ansi-green-intense-fg ansi-bold">    131</span>     <span style="color: rgb(0,135,0)">self</span>, text: <span style="color: rgb(0,135,0)">str</span>, text_embedder: TextEmbedder, k: <span style="color: rgb(0,135,0)">int</span> <span style="color: rgb(98,98,98)">=</span> <span style="color: rgb(98,98,98)">10</span>, <span style="color: rgb(98,98,98)">*</span><span style="color: rgb(98,98,98)">*</span>kwargs: Any
+<span class="ansi-green-intense-fg ansi-bold">    132</span> ) <span style="color: rgb(98,98,98)">-</span><span style="color: rgb(98,98,98)">&gt;</span> <span style="color: rgb(0,135,0)">list</span>[VectorStoreSearchResult]:
+<span class="ansi-green-intense-fg ansi-bold">    133</span> <span style="color: rgb(188,188,188)">    </span><span style="color: rgb(175,0,0)">"""Perform a similarity search using a given input text."""</span>
+<span class="ansi-green-fg">--&gt; 134</span>     query_embedding <span style="color: rgb(98,98,98)">=</span> <span class="ansi-yellow-bg">text_embedder</span><span class="ansi-yellow-bg">(</span><span class="ansi-yellow-bg">text</span><span class="ansi-yellow-bg">)</span>
+<span class="ansi-green-intense-fg ansi-bold">    135</span>     <span class="ansi-bold" style="color: rgb(0,135,0)">if</span> query_embedding:
+<span class="ansi-green-intense-fg ansi-bold">    136</span>         <span class="ansi-bold" style="color: rgb(0,135,0)">return</span> <span style="color: rgb(0,135,0)">self</span><span style="color: rgb(98,98,98)">.</span>similarity_search_by_vector(query_embedding, k)
+
+File <span class="ansi-green-fg">~/work/graphrag/graphrag/graphrag/query/context_builder/entity_extraction.py:60</span>, in <span class="ansi-cyan-fg">map_query_to_entities.&lt;locals&gt;.&lt;lambda&gt;</span><span class="ansi-blue-fg">(t)</span>
+<span class="ansi-green-intense-fg ansi-bold">     54</span> matched_entities <span style="color: rgb(98,98,98)">=</span> []
+<span class="ansi-green-intense-fg ansi-bold">     55</span> <span class="ansi-bold" style="color: rgb(0,135,0)">if</span> query <span style="color: rgb(98,98,98)">!=</span> <span style="color: rgb(175,0,0)">"</span><span style="color: rgb(175,0,0)">"</span>:
+<span class="ansi-green-intense-fg ansi-bold">     56</span>     <span style="color: rgb(95,135,135)"># get entities with highest semantic similarity to query</span>
+<span class="ansi-green-intense-fg ansi-bold">     57</span>     <span style="color: rgb(95,135,135)"># oversample to account for excluded entities</span>
+<span class="ansi-green-intense-fg ansi-bold">     58</span>     search_results <span style="color: rgb(98,98,98)">=</span> text_embedding_vectorstore<span style="color: rgb(98,98,98)">.</span>similarity_search_by_text(
+<span class="ansi-green-intense-fg ansi-bold">     59</span>         text<span style="color: rgb(98,98,98)">=</span>query,
+<span class="ansi-green-fg">---&gt; 60</span>         text_embedder<span style="color: rgb(98,98,98)">=</span><span class="ansi-bold" style="color: rgb(0,135,0)">lambda</span> t: <span class="ansi-yellow-bg">text_embedder</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">.</span><span class="ansi-yellow-bg">embed</span><span class="ansi-yellow-bg">(</span><span class="ansi-yellow-bg">t</span><span class="ansi-yellow-bg">)</span>,
+<span class="ansi-green-intense-fg ansi-bold">     61</span>         k<span style="color: rgb(98,98,98)">=</span>k <span style="color: rgb(98,98,98)">*</span> oversample_scaler,
+<span class="ansi-green-intense-fg ansi-bold">     62</span>     )
+<span class="ansi-green-intense-fg ansi-bold">     63</span>     <span class="ansi-bold" style="color: rgb(0,135,0)">for</span> result <span class="ansi-bold" style="color: rgb(175,0,255)">in</span> search_results:
+<span class="ansi-green-intense-fg ansi-bold">     64</span>         <span class="ansi-bold" style="color: rgb(0,135,0)">if</span> embedding_vectorstore_key <span style="color: rgb(98,98,98)">==</span> EntityVectorStoreKey<span style="color: rgb(98,98,98)">.</span>ID <span class="ansi-bold" style="color: rgb(175,0,255)">and</span> <span style="color: rgb(0,135,0)">isinstance</span>(
+<span class="ansi-green-intense-fg ansi-bold">     65</span>             result<span style="color: rgb(98,98,98)">.</span>document<span style="color: rgb(98,98,98)">.</span>id, <span style="color: rgb(0,135,0)">str</span>
+<span class="ansi-green-intense-fg ansi-bold">     66</span>         ):
+
+File <span class="ansi-green-fg">~/work/graphrag/graphrag/graphrag/query/llm/oai/embedding.py:96</span>, in <span class="ansi-cyan-fg">OpenAIEmbedding.embed</span><span class="ansi-blue-fg">(self, text, **kwargs)</span>
+<span class="ansi-green-intense-fg ansi-bold">     90</span>         <span style="color: rgb(0,135,0)">self</span><span style="color: rgb(98,98,98)">.</span>_reporter<span style="color: rgb(98,98,98)">.</span>error(
+<span class="ansi-green-intense-fg ansi-bold">     91</span>             message<span style="color: rgb(98,98,98)">=</span><span style="color: rgb(175,0,0)">"</span><span style="color: rgb(175,0,0)">Error embedding chunk</span><span style="color: rgb(175,0,0)">"</span>,
+<span class="ansi-green-intense-fg ansi-bold">     92</span>             details<span style="color: rgb(98,98,98)">=</span>{<span style="color: rgb(0,135,0)">self</span><span style="color: rgb(98,98,98)">.</span><span style="color: rgb(0,0,135)">__class__</span><span style="color: rgb(98,98,98)">.</span><span style="color: rgb(0,0,135)">__name__</span>: <span style="color: rgb(0,135,0)">str</span>(e)},
+<span class="ansi-green-intense-fg ansi-bold">     93</span>         )
+<span class="ansi-green-intense-fg ansi-bold">     95</span>         <span class="ansi-bold" style="color: rgb(0,135,0)">continue</span>
+<span class="ansi-green-fg">---&gt; 96</span> chunk_embeddings <span style="color: rgb(98,98,98)">=</span> <span class="ansi-yellow-bg">np</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">.</span><span class="ansi-yellow-bg">average</span><span class="ansi-yellow-bg">(</span><span class="ansi-yellow-bg">chunk_embeddings</span><span class="ansi-yellow-bg">,</span><span class="ansi-yellow-bg"> </span><span class="ansi-yellow-bg">axis</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">=</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">0</span><span class="ansi-yellow-bg">,</span><span class="ansi-yellow-bg"> </span><span class="ansi-yellow-bg">weights</span><span class="ansi-yellow-bg" style="color: rgb(98,98,98)">=</span><span class="ansi-yellow-bg">chunk_lens</span><span class="ansi-yellow-bg">)</span>
+<span class="ansi-green-intense-fg ansi-bold">     97</span> chunk_embeddings <span style="color: rgb(98,98,98)">=</span> chunk_embeddings <span style="color: rgb(98,98,98)">/</span> np<span style="color: rgb(98,98,98)">.</span>linalg<span style="color: rgb(98,98,98)">.</span>norm(chunk_embeddings)
+<span class="ansi-green-intense-fg ansi-bold">     98</span> <span class="ansi-bold" style="color: rgb(0,135,0)">return</span> chunk_embeddings<span style="color: rgb(98,98,98)">.</span>tolist()
+
+File <span class="ansi-green-fg">~/.cache/pypoetry/virtualenvs/graphrag-F2jvqev7-py3.11/lib/python3.11/site-packages/numpy/lib/function_base.py:550</span>, in <span class="ansi-cyan-fg">average</span><span class="ansi-blue-fg">(a, axis, weights, returned, keepdims)</span>
+<span class="ansi-green-intense-fg ansi-bold">    548</span>     scl <span style="color: rgb(98,98,98)">=</span> wgt<span style="color: rgb(98,98,98)">.</span>sum(axis<span style="color: rgb(98,98,98)">=</span>axis, dtype<span style="color: rgb(98,98,98)">=</span>result_dtype, <span style="color: rgb(98,98,98)">*</span><span style="color: rgb(98,98,98)">*</span>keepdims_kw)
+<span class="ansi-green-intense-fg ansi-bold">    549</span>     <span class="ansi-bold" style="color: rgb(0,135,0)">if</span> np<span style="color: rgb(98,98,98)">.</span>any(scl <span style="color: rgb(98,98,98)">==</span> <span style="color: rgb(98,98,98)">0.0</span>):
+<span class="ansi-green-fg">--&gt; 550</span>         <span class="ansi-bold" style="color: rgb(0,135,0)">raise</span> <span class="ansi-bold" style="color: rgb(215,95,95)">ZeroDivisionError</span>(
+<span class="ansi-green-intense-fg ansi-bold">    551</span>             <span style="color: rgb(175,0,0)">"</span><span style="color: rgb(175,0,0)">Weights sum to zero, can</span><span style="color: rgb(175,0,0)">'</span><span style="color: rgb(175,0,0)">t be normalized</span><span style="color: rgb(175,0,0)">"</span>)
+<span class="ansi-green-intense-fg ansi-bold">    553</span>     avg <span style="color: rgb(98,98,98)">=</span> avg_as_array <span style="color: rgb(98,98,98)">=</span> np<span style="color: rgb(98,98,98)">.</span>multiply(a, wgt,
+<span class="ansi-green-intense-fg ansi-bold">    554</span>                       dtype<span style="color: rgb(98,98,98)">=</span>result_dtype)<span style="color: rgb(98,98,98)">.</span>sum(axis, <span style="color: rgb(98,98,98)">*</span><span style="color: rgb(98,98,98)">*</span>keepdims_kw) <span style="color: rgb(98,98,98)">/</span> scl
+<span class="ansi-green-intense-fg ansi-bold">    556</span> <span class="ansi-bold" style="color: rgb(0,135,0)">if</span> returned:
+
+<span class="ansi-red-fg">ZeroDivisionError</span>: Weights sum to zero, can't be normalized</pre>
+</div>
+</div>
 </div>
 </div>
 </div>
diff --git a/search/search_index.json b/search/search_index.json
index ca6ec13e..e9b33690 100644
--- a/search/search_index.json
+++ b/search/search_index.json
@@ -1 +1 @@
-{"config": {"lang": ["en"], "separator": "[\\s\\-]+", "pipeline": ["stopWordFilter"]}, "docs": [{"location": "", "title": "Welcome to GraphRAG", "text": "<p>\ud83d\udc49 Microsoft Research Blog Post  \ud83d\udc49 GraphRAG Accelerator  \ud83d\udc49 GraphRAG Arxiv</p> <p> </p> <p> Figure 1: An LLM-generated knowledge graph built using GPT-4 Turbo. </p> <p>GraphRAG is a structured, hierarchical approach to Retrieval Augmented Generation (RAG), as opposed to naive semantic-search approaches using plain text snippets. The GraphRAG process involves extracting a knowledge graph out of raw text, building a community hierarchy, generating summaries for these communities, and then leveraging these structures when perform RAG-based tasks.</p> <p>To learn more about GraphRAG and how it can be used to enhance your LLMs ability to reason about your private data, please visit the Microsoft Research Blog Post.</p>"}, {"location": "#solution-accelerator", "title": "Solution Accelerator \ud83d\ude80", "text": "<p>To quickstart the GraphRAG system we recommend trying the Solution Accelerator package. This provides a user-friendly end-to-end experience with Azure resources.</p>"}, {"location": "#get-started-with-graphrag", "title": "Get Started with GraphRAG \ud83d\ude80", "text": "<p>To start using GraphRAG, check out the Get Started guide. For a deeper dive into the main sub-systems, please visit the docpages for the Indexer and Query packages.</p>"}, {"location": "#graphrag-vs-baseline-rag", "title": "GraphRAG vs Baseline RAG \ud83d\udd0d", "text": "<p>Retrieval-Augmented Generation (RAG) is a technique to improve LLM outputs using real-world information. This technique is an important part of most LLM-based tools and the majority of RAG approaches use vector similarity as the search technique, which we call Baseline RAG. GraphRAG uses knowledge graphs to provide substantial improvements in question-and-answer performance when reasoning about complex information. RAG techniques have shown promise in helping LLMs to reason about private datasets - data that the LLM is not trained on and has never seen before, such as an enterprise\u2019s proprietary research, business documents, or communications. Baseline RAG was created to help solve this problem, but we observe situations where baseline RAG performs very poorly. For example:</p> <ul> <li>Baseline RAG struggles to connect the dots. This happens when answering a question requires traversing disparate pieces of information through their shared attributes in order to provide new synthesized insights.</li> <li>Baseline RAG performs poorly when being asked to holistically understand summarized semantic concepts over large data collections or even singular large documents.</li> </ul> <p>To address this, the tech community is working to develop methods that extend and enhance RAG. Microsoft Research\u2019s new approach, GraphRAG, uses LLMs to create a knowledge graph based on an input corpus. This graph, along with community summaries and graph machine learning outputs, are used to augment prompts at query time. GraphRAG shows substantial improvement in answering the two classes of questions described above, demonstrating intelligence or mastery that outperforms other approaches previously applied to private datasets.</p>"}, {"location": "#the-graphrag-process", "title": "The GraphRAG Process \ud83e\udd16", "text": "<p>GraphRAG builds upon our prior research and tooling using graph machine learning. The basic steps of the GraphRAG process are as follows:</p>"}, {"location": "#index", "title": "Index", "text": "<ul> <li>Slice up an input corpus into a series of TextUnits, which act as analyzable units for the rest of the process, and provide fine-grained references in our outputs.</li> <li>Extract all entities, relationships, and key claims from the TextUnits using an LLM.</li> <li>Perform a hierarchical clustering of the graph using the Leiden technique. To see this visually, check out Figure 1 above. Each circle is an entity (e.g., a person, place, or organization), with the size representing the degree of the entity, and the color representing its community.</li> <li>Generate summaries of each community and its constituents from the bottom-up. This aids in holistic understanding of the dataset.</li> </ul>"}, {"location": "#query", "title": "Query", "text": "<p>At query time, these structures are used to provide materials for the LLM context window when answering a question. The primary query modes are:</p> <ul> <li>Global Search for reasoning about holistic questions about the corpus by leveraging the community summaries.</li> <li>Local Search for reasoning about specific entities by fanning-out to their neighbors and associated concepts.</li> <li>DRIFT Search for reasoning about specific entities by fanning-out to their neighbors and associated concepts, but with the added context of community information.</li> </ul>"}, {"location": "#prompt-tuning", "title": "Prompt Tuning", "text": "<p>Using GraphRAG with your data out of the box may not yield the best possible results. We strongly recommend to fine-tune your prompts following the Prompt Tuning Guide in our documentation.</p>"}, {"location": "blog_posts/", "title": "Microsoft Research Blog", "text": "<ul> <li> <p> GraphRAG: Unlocking LLM discovery on narrative private data</p> <p>Published February 13, 2024 <p>By Jonathan Larson, Senior Principal Data Architect; Steven Truitt, Principal Program Manager</p> <li> <p> GraphRAG: New tool for complex data discovery now on GitHub</p> <p>Published July 2, 2024 <p>By Darren Edge, Senior Director; Ha Trinh, Senior Data Scientist; Steven Truitt, Principal Program Manager; Jonathan Larson, Senior Principal Data Architect</p> <li> <p> GraphRAG auto-tuning provides rapid adaptation to new domains</p> <p>Published September 9, 2024 <p>By Alonso Guevara Fern\u00e1ndez, Sr. Software Engineer; Katy Smith, Data Scientist II; Joshua Bradley, Senior Data Scientist; Darren Edge, Senior Director; Ha Trinh, Senior Data Scientist; Sarah Smith, Senior Program Manager; Ben Cutler, Senior Director; Steven Truitt, Principal Program Manager; Jonathan Larson, Senior Principal Data Architect</p> <li> <p> Introducing DRIFT Search: Combining global and local search methods to improve quality and efficiency</p> <p>Published October 31, 2024 <p>By Julian Whiting, Senior Machine Learning Engineer; Zachary Hills , Senior Software Engineer; Alonso Guevara Fern\u00e1ndez, Sr. Software Engineer; Ha Trinh, Senior Data Scientist; Adam Bradley , Managing Partner, Strategic Research; Jonathan Larson, Senior Principal Data Architect</p> <li> <p> GraphRAG: Improving global search via dynamic community selection</p> <p>Published November 15, 2024 <p>By Bryan Li, Research Intern; Ha Trinh, Senior Data Scientist; Darren Edge, Senior Director; Jonathan Larson, Senior Principal Data Architect</p> <li> <p> LazyGraphRAG: Setting a new standard for quality and cost</p> <p>Published November 25, 2024 <p>By Darren Edge, Senior Director; Ha Trinh, Senior Data Scientist;  Jonathan Larson, Senior Principal Data Architect</p>"}, {"location": "cli/", "title": "CLI Reference", "text": "<p>This page documents the command-line interface of the graphrag library.</p>"}, {"location": "cli/#graphrag", "title": "graphrag", "text": "<p>GraphRAG: A graph-based retrieval-augmented generation (RAG) system.</p> <p>Usage:</p> <pre><code> [OPTIONS] COMMAND [ARGS]...\n</code></pre> <p>Options:</p> <pre><code>  --install-completion  Install completion for the current shell.\n  --show-completion     Show completion for the current shell, to copy it or\n                        customize the installation.\n</code></pre>"}, {"location": "cli/#index", "title": "index", "text": "<p>Build a knowledge graph index.</p> <p>Usage:</p> <pre><code> index [OPTIONS]\n</code></pre> <p>Options:</p> <pre><code>  --config PATH                   The configuration to use.\n  --root PATH                     The project root directory.  [default: .]\n  --verbose / --no-verbose        Run the indexing pipeline with verbose\n                                  logging  [default: no-verbose]\n  --memprofile / --no-memprofile  Run the indexing pipeline with memory\n                                  profiling  [default: no-memprofile]\n  --resume TEXT                   Resume a given indexing run\n  --reporter [rich|print|none]    The progress reporter to use.  [default:\n                                  rich]\n  --dry-run / --no-dry-run        Run the indexing pipeline without executing\n                                  any steps to inspect and validate the\n                                  configuration.  [default: no-dry-run]\n  --cache / --no-cache            Use LLM cache.  [default: cache]\n  --skip-validation / --no-skip-validation\n                                  Skip any preflight validation. Useful when\n                                  running no LLM steps.  [default: no-skip-\n                                  validation]\n  --output PATH                   Indexing pipeline output directory.\n                                  Overrides storage.base_dir in the\n                                  configuration file.\n</code></pre>"}, {"location": "cli/#init", "title": "init", "text": "<p>Generate a default configuration file.</p> <p>Usage:</p> <pre><code> init [OPTIONS]\n</code></pre> <p>Options:</p> <pre><code>  --root PATH  The project root directory.  [required]\n</code></pre>"}, {"location": "cli/#prompt-tune", "title": "prompt-tune", "text": "<p>Generate custom graphrag prompts with your own data (i.e. auto templating).</p> <p>Usage:</p> <pre><code> prompt-tune [OPTIONS]\n</code></pre> <p>Options:</p> <pre><code>  --root PATH                     The project root directory.  [default: .]\n  --config PATH                   The configuration to use.\n  --domain TEXT                   The domain your input data is related to.\n                                  For example 'space science', 'microbiology',\n                                  'environmental news'. If not defined, a\n                                  domain will be inferred from the input data.\n  --selection-method [all|random|top|auto]\n                                  The text chunk selection method.  [default:\n                                  random]\n  --n-subset-max INTEGER          The number of text chunks to embed when\n                                  --selection-method=auto.  [default: 300]\n  --k INTEGER                     The maximum number of documents to select\n                                  from each centroid when --selection-\n                                  method=auto.  [default: 15]\n  --limit INTEGER                 The number of documents to load when\n                                  --selection-method={random,top}.  [default:\n                                  15]\n  --max-tokens INTEGER            The max token count for prompt generation.\n                                  [default: 2000]\n  --min-examples-required INTEGER\n                                  The minimum number of examples to\n                                  generate/include in the entity extraction\n                                  prompt.  [default: 2]\n  --chunk-size INTEGER            The max token count for prompt generation.\n                                  [default: 200]\n  --language TEXT                 The primary language used for inputs and\n                                  outputs in graphrag prompts.\n  --discover-entity-types / --no-discover-entity-types\n                                  Discover and extract unspecified entity\n                                  types.  [default: discover-entity-types]\n  --output PATH                   The directory to save prompts to, relative\n                                  to the project root directory.  [default:\n                                  prompts]\n</code></pre>"}, {"location": "cli/#query", "title": "query", "text": "<p>Query a knowledge graph index.</p> <p>Usage:</p> <pre><code> query [OPTIONS]\n</code></pre> <p>Options:</p> <pre><code>  --method [local|global|drift]   The query algorithm to use.  [required]\n  --query TEXT                    The query to execute.  [required]\n  --config PATH                   The configuration to use.\n  --data PATH                     Indexing pipeline output directory (i.e.\n                                  contains the parquet files).\n  --root PATH                     The project root directory.  [default: .]\n  --community-level INTEGER       The community level in the Leiden community\n                                  hierarchy from which to load community\n                                  reports. Higher values represent reports\n                                  from smaller communities.  [default: 2]\n  --dynamic-community-selection / --no-dynamic-community-selection\n                                  Use global search with dynamic community\n                                  selection.  [default: no-dynamic-community-\n                                  selection]\n  --response-type TEXT            Free form text describing the response type\n                                  and format, can be anything, e.g. Multiple\n                                  Paragraphs, Single Paragraph, Single\n                                  Sentence, List of 3-7 Points, Single Page,\n                                  Multi-Page Report. Default: Multiple\n                                  Paragraphs  [default: Multiple Paragraphs]\n  --streaming / --no-streaming    Print response in a streaming manner.\n                                  [default: no-streaming]\n</code></pre>"}, {"location": "cli/#update", "title": "update", "text": "<p>Update an existing knowledge graph index.</p> <p>Applies a default storage configuration (if not provided by config), saving the new index to the local file system in the <code>update_output</code> folder.</p> <p>Usage:</p> <pre><code> update [OPTIONS]\n</code></pre> <p>Options:</p> <pre><code>  --config PATH                   The configuration to use.\n  --root PATH                     The project root directory.  [default: .]\n  --verbose / --no-verbose        Run the indexing pipeline with verbose\n                                  logging  [default: no-verbose]\n  --memprofile / --no-memprofile  Run the indexing pipeline with memory\n                                  profiling  [default: no-memprofile]\n  --reporter [rich|print|none]    The progress reporter to use.  [default:\n                                  rich]\n  --cache / --no-cache            Use LLM cache.  [default: cache]\n  --skip-validation / --no-skip-validation\n                                  Skip any preflight validation. Useful when\n                                  running no LLM steps.  [default: no-skip-\n                                  validation]\n  --output PATH                   Indexing pipeline output directory.\n                                  Overrides storage.base_dir in the\n                                  configuration file.\n</code></pre>"}, {"location": "developing/", "title": "Development Guide", "text": ""}, {"location": "developing/#requirements", "title": "Requirements", "text": "Name Installation Purpose Python 3.10-3.12 Download The library is Python-based. Poetry Instructions Poetry is used for package management and virtualenv management in Python codebases"}, {"location": "developing/#getting-started", "title": "Getting Started", "text": ""}, {"location": "developing/#install-dependencies", "title": "Install Dependencies", "text": "<pre><code># Install Python dependencies.\npoetry install\n</code></pre>"}, {"location": "developing/#execute-the-indexing-engine", "title": "Execute the Indexing Engine", "text": "<pre><code>poetry run poe index &lt;...args&gt;\n</code></pre>"}, {"location": "developing/#executing-queries", "title": "Executing Queries", "text": "<pre><code>poetry run poe query &lt;...args&gt;\n</code></pre>"}, {"location": "developing/#azurite", "title": "Azurite", "text": "<p>Some unit and smoke tests use Azurite to emulate Azure resources. This can be started by running:</p> <pre><code>./scripts/start-azurite.sh\n</code></pre> <p>or by simply running <code>azurite</code> in the terminal if already installed globally. See the Azurite documentation for more information about how to install and use Azurite.</p>"}, {"location": "developing/#lifecycle-scripts", "title": "Lifecycle Scripts", "text": "<p>Our Python package utilizes Poetry to manage dependencies and poethepoet to manage build scripts.</p> <p>Available scripts are:</p> <ul> <li><code>poetry run poe index</code> - Run the Indexing CLI</li> <li><code>poetry run poe query</code> - Run the Query CLI</li> <li><code>poetry build</code> - This invokes <code>poetry build</code>, which will build a wheel file and other distributable artifacts.</li> <li><code>poetry run poe test</code> - This will execute all tests.</li> <li><code>poetry run poe test_unit</code> - This will execute unit tests.</li> <li><code>poetry run poe test_integration</code> - This will execute integration tests.</li> <li><code>poetry run poe test_smoke</code> - This will execute smoke tests.</li> <li><code>poetry run poe check</code> - This will perform a suite of static checks across the package, including:</li> <li>formatting</li> <li>documentation formatting</li> <li>linting</li> <li>security patterns</li> <li>type-checking</li> <li><code>poetry run poe fix</code> - This will apply any available auto-fixes to the package. Usually this is just formatting fixes.</li> <li><code>poetry run poe fix_unsafe</code> - This will apply any available auto-fixes to the package, including those that may be unsafe.</li> <li><code>poetry run poe format</code> - Explicitly run the formatter across the package.</li> </ul>"}, {"location": "developing/#troubleshooting", "title": "Troubleshooting", "text": ""}, {"location": "developing/#runtimeerror-llvm-config-failed-executing-please-point-llvm_config-to-the-path-for-llvm-config-when-running-poetry-install", "title": "\"RuntimeError: llvm-config failed executing, please point LLVM_CONFIG to the path for llvm-config\" when running poetry install", "text": "<p>Make sure llvm-9 and llvm-9-dev are installed:</p> <p><code>sudo apt-get install llvm-9 llvm-9-dev</code></p> <p>and then in your bashrc, add</p> <p><code>export LLVM_CONFIG=/usr/bin/llvm-config-9</code></p>"}, {"location": "developing/#numba_pymoduleh610-fatal-error-pythonh-no-such-file-or-directory-when-running-poetry-install", "title": "\"numba/_pymodule.h:6:10: fatal error: Python.h: No such file or directory\" when running poetry install", "text": "<p>Make sure you have python3.10-dev installed or more generally <code>python&lt;version&gt;-dev</code></p> <p><code>sudo apt-get install python3.10-dev</code></p>"}, {"location": "developing/#llm-call-constantly-exceeds-tpm-rpm-or-time-limits", "title": "LLM call constantly exceeds TPM, RPM or time limits", "text": "<p><code>GRAPHRAG_LLM_THREAD_COUNT</code> and <code>GRAPHRAG_EMBEDDING_THREAD_COUNT</code> are both set to 50 by default. You can modify these values to reduce concurrency. Please refer to the Configuration Documents</p>"}, {"location": "get_started/", "title": "Getting Started", "text": ""}, {"location": "get_started/#requirements", "title": "Requirements", "text": "<p>Python 3.10-3.12</p> <p>To get started with the GraphRAG system, you have a few options:</p> <p>\ud83d\udc49 Use the GraphRAG Accelerator solution  \ud83d\udc49 Install from pypi.  \ud83d\udc49 Use it from source</p>"}, {"location": "get_started/#quickstart", "title": "Quickstart", "text": "<p>To get started with the GraphRAG system we recommend trying the Solution Accelerator package. This provides a user-friendly end-to-end experience with Azure resources.</p>"}, {"location": "get_started/#overview", "title": "Overview", "text": "<p>The following is a simple end-to-end example for using the GraphRAG system. It shows how to use the system to index some text, and then use the indexed data to answer questions about the documents.</p>"}, {"location": "get_started/#install-graphrag", "title": "Install GraphRAG", "text": "<pre><code>pip install graphrag\n</code></pre> <p>The graphrag library includes a CLI for a no-code approach to getting started. Please review the full CLI documentation for further detail.</p>"}, {"location": "get_started/#running-the-indexer", "title": "Running the Indexer", "text": "<p>We need to set up a data project and some initial configuration. First let's get a sample dataset ready:</p> <pre><code>mkdir -p ./ragtest/input\n</code></pre> <p>Get a copy of A Christmas Carol by Charles Dickens from a trusted source:</p> <pre><code>curl https://www.gutenberg.org/cache/epub/24022/pg24022.txt -o ./ragtest/input/book.txt\n</code></pre>"}, {"location": "get_started/#set-up-your-workspace-variables", "title": "Set Up Your Workspace Variables", "text": "<p>To initialize your workspace, first run the <code>graphrag init</code> command. Since we have already configured a directory named <code>./ragtest</code> in the previous step, run the following command:</p> <pre><code>graphrag init --root ./ragtest\n</code></pre> <p>This will create two files: <code>.env</code> and <code>settings.yaml</code> in the <code>./ragtest</code> directory.</p> <ul> <li><code>.env</code> contains the environment variables required to run the GraphRAG pipeline. If you inspect the file, you'll see a single environment variable defined,   <code>GRAPHRAG_API_KEY=&lt;API_KEY&gt;</code>. This is the API key for the OpenAI API or Azure OpenAI endpoint. You can replace this with your own API key. If you are using another form of authentication (i.e. managed identity), please delete this file.</li> <li><code>settings.yaml</code> contains the settings for the pipeline. You can modify this file to change the settings for the pipeline.   </li> </ul>"}, {"location": "get_started/#openai-and-azure-openai", "title": "OpenAI and Azure OpenAI", "text": "<p>If running in OpenAI mode, update the value of <code>GRAPHRAG_API_KEY</code> in the <code>.env</code> file with your OpenAI API key.</p>"}, {"location": "get_started/#azure-openai", "title": "Azure OpenAI", "text": "<p>In addition, Azure OpenAI users should set the following variables in the settings.yaml file. To find the appropriate sections, just search for the <code>llm:</code> configuration, you should see two sections, one for the chat endpoint and one for the embeddings endpoint. Here is an example of how to configure the chat endpoint:</p> <pre><code>type: azure_openai_chat # Or azure_openai_embedding for embeddings\napi_base: https://&lt;instance&gt;.openai.azure.com\napi_version: 2024-02-15-preview # You can customize this for other versions\ndeployment_name: &lt;azure_model_deployment_name&gt;\n</code></pre> <ul> <li>For more details about configuring GraphRAG, see the configuration documentation.</li> <li>To learn more about Initialization, refer to the Initialization documentation.</li> <li>For more details about using the CLI, refer to the CLI documentation.</li> </ul>"}, {"location": "get_started/#running-the-indexing-pipeline", "title": "Running the Indexing pipeline", "text": "<p>Finally we'll run the pipeline!</p> <pre><code>graphrag index --root ./ragtest\n</code></pre> <p></p> <p>This process will take some time to run. This depends on the size of your input data, what model you're using, and the text chunk size being used (these can be configured in your <code>settings.yml</code> file). Once the pipeline is complete, you should see a new folder called <code>./ragtest/output</code> with a series of parquet files.</p>"}, {"location": "get_started/#using-the-query-engine", "title": "Using the Query Engine", "text": ""}, {"location": "get_started/#running-the-query-engine", "title": "Running the Query Engine", "text": "<p>Now let's ask some questions using this dataset.</p> <p>Here is an example using Global search to ask a high-level question:</p> <pre><code>graphrag query \\\n--root ./ragtest \\\n--method global \\\n--query \"What are the top themes in this story?\"\n</code></pre> <p>Here is an example using Local search to ask a more specific question about a particular character:</p> <pre><code>graphrag query \\\n--root ./ragtest \\\n--method local \\\n--query \"Who is Scrooge and what are his main relationships?\"\n</code></pre> <p>Please refer to Query Engine docs for detailed information about how to leverage our Local and Global search mechanisms for extracting meaningful insights from data after the Indexer has wrapped up execution.</p>"}, {"location": "get_started/#visualizing-the-graph", "title": "Visualizing the Graph", "text": "<p>Check out our visualization guide for a more interactive experience in debugging and exploring the knowledge graph.</p>"}, {"location": "visualization_guide/", "title": "Visualizing and Debugging Your Knowledge Graph", "text": "<p>The following step-by-step guide walks through the process to visualize a knowledge graph after it's been constructed by graphrag. Note that some of the settings recommended below are based on our own experience of what works well. Feel free to change and explore other settings for a better visualization experience!</p>"}, {"location": "visualization_guide/#1-run-the-pipeline", "title": "1. Run the Pipeline", "text": "<p>Before building an index, please review your <code>settings.yaml</code> configuration file and ensure that graphml snapshots is enabled. <pre><code>snapshots:\n  graphml: true\n</code></pre> (Optional) To support other visualization tools and exploration, additional parameters can be enabled that provide access to vector embeddings. <pre><code>embed_graph:\n  enabled: true # will generate node2vec embeddings for nodes\numap:\n  enabled: true # will generate UMAP embeddings for nodes\n</code></pre> After running the indexing pipeline over your data, there will be an output folder (defined by the <code>storage.base_dir</code> setting).</p> <ul> <li>Output Folder: Contains artifacts from the LLM\u2019s indexing pass.</li> </ul>"}, {"location": "visualization_guide/#2-locate-the-knowledge-graph", "title": "2. Locate the Knowledge Graph", "text": "<p>In the output folder, look for a file named <code>merged_graph.graphml</code>. graphml is a standard file format supported by many visualization tools. We recommend trying Gephi.</p>"}, {"location": "visualization_guide/#3-open-the-graph-in-gephi", "title": "3. Open the Graph in Gephi", "text": "<ol> <li>Install and open Gephi</li> <li>Navigate to the <code>output</code> folder containing the various parquet files.</li> <li>Import the <code>merged_graph.graphml</code> file into Gephi. This will result in a fairly plain view of the undirected graph nodes and edges.</li> </ol>"}, {"location": "visualization_guide/#4-install-the-leiden-algorithm-plugin", "title": "4. Install the Leiden Algorithm Plugin", "text": "<ol> <li>Go to <code>Tools</code> -&gt; <code>Plugins</code>.</li> <li>Search for \"Leiden Algorithm\".</li> <li>Click <code>Install</code> and restart Gephi.</li> </ol>"}, {"location": "visualization_guide/#5-run-statistics", "title": "5. Run Statistics", "text": "<ol> <li>In the <code>Statistics</code> tab on the right, click <code>Run</code> for <code>Average Degree</code> and <code>Leiden Algorithm</code>.</li> </ol> <ol> <li>For the Leiden Algorithm, adjust the settings:</li> <li>Quality function: Modularity</li> <li>Resolution: 1</li> </ol>"}, {"location": "visualization_guide/#6-color-the-graph-by-clusters", "title": "6. Color the Graph by Clusters", "text": "<ol> <li>Go to the <code>Appearance</code> pane in the upper left side of Gephi.</li> </ol> <ol> <li>Select <code>Nodes</code>, then <code>Partition</code>, and click the color palette icon in the upper right.</li> <li>Choose <code>Cluster</code> from the dropdown.</li> <li>Click the <code>Palette...</code> hyperlink, then <code>Generate...</code>.</li> <li>Uncheck <code>Limit number of colors</code>, click <code>Generate</code>, and then <code>Ok</code>.</li> <li>Click <code>Apply</code> to color the graph. This will color the graph based on the partitions discovered by Leiden.</li> </ol>"}, {"location": "visualization_guide/#7-resize-nodes-by-degree-centrality", "title": "7. Resize Nodes by Degree Centrality", "text": "<ol> <li>In the <code>Appearance</code> pane in the upper left, select <code>Nodes</code> -&gt; <code>Ranking</code></li> <li>Select the <code>Sizing</code> icon in the upper right.</li> <li>Choose <code>Degree</code> and set:</li> <li>Min: 10</li> <li>Max: 150</li> <li>Click <code>Apply</code>.</li> </ol>"}, {"location": "visualization_guide/#8-layout-the-graph", "title": "8. Layout the Graph", "text": "<ol> <li>In the <code>Layout</code> tab in the lower left, select <code>OpenORD</code>.</li> </ol> <ol> <li>Set <code>Liquid</code> and <code>Expansion</code> stages to 50, and everything else to 0.</li> <li>Click <code>Run</code> and monitor the progress.</li> </ol>"}, {"location": "visualization_guide/#9-run-forceatlas2", "title": "9. Run ForceAtlas2", "text": "<ol> <li>Select <code>Force Atlas 2</code> in the layout options.</li> </ol> <ol> <li>Adjust the settings:</li> <li>Scaling: 15</li> <li>Dissuade Hubs: checked</li> <li>LinLog mode: uncheck</li> <li>Prevent Overlap: checked</li> <li>Click <code>Run</code> and wait.</li> <li>Press <code>Stop</code> when it looks like the graph nodes have settled and no longer change position significantly.</li> </ol>"}, {"location": "visualization_guide/#10-add-text-labels-optional", "title": "10. Add Text Labels (Optional)", "text": "<ol> <li>Turn on text labels in the appropriate section.</li> <li>Configure and resize them as needed.</li> </ol> <p>Your final graph should now be visually organized and ready for analysis!</p>"}, {"location": "config/env_vars/", "title": "Default Configuration Mode (using Env Vars)", "text": ""}, {"location": "config/env_vars/#text-embeddings-customization", "title": "Text-Embeddings Customization", "text": "<p>By default, the GraphRAG indexer will only export embeddings required for our query methods. However, the model has embeddings defined for all plaintext fields, and these can be generated by setting the <code>GRAPHRAG_EMBEDDING_TARGET</code> environment variable to <code>all</code>.</p> <p>If the embedding target is <code>all</code>, and you want to only embed a subset of these fields, you may specify which embeddings to skip using the <code>GRAPHRAG_EMBEDDING_SKIP</code> argument described below.</p>"}, {"location": "config/env_vars/#embedded-fields", "title": "Embedded Fields", "text": "<ul> <li><code>text_unit.text</code></li> <li><code>document.text</code></li> <li><code>entity.title</code></li> <li><code>entity.description</code></li> <li><code>relationship.description</code></li> <li><code>community.title</code></li> <li><code>community.summary</code></li> <li><code>community.full_content</code></li> </ul>"}, {"location": "config/env_vars/#input-data", "title": "Input Data", "text": "<p>Our pipeline can ingest .csv or .txt data from an input folder. These files can be nested within subfolders. To configure how input data is handled, what fields are mapped over, and how timestamps are parsed, look for configuration values starting with <code>GRAPHRAG_INPUT_</code> below. In general, CSV-based data provides the most customizability. Each CSV should at least contain a <code>text</code> field (which can be mapped with environment variables), but it's helpful if they also have <code>title</code>, <code>timestamp</code>, and <code>source</code> fields. Additional fields can be included as well, which will land as extra fields on the <code>Document</code> table.</p>"}, {"location": "config/env_vars/#base-llm-settings", "title": "Base LLM Settings", "text": "<p>These are the primary settings for configuring LLM connectivity.</p> Parameter Required? Description Type Default Value <code>GRAPHRAG_API_KEY</code> Yes for OpenAI. Optional for AOAI The API key. (Note: <code>OPENAI_API_KEY is also used as a fallback). If not defined when using AOAI, managed identity will be used. |</code>str<code>|</code>None` <code>GRAPHRAG_API_BASE</code> For AOAI The API Base URL <code>str</code> <code>None</code> <code>GRAPHRAG_API_VERSION</code> For AOAI The AOAI API version. <code>str</code> <code>None</code> <code>GRAPHRAG_API_ORGANIZATION</code> The AOAI organization. <code>str</code> <code>None</code> <code>GRAPHRAG_API_PROXY</code> The AOAI proxy. <code>str</code> <code>None</code>"}, {"location": "config/env_vars/#text-generation-settings", "title": "Text Generation Settings", "text": "<p>These settings control the text generation model used by the pipeline. Any settings with a fallback will use the base LLM settings, if available.</p> Parameter Required? Description Type Default Value <code>GRAPHRAG_LLM_TYPE</code> For AOAI The LLM operation type. Either <code>openai_chat</code> or <code>azure_openai_chat</code> <code>str</code> <code>openai_chat</code> <code>GRAPHRAG_LLM_DEPLOYMENT_NAME</code> For AOAI The AOAI model deployment name. <code>str</code> <code>None</code> <code>GRAPHRAG_LLM_API_KEY</code> Yes (uses fallback) The API key. If not defined when using AOAI, managed identity will be used. <code>str</code> <code>None</code> <code>GRAPHRAG_LLM_API_BASE</code> For AOAI (uses fallback) The API Base URL <code>str</code> <code>None</code> <code>GRAPHRAG_LLM_API_VERSION</code> For AOAI (uses fallback) The AOAI API version. <code>str</code> <code>None</code> <code>GRAPHRAG_LLM_API_ORGANIZATION</code> For AOAI (uses fallback) The AOAI organization. <code>str</code> <code>None</code> <code>GRAPHRAG_LLM_API_PROXY</code> The AOAI proxy. <code>str</code> <code>None</code> <code>GRAPHRAG_LLM_MODEL</code> The LLM model. <code>str</code> <code>gpt-4-turbo-preview</code> <code>GRAPHRAG_LLM_MAX_TOKENS</code> The maximum number of tokens. <code>int</code> <code>4000</code> <code>GRAPHRAG_LLM_REQUEST_TIMEOUT</code> The maximum number of seconds to wait for a response from the chat client. <code>int</code> <code>180</code> <code>GRAPHRAG_LLM_MODEL_SUPPORTS_JSON</code> Indicates whether the given model supports JSON output mode. <code>True</code> to enable. <code>str</code> <code>None</code> <code>GRAPHRAG_LLM_THREAD_COUNT</code> The number of threads to use for LLM parallelization. <code>int</code> 50 <code>GRAPHRAG_LLM_THREAD_STAGGER</code> The time to wait (in seconds) between starting each thread. <code>float</code> 0.3 <code>GRAPHRAG_LLM_CONCURRENT_REQUESTS</code> The number of concurrent requests to allow for the embedding client. <code>int</code> 25 <code>GRAPHRAG_LLM_TOKENS_PER_MINUTE</code> The number of tokens per minute to allow for the LLM client. 0 = Bypass <code>int</code> 0 <code>GRAPHRAG_LLM_REQUESTS_PER_MINUTE</code> The number of requests per minute to allow for the LLM client. 0 = Bypass <code>int</code> 0 <code>GRAPHRAG_LLM_MAX_RETRIES</code> The maximum number of retries to attempt when a request fails. <code>int</code> 10 <code>GRAPHRAG_LLM_MAX_RETRY_WAIT</code> The maximum number of seconds to wait between retries. <code>int</code> 10 <code>GRAPHRAG_LLM_SLEEP_ON_RATE_LIMIT_RECOMMENDATION</code> Whether to sleep on rate limit recommendation. (Azure Only) <code>bool</code> <code>True</code> <code>GRAPHRAG_LLM_TEMPERATURE</code> The temperature to use generation. <code>float</code> 0 <code>GRAPHRAG_LLM_TOP_P</code> The top_p to use for sampling. <code>float</code> 1 <code>GRAPHRAG_LLM_N</code> The number of responses to generate. <code>int</code> 1"}, {"location": "config/env_vars/#text-embedding-settings", "title": "Text Embedding Settings", "text": "<p>These settings control the text embedding model used by the pipeline. Any settings with a fallback will use the base LLM settings, if available.</p> Parameter Required ? Description Type Default <code>GRAPHRAG_EMBEDDING_TYPE</code> For AOAI The embedding client to use. Either <code>openai_embedding</code> or <code>azure_openai_embedding</code> <code>str</code> <code>openai_embedding</code> <code>GRAPHRAG_EMBEDDING_DEPLOYMENT_NAME</code> For AOAI The AOAI deployment name. <code>str</code> <code>None</code> <code>GRAPHRAG_EMBEDDING_API_KEY</code> Yes (uses fallback) The API key to use for the embedding client. If not defined when using AOAI, managed identity will be used. <code>str</code> <code>None</code> <code>GRAPHRAG_EMBEDDING_API_BASE</code> For AOAI (uses fallback) The API base URL. <code>str</code> <code>None</code> <code>GRAPHRAG_EMBEDDING_API_VERSION</code> For AOAI (uses fallback) The AOAI API version to use for the embedding client. <code>str</code> <code>None</code> <code>GRAPHRAG_EMBEDDING_API_ORGANIZATION</code> For AOAI (uses fallback) The AOAI organization to use for the embedding client. <code>str</code> <code>None</code> <code>GRAPHRAG_EMBEDDING_API_PROXY</code> The AOAI proxy to use for the embedding client. <code>str</code> <code>None</code> <code>GRAPHRAG_EMBEDDING_MODEL</code> The model to use for the embedding client. <code>str</code> <code>text-embedding-3-small</code> <code>GRAPHRAG_EMBEDDING_BATCH_SIZE</code> The number of texts to embed at once. (Azure limit is 16) <code>int</code> 16 <code>GRAPHRAG_EMBEDDING_BATCH_MAX_TOKENS</code> The maximum tokens per batch (Azure limit is 8191) <code>int</code> 8191 <code>GRAPHRAG_EMBEDDING_TARGET</code> The target fields to embed. Either <code>required</code> or <code>all</code>. <code>str</code> <code>required</code> <code>GRAPHRAG_EMBEDDING_SKIP</code> A comma-separated list of fields to skip embeddings for . (e.g. 'relationship.description') <code>str</code> <code>None</code> <code>GRAPHRAG_EMBEDDING_THREAD_COUNT</code> The number of threads to use for parallelization for embeddings. <code>int</code> <code>GRAPHRAG_EMBEDDING_THREAD_STAGGER</code> The time to wait (in seconds) between starting each thread for embeddings. <code>float</code> 50 <code>GRAPHRAG_EMBEDDING_CONCURRENT_REQUESTS</code> The number of concurrent requests to allow for the embedding client. <code>int</code> 25 <code>GRAPHRAG_EMBEDDING_TOKENS_PER_MINUTE</code> The number of tokens per minute to allow for the embedding client. 0 = Bypass <code>int</code> 0 <code>GRAPHRAG_EMBEDDING_REQUESTS_PER_MINUTE</code> The number of requests per minute to allow for the embedding client. 0 = Bypass <code>int</code> 0 <code>GRAPHRAG_EMBEDDING_MAX_RETRIES</code> The maximum number of retries to attempt when a request fails. <code>int</code> 10 <code>GRAPHRAG_EMBEDDING_MAX_RETRY_WAIT</code> The maximum number of seconds to wait between retries. <code>int</code> 10 <code>GRAPHRAG_EMBEDDING_SLEEP_ON_RATE_LIMIT_RECOMMENDATION</code> Whether to sleep on rate limit recommendation. (Azure Only) <code>bool</code> <code>True</code>"}, {"location": "config/env_vars/#input-settings", "title": "Input Settings", "text": "<p>These settings control the data input used by the pipeline. Any settings with a fallback will use the base LLM settings, if available.</p>"}, {"location": "config/env_vars/#plaintext-input-data-graphrag_input_file_typetext", "title": "Plaintext Input Data (<code>GRAPHRAG_INPUT_FILE_TYPE</code>=text)", "text": "Parameter Description Type Required or Optional Default <code>GRAPHRAG_INPUT_FILE_PATTERN</code> The file pattern regexp to use when reading input files from the input directory. <code>str</code> optional <code>.*\\.txt$</code>"}, {"location": "config/env_vars/#csv-input-data-graphrag_input_file_typecsv", "title": "CSV Input Data (<code>GRAPHRAG_INPUT_FILE_TYPE</code>=csv)", "text": "Parameter Description Type Required or Optional Default <code>GRAPHRAG_INPUT_TYPE</code> The input storage type to use when reading files. (<code>file</code> or <code>blob</code>) <code>str</code> optional <code>file</code> <code>GRAPHRAG_INPUT_FILE_PATTERN</code> The file pattern regexp to use when reading input files from the input directory. <code>str</code> optional <code>.*\\.txt$</code> <code>GRAPHRAG_INPUT_SOURCE_COLUMN</code> The 'source' column to use when reading CSV input files. <code>str</code> optional <code>source</code> <code>GRAPHRAG_INPUT_TIMESTAMP_COLUMN</code> The 'timestamp' column to use when reading CSV input files. <code>str</code> optional <code>None</code> <code>GRAPHRAG_INPUT_TIMESTAMP_FORMAT</code> The timestamp format to use when parsing timestamps in the timestamp column. <code>str</code> optional <code>None</code> <code>GRAPHRAG_INPUT_TEXT_COLUMN</code> The 'text' column to use when reading CSV input files. <code>str</code> optional <code>text</code> <code>GRAPHRAG_INPUT_DOCUMENT_ATTRIBUTE_COLUMNS</code> A list of CSV columns, comma-separated, to incorporate as document fields. <code>str</code> optional <code>id</code> <code>GRAPHRAG_INPUT_TITLE_COLUMN</code> The 'title' column to use when reading CSV input files. <code>str</code> optional <code>title</code> <code>GRAPHRAG_INPUT_STORAGE_ACCOUNT_BLOB_URL</code> The Azure Storage blob endpoint to use when in <code>blob</code> mode and using managed identity. Will have the format <code>https://&lt;storage_account_name&gt;.blob.core.windows.net</code> <code>str</code> optional <code>None</code> <code>GRAPHRAG_INPUT_CONNECTION_STRING</code> The connection string to use when reading CSV input files from Azure Blob Storage. <code>str</code> optional <code>None</code> <code>GRAPHRAG_INPUT_CONTAINER_NAME</code> The container name to use when reading CSV input files from Azure Blob Storage. <code>str</code> optional <code>None</code> <code>GRAPHRAG_INPUT_BASE_DIR</code> The base directory to read input files from. <code>str</code> optional <code>None</code>"}, {"location": "config/env_vars/#data-mapping-settings", "title": "Data Mapping Settings", "text": "Parameter Description Type Required or Optional Default <code>GRAPHRAG_INPUT_FILE_TYPE</code> The type of input data, <code>csv</code> or <code>text</code> <code>str</code> optional <code>text</code> <code>GRAPHRAG_INPUT_ENCODING</code> The encoding to apply when reading CSV/text input files. <code>str</code> optional <code>utf-8</code>"}, {"location": "config/env_vars/#data-chunking", "title": "Data Chunking", "text": "Parameter Description Type Required or Optional Default <code>GRAPHRAG_CHUNK_SIZE</code> The chunk size in tokens for text-chunk analysis windows. <code>str</code> optional 1200 <code>GRAPHRAG_CHUNK_OVERLAP</code> The chunk overlap in tokens for text-chunk analysis windows. <code>str</code> optional 100 <code>GRAPHRAG_CHUNK_BY_COLUMNS</code> A comma-separated list of document attributes to groupby when performing TextUnit chunking. <code>str</code> optional <code>id</code> <code>GRAPHRAG_CHUNK_ENCODING_MODEL</code> The encoding model to use for chunking. <code>str</code> optional The top-level encoding model."}, {"location": "config/env_vars/#prompting-overrides", "title": "Prompting Overrides", "text": "Parameter Description Type Required or Optional Default <code>GRAPHRAG_ENTITY_EXTRACTION_PROMPT_FILE</code> The path (relative to the root) of an entity extraction prompt template text file. <code>str</code> optional <code>None</code> <code>GRAPHRAG_ENTITY_EXTRACTION_MAX_GLEANINGS</code> The maximum number of redrives (gleanings) to invoke when extracting entities in a loop. <code>int</code> optional 1 <code>GRAPHRAG_ENTITY_EXTRACTION_ENTITY_TYPES</code> A comma-separated list of entity types to extract. <code>str</code> optional <code>organization,person,event,geo</code> <code>GRAPHRAG_ENTITY_EXTRACTION_ENCODING_MODEL</code> The encoding model to use for entity extraction. <code>str</code> optional The top-level encoding model. <code>GRAPHRAG_SUMMARIZE_DESCRIPTIONS_PROMPT_FILE</code> The path (relative to the root) of an description summarization prompt template text file. <code>str</code> optional <code>None</code> <code>GRAPHRAG_SUMMARIZE_DESCRIPTIONS_MAX_LENGTH</code> The maximum number of tokens to generate per description summarization. <code>int</code> optional 500 <code>GRAPHRAG_CLAIM_EXTRACTION_ENABLED</code> Whether claim extraction is enabled for this pipeline. <code>bool</code> optional <code>False</code> <code>GRAPHRAG_CLAIM_EXTRACTION_DESCRIPTION</code> The claim_description prompting argument to utilize. <code>string</code> optional \"Any claims or facts that could be relevant to threat analysis.\" <code>GRAPHRAG_CLAIM_EXTRACTION_PROMPT_FILE</code> The claim extraction prompt to utilize. <code>string</code> optional <code>None</code> <code>GRAPHRAG_CLAIM_EXTRACTION_MAX_GLEANINGS</code> The maximum number of redrives (gleanings) to invoke when extracting claims in a loop. <code>int</code> optional 1 <code>GRAPHRAG_CLAIM_EXTRACTION_ENCODING_MODEL</code> The encoding model to use for claim extraction. <code>str</code> optional The top-level encoding model <code>GRAPHRAG_COMMUNITY_REPORTS_PROMPT_FILE</code> The community reports extraction prompt to utilize. <code>string</code> optional <code>None</code> <code>GRAPHRAG_COMMUNITY_REPORTS_MAX_LENGTH</code> The maximum number of tokens to generate per community reports. <code>int</code> optional 1500"}, {"location": "config/env_vars/#storage", "title": "Storage", "text": "<p>This section controls the storage mechanism used by the pipeline used for exporting output tables.</p> Parameter Description Type Required or Optional Default <code>GRAPHRAG_STORAGE_TYPE</code> The type of reporter to use. Options are <code>file</code>, <code>memory</code>, or <code>blob</code> <code>str</code> optional <code>file</code> <code>GRAPHRAG_STORAGE_STORAGE_ACCOUNT_BLOB_URL</code> The Azure Storage blob endpoint to use when in <code>blob</code> mode and using managed identity. Will have the format <code>https://&lt;storage_account_name&gt;.blob.core.windows.net</code> <code>str</code> optional None <code>GRAPHRAG_STORAGE_CONNECTION_STRING</code> The Azure Storage connection string to use when in <code>blob</code> mode. <code>str</code> optional None <code>GRAPHRAG_STORAGE_CONTAINER_NAME</code> The Azure Storage container name to use when in <code>blob</code> mode. <code>str</code> optional None <code>GRAPHRAG_STORAGE_BASE_DIR</code> The base path to data outputs outputs. <code>str</code> optional None"}, {"location": "config/env_vars/#cache", "title": "Cache", "text": "<p>This section controls the cache mechanism used by the pipeline. This is used to cache LLM invocation results.</p> Parameter Description Type Required or Optional Default <code>GRAPHRAG_CACHE_TYPE</code> The type of cache to use. Options are <code>file</code>, <code>memory</code>, <code>none</code> or <code>blob</code> <code>str</code> optional <code>file</code> <code>GRAPHRAG_CACHE_STORAGE_ACCOUNT_BLOB_URL</code> The Azure Storage blob endpoint to use when in <code>blob</code> mode and using managed identity. Will have the format <code>https://&lt;storage_account_name&gt;.blob.core.windows.net</code> <code>str</code> optional None <code>GRAPHRAG_CACHE_CONNECTION_STRING</code> The Azure Storage connection string to use when in <code>blob</code> mode. <code>str</code> optional None <code>GRAPHRAG_CACHE_CONTAINER_NAME</code> The Azure Storage container name to use when in <code>blob</code> mode. <code>str</code> optional None <code>GRAPHRAG_CACHE_BASE_DIR</code> The base path to the cache files. <code>str</code> optional None"}, {"location": "config/env_vars/#reporting", "title": "Reporting", "text": "<p>This section controls the reporting mechanism used by the pipeline, for common events and error messages. The default is to write reports to a file in the output directory. However, you can also choose to write reports to the console or to an Azure Blob Storage container.</p> Parameter Description Type Required or Optional Default <code>GRAPHRAG_REPORTING_TYPE</code> The type of reporter to use. Options are <code>file</code>, <code>console</code>, or <code>blob</code> <code>str</code> optional <code>file</code> <code>GRAPHRAG_REPORTING_STORAGE_ACCOUNT_BLOB_URL</code> The Azure Storage blob endpoint to use when in <code>blob</code> mode and using managed identity. Will have the format <code>https://&lt;storage_account_name&gt;.blob.core.windows.net</code> <code>str</code> optional None <code>GRAPHRAG_REPORTING_CONNECTION_STRING</code> The Azure Storage connection string to use when in <code>blob</code> mode. <code>str</code> optional None <code>GRAPHRAG_REPORTING_CONTAINER_NAME</code> The Azure Storage container name to use when in <code>blob</code> mode. <code>str</code> optional None <code>GRAPHRAG_REPORTING_BASE_DIR</code> The base path to the reporting outputs. <code>str</code> optional None"}, {"location": "config/env_vars/#node2vec-parameters", "title": "Node2Vec Parameters", "text": "Parameter Description Type Required or Optional Default <code>GRAPHRAG_NODE2VEC_ENABLED</code> Whether to enable Node2Vec <code>bool</code> optional False <code>GRAPHRAG_NODE2VEC_NUM_WALKS</code> The Node2Vec number of walks to perform <code>int</code> optional 10 <code>GRAPHRAG_NODE2VEC_WALK_LENGTH</code> The Node2Vec walk length <code>int</code> optional 40 <code>GRAPHRAG_NODE2VEC_WINDOW_SIZE</code> The Node2Vec window size <code>int</code> optional 2 <code>GRAPHRAG_NODE2VEC_ITERATIONS</code> The number of iterations to run node2vec <code>int</code> optional 3 <code>GRAPHRAG_NODE2VEC_RANDOM_SEED</code> The random seed to use for node2vec <code>int</code> optional 597832"}, {"location": "config/env_vars/#data-snapshotting", "title": "Data Snapshotting", "text": "Parameter Description Type Required or Optional Default <code>GRAPHRAG_SNAPSHOT_EMBEDDINGS</code> Whether to enable embeddings snapshots. <code>bool</code> optional False <code>GRAPHRAG_SNAPSHOT_GRAPHML</code> Whether to enable GraphML snapshots. <code>bool</code> optional False <code>GRAPHRAG_SNAPSHOT_RAW_ENTITIES</code> Whether to enable raw entity snapshots. <code>bool</code> optional False <code>GRAPHRAG_SNAPSHOT_TOP_LEVEL_NODES</code> Whether to enable top-level node snapshots. <code>bool</code> optional False <code>GRAPHRAG_SNAPSHOT_TRANSIENT</code> Whether to enable transient table snapshots. <code>bool</code> optional False"}, {"location": "config/env_vars/#miscellaneous-settings", "title": "Miscellaneous Settings", "text": "Parameter Description Type Required or Optional Default <code>GRAPHRAG_ASYNC_MODE</code> Which async mode to use. Either <code>asyncio</code> or <code>threaded</code>. <code>str</code> optional <code>asyncio</code> <code>GRAPHRAG_ENCODING_MODEL</code> The text encoding model, used in tiktoken, to encode text. <code>str</code> optional <code>cl100k_base</code> <code>GRAPHRAG_MAX_CLUSTER_SIZE</code> The maximum number of entities to include in a single Leiden cluster. <code>int</code> optional 10 <code>GRAPHRAG_SKIP_WORKFLOWS</code> A comma-separated list of workflow names to skip. <code>str</code> optional <code>None</code> <code>GRAPHRAG_UMAP_ENABLED</code> Whether to enable UMAP layouts <code>bool</code> optional False"}, {"location": "config/init/", "title": "Configuring GraphRAG Indexing", "text": "<p>To start using GraphRAG, you must generate a configuration file. The <code>init</code> command is the easiest way to get started. It will create a <code>.env</code> and <code>settings.yaml</code> files in the specified directory with the necessary configuration settings. It will also output the default LLM prompts used by GraphRAG.</p>"}, {"location": "config/init/#usage", "title": "Usage", "text": "<pre><code>graphrag init [--root PATH]\n</code></pre>"}, {"location": "config/init/#options", "title": "Options", "text": "<ul> <li><code>--root PATH</code> - The project root directory to initialize graphrag at. Default is the current directory.</li> </ul>"}, {"location": "config/init/#example", "title": "Example", "text": "<pre><code>graphrag init --root ./ragtest\n</code></pre>"}, {"location": "config/init/#output", "title": "Output", "text": "<p>The <code>init</code> command will create the following files in the specified directory:</p> <ul> <li><code>settings.yaml</code> - The configuration settings file. This file contains the configuration settings for GraphRAG.</li> <li><code>.env</code> - The environment variables file. These are referenced in the <code>settings.yaml</code> file.</li> <li><code>prompts/</code> - The LLM prompts folder. This contains the default prompts used by GraphRAG, you can modify them or run the Auto Prompt Tuning command to generate new prompts adapted to your data.</li> </ul>"}, {"location": "config/init/#next-steps", "title": "Next Steps", "text": "<p>After initializing your workspace, you can either run the Prompt Tuning command to adapt the prompts to your data or even start running the Indexing Pipeline to index your data. For more information on configuring GraphRAG, see the Configuration documentation.</p>"}, {"location": "config/overview/", "title": "Configuring GraphRAG Indexing", "text": "<p>The GraphRAG system is highly configurable. This page provides an overview of the configuration options available for the GraphRAG indexing engine.</p>"}, {"location": "config/overview/#default-configuration-mode", "title": "Default Configuration Mode", "text": "<p>The default configuration mode is the simplest way to get started with the GraphRAG system. It is designed to work out-of-the-box with minimal configuration. The primary configuration sections for the Indexing Engine pipelines are described below. The main ways to set up GraphRAG in Default Configuration mode are via:</p> <ul> <li>Init command (recommended)</li> <li>Using YAML for deeper control</li> <li>Purely using environment variables</li> </ul>"}, {"location": "config/yaml/", "title": "Default Configuration Mode (using YAML/JSON)", "text": "<p>The default configuration mode may be configured by using a <code>settings.yml</code> or <code>settings.json</code> file in the data project root. If a <code>.env</code> file is present along with this config file, then it will be loaded, and the environment variables defined therein will be available for token replacements in your configuration document using <code>${ENV_VAR}</code> syntax. We initialize with YML by default in <code>graphrag init</code> but you may use the equivalent JSON form if preferred.</p> <p>Many of these config values have defaults. Rather than replicate them here, please refer to the constants in the code directly.</p> <p>For example:</p> <pre><code># .env\nGRAPHRAG_API_KEY=some_api_key\n\n# settings.yml\nllm: \n  api_key: ${GRAPHRAG_API_KEY}\n</code></pre>"}, {"location": "config/yaml/#config-sections", "title": "Config Sections", "text": ""}, {"location": "config/yaml/#indexing", "title": "Indexing", "text": ""}, {"location": "config/yaml/#llm", "title": "llm", "text": "<p>This is the base LLM configuration section. Other steps may override this configuration with their own LLM configuration.</p>"}, {"location": "config/yaml/#fields", "title": "Fields", "text": "<ul> <li><code>api_key</code> str - The OpenAI API key to use.</li> <li><code>type</code> openai_chat|azure_openai_chat|openai_embedding|azure_openai_embedding - The type of LLM to use.</li> <li><code>model</code> str - The model name.</li> <li><code>max_tokens</code> int - The maximum number of output tokens.</li> <li><code>request_timeout</code> float - The per-request timeout.</li> <li><code>api_base</code> str - The API base url to use.</li> <li><code>api_version</code> str - The API version</li> <li><code>organization</code> str - The client organization.</li> <li><code>proxy</code> str - The proxy URL to use.</li> <li><code>audience</code> str - (Azure OpenAI only) The URI of the target Azure resource/service for which a managed identity token is requested. Used if <code>api_key</code> is not defined. Default=<code>https://cognitiveservices.azure.com/.default</code></li> <li><code>deployment_name</code> str - The deployment name to use (Azure).</li> <li><code>model_supports_json</code> bool - Whether the model supports JSON-mode output.</li> <li><code>tokens_per_minute</code> int - Set a leaky-bucket throttle on tokens-per-minute.</li> <li><code>requests_per_minute</code> int - Set a leaky-bucket throttle on requests-per-minute.</li> <li><code>max_retries</code> int - The maximum number of retries to use.</li> <li><code>max_retry_wait</code> float - The maximum backoff time.</li> <li><code>sleep_on_rate_limit_recommendation</code> bool - Whether to adhere to sleep recommendations (Azure).</li> <li><code>concurrent_requests</code> int The number of open requests to allow at once.</li> <li><code>temperature</code> float - The temperature to use.</li> <li><code>top_p</code> float - The top-p value to use.</li> <li><code>n</code> int - The number of completions to generate.</li> </ul>"}, {"location": "config/yaml/#parallelization", "title": "parallelization", "text": ""}, {"location": "config/yaml/#fields_1", "title": "Fields", "text": "<ul> <li><code>stagger</code> float - The threading stagger value.</li> <li><code>num_threads</code> int - The maximum number of work threads.</li> </ul>"}, {"location": "config/yaml/#async_mode", "title": "async_mode", "text": "<p>asyncio|threaded The async mode to use. Either <code>asyncio</code> or `threaded.</p>"}, {"location": "config/yaml/#embeddings", "title": "embeddings", "text": ""}, {"location": "config/yaml/#fields_2", "title": "Fields", "text": "<ul> <li><code>llm</code> (see LLM top-level config)</li> <li><code>parallelization</code> (see Parallelization top-level config)</li> <li><code>async_mode</code> (see Async Mode top-level config)</li> <li><code>batch_size</code> int - The maximum batch size to use.</li> <li><code>batch_max_tokens</code> int - The maximum batch # of tokens.</li> <li><code>target</code> required|all|none - Determines which set of embeddings to export.</li> <li><code>skip</code> list[str] - Which embeddings to skip. Only useful if target=all to customize the list.</li> <li><code>vector_store</code> dict - The vector store to use. Configured for lancedb by default.<ul> <li><code>type</code> str - <code>lancedb</code> or <code>azure_ai_search</code>. Default=<code>lancedb</code></li> <li><code>db_uri</code> str (only for lancedb) - The database uri. Default=<code>storage.base_dir/lancedb</code></li> <li><code>url</code> str (only for AI Search) - AI Search endpoint</li> <li><code>api_key</code> str (optional - only for AI Search) - The AI Search api key to use.</li> <li><code>audience</code> str (only for AI Search) - Audience for managed identity token if managed identity authentication is used.</li> <li><code>overwrite</code> bool (only used at index creation time) - Overwrite collection if it exist. Default=<code>True</code></li> <li><code>container_name</code> str - The name of a vector container. This stores all indexes (tables) for a given dataset ingest. Default=<code>default</code></li> </ul> </li> <li><code>strategy</code> dict - Fully override the text-embedding strategy.</li> </ul>"}, {"location": "config/yaml/#input", "title": "input", "text": ""}, {"location": "config/yaml/#fields_3", "title": "Fields", "text": "<ul> <li><code>type</code> file|blob - The input type to use. Default=<code>file</code></li> <li><code>file_type</code> text|csv - The type of input data to load. Either <code>text</code> or <code>csv</code>. Default is <code>text</code></li> <li><code>base_dir</code> str - The base directory to read input from, relative to the root.</li> <li><code>connection_string</code> str - (blob only) The Azure Storage connection string.</li> <li><code>storage_account_blob_url</code> str - The storage account blob URL to use.</li> <li><code>container_name</code> str - (blob only) The Azure Storage container name.</li> <li><code>file_encoding</code> str - The encoding of the input file. Default is <code>utf-8</code></li> <li><code>file_pattern</code> str - A regex to match input files. Default is <code>.*\\.csv$</code> if in csv mode and <code>.*\\.txt$</code> if in text mode.</li> <li><code>file_filter</code> dict - Key/value pairs to filter. Default is None.</li> <li><code>source_column</code> str - (CSV Mode Only) The source column name.</li> <li><code>timestamp_column</code> str - (CSV Mode Only) The timestamp column name.</li> <li><code>timestamp_format</code> str - (CSV Mode Only) The source format.</li> <li><code>text_column</code> str - (CSV Mode Only) The text column name.</li> <li><code>title_column</code> str - (CSV Mode Only) The title column name.</li> <li><code>document_attribute_columns</code> list[str] - (CSV Mode Only) The additional document attributes to include.</li> </ul>"}, {"location": "config/yaml/#chunks", "title": "chunks", "text": ""}, {"location": "config/yaml/#fields_4", "title": "Fields", "text": "<ul> <li><code>size</code> int - The max chunk size in tokens.</li> <li><code>overlap</code> int - The chunk overlap in tokens.</li> <li><code>group_by_columns</code> list[str] - group documents by fields before chunking.</li> <li><code>encoding_model</code> str - The text encoding model to use. Default is to use the top-level encoding model.</li> <li><code>strategy</code> dict - Fully override the chunking strategy.</li> </ul>"}, {"location": "config/yaml/#cache", "title": "cache", "text": ""}, {"location": "config/yaml/#fields_5", "title": "Fields", "text": "<ul> <li><code>type</code> file|memory|none|blob - The cache type to use. Default=<code>file</code></li> <li><code>connection_string</code> str - (blob only) The Azure Storage connection string.</li> <li><code>container_name</code> str - (blob only) The Azure Storage container name.</li> <li><code>base_dir</code> str - The base directory to write cache to, relative to the root.</li> <li><code>storage_account_blob_url</code> str - The storage account blob URL to use.</li> </ul>"}, {"location": "config/yaml/#storage", "title": "storage", "text": ""}, {"location": "config/yaml/#fields_6", "title": "Fields", "text": "<ul> <li><code>type</code> file|memory|blob - The storage type to use. Default=<code>file</code></li> <li><code>connection_string</code> str - (blob only) The Azure Storage connection string.</li> <li><code>container_name</code> str - (blob only) The Azure Storage container name.</li> <li><code>base_dir</code> str - The base directory to write output artifacts to, relative to the root.</li> <li><code>storage_account_blob_url</code> str - The storage account blob URL to use.</li> </ul>"}, {"location": "config/yaml/#update_index_storage", "title": "update_index_storage", "text": ""}, {"location": "config/yaml/#fields_7", "title": "Fields", "text": "<ul> <li><code>type</code> file|memory|blob - The storage type to use. Default=<code>file</code></li> <li><code>connection_string</code> str - (blob only) The Azure Storage connection string.</li> <li><code>container_name</code> str - (blob only) The Azure Storage container name.</li> <li><code>base_dir</code> str - The base directory to write output artifacts to, relative to the root.</li> <li><code>storage_account_blob_url</code> str - The storage account blob URL to use.</li> </ul>"}, {"location": "config/yaml/#reporting", "title": "reporting", "text": ""}, {"location": "config/yaml/#fields_8", "title": "Fields", "text": "<ul> <li><code>type</code> file|console|blob - The reporting type to use. Default=<code>file</code></li> <li><code>connection_string</code> str - (blob only) The Azure Storage connection string.</li> <li><code>container_name</code> str - (blob only) The Azure Storage container name.</li> <li><code>base_dir</code> str - The base directory to write reports to, relative to the root.</li> <li><code>storage_account_blob_url</code> str - The storage account blob URL to use.</li> </ul>"}, {"location": "config/yaml/#entity_extraction", "title": "entity_extraction", "text": ""}, {"location": "config/yaml/#fields_9", "title": "Fields", "text": "<ul> <li><code>llm</code> (see LLM top-level config)</li> <li><code>parallelization</code> (see Parallelization top-level config)</li> <li><code>async_mode</code> (see Async Mode top-level config)</li> <li><code>prompt</code> str - The prompt file to use.</li> <li><code>entity_types</code> list[str] - The entity types to identify.</li> <li><code>max_gleanings</code> int - The maximum number of gleaning cycles to use.</li> <li><code>encoding_model</code> str - The text encoding model to use. By default, this will use the top-level encoding model.</li> <li><code>strategy</code> dict - Fully override the entity extraction strategy.</li> </ul>"}, {"location": "config/yaml/#summarize_descriptions", "title": "summarize_descriptions", "text": ""}, {"location": "config/yaml/#fields_10", "title": "Fields", "text": "<ul> <li><code>llm</code> (see LLM top-level config)</li> <li><code>parallelization</code> (see Parallelization top-level config)</li> <li><code>async_mode</code> (see Async Mode top-level config)</li> <li><code>prompt</code> str - The prompt file to use.</li> <li><code>max_length</code> int - The maximum number of output tokens per summarization.</li> <li><code>strategy</code> dict - Fully override the summarize description strategy.</li> </ul>"}, {"location": "config/yaml/#claim_extraction", "title": "claim_extraction", "text": ""}, {"location": "config/yaml/#fields_11", "title": "Fields", "text": "<ul> <li><code>enabled</code> bool - Whether to enable claim extraction. Off by default, because claim prompts really need user tuning.</li> <li><code>llm</code> (see LLM top-level config)</li> <li><code>parallelization</code> (see Parallelization top-level config)</li> <li><code>async_mode</code> (see Async Mode top-level config)</li> <li><code>prompt</code> str - The prompt file to use.</li> <li><code>description</code> str - Describes the types of claims we want to extract.</li> <li><code>max_gleanings</code> int - The maximum number of gleaning cycles to use.</li> <li><code>encoding_model</code> str - The text encoding model to use. By default, this will use the top-level encoding model.</li> <li><code>strategy</code> dict - Fully override the claim extraction strategy.</li> </ul>"}, {"location": "config/yaml/#community_reports", "title": "community_reports", "text": ""}, {"location": "config/yaml/#fields_12", "title": "Fields", "text": "<ul> <li><code>llm</code> (see LLM top-level config)</li> <li><code>parallelization</code> (see Parallelization top-level config)</li> <li><code>async_mode</code> (see Async Mode top-level config)</li> <li><code>prompt</code> str - The prompt file to use.</li> <li><code>max_length</code> int - The maximum number of output tokens per report.</li> <li><code>max_input_length</code> int - The maximum number of input tokens to use when generating reports.</li> <li><code>strategy</code> dict - Fully override the community reports strategy.</li> </ul>"}, {"location": "config/yaml/#cluster_graph", "title": "cluster_graph", "text": ""}, {"location": "config/yaml/#fields_13", "title": "Fields", "text": "<ul> <li><code>max_cluster_size</code> int - The maximum cluster size to export.</li> <li><code>strategy</code> dict - Fully override the cluster_graph strategy.</li> </ul>"}, {"location": "config/yaml/#embed_graph", "title": "embed_graph", "text": ""}, {"location": "config/yaml/#fields_14", "title": "Fields", "text": "<ul> <li><code>enabled</code> bool - Whether to enable graph embeddings.</li> <li><code>num_walks</code> int - The node2vec number of walks.</li> <li><code>walk_length</code> int - The node2vec walk length.</li> <li><code>window_size</code> int - The node2vec window size.</li> <li><code>iterations</code> int - The node2vec number of iterations.</li> <li><code>random_seed</code> int - The node2vec random seed.</li> <li><code>strategy</code> dict - Fully override the embed graph strategy.</li> </ul>"}, {"location": "config/yaml/#umap", "title": "umap", "text": ""}, {"location": "config/yaml/#fields_15", "title": "Fields", "text": "<ul> <li><code>enabled</code> bool - Whether to enable UMAP layouts.</li> </ul>"}, {"location": "config/yaml/#snapshots", "title": "snapshots", "text": ""}, {"location": "config/yaml/#fields_16", "title": "Fields", "text": "<ul> <li><code>embeddings</code> bool - Export embeddings snapshots to parquet.</li> <li><code>graphml</code> bool - Export graph snapshots to GraphML.</li> <li><code>raw_entities</code> bool - Export raw entity snapshots to JSON.</li> <li><code>top_level_nodes</code> bool - Export top-level-node snapshots to JSON.</li> <li><code>transient</code> bool - Export transient workflow tables snapshots to parquet.</li> </ul>"}, {"location": "config/yaml/#encoding_model", "title": "encoding_model", "text": "<p>str - The text encoding model to use. Default=<code>cl100k_base</code>.</p>"}, {"location": "config/yaml/#skip_workflows", "title": "skip_workflows", "text": "<p>list[str] - Which workflow names to skip.</p>"}, {"location": "config/yaml/#query", "title": "Query", "text": ""}, {"location": "config/yaml/#local_search", "title": "local_search", "text": ""}, {"location": "config/yaml/#fields_17", "title": "Fields", "text": "<ul> <li><code>prompt</code> str - The prompt file to use.</li> <li><code>text_unit_prop</code> float - The text unit proportion. </li> <li><code>community_prop</code> float - The community proportion.</li> <li><code>conversation_history_max_turns</code> int - The conversation history maximum turns.</li> <li><code>top_k_entities</code> int - The top k mapped entities.</li> <li><code>top_k_relationships</code> int - The top k mapped relations.</li> <li><code>temperature</code> float | None - The temperature to use for token generation.</li> <li><code>top_p</code> float | None - The top-p value to use for token generation.</li> <li><code>n</code> int | None - The number of completions to generate.</li> <li><code>max_tokens</code> int - The maximum tokens.</li> <li><code>llm_max_tokens</code> int - The LLM maximum tokens.</li> </ul>"}, {"location": "config/yaml/#global_search", "title": "global_search", "text": ""}, {"location": "config/yaml/#fields_18", "title": "Fields", "text": "<ul> <li><code>map_prompt</code> str - The mapper prompt file to use.</li> <li><code>reduce_prompt</code> str - The reducer prompt file to use.</li> <li><code>knowledge_prompt</code> str - The knowledge prompt file to use.</li> <li><code>map_prompt</code> str | None - The global search mapper prompt to use.</li> <li><code>reduce_prompt</code> str | None - The global search reducer to use.</li> <li><code>knowledge_prompt</code> str | None - The global search general prompt to use.</li> <li><code>temperature</code> float | None - The temperature to use for token generation.</li> <li><code>top_p</code> float | None - The top-p value to use for token generation.</li> <li><code>n</code> int | None - The number of completions to generate.</li> <li><code>max_tokens</code> int - The maximum context size in tokens.</li> <li><code>data_max_tokens</code> int - The data llm maximum tokens.</li> <li><code>map_max_tokens</code> int - The map llm maximum tokens.</li> <li><code>reduce_max_tokens</code> int - The reduce llm maximum tokens.</li> <li><code>concurrency</code> int - The number of concurrent requests.</li> <li><code>dynamic_search_llm</code> str - LLM model to use for dynamic community selection.</li> <li><code>dynamic_search_threshold</code> int - Rating threshold in include a community report.</li> <li><code>dynamic_search_keep_parent</code> bool - Keep parent community if any of the child communities are relevant.</li> <li><code>dynamic_search_num_repeats</code> int - Number of times to rate the same community report.</li> <li><code>dynamic_search_use_summary</code> bool - Use community summary instead of full_context.</li> <li><code>dynamic_search_concurrent_coroutines</code> int - Number of concurrent coroutines to rate community reports.</li> <li><code>dynamic_search_max_level</code> int - The maximum level of community hierarchy to consider if none of the processed communities are relevant.</li> </ul>"}, {"location": "config/yaml/#drift_search", "title": "drift_search", "text": ""}, {"location": "config/yaml/#fields_19", "title": "Fields", "text": "<ul> <li><code>prompt</code> str - The prompt file to use.</li> <li><code>temperature</code> float - The temperature to use for token generation.\",</li> <li><code>top_p</code> float - The top-p value to use for token generation.</li> <li><code>n</code> int - The number of completions to generate.</li> <li><code>max_tokens</code> int - The maximum context size in tokens.</li> <li><code>data_max_tokens</code> int - The data llm maximum tokens.</li> <li><code>concurrency</code> int - The number of concurrent requests.</li> <li><code>drift_k_followups</code> int - The number of top global results to retrieve.</li> <li><code>primer_folds</code> int - The number of folds for search priming.</li> <li><code>primer_llm_max_tokens</code> int - The maximum number of tokens for the LLM in primer.</li> <li><code>n_depth</code> int - The number of drift search steps to take.</li> <li><code>local_search_text_unit_prop</code> float - The proportion of search dedicated to text units.</li> <li><code>local_search_community_prop</code> float - The proportion of search dedicated to community properties.</li> <li><code>local_search_top_k_mapped_entities</code> int - The number of top K entities to map during local search.</li> <li><code>local_search_top_k_relationships</code> int - The number of top K relationships to map during local search.</li> <li><code>local_search_max_data_tokens</code> int - The maximum context size in tokens for local search.</li> <li><code>local_search_temperature</code> float - The temperature to use for token generation in local search.</li> <li><code>local_search_top_p</code> float - The top-p value to use for token generation in local search.</li> <li><code>local_search_n</code> int - The number of completions to generate in local search.</li> <li><code>local_search_llm_max_gen_tokens</code> int - The maximum number of generated tokens for the LLM in local search.</li> </ul>"}, {"location": "data/operation_dulce/ABOUT/", "title": "About", "text": "<p>This document (Operation Dulce) is an AI-generated science fiction novella, included here for the purposes of integration testing.</p>"}, {"location": "index/architecture/", "title": "Indexing Architecture", "text": ""}, {"location": "index/architecture/#key-concepts", "title": "Key Concepts", "text": ""}, {"location": "index/architecture/#knowledge-model", "title": "Knowledge Model", "text": "<p>In order to support the GraphRAG system, the outputs of the indexing engine (in the Default Configuration Mode) are aligned to a knowledge model we call the GraphRAG Knowledge Model. This model is designed to be an abstraction over the underlying data storage technology, and to provide a common interface for the GraphRAG system to interact with. In normal use-cases the outputs of the GraphRAG Indexer would be loaded into a database system, and the GraphRAG's Query Engine would interact with the database using the knowledge model data-store types.</p>"}, {"location": "index/architecture/#datashaper-workflows", "title": "DataShaper Workflows", "text": "<p>GraphRAG's Indexing Pipeline is built on top of our open-source library, DataShaper. DataShaper is a data processing library that allows users to declaratively express data pipelines, schemas, and related assets using well-defined schemas. DataShaper has implementations in JavaScript and Python, and is designed to be extensible to other languages.</p> <p>One of the core resource types within DataShaper is a Workflow. Workflows are expressed as sequences of steps, which we call verbs. Each step has a verb name and a configuration object. In DataShaper, these verbs model relational concepts such as SELECT, DROP, JOIN, etc.. Each verb transforms an input data table, and that table is passed down the pipeline.</p> <pre><code>---\ntitle: Sample Workflow\n---\nflowchart LR\n    input[Input Table] --&gt; select[SELECT] --&gt; join[JOIN] --&gt; binarize[BINARIZE] --&gt; output[Output Table]</code></pre>"}, {"location": "index/architecture/#llm-based-workflow-steps", "title": "LLM-based Workflow Steps", "text": "<p>GraphRAG's Indexing Pipeline implements a handful of custom verbs on top of the standard, relational verbs that our DataShaper library provides. These verbs give us the ability to augment text documents with rich, structured data using the power of LLMs such as GPT-4. We utilize these verbs in our standard workflow to extract entities, relationships, claims, community structures, and community reports and summaries. This behavior is customizable and can be extended to support many kinds of AI-based data enrichment and extraction tasks.</p>"}, {"location": "index/architecture/#workflow-graphs", "title": "Workflow Graphs", "text": "<p>Because of the complexity of our data indexing tasks, we needed to be able to express our data pipeline as series of multiple, interdependent workflows. In the GraphRAG Indexing Pipeline, each workflow may define dependencies on other workflows, effectively forming a directed acyclic graph (DAG) of workflows, which is then used to schedule processing.</p> <pre><code>---\ntitle: Sample Workflow DAG\n---\nstateDiagram-v2\n    [*] --&gt; Prepare\n    Prepare --&gt; Chunk\n    Chunk --&gt; ExtractGraph\n    Chunk --&gt; EmbedDocuments\n    ExtractGraph --&gt; GenerateReports\n    ExtractGraph --&gt; EmbedEntities\n    ExtractGraph --&gt; EmbedGraph</code></pre>"}, {"location": "index/architecture/#dataframe-message-format", "title": "Dataframe Message Format", "text": "<p>The primary unit of communication between workflows, and between workflow steps is an instance of <code>pandas.DataFrame</code>. Although side-effects are possible, our goal is to be data-centric and table-centric in our approach to data processing. This allows us to easily reason about our data, and to leverage the power of dataframe-based ecosystems. Our underlying dataframe technology may change over time, but our primary goal is to support the DataShaper workflow schema while retaining single-machine ease of use and developer ergonomics.</p>"}, {"location": "index/architecture/#llm-caching", "title": "LLM Caching", "text": "<p>The GraphRAG library was designed with LLM interactions in mind, and a common setback when working with LLM APIs is various errors due to network latency, throttling, etc.. Because of these potential error cases, we've added a cache layer around LLM interactions. When completion requests are made using the same input set (prompt and tuning parameters), we return a cached result if one exists. This allows our indexer to be more resilient to network issues, to act idempotently, and to provide a more efficient end-user experience.</p>"}, {"location": "index/default_dataflow/", "title": "Indexing Dataflow", "text": ""}, {"location": "index/default_dataflow/#the-graphrag-knowledge-model", "title": "The GraphRAG Knowledge Model", "text": "<p>The knowledge model is a specification for data outputs that conform to our data-model definition. You can find these definitions in the python/graphrag/graphrag/model folder within the GraphRAG repository. The following entity types are provided. The fields here represent the fields that are text-embedded by default.</p> <ul> <li><code>Document</code> - An input document into the system. These either represent individual rows in a CSV or individual .txt file.</li> <li><code>TextUnit</code> - A chunk of text to analyze. The size of these chunks, their overlap, and whether they adhere to any data boundaries may be configured below. A common use case is to set <code>CHUNK_BY_COLUMNS</code> to <code>id</code> so that there is a 1-to-many relationship between documents and TextUnits instead of a many-to-many.</li> <li><code>Entity</code> - An entity extracted from a TextUnit. These represent people, places, events, or some other entity-model that you provide.</li> <li><code>Relationship</code> - A relationship between two entities. These are generated from the covariates.</li> <li><code>Covariate</code> - Extracted claim information, which contains statements about entities which may be time-bound.</li> <li><code>Community</code> - Once the graph of entities and relationships is built, we perform hierarchical community detection on them to create a clustering structure.</li> <li><code>Community Report</code> - The contents of each community are summarized into a generated report, useful for human reading and downstream search.</li> <li><code>Node</code> - This table contains layout information for rendered graph-views of the Entities and Documents which have been embedded and clustered.</li> </ul>"}, {"location": "index/default_dataflow/#the-default-configuration-workflow", "title": "The Default Configuration Workflow", "text": "<p>Let's take a look at how the default-configuration workflow transforms text documents into the GraphRAG Knowledge Model. This page gives a general overview of the major steps in this process. To fully configure this workflow, check out the configuration documentation.</p> <pre><code>---\ntitle: Dataflow Overview\n---\nflowchart TB\n    subgraph phase1[Phase 1: Compose TextUnits]\n    documents[Documents] --&gt; chunk[Chunk]\n    chunk --&gt; embed[Embed] --&gt; textUnits[Text Units]\n    end\n    subgraph phase2[Phase 2: Graph Extraction]\n    textUnits --&gt; graph_extract[Entity &amp; Relationship Extraction]\n    graph_extract --&gt; graph_summarize[Entity &amp; Relationship Summarization]\n    graph_summarize --&gt; claim_extraction[Claim Extraction]\n    claim_extraction --&gt; graph_outputs[Graph Tables]\n    end\n    subgraph phase3[Phase 3: Graph Augmentation]\n    graph_outputs --&gt; community_detect[Community Detection]\n    community_detect --&gt; graph_embed[Graph Embedding]\n    graph_embed --&gt; augmented_graph[Augmented Graph Tables]\n    end\n    subgraph phase4[Phase 4: Community Summarization]\n    augmented_graph --&gt; summarized_communities[Community Summarization]\n    summarized_communities --&gt; embed_communities[Community Embedding]\n    embed_communities --&gt; community_outputs[Community Tables]\n    end\n    subgraph phase5[Phase 5: Document Processing]\n    documents --&gt; link_to_text_units[Link to TextUnits]\n    textUnits --&gt; link_to_text_units\n    link_to_text_units --&gt; embed_documents[Document Embedding]\n    embed_documents --&gt; document_graph[Document Graph Creation]\n    document_graph --&gt; document_outputs[Document Tables]\n    end\n    subgraph phase6[Phase 6: Network Visualization]\n    document_outputs --&gt; umap_docs[Umap Documents]\n    augmented_graph --&gt; umap_entities[Umap Entities]\n    umap_docs --&gt; combine_nodes[Nodes Table]\n    umap_entities --&gt; combine_nodes\n    end</code></pre>"}, {"location": "index/default_dataflow/#phase-1-compose-textunits", "title": "Phase 1: Compose TextUnits", "text": "<p>The first phase of the default-configuration workflow is to transform input documents into TextUnits. A TextUnit is a chunk of text that is used for our graph extraction techniques. They are also used as source-references by extracted knowledge items in order to empower breadcrumbs and provenance by concepts back to their original source tex.</p> <p>The chunk size (counted in tokens), is user-configurable. By default this is set to 300 tokens, although we've had positive experience with 1200-token chunks using a single \"glean\" step. (A \"glean\" step is a follow-on extraction). Larger chunks result in lower-fidelity output and less meaningful reference texts; however, using larger chunks can result in much faster processing time.</p> <p>The group-by configuration is also user-configurable. By default, we align our chunks to document boundaries, meaning that there is a strict 1-to-many relationship between Documents and TextUnits. In rare cases, this can be turned into a many-to-many relationship. This is useful when the documents are very short and we need several of them to compose a meaningful analysis unit (e.g. Tweets or a chat log)</p> <p>Each of these text-units are text-embedded and passed into the next phase of the pipeline.</p> <pre><code>---\ntitle: Documents into Text Chunks\n---\nflowchart LR\n    doc1[Document 1] --&gt; tu1[TextUnit 1]\n    doc1 --&gt; tu2[TextUnit 2]\n    doc2[Document 2] --&gt; tu3[TextUnit 3]\n    doc2 --&gt; tu4[TextUnit 4]\n</code></pre>"}, {"location": "index/default_dataflow/#phase-2-graph-extraction", "title": "Phase 2: Graph Extraction", "text": "<p>In this phase, we analyze each text unit and extract our graph primitives: Entities, Relationships, and Claims. Entities and Relationships are extracted at once in our entity_extract verb, and claims are extracted in our claim_extract verb. Results are then combined and passed into following phases of the pipeline.</p> <pre><code>---\ntitle: Graph Extraction\n---\nflowchart LR\n    tu[TextUnit] --&gt; ge[Graph Extraction] --&gt; gs[Graph Summarization]\n    tu --&gt; ce[Claim Extraction]</code></pre>"}, {"location": "index/default_dataflow/#entity-relationship-extraction", "title": "Entity &amp; Relationship Extraction", "text": "<p>In this first step of graph extraction, we process each text-unit in order to extract entities and relationships out of the raw text using the LLM. The output of this step is a subgraph-per-TextUnit containing a list of entities with a name, type, and description, and a list of relationships with a source, target, and description.</p> <p>These subgraphs are merged together - any entities with the same name and type are merged by creating an array of their descriptions. Similarly, any relationships with the same source and target are merged by creating an array of their descriptions.</p>"}, {"location": "index/default_dataflow/#entity-relationship-summarization", "title": "Entity &amp; Relationship Summarization", "text": "<p>Now that we have a graph of entities and relationships, each with a list of descriptions, we can summarize these lists into a single description per entity and relationship. This is done by asking the LLM for a short summary that captures all of the distinct information from each description. This allows all of our entities and relationships to have a single concise description.</p>"}, {"location": "index/default_dataflow/#claim-extraction-emission", "title": "Claim Extraction &amp; Emission", "text": "<p>Finally, as an independent workflow, we extract claims from the source TextUnits. These claims represent positive factual statements with an evaluated status and time-bounds. These get exported as a primary artifact called Covariates.</p> <p>Note: claim extraction is optional and turned off by default. This is because claim extraction generally requires prompt tuning to be useful.</p>"}, {"location": "index/default_dataflow/#phase-3-graph-augmentation", "title": "Phase 3: Graph Augmentation", "text": "<p>Now that we have a usable graph of entities and relationships, we want to understand their community structure and augment the graph with additional information. This is done in two steps: Community Detection and Graph Embedding. These give us explicit (communities) and implicit (embeddings) ways of understanding the topological structure of our graph.</p> <pre><code>---\ntitle: Graph Augmentation\n---\nflowchart LR\n    cd[Leiden Hierarchical Community Detection] --&gt; ge[Node2Vec Graph Embedding] --&gt; ag[Graph Table Emission]</code></pre>"}, {"location": "index/default_dataflow/#community-detection", "title": "Community Detection", "text": "<p>In this step, we generate a hierarchy of entity communities using the Hierarchical Leiden Algorithm. This method will apply a recursive community-clustering to our graph until we reach a community-size threshold. This will allow us to understand the community structure of our graph and provide a way to navigate and summarize the graph at different levels of granularity.</p>"}, {"location": "index/default_dataflow/#graph-embedding", "title": "Graph Embedding", "text": "<p>In this step, we generate a vector representation of our graph using the Node2Vec algorithm. This will allow us to understand the implicit structure of our graph and provide an additional vector-space in which to search for related concepts during our query phase.</p>"}, {"location": "index/default_dataflow/#graph-tables-emission", "title": "Graph Tables Emission", "text": "<p>Once our graph augmentation steps are complete, the final Entities and Relationships tables are exported after their text fields are text-embedded.</p>"}, {"location": "index/default_dataflow/#phase-4-community-summarization", "title": "Phase 4: Community Summarization", "text": "<pre><code>---\ntitle: Community Summarization\n---\nflowchart LR\n    sc[Generate Community Reports] --&gt; ss[Summarize Community Reports] --&gt; ce[Community Embedding] --&gt; co[Community Tables Emission]</code></pre> <p>At this point, we have a functional graph of entities and relationships, a hierarchy of communities for the entities, as well as node2vec embeddings.</p> <p>Now we want to build on the communities data and generate reports for each community. This gives us a high-level understanding of the graph at several points of graph granularity. For example, if community A is the top-level community, we'll get a report about the entire graph. If the community is lower-level, we'll get a report about a local cluster.</p>"}, {"location": "index/default_dataflow/#generate-community-reports", "title": "Generate Community Reports", "text": "<p>In this step, we generate a summary of each community using the LLM. This will allow us to understand the distinct information contained within each community and provide a scoped understanding of the graph, from either a high-level or a low-level perspective. These reports contain an executive overview and reference the key entities, relationships, and claims within the community sub-structure.</p>"}, {"location": "index/default_dataflow/#summarize-community-reports", "title": "Summarize Community Reports", "text": "<p>In this step, each community report is then summarized via the LLM for shorthand use.</p>"}, {"location": "index/default_dataflow/#community-embedding", "title": "Community Embedding", "text": "<p>In this step, we generate a vector representation of our communities by generating text embeddings of the community report, the community report summary, and the title of the community report.</p>"}, {"location": "index/default_dataflow/#community-tables-emission", "title": "Community Tables Emission", "text": "<p>At this point, some bookkeeping work is performed and we export the Communities and CommunityReports tables.</p>"}, {"location": "index/default_dataflow/#phase-5-document-processing", "title": "Phase 5: Document Processing", "text": "<p>In this phase of the workflow, we create the Documents table for the knowledge model.</p> <pre><code>---\ntitle: Document Processing\n---\nflowchart LR\n    aug[Augment] --&gt; dp[Link to TextUnits] --&gt; de[Avg. Embedding] --&gt; dg[Document Table Emission]</code></pre>"}, {"location": "index/default_dataflow/#augment-with-columns-csv-only", "title": "Augment with Columns (CSV Only)", "text": "<p>If the workflow is operating on CSV data, you may configure your workflow to add additional fields to Documents output. These fields should exist on the incoming CSV tables. Details about configuring this can be found in the configuration documentation.</p>"}, {"location": "index/default_dataflow/#link-to-textunits", "title": "Link to TextUnits", "text": "<p>In this step, we link each document to the text-units that were created in the first phase. This allows us to understand which documents are related to which text-units and vice-versa.</p>"}, {"location": "index/default_dataflow/#document-embedding", "title": "Document Embedding", "text": "<p>In this step, we generate a vector representation of our documents using an average embedding of document slices. We re-chunk documents without overlapping chunks, and then generate an embedding for each chunk. We create an average of these chunks weighted by token-count and use this as the document embedding. This will allow us to understand the implicit relationship between documents, and will help us generate a network representation of our documents.</p>"}, {"location": "index/default_dataflow/#documents-table-emission", "title": "Documents Table Emission", "text": "<p>At this point, we can export the Documents table into the knowledge Model.</p>"}, {"location": "index/default_dataflow/#phase-6-network-visualization", "title": "Phase 6: Network Visualization", "text": "<p>In this phase of the workflow, we perform some steps to support network visualization of our high-dimensional vector spaces within our existing graphs. At this point there are two logical graphs at play: the Entity-Relationship graph and the Document graph.</p> <pre><code>---\ntitle: Network Visualization Workflows\n---\nflowchart LR\n    nv[Umap Documents] --&gt; ne[Umap Entities] --&gt; ng[Nodes Table Emission]</code></pre> <p>For each of the logical graphs, we perform a UMAP dimensionality reduction to generate a 2D representation of the graph. This will allow us to visualize the graph in a 2D space and understand the relationships between the nodes in the graph. The UMAP embeddings are then exported as a table of Nodes. The rows of this table include a discriminator indicating whether the node is a document or an entity, and the UMAP coordinates.</p>"}, {"location": "index/outputs/", "title": "Outputs", "text": "<p>The default pipeline produces a series of output tables that align with the conceptual knowledge model. This page describes the detailed output table schemas. By default we write these tables out as parquet files on disk.</p>"}, {"location": "index/outputs/#shared-fields", "title": "Shared fields", "text": "<p>All tables have two identifier fields:</p> name type description id str Generated UUID, assuring global uniqueness human_readable_id int This is an incremented short ID created per-run. For example, we use this short ID with generated summaries that print citations so they are easy to cross-reference visually."}, {"location": "index/outputs/#create_final_communities", "title": "create_final_communities", "text": "<p>This is a list of the final communities generated by Leiden. Communities are strictly hierarchical, subdividing into children as the cluster affinity is narrowed.</p> name type description community int Leiden-generated cluster ID for the community. Note that these increment with depth, so they are unique through all levels of the community hierarchy. For this table, human_readable_id is a copy of the community ID rather than a plain increment. level int Depth of the community in the hierarchy. title str Friendly name of the community. entity_ids str[] List of entities that are members of the community. relationship_ids str[] List of relationships that are wholly within the community (source and target are both in the community). text_unit_ids str[] List of text units represented within the community. period str Date of ingest, used for incremental update merges. ISO8601 size int Size of the community (entity count), used for incremental update merges."}, {"location": "index/outputs/#create_final_community_reports", "title": "create_final_community_reports", "text": "<p>This is the list of summarized reports for each community.</p> name type description community int Short ID of the community this report applies to. level int Level of the community this report applies to. title str LM-generated title for the report. summary str LM-generated summary of the report. full_content str LM-generated full report. rank float LM-derived relevance ranking of the report based on member entity salience rank_explanation str LM-derived explanation of the rank. findings dict LM-derived list of the top 5-10 insights from the community. Contains <code>summary</code> and <code>explanation</code> values. full_content_json json Full JSON output as returned by the LM. Most fields are extracted into columns, but this JSON is sent for query summarization so we leave it to allow for prompt tuning to add fields/content by end users. period str Date of ingest, used for incremental update merges. ISO8601 size int Size of the community (entity count), used for incremental update merges."}, {"location": "index/outputs/#create_final_covariates", "title": "create_final_covariates", "text": "<p>(Optional) If claim extraction is turned on, this is a list of the extracted covariates. Note that claims are typically oriented around identifying malicious behavior such as fraud, so they are not useful for all datasets.</p> name type description covariate_type str This is always \"claim\" with our default covariates. type str Nature of the claim type. description str LM-generated description of the behavior. subject_id str Name of the source entity (that is performing the claimed behavior). object_id str Name of the target entity (that the claimed behavior is performed on). status str LM-derived assessment of the correctness of the claim. One of [TRUE, FALSE, SUSPECTED] start_date str LM-derived start of the claimed activity. ISO8601 end_date str LM-derived end of the claimed activity. ISO8601 source_text str Short string of text containing the claimed behavior. text_unit_id str ID of the text unit the claim text was extracted from."}, {"location": "index/outputs/#create_final_documents", "title": "create_final_documents", "text": "<p>List of document content after import.</p> name type description title str Filename, unless otherwise configured during CSV import. text str Full text of the document. text_unit_ids str[] List of text units (chunks) that were parsed from the document. attributes dict (optional) If specified during CSV import, this is a dict of attributes for the document."}, {"location": "index/outputs/#create_final_entities", "title": "create_final_entities", "text": "<p>List of all entities found in the data by the LM.</p> name type description title str Name of the entity. type str Type of the entity. By default this will be \"organization\", \"person\", \"geo\", or \"event\" unless configured differently or auto-tuning is used. description str Textual description of the entity. Entities may be found in many text units, so this is an LM-derived summary of all descriptions. text_unit_ids str[] List of the text units containing the entity."}, {"location": "index/outputs/#create_final_nodes", "title": "create_final_nodes", "text": "<p>This is graph-related information for the entities. It contains only information relevant to the graph such as community. There is an entry for each entity at every community level it is found within, so you may see \"duplicate\" entities.</p> <p>Note that the ID fields match those in create_final_entities and can be used for joining if additional information about a node is required.</p> name type description title str Name of the referenced entity. Duplicated from create_final_entities for convenient cross-referencing. community int Leiden community the node is found within. Entities are not always assigned a community (they may not be close enough to any), so they may have a ID of -1. level int Level of the community the entity is in. degree int Node degree (connectedness) in the graph. x float X position of the node for visual layouts. If graph embeddings and UMAP are not turned on, this will be 0. y float Y position of the node for visual layouts. If graph embeddings and UMAP are not turned on, this will be 0."}, {"location": "index/outputs/#create_final_relationships", "title": "create_final_relationships", "text": "<p>List of all entity-to-entity relationships found in the data by the LM. This is also the edge list for the graph.</p> name type description source str Name of the source entity. target str Name of the target entity. description str LM-derived description of the relationship. Also see note for entity descriptions. weight float Weight of the edge in the graph. This is summed from an LM-derived \"strength\" measure for each relationship instance. combined_degree int Sum of source and target node degrees. text_unit_ids str[] List of text units the relationship was found within."}, {"location": "index/outputs/#create_final_text_units", "title": "create_final_text_units", "text": "<p>List of all text chunks parsed from the input documents.</p> name type description text str Raw full text of the chunk. n_tokens int Number of tokens in the chunk. This should normally match the <code>chunk_size</code> config parameter, except for the last chunk which is often shorter. document_ids str[] List of document IDs the chunk came from. This is normally only 1 due to our default groupby, but for very short text documents (e.g., microblogs) it can be configured so text units span multiple documents. entity_ids str[] List of entities found in the text unit. relationships_ids str[] List of relationships found in the text unit. covariate_ids str[] Optional list of covariates found in the text unit."}, {"location": "index/overview/", "title": "GraphRAG Indexing \ud83e\udd16", "text": "<p>The GraphRAG indexing package is a data pipeline and transformation suite that is designed to extract meaningful, structured data from unstructured text using LLMs.</p> <p>Indexing Pipelines are configurable. They are composed of workflows, standard and custom steps, prompt templates, and input/output adapters. Our standard pipeline is designed to:</p> <ul> <li>extract entities, relationships and claims from raw text</li> <li>perform community detection in entities</li> <li>generate community summaries and reports at multiple levels of granularity</li> <li>embed entities into a graph vector space</li> <li>embed text chunks into a textual vector space</li> </ul> <p>The outputs of the pipeline can be stored in a variety of formats, including JSON and Parquet - or they can be handled manually via the Python API.</p>"}, {"location": "index/overview/#getting-started", "title": "Getting Started", "text": ""}, {"location": "index/overview/#requirements", "title": "Requirements", "text": "<p>See the requirements section in Get Started for details on setting up a development environment.</p> <p>The Indexing Engine can be used in either a default configuration mode or with a custom pipeline. To configure GraphRAG, see the configuration documentation. After you have a config file you can run the pipeline using the CLI or the Python API.</p>"}, {"location": "index/overview/#usage", "title": "Usage", "text": ""}, {"location": "index/overview/#cli", "title": "CLI", "text": "<pre><code># Via Poetry\npoetry run poe cli --root &lt;data_root&gt; # default config mode\npoetry run poe cli --config your_pipeline.yml # custom config mode\n\n# Via Node\nyarn run:index --root &lt;data_root&gt; # default config mode\nyarn run:index --config your_pipeline.yml # custom config mode\n</code></pre>"}, {"location": "index/overview/#python-api", "title": "Python API", "text": "<p>Please see the examples folder for a handful of functional pipelines illustrating how to create and run via a custom settings.yml or through custom python scripts.</p>"}, {"location": "index/overview/#further-reading", "title": "Further Reading", "text": "<ul> <li>To start developing within the GraphRAG project, see getting started</li> <li>To understand the underlying concepts and execution model of the indexing library, see the architecture documentation</li> <li>To get running with a series of examples, see the examples documentation</li> <li>To read more about configuring the indexing engine, see the configuration documentation</li> </ul>"}, {"location": "prompt_tuning/auto_prompt_tuning/", "title": "Auto Prompt Tuning \u2699\ufe0f", "text": "<p>GraphRAG provides the ability to create domain adapted prompts for the generation of the knowledge graph. This step is optional, though it is highly encouraged to run it as it will yield better results when executing an Index Run.</p> <p>These are generated by loading the inputs, splitting them into chunks (text units) and then running a series of LLM invocations and template substitutions to generate the final prompts. We suggest using the default values provided by the script, but in this page you'll find the detail of each in case you want to further explore and tweak the prompt tuning algorithm.</p> <p> </p> <p> Figure 1: Auto Tuning Conceptual Diagram. </p>"}, {"location": "prompt_tuning/auto_prompt_tuning/#prerequisites", "title": "Prerequisites", "text": "<p>Before running auto tuning, ensure you have already initialized your workspace with the <code>graphrag init</code> command. This will create the necessary configuration files and the default prompts. Refer to the Init Documentation for more information about the initialization process.</p>"}, {"location": "prompt_tuning/auto_prompt_tuning/#usage", "title": "Usage", "text": "<p>You can run the main script from the command line with various options:</p> <pre><code>graphrag prompt-tune [--root ROOT] [--config CONFIG] [--domain DOMAIN]  [--selection-method METHOD] [--limit LIMIT] [--language LANGUAGE] \\\n[--max-tokens MAX_TOKENS] [--chunk-size CHUNK_SIZE] [--n-subset-max N_SUBSET_MAX] [--k K] \\\n[--min-examples-required MIN_EXAMPLES_REQUIRED] [--discover-entity-types] [--output OUTPUT]\n</code></pre>"}, {"location": "prompt_tuning/auto_prompt_tuning/#command-line-options", "title": "Command-Line Options", "text": "<ul> <li> <p><code>--config</code> (required): The path to the configuration file. This is required to load the data and model settings.</p> </li> <li> <p><code>--root</code> (optional): The data project root directory, including the config files (YML, JSON, or .env). Defaults to the current directory.</p> </li> <li> <p><code>--domain</code> (optional): The domain related to your input data, such as 'space science', 'microbiology', or 'environmental news'. If left empty, the domain will be inferred from the input data.</p> </li> <li> <p><code>--method</code> (optional): The method to select documents. Options are all, random, auto or top. Default is random.</p> </li> <li> <p><code>--limit</code> (optional): The limit of text units to load when using random or top selection. Default is 15.</p> </li> <li> <p><code>--language</code> (optional): The language to use for input processing. If it is different from the inputs' language, the LLM will translate. Default is \"\" meaning it will be automatically detected from the inputs.</p> </li> <li> <p><code>--max-tokens</code> (optional): Maximum token count for prompt generation. Default is 2000.</p> </li> <li> <p><code>--chunk-size</code> (optional): The size in tokens to use for generating text units from input documents. Default is 200.</p> </li> <li> <p><code>--n-subset-max</code> (optional): The number of text chunks to embed when using auto selection method. Default is 300.</p> </li> <li> <p><code>--k</code> (optional): The number of documents to select when using auto selection method. Default is 15.</p> </li> <li> <p><code>--min-examples-required</code> (optional): The minimum number of examples required for entity extraction prompts. Default is 2.</p> </li> <li> <p><code>--discover-entity-types</code> (optional): Allow the LLM to discover and extract entities automatically. We recommend using this when your data covers a lot of topics or it is highly randomized.</p> </li> <li> <p><code>--output</code> (optional): The folder to save the generated prompts. Default is \"prompts\".</p> </li> </ul>"}, {"location": "prompt_tuning/auto_prompt_tuning/#example-usage", "title": "Example Usage", "text": "<pre><code>python -m graphrag prompt-tune --root /path/to/project --config /path/to/settings.yaml --domain \"environmental news\" \\\n--method random --limit 10 --language English --max-tokens 2048 --chunk-size 256 --min-examples-required 3 \\\n--no-entity-types --output /path/to/output\n</code></pre> <p>or, with minimal configuration (suggested):</p> <pre><code>python -m graphrag prompt-tune --root /path/to/project --config /path/to/settings.yaml --no-entity-types\n</code></pre>"}, {"location": "prompt_tuning/auto_prompt_tuning/#document-selection-methods", "title": "Document Selection Methods", "text": "<p>The auto tuning feature ingests the input data and then divides it into text units the size of the chunk size parameter. After that, it uses one of the following selection methods to pick a sample to work with for prompt generation:</p> <ul> <li><code>random</code>: Select text units randomly. This is the default and recommended option.</li> <li><code>top</code>: Select the head n text units.</li> <li><code>all</code>: Use all text units for the generation. Use only with small datasets; this option is not usually recommended.</li> <li><code>auto</code>: Embed text units in a lower-dimensional space and select the k nearest neighbors to the centroid. This is useful when you have a large dataset and want to select a representative sample.</li> </ul>"}, {"location": "prompt_tuning/auto_prompt_tuning/#modify-env-vars", "title": "Modify Env Vars", "text": "<p>After running auto tuning, you should modify the following environment variables (or config variables) to pick up the new prompts on your index run. Note: Please make sure to update the correct path to the generated prompts, in this example we are using the default \"prompts\" path.</p> <ul> <li> <p><code>GRAPHRAG_ENTITY_EXTRACTION_PROMPT_FILE</code> = \"prompts/entity_extraction.txt\"</p> </li> <li> <p><code>GRAPHRAG_COMMUNITY_REPORT_PROMPT_FILE</code> = \"prompts/community_report.txt\"</p> </li> <li> <p><code>GRAPHRAG_SUMMARIZE_DESCRIPTIONS_PROMPT_FILE</code> = \"prompts/summarize_descriptions.txt\"</p> </li> </ul> <p>or in your yaml config file:</p> <pre><code>entity_extraction:\n  prompt: \"prompts/entity_extraction.txt\"\n\nsummarize_descriptions:\n  prompt: \"prompts/summarize_descriptions.txt\"\n\ncommunity_reports:\n  prompt: \"prompts/community_report.txt\"\n</code></pre>"}, {"location": "prompt_tuning/manual_prompt_tuning/", "title": "Manual Prompt Tuning \u2699\ufe0f", "text": "<p>The GraphRAG indexer, by default, will run with a handful of prompts that are designed to work well in the broad context of knowledge discovery. However, it is quite common to want to tune the prompts to better suit your specific use case. We provide a means for you to do this by allowing you to specify a custom prompt file, which will each use a series of token-replacements internally.</p> <p>Each of these prompts may be overridden by writing a custom prompt file in plaintext. We use token-replacements in the form of <code>{token_name}</code>, and the descriptions for the available tokens can be found below.</p>"}, {"location": "prompt_tuning/manual_prompt_tuning/#indexing-prompts", "title": "Indexing Prompts", "text": ""}, {"location": "prompt_tuning/manual_prompt_tuning/#entityrelationship-extraction", "title": "Entity/Relationship Extraction", "text": "<p>Prompt Source</p>"}, {"location": "prompt_tuning/manual_prompt_tuning/#tokens", "title": "Tokens", "text": "<ul> <li>{input_text} - The input text to be processed.</li> <li>{entity_types} - A list of entity types</li> <li>{tuple_delimiter} - A delimiter for separating values within a tuple. A single tuple is used to represent an individual entity or relationship.</li> <li>{record_delimiter} - A delimiter for separating tuple instances.</li> <li>{completion_delimiter} - An indicator for when generation is complete.</li> </ul>"}, {"location": "prompt_tuning/manual_prompt_tuning/#summarize-entityrelationship-descriptions", "title": "Summarize Entity/Relationship Descriptions", "text": "<p>Prompt Source</p>"}, {"location": "prompt_tuning/manual_prompt_tuning/#tokens_1", "title": "Tokens", "text": "<ul> <li>{entity_name} - The name of the entity or the source/target pair of the relationship.</li> <li>{description_list} - A list of descriptions for the entity or relationship.</li> </ul>"}, {"location": "prompt_tuning/manual_prompt_tuning/#claim-extraction", "title": "Claim Extraction", "text": "<p>Prompt Source</p>"}, {"location": "prompt_tuning/manual_prompt_tuning/#tokens_2", "title": "Tokens", "text": "<ul> <li>{input_text} - The input text to be processed.</li> <li>{tuple_delimiter} - A delimiter for separating values within a tuple. A single tuple is used to represent an individual entity or relationship.</li> <li>{record_delimiter} - A delimiter for separating tuple instances.</li> <li>{completion_delimiter} - An indicator for when generation is complete.</li> <li>{entity_specs} - A list of entity types.</li> <li>{claim_description} - Description of what claims should look like. Default is: <code>\"Any claims or facts that could be relevant to information discovery.\"</code></li> </ul> <p>See the configuration documentation for details on how to change this.</p>"}, {"location": "prompt_tuning/manual_prompt_tuning/#generate-community-reports", "title": "Generate Community Reports", "text": "<p>Prompt Source</p>"}, {"location": "prompt_tuning/manual_prompt_tuning/#tokens_3", "title": "Tokens", "text": "<ul> <li>{input_text} - The input text to generate the report with. This will contain tables of entities and relationships.</li> </ul>"}, {"location": "prompt_tuning/manual_prompt_tuning/#query-prompts", "title": "Query Prompts", "text": ""}, {"location": "prompt_tuning/manual_prompt_tuning/#local-search", "title": "Local Search", "text": "<p>Prompt Source</p>"}, {"location": "prompt_tuning/manual_prompt_tuning/#tokens_4", "title": "Tokens", "text": "<ul> <li>{response_type} - Describe how the response should look. We default to \"multiple paragraphs\".</li> <li>{context_data} - The data tables from GraphRAG's index.</li> </ul>"}, {"location": "prompt_tuning/manual_prompt_tuning/#global-search", "title": "Global Search", "text": "<p>Mapper Prompt Source</p> <p>Reducer Prompt Source</p> <p>Knowledge Prompt Source</p> <p>Global search uses a map/reduce approach to summarization. You can tune these prompts independently. This search also includes the ability to adjust the use of general knowledge from the model's training.</p>"}, {"location": "prompt_tuning/manual_prompt_tuning/#tokens_5", "title": "Tokens", "text": "<ul> <li>{response_type} - Describe how the response should look (reducer only). We default to \"multiple paragraphs\".</li> <li>{context_data} - The data tables from GraphRAG's index.</li> </ul>"}, {"location": "prompt_tuning/manual_prompt_tuning/#drift-search", "title": "Drift Search", "text": "<p>Prompt Source</p>"}, {"location": "prompt_tuning/manual_prompt_tuning/#tokens_6", "title": "Tokens", "text": "<ul> <li>{response_type} - Describe how the response should look. We default to \"multiple paragraphs\".</li> <li>{context_data} - The data tables from GraphRAG's index.</li> <li>{community_reports} - The most relevant community reports to include in the summarization.</li> <li>{query} - The query text as injected into the context.</li> </ul>"}, {"location": "prompt_tuning/overview/", "title": "Prompt Tuning \u2699\ufe0f", "text": "<p>This page provides an overview of the prompt tuning options available for the GraphRAG indexing engine.</p>"}, {"location": "prompt_tuning/overview/#default-prompts", "title": "Default Prompts", "text": "<p>The default prompts are the simplest way to get started with the GraphRAG system. It is designed to work out-of-the-box with minimal configuration. More details about each of the default prompts for indexing and query can be found on the manual tuning page.</p>"}, {"location": "prompt_tuning/overview/#auto-tuning", "title": "Auto Tuning", "text": "<p>Auto Tuning leverages your input data and LLM interactions to create domain adapted prompts for the generation of the knowledge graph. It is highly encouraged to run it as it will yield better results when executing an Index Run. For more details about how to use it, please refer to the Auto Tuning documentation.</p>"}, {"location": "prompt_tuning/overview/#manual-tuning", "title": "Manual Tuning", "text": "<p>Manual tuning is an advanced use-case. Most users will want to use the Auto Tuning feature instead. Details about how to use manual configuration are available in the manual tuning documentation.</p>"}, {"location": "query/drift_search/", "title": "DRIFT Search \ud83d\udd0e", "text": ""}, {"location": "query/drift_search/#combining-local-and-global-search", "title": "Combining Local and Global Search", "text": "<p>GraphRAG is a technique that uses large language models (LLMs) to create knowledge graphs and summaries from unstructured text documents and leverages them to improve retrieval-augmented generation (RAG) operations on private datasets. It offers comprehensive global overviews of large, private troves of unstructured text documents while also enabling exploration of detailed, localized information. By using LLMs to create comprehensive knowledge graphs that connect and describe entities and relationships contained in those documents, GraphRAG leverages semantic structuring of the data to generate responses to a wide variety of complex user queries.</p> <p>DRIFT search (Dynamic Reasoning and Inference with Flexible Traversal) builds upon Microsoft\u2019s GraphRAG technique, combining characteristics of both global and local search to generate detailed responses in a method that balances computational costs with quality outcomes using our drift search method.</p>"}, {"location": "query/drift_search/#methodology", "title": "Methodology", "text": "<p> Figure 1. An entire DRIFT search hierarchy highlighting the three core phases of the DRIFT search process. A (Primer): DRIFT compares the user\u2019s query with the top K most semantically relevant community reports, generating a broad initial answer and follow-up questions to steer further exploration. B (Follow-Up): DRIFT uses local search to refine queries, producing additional intermediate answers and follow-up questions that enhance specificity, guiding the engine towards context-rich information. A glyph on each node in the diagram shows the confidence the algorithm has to continue the query expansion step.  C (Output Hierarchy): The final output is a hierarchical structure of questions and answers ranked by relevance, reflecting a balanced mix of global insights and local refinements, making the results adaptable and comprehensive.</p> <p>DRIFT Search introduces a new approach to local search queries by including community information in the search process. This greatly expands the breadth of the query\u2019s starting point and leads to retrieval and usage of a far higher variety of facts in the final answer. This addition expands the GraphRAG query engine by providing a more comprehensive option for local search, which uses community insights to refine a query into detailed follow-up questions.</p>"}, {"location": "query/drift_search/#configuration", "title": "Configuration", "text": "<p>Below are the key parameters of the DRIFTSearch class:</p> <ul> <li><code>llm</code>: OpenAI model object to be used for response generation</li> <li><code>context_builder</code>: context builder object to be used for preparing context data from community reports and query information</li> <li><code>config</code>: model to define the DRIFT Search hyperparameters. DRIFT Config model</li> <li><code>token_encoder</code>: token encoder for tracking the budget for the algorithm.</li> <li><code>query_state</code>: a state object as defined in Query State that allows to track execution of a DRIFT Search instance, alongside follow ups and DRIFT actions.</li> </ul>"}, {"location": "query/drift_search/#how-to-use", "title": "How to Use", "text": "<p>An example of a drift search scenario can be found in the following notebook.</p>"}, {"location": "query/drift_search/#learn-more", "title": "Learn More", "text": "<p>For a more in-depth look at the DRIFT search method, please refer to our DRIFT Search blog post</p>"}, {"location": "query/global_search/", "title": "Global Search \ud83d\udd0e", "text": ""}, {"location": "query/global_search/#whole-dataset-reasoning", "title": "Whole Dataset Reasoning", "text": "<p>Baseline RAG struggles with queries that require aggregation of information across the dataset to compose an answer. Queries such as \u201cWhat are the top 5 themes in the data?\u201d perform terribly because baseline RAG relies on a vector search of semantically similar text content within the dataset. There is nothing in the query to direct it to the correct information.</p> <p>However, with GraphRAG we can answer such questions, because the structure of the LLM-generated knowledge graph tells us about the structure (and thus themes) of the dataset as a whole. This allows the private dataset to be organized into meaningful semantic clusters that are pre-summarized. Using our global search method, the LLM uses these clusters to summarize these themes when responding to a user query.</p>"}, {"location": "query/global_search/#methodology", "title": "Methodology", "text": "<pre><code>---\ntitle: Global Search Dataflow\n---\n%%{ init: { 'flowchart': { 'curve': 'step' } } }%%\nflowchart LR\n\n    uq[User Query] --- .1\n    ch1[Conversation History] --- .1\n\n    subgraph RIR\n        direction TB\n        ri1[Rated Intermediate&lt;br/&gt;Response 1]~~~ri2[Rated Intermediate&lt;br/&gt;Response 2] -.\"{1..N}\".-rin[Rated Intermediate&lt;br/&gt;Response N]\n    end\n\n    .1--Shuffled Community&lt;br/&gt;Report Batch 1--&gt;RIR\n    .1--Shuffled Community&lt;br/&gt;Report Batch 2--&gt;RIR---.2\n    .1--Shuffled Community&lt;br/&gt;Report Batch N--&gt;RIR\n\n    .2--Ranking +&lt;br/&gt;Filtering--&gt;agr[Aggregated Intermediate&lt;br/&gt;Responses]--&gt;res[Response]\n\n\n\n     classDef green fill:#26B653,stroke:#333,stroke-width:2px,color:#fff;\n     classDef turquoise fill:#19CCD3,stroke:#333,stroke-width:2px,color:#fff;\n     classDef rose fill:#DD8694,stroke:#333,stroke-width:2px,color:#fff;\n     classDef orange fill:#F19914,stroke:#333,stroke-width:2px,color:#fff;\n     classDef purple fill:#B356CD,stroke:#333,stroke-width:2px,color:#fff;\n     classDef invisible fill:#fff,stroke:#fff,stroke-width:0px,color:#fff, width:0px;\n     class uq,ch1 turquoise;\n     class ri1,ri2,rin rose;\n     class agr orange;\n     class res purple;\n     class .1,.2 invisible;\n</code></pre> <p>Given a user query and, optionally, the conversation history, the global search method uses a collection of LLM-generated community reports from a specified level of the graph's community hierarchy as context data to generate response in a map-reduce manner. At the <code>map</code> step, community reports are segmented into text chunks of pre-defined size. Each text chunk is then used to produce an intermediate response containing a list of point, each of which is accompanied by a numerical rating indicating the importance of the point. At the <code>reduce</code> step, a filtered set of the most important points from the intermediate responses are aggregated and used as the context to generate the final response. </p> <p>The quality of the global search\u2019s response can be heavily influenced by the level of the community hierarchy chosen for sourcing community reports. Lower hierarchy levels, with their detailed reports, tend to yield more thorough responses, but may also increase the time and LLM resources needed to generate the final response due to the volume of reports.</p>"}, {"location": "query/global_search/#configuration", "title": "Configuration", "text": "<p>Below are the key parameters of the GlobalSearch class:</p> <ul> <li><code>llm</code>: OpenAI model object to be used for response generation</li> <li><code>context_builder</code>: context builder object to be used for preparing context data from community reports</li> <li><code>map_system_prompt</code>: prompt template used in the <code>map</code> stage. Default template can be found at map_system_prompt</li> <li><code>reduce_system_prompt</code>: prompt template used in the <code>reduce</code> stage, default template can be found at reduce_system_prompt</li> <li><code>response_type</code>: free-form text describing the desired response type and format (e.g., <code>Multiple Paragraphs</code>, <code>Multi-Page Report</code>)</li> <li><code>allow_general_knowledge</code>: setting this to True will include additional instructions to the <code>reduce_system_prompt</code> to prompt the LLM to incorporate relevant real-world knowledge outside of the dataset. Note that this may increase hallucinations, but can be useful for certain scenarios. Default is False *<code>general_knowledge_inclusion_prompt</code>: instruction to add to the <code>reduce_system_prompt</code> if <code>allow_general_knowledge</code> is enabled. Default instruction can be found at general_knowledge_instruction</li> <li><code>max_data_tokens</code>: token budget for the context data</li> <li><code>map_llm_params</code>: a dictionary of additional parameters (e.g., temperature, max_tokens) to be passed to the LLM call at the <code>map</code> stage</li> <li><code>reduce_llm_params</code>: a dictionary of additional parameters (e.g., temperature, max_tokens) to passed to the LLM call at the <code>reduce</code> stage</li> <li><code>context_builder_params</code>: a dictionary of additional parameters to be passed to the <code>context_builder</code> object when building context window for the <code>map</code> stage.</li> <li><code>concurrent_coroutines</code>: controls the degree of parallelism in the <code>map</code> stage.</li> <li><code>callbacks</code>: optional callback functions, can be used to provide custom event handlers for LLM's completion streaming events</li> </ul>"}, {"location": "query/global_search/#how-to-use", "title": "How to Use", "text": "<p>An example of a global search scenario can be found in the following notebook.</p>"}, {"location": "query/local_search/", "title": "Local Search \ud83d\udd0e", "text": ""}, {"location": "query/local_search/#entity-based-reasoning", "title": "Entity-based Reasoning", "text": "<p>The local search method combines structured data from the knowledge graph with unstructured data from the input documents to augment the LLM context with relevant entity information at query time. It is well-suited for answering questions that require an understanding of specific entities mentioned in the input documents (e.g., \u201cWhat are the healing properties of chamomile?\u201d).</p>"}, {"location": "query/local_search/#methodology", "title": "Methodology", "text": "<pre><code>---\ntitle: Local Search Dataflow\n---\n%%{ init: { 'flowchart': { 'curve': 'step' } } }%%\nflowchart LR\n\n    uq[User Query] ---.1\n    ch1[Conversation&lt;br/&gt;History]---.1\n\n    .1--Entity&lt;br/&gt;Description&lt;br/&gt;Embedding--&gt; ee[Extracted Entities]\n\n    ee[Extracted Entities] ---.2--Entity-Text&lt;br/&gt;Unit Mapping--&gt; ctu[Candidate&lt;br/&gt;Text Units]--Ranking + &lt;br/&gt;Filtering --&gt;ptu[Prioritized&lt;br/&gt;Text Units]---.3\n    .2--Entity-Report&lt;br/&gt;Mapping--&gt; ccr[Candidate&lt;br/&gt;Community Reports]--Ranking + &lt;br/&gt;Filtering --&gt;pcr[Prioritized&lt;br/&gt;Community Reports]---.3\n    .2--Entity-Entity&lt;br/&gt;Relationships--&gt; ce[Candidate&lt;br/&gt;Entities]--Ranking + &lt;br/&gt;Filtering --&gt;pe[Prioritized&lt;br/&gt;Entities]---.3\n    .2--Entity-Entity&lt;br/&gt;Relationships--&gt; cr[Candidate&lt;br/&gt;Relationships]--Ranking + &lt;br/&gt;Filtering --&gt;pr[Prioritized&lt;br/&gt;Relationships]---.3\n    .2--Entity-Covariate&lt;br/&gt;Mappings--&gt; cc[Candidate&lt;br/&gt;Covariates]--Ranking + &lt;br/&gt;Filtering --&gt;pc[Prioritized&lt;br/&gt;Covariates]---.3\n    ch1 --&gt;ch2[Conversation History]---.3\n    .3--&gt;res[Response]\n\n     classDef green fill:#26B653,stroke:#333,stroke-width:2px,color:#fff;\n     classDef turquoise fill:#19CCD3,stroke:#333,stroke-width:2px,color:#fff;\n     classDef rose fill:#DD8694,stroke:#333,stroke-width:2px,color:#fff;\n     classDef orange fill:#F19914,stroke:#333,stroke-width:2px,color:#fff;\n     classDef purple fill:#B356CD,stroke:#333,stroke-width:2px,color:#fff;\n     classDef invisible fill:#fff,stroke:#fff,stroke-width:0px,color:#fff, width:0px;\n     class uq,ch1 turquoise\n     class ee green\n     class ctu,ccr,ce,cr,cc rose\n     class ptu,pcr,pe,pr,pc,ch2 orange\n     class res purple\n     class .1,.2,.3 invisible\n\n</code></pre> <p>Given a user query and, optionally, the conversation history, the local search method identifies a set of entities from the knowledge graph that are semantically-related to the user input. These entities serve as access points into the knowledge graph, enabling the extraction of further relevant details such as connected entities, relationships, entity covariates, and community reports. Additionally, it also extracts relevant text chunks from the raw input documents that are associated with the identified entities. These candidate data sources are then prioritized and filtered to fit within a single context window of pre-defined size, which is used to generate a response to the user query.</p>"}, {"location": "query/local_search/#configuration", "title": "Configuration", "text": "<p>Below are the key parameters of the LocalSearch class:</p> <ul> <li><code>llm</code>: OpenAI model object to be used for response generation</li> <li><code>context_builder</code>: context builder object to be used for preparing context data from collections of knowledge model objects</li> <li><code>system_prompt</code>: prompt template used to generate the search response. Default template can be found at system_prompt</li> <li><code>response_type</code>: free-form text describing the desired response type and format (e.g., <code>Multiple Paragraphs</code>, <code>Multi-Page Report</code>)</li> <li><code>llm_params</code>: a dictionary of additional parameters (e.g., temperature, max_tokens) to be passed to the LLM call</li> <li><code>context_builder_params</code>: a dictionary of additional parameters to be passed to the <code>context_builder</code> object when building context for the search prompt</li> <li><code>callbacks</code>: optional callback functions, can be used to provide custom event handlers for LLM's completion streaming events</li> </ul>"}, {"location": "query/local_search/#how-to-use", "title": "How to Use", "text": "<p>An example of a local search scenario can be found in the following notebook.</p>"}, {"location": "query/overview/", "title": "Query Engine \ud83d\udd0e", "text": "<p>The Query Engine is the retrieval module of the Graph RAG Library. It is one of the two main components of the Graph RAG library, the other being the Indexing Pipeline (see Indexing Pipeline). It is responsible for the following tasks:</p> <ul> <li>Local Search</li> <li>Global Search</li> <li>DRIFT Search</li> <li>Question Generation</li> </ul>"}, {"location": "query/overview/#local-search", "title": "Local Search", "text": "<p>Local search method generates answers by combining relevant data from the AI-extracted knowledge-graph with text chunks of the raw documents. This method is suitable for questions that require an understanding of specific entities mentioned in the documents (e.g. What are the healing properties of chamomile?).</p> <p>For more details about how Local Search works please refer to the Local Search documentation.</p>"}, {"location": "query/overview/#global-search", "title": "Global Search", "text": "<p>Global search method generates answers by searching over all AI-generated community reports in a map-reduce fashion. This is a resource-intensive method, but often gives good responses for questions that require an understanding of the dataset as a whole (e.g. What are the most significant values of the herbs mentioned in this notebook?).</p> <p>More about this can be checked at the Global Search documentation.</p>"}, {"location": "query/overview/#drift-search", "title": "DRIFT Search", "text": "<p>DRIFT Search introduces a new approach to local search queries by including community information in the search process. This greatly expands the breadth of the query\u2019s starting point and leads to retrieval and usage of a far higher variety of facts in the final answer. This addition expands the GraphRAG query engine by providing a more comprehensive option for local search, which uses community insights to refine a query into detailed follow-up questions.</p> <p>To learn more about DRIFT Search, please refer to the DRIFT Search documentation.</p>"}, {"location": "query/overview/#question-generation", "title": "Question Generation", "text": "<p>This functionality takes a list of user queries and generates the next candidate questions. This is useful for generating follow-up questions in a conversation or for generating a list of questions for the investigator to dive deeper into the dataset.</p> <p>Information about how question generation works can be found at the Question Generation documentation page.</p>"}, {"location": "query/question_generation/", "title": "Question Generation \u2754", "text": ""}, {"location": "query/question_generation/#entity-based-question-generation", "title": "Entity-based Question Generation", "text": "<p>The question generation method combines structured data from the knowledge graph with unstructured data from the input documents to generate candidate questions related to specific entities.</p>"}, {"location": "query/question_generation/#methodology", "title": "Methodology", "text": "<p>Given a list of prior user questions, the question generation method uses the same context-building approach employed in local search to extract and prioritize relevant structured and unstructured data, including entities, relationships, covariates, community reports and raw text chunks. These data records are then fitted into a single LLM prompt to generate candidate follow-up questions that represent the most important or urgent information content or themes in the data.</p>"}, {"location": "query/question_generation/#configuration", "title": "Configuration", "text": "<p>Below are the key parameters of the Question Generation class:</p> <ul> <li><code>llm</code>: OpenAI model object to be used for response generation</li> <li><code>context_builder</code>: context builder object to be used for preparing context data from collections of knowledge model objects, using the same context builder class as in local search</li> <li><code>system_prompt</code>: prompt template used to generate candidate questions. Default template can be found at system_prompt</li> <li><code>llm_params</code>: a dictionary of additional parameters (e.g., temperature, max_tokens) to be passed to the LLM call</li> <li><code>context_builder_params</code>: a dictionary of additional parameters to be passed to the <code>context_builder</code> object when building context for the question generation prompt</li> <li><code>callbacks</code>: optional callback functions, can be used to provide custom event handlers for LLM's completion streaming events</li> </ul>"}, {"location": "query/question_generation/#how-to-use", "title": "How to Use", "text": "<p>An example of the question generation function can be found in the following notebook.</p>"}, {"location": "query/notebooks/overview/", "title": "Query Engine Notebooks", "text": "<p>For examples about running Query please refer to the following notebooks:</p> <ul> <li>Global Search Notebook</li> <li>Local Search Notebook</li> <li>DRIFT Search Notebook</li> </ul> <p>The test dataset for these notebooks can be found in dataset.zip.</p>"}]}
\ No newline at end of file
+{"config": {"lang": ["en"], "separator": "[\\s\\-]+", "pipeline": ["stopWordFilter"]}, "docs": [{"location": "", "title": "Welcome to GraphRAG", "text": "<p>\ud83d\udc49 Microsoft Research Blog Post  \ud83d\udc49 GraphRAG Accelerator  \ud83d\udc49 GraphRAG Arxiv</p> <p> </p> <p> Figure 1: An LLM-generated knowledge graph built using GPT-4 Turbo. </p> <p>GraphRAG is a structured, hierarchical approach to Retrieval Augmented Generation (RAG), as opposed to naive semantic-search approaches using plain text snippets. The GraphRAG process involves extracting a knowledge graph out of raw text, building a community hierarchy, generating summaries for these communities, and then leveraging these structures when perform RAG-based tasks.</p> <p>To learn more about GraphRAG and how it can be used to enhance your LLMs ability to reason about your private data, please visit the Microsoft Research Blog Post.</p>"}, {"location": "#solution-accelerator", "title": "Solution Accelerator \ud83d\ude80", "text": "<p>To quickstart the GraphRAG system we recommend trying the Solution Accelerator package. This provides a user-friendly end-to-end experience with Azure resources.</p>"}, {"location": "#get-started-with-graphrag", "title": "Get Started with GraphRAG \ud83d\ude80", "text": "<p>To start using GraphRAG, check out the Get Started guide. For a deeper dive into the main sub-systems, please visit the docpages for the Indexer and Query packages.</p>"}, {"location": "#graphrag-vs-baseline-rag", "title": "GraphRAG vs Baseline RAG \ud83d\udd0d", "text": "<p>Retrieval-Augmented Generation (RAG) is a technique to improve LLM outputs using real-world information. This technique is an important part of most LLM-based tools and the majority of RAG approaches use vector similarity as the search technique, which we call Baseline RAG. GraphRAG uses knowledge graphs to provide substantial improvements in question-and-answer performance when reasoning about complex information. RAG techniques have shown promise in helping LLMs to reason about private datasets - data that the LLM is not trained on and has never seen before, such as an enterprise\u2019s proprietary research, business documents, or communications. Baseline RAG was created to help solve this problem, but we observe situations where baseline RAG performs very poorly. For example:</p> <ul> <li>Baseline RAG struggles to connect the dots. This happens when answering a question requires traversing disparate pieces of information through their shared attributes in order to provide new synthesized insights.</li> <li>Baseline RAG performs poorly when being asked to holistically understand summarized semantic concepts over large data collections or even singular large documents.</li> </ul> <p>To address this, the tech community is working to develop methods that extend and enhance RAG. Microsoft Research\u2019s new approach, GraphRAG, uses LLMs to create a knowledge graph based on an input corpus. This graph, along with community summaries and graph machine learning outputs, are used to augment prompts at query time. GraphRAG shows substantial improvement in answering the two classes of questions described above, demonstrating intelligence or mastery that outperforms other approaches previously applied to private datasets.</p>"}, {"location": "#the-graphrag-process", "title": "The GraphRAG Process \ud83e\udd16", "text": "<p>GraphRAG builds upon our prior research and tooling using graph machine learning. The basic steps of the GraphRAG process are as follows:</p>"}, {"location": "#index", "title": "Index", "text": "<ul> <li>Slice up an input corpus into a series of TextUnits, which act as analyzable units for the rest of the process, and provide fine-grained references in our outputs.</li> <li>Extract all entities, relationships, and key claims from the TextUnits using an LLM.</li> <li>Perform a hierarchical clustering of the graph using the Leiden technique. To see this visually, check out Figure 1 above. Each circle is an entity (e.g., a person, place, or organization), with the size representing the degree of the entity, and the color representing its community.</li> <li>Generate summaries of each community and its constituents from the bottom-up. This aids in holistic understanding of the dataset.</li> </ul>"}, {"location": "#query", "title": "Query", "text": "<p>At query time, these structures are used to provide materials for the LLM context window when answering a question. The primary query modes are:</p> <ul> <li>Global Search for reasoning about holistic questions about the corpus by leveraging the community summaries.</li> <li>Local Search for reasoning about specific entities by fanning-out to their neighbors and associated concepts.</li> <li>DRIFT Search for reasoning about specific entities by fanning-out to their neighbors and associated concepts, but with the added context of community information.</li> </ul>"}, {"location": "#prompt-tuning", "title": "Prompt Tuning", "text": "<p>Using GraphRAG with your data out of the box may not yield the best possible results. We strongly recommend to fine-tune your prompts following the Prompt Tuning Guide in our documentation.</p>"}, {"location": "blog_posts/", "title": "Microsoft Research Blog", "text": "<ul> <li> <p> GraphRAG: Unlocking LLM discovery on narrative private data</p> <p>Published February 13, 2024 <p>By Jonathan Larson, Senior Principal Data Architect; Steven Truitt, Principal Program Manager</p> <li> <p> GraphRAG: New tool for complex data discovery now on GitHub</p> <p>Published July 2, 2024 <p>By Darren Edge, Senior Director; Ha Trinh, Senior Data Scientist; Steven Truitt, Principal Program Manager; Jonathan Larson, Senior Principal Data Architect</p> <li> <p> GraphRAG auto-tuning provides rapid adaptation to new domains</p> <p>Published September 9, 2024 <p>By Alonso Guevara Fern\u00e1ndez, Sr. Software Engineer; Katy Smith, Data Scientist II; Joshua Bradley, Senior Data Scientist; Darren Edge, Senior Director; Ha Trinh, Senior Data Scientist; Sarah Smith, Senior Program Manager; Ben Cutler, Senior Director; Steven Truitt, Principal Program Manager; Jonathan Larson, Senior Principal Data Architect</p> <li> <p> Introducing DRIFT Search: Combining global and local search methods to improve quality and efficiency</p> <p>Published October 31, 2024 <p>By Julian Whiting, Senior Machine Learning Engineer; Zachary Hills , Senior Software Engineer; Alonso Guevara Fern\u00e1ndez, Sr. Software Engineer; Ha Trinh, Senior Data Scientist; Adam Bradley , Managing Partner, Strategic Research; Jonathan Larson, Senior Principal Data Architect</p> <li> <p> GraphRAG: Improving global search via dynamic community selection</p> <p>Published November 15, 2024 <p>By Bryan Li, Research Intern; Ha Trinh, Senior Data Scientist; Darren Edge, Senior Director; Jonathan Larson, Senior Principal Data Architect</p> <li> <p> LazyGraphRAG: Setting a new standard for quality and cost</p> <p>Published November 25, 2024 <p>By Darren Edge, Senior Director; Ha Trinh, Senior Data Scientist;  Jonathan Larson, Senior Principal Data Architect</p>"}, {"location": "cli/", "title": "CLI Reference", "text": "<p>This page documents the command-line interface of the graphrag library.</p>"}, {"location": "cli/#graphrag", "title": "graphrag", "text": "<p>GraphRAG: A graph-based retrieval-augmented generation (RAG) system.</p> <p>Usage:</p> <pre><code> [OPTIONS] COMMAND [ARGS]...\n</code></pre> <p>Options:</p> <pre><code>  --install-completion  Install completion for the current shell.\n  --show-completion     Show completion for the current shell, to copy it or\n                        customize the installation.\n</code></pre>"}, {"location": "cli/#index", "title": "index", "text": "<p>Build a knowledge graph index.</p> <p>Usage:</p> <pre><code> index [OPTIONS]\n</code></pre> <p>Options:</p> <pre><code>  --config PATH                   The configuration to use.\n  --root PATH                     The project root directory.  [default: .]\n  --verbose / --no-verbose        Run the indexing pipeline with verbose\n                                  logging  [default: no-verbose]\n  --memprofile / --no-memprofile  Run the indexing pipeline with memory\n                                  profiling  [default: no-memprofile]\n  --resume TEXT                   Resume a given indexing run\n  --reporter [rich|print|none]    The progress reporter to use.  [default:\n                                  rich]\n  --dry-run / --no-dry-run        Run the indexing pipeline without executing\n                                  any steps to inspect and validate the\n                                  configuration.  [default: no-dry-run]\n  --cache / --no-cache            Use LLM cache.  [default: cache]\n  --skip-validation / --no-skip-validation\n                                  Skip any preflight validation. Useful when\n                                  running no LLM steps.  [default: no-skip-\n                                  validation]\n  --output PATH                   Indexing pipeline output directory.\n                                  Overrides storage.base_dir in the\n                                  configuration file.\n</code></pre>"}, {"location": "cli/#init", "title": "init", "text": "<p>Generate a default configuration file.</p> <p>Usage:</p> <pre><code> init [OPTIONS]\n</code></pre> <p>Options:</p> <pre><code>  --root PATH  The project root directory.  [required]\n</code></pre>"}, {"location": "cli/#prompt-tune", "title": "prompt-tune", "text": "<p>Generate custom graphrag prompts with your own data (i.e. auto templating).</p> <p>Usage:</p> <pre><code> prompt-tune [OPTIONS]\n</code></pre> <p>Options:</p> <pre><code>  --root PATH                     The project root directory.  [default: .]\n  --config PATH                   The configuration to use.\n  --domain TEXT                   The domain your input data is related to.\n                                  For example 'space science', 'microbiology',\n                                  'environmental news'. If not defined, a\n                                  domain will be inferred from the input data.\n  --selection-method [all|random|top|auto]\n                                  The text chunk selection method.  [default:\n                                  random]\n  --n-subset-max INTEGER          The number of text chunks to embed when\n                                  --selection-method=auto.  [default: 300]\n  --k INTEGER                     The maximum number of documents to select\n                                  from each centroid when --selection-\n                                  method=auto.  [default: 15]\n  --limit INTEGER                 The number of documents to load when\n                                  --selection-method={random,top}.  [default:\n                                  15]\n  --max-tokens INTEGER            The max token count for prompt generation.\n                                  [default: 2000]\n  --min-examples-required INTEGER\n                                  The minimum number of examples to\n                                  generate/include in the entity extraction\n                                  prompt.  [default: 2]\n  --chunk-size INTEGER            The max token count for prompt generation.\n                                  [default: 200]\n  --language TEXT                 The primary language used for inputs and\n                                  outputs in graphrag prompts.\n  --discover-entity-types / --no-discover-entity-types\n                                  Discover and extract unspecified entity\n                                  types.  [default: discover-entity-types]\n  --output PATH                   The directory to save prompts to, relative\n                                  to the project root directory.  [default:\n                                  prompts]\n</code></pre>"}, {"location": "cli/#query", "title": "query", "text": "<p>Query a knowledge graph index.</p> <p>Usage:</p> <pre><code> query [OPTIONS]\n</code></pre> <p>Options:</p> <pre><code>  --method [local|global|drift]   The query algorithm to use.  [required]\n  --query TEXT                    The query to execute.  [required]\n  --config PATH                   The configuration to use.\n  --data PATH                     Indexing pipeline output directory (i.e.\n                                  contains the parquet files).\n  --root PATH                     The project root directory.  [default: .]\n  --community-level INTEGER       The community level in the Leiden community\n                                  hierarchy from which to load community\n                                  reports. Higher values represent reports\n                                  from smaller communities.  [default: 2]\n  --dynamic-community-selection / --no-dynamic-community-selection\n                                  Use global search with dynamic community\n                                  selection.  [default: no-dynamic-community-\n                                  selection]\n  --response-type TEXT            Free form text describing the response type\n                                  and format, can be anything, e.g. Multiple\n                                  Paragraphs, Single Paragraph, Single\n                                  Sentence, List of 3-7 Points, Single Page,\n                                  Multi-Page Report. Default: Multiple\n                                  Paragraphs  [default: Multiple Paragraphs]\n  --streaming / --no-streaming    Print response in a streaming manner.\n                                  [default: no-streaming]\n</code></pre>"}, {"location": "cli/#update", "title": "update", "text": "<p>Update an existing knowledge graph index.</p> <p>Applies a default storage configuration (if not provided by config), saving the new index to the local file system in the <code>update_output</code> folder.</p> <p>Usage:</p> <pre><code> update [OPTIONS]\n</code></pre> <p>Options:</p> <pre><code>  --config PATH                   The configuration to use.\n  --root PATH                     The project root directory.  [default: .]\n  --verbose / --no-verbose        Run the indexing pipeline with verbose\n                                  logging  [default: no-verbose]\n  --memprofile / --no-memprofile  Run the indexing pipeline with memory\n                                  profiling  [default: no-memprofile]\n  --reporter [rich|print|none]    The progress reporter to use.  [default:\n                                  rich]\n  --cache / --no-cache            Use LLM cache.  [default: cache]\n  --skip-validation / --no-skip-validation\n                                  Skip any preflight validation. Useful when\n                                  running no LLM steps.  [default: no-skip-\n                                  validation]\n  --output PATH                   Indexing pipeline output directory.\n                                  Overrides storage.base_dir in the\n                                  configuration file.\n</code></pre>"}, {"location": "developing/", "title": "Development Guide", "text": ""}, {"location": "developing/#requirements", "title": "Requirements", "text": "Name Installation Purpose Python 3.10-3.12 Download The library is Python-based. Poetry Instructions Poetry is used for package management and virtualenv management in Python codebases"}, {"location": "developing/#getting-started", "title": "Getting Started", "text": ""}, {"location": "developing/#install-dependencies", "title": "Install Dependencies", "text": "<pre><code># Install Python dependencies.\npoetry install\n</code></pre>"}, {"location": "developing/#execute-the-indexing-engine", "title": "Execute the Indexing Engine", "text": "<pre><code>poetry run poe index &lt;...args&gt;\n</code></pre>"}, {"location": "developing/#executing-queries", "title": "Executing Queries", "text": "<pre><code>poetry run poe query &lt;...args&gt;\n</code></pre>"}, {"location": "developing/#azurite", "title": "Azurite", "text": "<p>Some unit and smoke tests use Azurite to emulate Azure resources. This can be started by running:</p> <pre><code>./scripts/start-azurite.sh\n</code></pre> <p>or by simply running <code>azurite</code> in the terminal if already installed globally. See the Azurite documentation for more information about how to install and use Azurite.</p>"}, {"location": "developing/#lifecycle-scripts", "title": "Lifecycle Scripts", "text": "<p>Our Python package utilizes Poetry to manage dependencies and poethepoet to manage build scripts.</p> <p>Available scripts are:</p> <ul> <li><code>poetry run poe index</code> - Run the Indexing CLI</li> <li><code>poetry run poe query</code> - Run the Query CLI</li> <li><code>poetry build</code> - This invokes <code>poetry build</code>, which will build a wheel file and other distributable artifacts.</li> <li><code>poetry run poe test</code> - This will execute all tests.</li> <li><code>poetry run poe test_unit</code> - This will execute unit tests.</li> <li><code>poetry run poe test_integration</code> - This will execute integration tests.</li> <li><code>poetry run poe test_smoke</code> - This will execute smoke tests.</li> <li><code>poetry run poe check</code> - This will perform a suite of static checks across the package, including:</li> <li>formatting</li> <li>documentation formatting</li> <li>linting</li> <li>security patterns</li> <li>type-checking</li> <li><code>poetry run poe fix</code> - This will apply any available auto-fixes to the package. Usually this is just formatting fixes.</li> <li><code>poetry run poe fix_unsafe</code> - This will apply any available auto-fixes to the package, including those that may be unsafe.</li> <li><code>poetry run poe format</code> - Explicitly run the formatter across the package.</li> </ul>"}, {"location": "developing/#troubleshooting", "title": "Troubleshooting", "text": ""}, {"location": "developing/#runtimeerror-llvm-config-failed-executing-please-point-llvm_config-to-the-path-for-llvm-config-when-running-poetry-install", "title": "\"RuntimeError: llvm-config failed executing, please point LLVM_CONFIG to the path for llvm-config\" when running poetry install", "text": "<p>Make sure llvm-9 and llvm-9-dev are installed:</p> <p><code>sudo apt-get install llvm-9 llvm-9-dev</code></p> <p>and then in your bashrc, add</p> <p><code>export LLVM_CONFIG=/usr/bin/llvm-config-9</code></p>"}, {"location": "developing/#numba_pymoduleh610-fatal-error-pythonh-no-such-file-or-directory-when-running-poetry-install", "title": "\"numba/_pymodule.h:6:10: fatal error: Python.h: No such file or directory\" when running poetry install", "text": "<p>Make sure you have python3.10-dev installed or more generally <code>python&lt;version&gt;-dev</code></p> <p><code>sudo apt-get install python3.10-dev</code></p>"}, {"location": "developing/#llm-call-constantly-exceeds-tpm-rpm-or-time-limits", "title": "LLM call constantly exceeds TPM, RPM or time limits", "text": "<p><code>GRAPHRAG_LLM_THREAD_COUNT</code> and <code>GRAPHRAG_EMBEDDING_THREAD_COUNT</code> are both set to 50 by default. You can modify these values to reduce concurrency. Please refer to the Configuration Documents</p>"}, {"location": "get_started/", "title": "Getting Started", "text": ""}, {"location": "get_started/#requirements", "title": "Requirements", "text": "<p>Python 3.10-3.12</p> <p>To get started with the GraphRAG system, you have a few options:</p> <p>\ud83d\udc49 Use the GraphRAG Accelerator solution  \ud83d\udc49 Install from pypi.  \ud83d\udc49 Use it from source</p>"}, {"location": "get_started/#quickstart", "title": "Quickstart", "text": "<p>To get started with the GraphRAG system we recommend trying the Solution Accelerator package. This provides a user-friendly end-to-end experience with Azure resources.</p>"}, {"location": "get_started/#overview", "title": "Overview", "text": "<p>The following is a simple end-to-end example for using the GraphRAG system. It shows how to use the system to index some text, and then use the indexed data to answer questions about the documents.</p>"}, {"location": "get_started/#install-graphrag", "title": "Install GraphRAG", "text": "<pre><code>pip install graphrag\n</code></pre> <p>The graphrag library includes a CLI for a no-code approach to getting started. Please review the full CLI documentation for further detail.</p>"}, {"location": "get_started/#running-the-indexer", "title": "Running the Indexer", "text": "<p>We need to set up a data project and some initial configuration. First let's get a sample dataset ready:</p> <pre><code>mkdir -p ./ragtest/input\n</code></pre> <p>Get a copy of A Christmas Carol by Charles Dickens from a trusted source:</p> <pre><code>curl https://www.gutenberg.org/cache/epub/24022/pg24022.txt -o ./ragtest/input/book.txt\n</code></pre>"}, {"location": "get_started/#set-up-your-workspace-variables", "title": "Set Up Your Workspace Variables", "text": "<p>To initialize your workspace, first run the <code>graphrag init</code> command. Since we have already configured a directory named <code>./ragtest</code> in the previous step, run the following command:</p> <pre><code>graphrag init --root ./ragtest\n</code></pre> <p>This will create two files: <code>.env</code> and <code>settings.yaml</code> in the <code>./ragtest</code> directory.</p> <ul> <li><code>.env</code> contains the environment variables required to run the GraphRAG pipeline. If you inspect the file, you'll see a single environment variable defined,   <code>GRAPHRAG_API_KEY=&lt;API_KEY&gt;</code>. This is the API key for the OpenAI API or Azure OpenAI endpoint. You can replace this with your own API key. If you are using another form of authentication (i.e. managed identity), please delete this file.</li> <li><code>settings.yaml</code> contains the settings for the pipeline. You can modify this file to change the settings for the pipeline.   </li> </ul>"}, {"location": "get_started/#openai-and-azure-openai", "title": "OpenAI and Azure OpenAI", "text": "<p>If running in OpenAI mode, update the value of <code>GRAPHRAG_API_KEY</code> in the <code>.env</code> file with your OpenAI API key.</p>"}, {"location": "get_started/#azure-openai", "title": "Azure OpenAI", "text": "<p>In addition, Azure OpenAI users should set the following variables in the settings.yaml file. To find the appropriate sections, just search for the <code>llm:</code> configuration, you should see two sections, one for the chat endpoint and one for the embeddings endpoint. Here is an example of how to configure the chat endpoint:</p> <pre><code>type: azure_openai_chat # Or azure_openai_embedding for embeddings\napi_base: https://&lt;instance&gt;.openai.azure.com\napi_version: 2024-02-15-preview # You can customize this for other versions\ndeployment_name: &lt;azure_model_deployment_name&gt;\n</code></pre> <ul> <li>For more details about configuring GraphRAG, see the configuration documentation.</li> <li>To learn more about Initialization, refer to the Initialization documentation.</li> <li>For more details about using the CLI, refer to the CLI documentation.</li> </ul>"}, {"location": "get_started/#running-the-indexing-pipeline", "title": "Running the Indexing pipeline", "text": "<p>Finally we'll run the pipeline!</p> <pre><code>graphrag index --root ./ragtest\n</code></pre> <p></p> <p>This process will take some time to run. This depends on the size of your input data, what model you're using, and the text chunk size being used (these can be configured in your <code>settings.yml</code> file). Once the pipeline is complete, you should see a new folder called <code>./ragtest/output</code> with a series of parquet files.</p>"}, {"location": "get_started/#using-the-query-engine", "title": "Using the Query Engine", "text": ""}, {"location": "get_started/#running-the-query-engine", "title": "Running the Query Engine", "text": "<p>Now let's ask some questions using this dataset.</p> <p>Here is an example using Global search to ask a high-level question:</p> <pre><code>graphrag query \\\n--root ./ragtest \\\n--method global \\\n--query \"What are the top themes in this story?\"\n</code></pre> <p>Here is an example using Local search to ask a more specific question about a particular character:</p> <pre><code>graphrag query \\\n--root ./ragtest \\\n--method local \\\n--query \"Who is Scrooge and what are his main relationships?\"\n</code></pre> <p>Please refer to Query Engine docs for detailed information about how to leverage our Local and Global search mechanisms for extracting meaningful insights from data after the Indexer has wrapped up execution.</p>"}, {"location": "get_started/#visualizing-the-graph", "title": "Visualizing the Graph", "text": "<p>Check out our visualization guide for a more interactive experience in debugging and exploring the knowledge graph.</p>"}, {"location": "visualization_guide/", "title": "Visualizing and Debugging Your Knowledge Graph", "text": "<p>The following step-by-step guide walks through the process to visualize a knowledge graph after it's been constructed by graphrag. Note that some of the settings recommended below are based on our own experience of what works well. Feel free to change and explore other settings for a better visualization experience!</p>"}, {"location": "visualization_guide/#1-run-the-pipeline", "title": "1. Run the Pipeline", "text": "<p>Before building an index, please review your <code>settings.yaml</code> configuration file and ensure that graphml snapshots is enabled. <pre><code>snapshots:\n  graphml: true\n</code></pre> (Optional) To support other visualization tools and exploration, additional parameters can be enabled that provide access to vector embeddings. <pre><code>embed_graph:\n  enabled: true # will generate node2vec embeddings for nodes\numap:\n  enabled: true # will generate UMAP embeddings for nodes\n</code></pre> After running the indexing pipeline over your data, there will be an output folder (defined by the <code>storage.base_dir</code> setting).</p> <ul> <li>Output Folder: Contains artifacts from the LLM\u2019s indexing pass.</li> </ul>"}, {"location": "visualization_guide/#2-locate-the-knowledge-graph", "title": "2. Locate the Knowledge Graph", "text": "<p>In the output folder, look for a file named <code>merged_graph.graphml</code>. graphml is a standard file format supported by many visualization tools. We recommend trying Gephi.</p>"}, {"location": "visualization_guide/#3-open-the-graph-in-gephi", "title": "3. Open the Graph in Gephi", "text": "<ol> <li>Install and open Gephi</li> <li>Navigate to the <code>output</code> folder containing the various parquet files.</li> <li>Import the <code>merged_graph.graphml</code> file into Gephi. This will result in a fairly plain view of the undirected graph nodes and edges.</li> </ol>"}, {"location": "visualization_guide/#4-install-the-leiden-algorithm-plugin", "title": "4. Install the Leiden Algorithm Plugin", "text": "<ol> <li>Go to <code>Tools</code> -&gt; <code>Plugins</code>.</li> <li>Search for \"Leiden Algorithm\".</li> <li>Click <code>Install</code> and restart Gephi.</li> </ol>"}, {"location": "visualization_guide/#5-run-statistics", "title": "5. Run Statistics", "text": "<ol> <li>In the <code>Statistics</code> tab on the right, click <code>Run</code> for <code>Average Degree</code> and <code>Leiden Algorithm</code>.</li> </ol> <ol> <li>For the Leiden Algorithm, adjust the settings:</li> <li>Quality function: Modularity</li> <li>Resolution: 1</li> </ol>"}, {"location": "visualization_guide/#6-color-the-graph-by-clusters", "title": "6. Color the Graph by Clusters", "text": "<ol> <li>Go to the <code>Appearance</code> pane in the upper left side of Gephi.</li> </ol> <ol> <li>Select <code>Nodes</code>, then <code>Partition</code>, and click the color palette icon in the upper right.</li> <li>Choose <code>Cluster</code> from the dropdown.</li> <li>Click the <code>Palette...</code> hyperlink, then <code>Generate...</code>.</li> <li>Uncheck <code>Limit number of colors</code>, click <code>Generate</code>, and then <code>Ok</code>.</li> <li>Click <code>Apply</code> to color the graph. This will color the graph based on the partitions discovered by Leiden.</li> </ol>"}, {"location": "visualization_guide/#7-resize-nodes-by-degree-centrality", "title": "7. Resize Nodes by Degree Centrality", "text": "<ol> <li>In the <code>Appearance</code> pane in the upper left, select <code>Nodes</code> -&gt; <code>Ranking</code></li> <li>Select the <code>Sizing</code> icon in the upper right.</li> <li>Choose <code>Degree</code> and set:</li> <li>Min: 10</li> <li>Max: 150</li> <li>Click <code>Apply</code>.</li> </ol>"}, {"location": "visualization_guide/#8-layout-the-graph", "title": "8. Layout the Graph", "text": "<ol> <li>In the <code>Layout</code> tab in the lower left, select <code>OpenORD</code>.</li> </ol> <ol> <li>Set <code>Liquid</code> and <code>Expansion</code> stages to 50, and everything else to 0.</li> <li>Click <code>Run</code> and monitor the progress.</li> </ol>"}, {"location": "visualization_guide/#9-run-forceatlas2", "title": "9. Run ForceAtlas2", "text": "<ol> <li>Select <code>Force Atlas 2</code> in the layout options.</li> </ol> <ol> <li>Adjust the settings:</li> <li>Scaling: 15</li> <li>Dissuade Hubs: checked</li> <li>LinLog mode: uncheck</li> <li>Prevent Overlap: checked</li> <li>Click <code>Run</code> and wait.</li> <li>Press <code>Stop</code> when it looks like the graph nodes have settled and no longer change position significantly.</li> </ol>"}, {"location": "visualization_guide/#10-add-text-labels-optional", "title": "10. Add Text Labels (Optional)", "text": "<ol> <li>Turn on text labels in the appropriate section.</li> <li>Configure and resize them as needed.</li> </ol> <p>Your final graph should now be visually organized and ready for analysis!</p>"}, {"location": "config/env_vars/", "title": "Default Configuration Mode (using Env Vars)", "text": ""}, {"location": "config/env_vars/#text-embeddings-customization", "title": "Text-Embeddings Customization", "text": "<p>By default, the GraphRAG indexer will only export embeddings required for our query methods. However, the model has embeddings defined for all plaintext fields, and these can be generated by setting the <code>GRAPHRAG_EMBEDDING_TARGET</code> environment variable to <code>all</code>.</p> <p>If the embedding target is <code>all</code>, and you want to only embed a subset of these fields, you may specify which embeddings to skip using the <code>GRAPHRAG_EMBEDDING_SKIP</code> argument described below.</p>"}, {"location": "config/env_vars/#embedded-fields", "title": "Embedded Fields", "text": "<ul> <li><code>text_unit.text</code></li> <li><code>document.text</code></li> <li><code>entity.title</code></li> <li><code>entity.description</code></li> <li><code>relationship.description</code></li> <li><code>community.title</code></li> <li><code>community.summary</code></li> <li><code>community.full_content</code></li> </ul>"}, {"location": "config/env_vars/#input-data", "title": "Input Data", "text": "<p>Our pipeline can ingest .csv or .txt data from an input folder. These files can be nested within subfolders. To configure how input data is handled, what fields are mapped over, and how timestamps are parsed, look for configuration values starting with <code>GRAPHRAG_INPUT_</code> below. In general, CSV-based data provides the most customizability. Each CSV should at least contain a <code>text</code> field (which can be mapped with environment variables), but it's helpful if they also have <code>title</code>, <code>timestamp</code>, and <code>source</code> fields. Additional fields can be included as well, which will land as extra fields on the <code>Document</code> table.</p>"}, {"location": "config/env_vars/#base-llm-settings", "title": "Base LLM Settings", "text": "<p>These are the primary settings for configuring LLM connectivity.</p> Parameter Required? Description Type Default Value <code>GRAPHRAG_API_KEY</code> Yes for OpenAI. Optional for AOAI The API key. (Note: <code>OPENAI_API_KEY is also used as a fallback). If not defined when using AOAI, managed identity will be used. |</code>str<code>|</code>None` <code>GRAPHRAG_API_BASE</code> For AOAI The API Base URL <code>str</code> <code>None</code> <code>GRAPHRAG_API_VERSION</code> For AOAI The AOAI API version. <code>str</code> <code>None</code> <code>GRAPHRAG_API_ORGANIZATION</code> The AOAI organization. <code>str</code> <code>None</code> <code>GRAPHRAG_API_PROXY</code> The AOAI proxy. <code>str</code> <code>None</code>"}, {"location": "config/env_vars/#text-generation-settings", "title": "Text Generation Settings", "text": "<p>These settings control the text generation model used by the pipeline. Any settings with a fallback will use the base LLM settings, if available.</p> Parameter Required? Description Type Default Value <code>GRAPHRAG_LLM_TYPE</code> For AOAI The LLM operation type. Either <code>openai_chat</code> or <code>azure_openai_chat</code> <code>str</code> <code>openai_chat</code> <code>GRAPHRAG_LLM_DEPLOYMENT_NAME</code> For AOAI The AOAI model deployment name. <code>str</code> <code>None</code> <code>GRAPHRAG_LLM_API_KEY</code> Yes (uses fallback) The API key. If not defined when using AOAI, managed identity will be used. <code>str</code> <code>None</code> <code>GRAPHRAG_LLM_API_BASE</code> For AOAI (uses fallback) The API Base URL <code>str</code> <code>None</code> <code>GRAPHRAG_LLM_API_VERSION</code> For AOAI (uses fallback) The AOAI API version. <code>str</code> <code>None</code> <code>GRAPHRAG_LLM_API_ORGANIZATION</code> For AOAI (uses fallback) The AOAI organization. <code>str</code> <code>None</code> <code>GRAPHRAG_LLM_API_PROXY</code> The AOAI proxy. <code>str</code> <code>None</code> <code>GRAPHRAG_LLM_MODEL</code> The LLM model. <code>str</code> <code>gpt-4-turbo-preview</code> <code>GRAPHRAG_LLM_MAX_TOKENS</code> The maximum number of tokens. <code>int</code> <code>4000</code> <code>GRAPHRAG_LLM_REQUEST_TIMEOUT</code> The maximum number of seconds to wait for a response from the chat client. <code>int</code> <code>180</code> <code>GRAPHRAG_LLM_MODEL_SUPPORTS_JSON</code> Indicates whether the given model supports JSON output mode. <code>True</code> to enable. <code>str</code> <code>None</code> <code>GRAPHRAG_LLM_THREAD_COUNT</code> The number of threads to use for LLM parallelization. <code>int</code> 50 <code>GRAPHRAG_LLM_THREAD_STAGGER</code> The time to wait (in seconds) between starting each thread. <code>float</code> 0.3 <code>GRAPHRAG_LLM_CONCURRENT_REQUESTS</code> The number of concurrent requests to allow for the embedding client. <code>int</code> 25 <code>GRAPHRAG_LLM_TOKENS_PER_MINUTE</code> The number of tokens per minute to allow for the LLM client. 0 = Bypass <code>int</code> 0 <code>GRAPHRAG_LLM_REQUESTS_PER_MINUTE</code> The number of requests per minute to allow for the LLM client. 0 = Bypass <code>int</code> 0 <code>GRAPHRAG_LLM_MAX_RETRIES</code> The maximum number of retries to attempt when a request fails. <code>int</code> 10 <code>GRAPHRAG_LLM_MAX_RETRY_WAIT</code> The maximum number of seconds to wait between retries. <code>int</code> 10 <code>GRAPHRAG_LLM_SLEEP_ON_RATE_LIMIT_RECOMMENDATION</code> Whether to sleep on rate limit recommendation. (Azure Only) <code>bool</code> <code>True</code> <code>GRAPHRAG_LLM_TEMPERATURE</code> The temperature to use generation. <code>float</code> 0 <code>GRAPHRAG_LLM_TOP_P</code> The top_p to use for sampling. <code>float</code> 1 <code>GRAPHRAG_LLM_N</code> The number of responses to generate. <code>int</code> 1"}, {"location": "config/env_vars/#text-embedding-settings", "title": "Text Embedding Settings", "text": "<p>These settings control the text embedding model used by the pipeline. Any settings with a fallback will use the base LLM settings, if available.</p> Parameter Required ? Description Type Default <code>GRAPHRAG_EMBEDDING_TYPE</code> For AOAI The embedding client to use. Either <code>openai_embedding</code> or <code>azure_openai_embedding</code> <code>str</code> <code>openai_embedding</code> <code>GRAPHRAG_EMBEDDING_DEPLOYMENT_NAME</code> For AOAI The AOAI deployment name. <code>str</code> <code>None</code> <code>GRAPHRAG_EMBEDDING_API_KEY</code> Yes (uses fallback) The API key to use for the embedding client. If not defined when using AOAI, managed identity will be used. <code>str</code> <code>None</code> <code>GRAPHRAG_EMBEDDING_API_BASE</code> For AOAI (uses fallback) The API base URL. <code>str</code> <code>None</code> <code>GRAPHRAG_EMBEDDING_API_VERSION</code> For AOAI (uses fallback) The AOAI API version to use for the embedding client. <code>str</code> <code>None</code> <code>GRAPHRAG_EMBEDDING_API_ORGANIZATION</code> For AOAI (uses fallback) The AOAI organization to use for the embedding client. <code>str</code> <code>None</code> <code>GRAPHRAG_EMBEDDING_API_PROXY</code> The AOAI proxy to use for the embedding client. <code>str</code> <code>None</code> <code>GRAPHRAG_EMBEDDING_MODEL</code> The model to use for the embedding client. <code>str</code> <code>text-embedding-3-small</code> <code>GRAPHRAG_EMBEDDING_BATCH_SIZE</code> The number of texts to embed at once. (Azure limit is 16) <code>int</code> 16 <code>GRAPHRAG_EMBEDDING_BATCH_MAX_TOKENS</code> The maximum tokens per batch (Azure limit is 8191) <code>int</code> 8191 <code>GRAPHRAG_EMBEDDING_TARGET</code> The target fields to embed. Either <code>required</code> or <code>all</code>. <code>str</code> <code>required</code> <code>GRAPHRAG_EMBEDDING_SKIP</code> A comma-separated list of fields to skip embeddings for . (e.g. 'relationship.description') <code>str</code> <code>None</code> <code>GRAPHRAG_EMBEDDING_THREAD_COUNT</code> The number of threads to use for parallelization for embeddings. <code>int</code> <code>GRAPHRAG_EMBEDDING_THREAD_STAGGER</code> The time to wait (in seconds) between starting each thread for embeddings. <code>float</code> 50 <code>GRAPHRAG_EMBEDDING_CONCURRENT_REQUESTS</code> The number of concurrent requests to allow for the embedding client. <code>int</code> 25 <code>GRAPHRAG_EMBEDDING_TOKENS_PER_MINUTE</code> The number of tokens per minute to allow for the embedding client. 0 = Bypass <code>int</code> 0 <code>GRAPHRAG_EMBEDDING_REQUESTS_PER_MINUTE</code> The number of requests per minute to allow for the embedding client. 0 = Bypass <code>int</code> 0 <code>GRAPHRAG_EMBEDDING_MAX_RETRIES</code> The maximum number of retries to attempt when a request fails. <code>int</code> 10 <code>GRAPHRAG_EMBEDDING_MAX_RETRY_WAIT</code> The maximum number of seconds to wait between retries. <code>int</code> 10 <code>GRAPHRAG_EMBEDDING_SLEEP_ON_RATE_LIMIT_RECOMMENDATION</code> Whether to sleep on rate limit recommendation. (Azure Only) <code>bool</code> <code>True</code>"}, {"location": "config/env_vars/#input-settings", "title": "Input Settings", "text": "<p>These settings control the data input used by the pipeline. Any settings with a fallback will use the base LLM settings, if available.</p>"}, {"location": "config/env_vars/#plaintext-input-data-graphrag_input_file_typetext", "title": "Plaintext Input Data (<code>GRAPHRAG_INPUT_FILE_TYPE</code>=text)", "text": "Parameter Description Type Required or Optional Default <code>GRAPHRAG_INPUT_FILE_PATTERN</code> The file pattern regexp to use when reading input files from the input directory. <code>str</code> optional <code>.*\\.txt$</code>"}, {"location": "config/env_vars/#csv-input-data-graphrag_input_file_typecsv", "title": "CSV Input Data (<code>GRAPHRAG_INPUT_FILE_TYPE</code>=csv)", "text": "Parameter Description Type Required or Optional Default <code>GRAPHRAG_INPUT_TYPE</code> The input storage type to use when reading files. (<code>file</code> or <code>blob</code>) <code>str</code> optional <code>file</code> <code>GRAPHRAG_INPUT_FILE_PATTERN</code> The file pattern regexp to use when reading input files from the input directory. <code>str</code> optional <code>.*\\.txt$</code> <code>GRAPHRAG_INPUT_SOURCE_COLUMN</code> The 'source' column to use when reading CSV input files. <code>str</code> optional <code>source</code> <code>GRAPHRAG_INPUT_TIMESTAMP_COLUMN</code> The 'timestamp' column to use when reading CSV input files. <code>str</code> optional <code>None</code> <code>GRAPHRAG_INPUT_TIMESTAMP_FORMAT</code> The timestamp format to use when parsing timestamps in the timestamp column. <code>str</code> optional <code>None</code> <code>GRAPHRAG_INPUT_TEXT_COLUMN</code> The 'text' column to use when reading CSV input files. <code>str</code> optional <code>text</code> <code>GRAPHRAG_INPUT_DOCUMENT_ATTRIBUTE_COLUMNS</code> A list of CSV columns, comma-separated, to incorporate as document fields. <code>str</code> optional <code>id</code> <code>GRAPHRAG_INPUT_TITLE_COLUMN</code> The 'title' column to use when reading CSV input files. <code>str</code> optional <code>title</code> <code>GRAPHRAG_INPUT_STORAGE_ACCOUNT_BLOB_URL</code> The Azure Storage blob endpoint to use when in <code>blob</code> mode and using managed identity. Will have the format <code>https://&lt;storage_account_name&gt;.blob.core.windows.net</code> <code>str</code> optional <code>None</code> <code>GRAPHRAG_INPUT_CONNECTION_STRING</code> The connection string to use when reading CSV input files from Azure Blob Storage. <code>str</code> optional <code>None</code> <code>GRAPHRAG_INPUT_CONTAINER_NAME</code> The container name to use when reading CSV input files from Azure Blob Storage. <code>str</code> optional <code>None</code> <code>GRAPHRAG_INPUT_BASE_DIR</code> The base directory to read input files from. <code>str</code> optional <code>None</code>"}, {"location": "config/env_vars/#data-mapping-settings", "title": "Data Mapping Settings", "text": "Parameter Description Type Required or Optional Default <code>GRAPHRAG_INPUT_FILE_TYPE</code> The type of input data, <code>csv</code> or <code>text</code> <code>str</code> optional <code>text</code> <code>GRAPHRAG_INPUT_ENCODING</code> The encoding to apply when reading CSV/text input files. <code>str</code> optional <code>utf-8</code>"}, {"location": "config/env_vars/#data-chunking", "title": "Data Chunking", "text": "Parameter Description Type Required or Optional Default <code>GRAPHRAG_CHUNK_SIZE</code> The chunk size in tokens for text-chunk analysis windows. <code>str</code> optional 1200 <code>GRAPHRAG_CHUNK_OVERLAP</code> The chunk overlap in tokens for text-chunk analysis windows. <code>str</code> optional 100 <code>GRAPHRAG_CHUNK_BY_COLUMNS</code> A comma-separated list of document attributes to groupby when performing TextUnit chunking. <code>str</code> optional <code>id</code> <code>GRAPHRAG_CHUNK_ENCODING_MODEL</code> The encoding model to use for chunking. <code>str</code> optional The top-level encoding model."}, {"location": "config/env_vars/#prompting-overrides", "title": "Prompting Overrides", "text": "Parameter Description Type Required or Optional Default <code>GRAPHRAG_ENTITY_EXTRACTION_PROMPT_FILE</code> The path (relative to the root) of an entity extraction prompt template text file. <code>str</code> optional <code>None</code> <code>GRAPHRAG_ENTITY_EXTRACTION_MAX_GLEANINGS</code> The maximum number of redrives (gleanings) to invoke when extracting entities in a loop. <code>int</code> optional 1 <code>GRAPHRAG_ENTITY_EXTRACTION_ENTITY_TYPES</code> A comma-separated list of entity types to extract. <code>str</code> optional <code>organization,person,event,geo</code> <code>GRAPHRAG_ENTITY_EXTRACTION_ENCODING_MODEL</code> The encoding model to use for entity extraction. <code>str</code> optional The top-level encoding model. <code>GRAPHRAG_SUMMARIZE_DESCRIPTIONS_PROMPT_FILE</code> The path (relative to the root) of an description summarization prompt template text file. <code>str</code> optional <code>None</code> <code>GRAPHRAG_SUMMARIZE_DESCRIPTIONS_MAX_LENGTH</code> The maximum number of tokens to generate per description summarization. <code>int</code> optional 500 <code>GRAPHRAG_CLAIM_EXTRACTION_ENABLED</code> Whether claim extraction is enabled for this pipeline. <code>bool</code> optional <code>False</code> <code>GRAPHRAG_CLAIM_EXTRACTION_DESCRIPTION</code> The claim_description prompting argument to utilize. <code>string</code> optional \"Any claims or facts that could be relevant to threat analysis.\" <code>GRAPHRAG_CLAIM_EXTRACTION_PROMPT_FILE</code> The claim extraction prompt to utilize. <code>string</code> optional <code>None</code> <code>GRAPHRAG_CLAIM_EXTRACTION_MAX_GLEANINGS</code> The maximum number of redrives (gleanings) to invoke when extracting claims in a loop. <code>int</code> optional 1 <code>GRAPHRAG_CLAIM_EXTRACTION_ENCODING_MODEL</code> The encoding model to use for claim extraction. <code>str</code> optional The top-level encoding model <code>GRAPHRAG_COMMUNITY_REPORTS_PROMPT_FILE</code> The community reports extraction prompt to utilize. <code>string</code> optional <code>None</code> <code>GRAPHRAG_COMMUNITY_REPORTS_MAX_LENGTH</code> The maximum number of tokens to generate per community reports. <code>int</code> optional 1500"}, {"location": "config/env_vars/#storage", "title": "Storage", "text": "<p>This section controls the storage mechanism used by the pipeline used for exporting output tables.</p> Parameter Description Type Required or Optional Default <code>GRAPHRAG_STORAGE_TYPE</code> The type of reporter to use. Options are <code>file</code>, <code>memory</code>, or <code>blob</code> <code>str</code> optional <code>file</code> <code>GRAPHRAG_STORAGE_STORAGE_ACCOUNT_BLOB_URL</code> The Azure Storage blob endpoint to use when in <code>blob</code> mode and using managed identity. Will have the format <code>https://&lt;storage_account_name&gt;.blob.core.windows.net</code> <code>str</code> optional None <code>GRAPHRAG_STORAGE_CONNECTION_STRING</code> The Azure Storage connection string to use when in <code>blob</code> mode. <code>str</code> optional None <code>GRAPHRAG_STORAGE_CONTAINER_NAME</code> The Azure Storage container name to use when in <code>blob</code> mode. <code>str</code> optional None <code>GRAPHRAG_STORAGE_BASE_DIR</code> The base path to data outputs outputs. <code>str</code> optional None"}, {"location": "config/env_vars/#cache", "title": "Cache", "text": "<p>This section controls the cache mechanism used by the pipeline. This is used to cache LLM invocation results.</p> Parameter Description Type Required or Optional Default <code>GRAPHRAG_CACHE_TYPE</code> The type of cache to use. Options are <code>file</code>, <code>memory</code>, <code>none</code> or <code>blob</code> <code>str</code> optional <code>file</code> <code>GRAPHRAG_CACHE_STORAGE_ACCOUNT_BLOB_URL</code> The Azure Storage blob endpoint to use when in <code>blob</code> mode and using managed identity. Will have the format <code>https://&lt;storage_account_name&gt;.blob.core.windows.net</code> <code>str</code> optional None <code>GRAPHRAG_CACHE_CONNECTION_STRING</code> The Azure Storage connection string to use when in <code>blob</code> mode. <code>str</code> optional None <code>GRAPHRAG_CACHE_CONTAINER_NAME</code> The Azure Storage container name to use when in <code>blob</code> mode. <code>str</code> optional None <code>GRAPHRAG_CACHE_BASE_DIR</code> The base path to the cache files. <code>str</code> optional None"}, {"location": "config/env_vars/#reporting", "title": "Reporting", "text": "<p>This section controls the reporting mechanism used by the pipeline, for common events and error messages. The default is to write reports to a file in the output directory. However, you can also choose to write reports to the console or to an Azure Blob Storage container.</p> Parameter Description Type Required or Optional Default <code>GRAPHRAG_REPORTING_TYPE</code> The type of reporter to use. Options are <code>file</code>, <code>console</code>, or <code>blob</code> <code>str</code> optional <code>file</code> <code>GRAPHRAG_REPORTING_STORAGE_ACCOUNT_BLOB_URL</code> The Azure Storage blob endpoint to use when in <code>blob</code> mode and using managed identity. Will have the format <code>https://&lt;storage_account_name&gt;.blob.core.windows.net</code> <code>str</code> optional None <code>GRAPHRAG_REPORTING_CONNECTION_STRING</code> The Azure Storage connection string to use when in <code>blob</code> mode. <code>str</code> optional None <code>GRAPHRAG_REPORTING_CONTAINER_NAME</code> The Azure Storage container name to use when in <code>blob</code> mode. <code>str</code> optional None <code>GRAPHRAG_REPORTING_BASE_DIR</code> The base path to the reporting outputs. <code>str</code> optional None"}, {"location": "config/env_vars/#node2vec-parameters", "title": "Node2Vec Parameters", "text": "Parameter Description Type Required or Optional Default <code>GRAPHRAG_NODE2VEC_ENABLED</code> Whether to enable Node2Vec <code>bool</code> optional False <code>GRAPHRAG_NODE2VEC_NUM_WALKS</code> The Node2Vec number of walks to perform <code>int</code> optional 10 <code>GRAPHRAG_NODE2VEC_WALK_LENGTH</code> The Node2Vec walk length <code>int</code> optional 40 <code>GRAPHRAG_NODE2VEC_WINDOW_SIZE</code> The Node2Vec window size <code>int</code> optional 2 <code>GRAPHRAG_NODE2VEC_ITERATIONS</code> The number of iterations to run node2vec <code>int</code> optional 3 <code>GRAPHRAG_NODE2VEC_RANDOM_SEED</code> The random seed to use for node2vec <code>int</code> optional 597832"}, {"location": "config/env_vars/#data-snapshotting", "title": "Data Snapshotting", "text": "Parameter Description Type Required or Optional Default <code>GRAPHRAG_SNAPSHOT_EMBEDDINGS</code> Whether to enable embeddings snapshots. <code>bool</code> optional False <code>GRAPHRAG_SNAPSHOT_GRAPHML</code> Whether to enable GraphML snapshots. <code>bool</code> optional False <code>GRAPHRAG_SNAPSHOT_RAW_ENTITIES</code> Whether to enable raw entity snapshots. <code>bool</code> optional False <code>GRAPHRAG_SNAPSHOT_TOP_LEVEL_NODES</code> Whether to enable top-level node snapshots. <code>bool</code> optional False <code>GRAPHRAG_SNAPSHOT_TRANSIENT</code> Whether to enable transient table snapshots. <code>bool</code> optional False"}, {"location": "config/env_vars/#miscellaneous-settings", "title": "Miscellaneous Settings", "text": "Parameter Description Type Required or Optional Default <code>GRAPHRAG_ASYNC_MODE</code> Which async mode to use. Either <code>asyncio</code> or <code>threaded</code>. <code>str</code> optional <code>asyncio</code> <code>GRAPHRAG_ENCODING_MODEL</code> The text encoding model, used in tiktoken, to encode text. <code>str</code> optional <code>cl100k_base</code> <code>GRAPHRAG_MAX_CLUSTER_SIZE</code> The maximum number of entities to include in a single Leiden cluster. <code>int</code> optional 10 <code>GRAPHRAG_SKIP_WORKFLOWS</code> A comma-separated list of workflow names to skip. <code>str</code> optional <code>None</code> <code>GRAPHRAG_UMAP_ENABLED</code> Whether to enable UMAP layouts <code>bool</code> optional False"}, {"location": "config/init/", "title": "Configuring GraphRAG Indexing", "text": "<p>To start using GraphRAG, you must generate a configuration file. The <code>init</code> command is the easiest way to get started. It will create a <code>.env</code> and <code>settings.yaml</code> files in the specified directory with the necessary configuration settings. It will also output the default LLM prompts used by GraphRAG.</p>"}, {"location": "config/init/#usage", "title": "Usage", "text": "<pre><code>graphrag init [--root PATH]\n</code></pre>"}, {"location": "config/init/#options", "title": "Options", "text": "<ul> <li><code>--root PATH</code> - The project root directory to initialize graphrag at. Default is the current directory.</li> </ul>"}, {"location": "config/init/#example", "title": "Example", "text": "<pre><code>graphrag init --root ./ragtest\n</code></pre>"}, {"location": "config/init/#output", "title": "Output", "text": "<p>The <code>init</code> command will create the following files in the specified directory:</p> <ul> <li><code>settings.yaml</code> - The configuration settings file. This file contains the configuration settings for GraphRAG.</li> <li><code>.env</code> - The environment variables file. These are referenced in the <code>settings.yaml</code> file.</li> <li><code>prompts/</code> - The LLM prompts folder. This contains the default prompts used by GraphRAG, you can modify them or run the Auto Prompt Tuning command to generate new prompts adapted to your data.</li> </ul>"}, {"location": "config/init/#next-steps", "title": "Next Steps", "text": "<p>After initializing your workspace, you can either run the Prompt Tuning command to adapt the prompts to your data or even start running the Indexing Pipeline to index your data. For more information on configuring GraphRAG, see the Configuration documentation.</p>"}, {"location": "config/overview/", "title": "Configuring GraphRAG Indexing", "text": "<p>The GraphRAG system is highly configurable. This page provides an overview of the configuration options available for the GraphRAG indexing engine.</p>"}, {"location": "config/overview/#default-configuration-mode", "title": "Default Configuration Mode", "text": "<p>The default configuration mode is the simplest way to get started with the GraphRAG system. It is designed to work out-of-the-box with minimal configuration. The primary configuration sections for the Indexing Engine pipelines are described below. The main ways to set up GraphRAG in Default Configuration mode are via:</p> <ul> <li>Init command (recommended)</li> <li>Using YAML for deeper control</li> <li>Purely using environment variables</li> </ul>"}, {"location": "config/yaml/", "title": "Default Configuration Mode (using YAML/JSON)", "text": "<p>The default configuration mode may be configured by using a <code>settings.yml</code> or <code>settings.json</code> file in the data project root. If a <code>.env</code> file is present along with this config file, then it will be loaded, and the environment variables defined therein will be available for token replacements in your configuration document using <code>${ENV_VAR}</code> syntax. We initialize with YML by default in <code>graphrag init</code> but you may use the equivalent JSON form if preferred.</p> <p>Many of these config values have defaults. Rather than replicate them here, please refer to the constants in the code directly.</p> <p>For example:</p> <pre><code># .env\nGRAPHRAG_API_KEY=some_api_key\n\n# settings.yml\nllm: \n  api_key: ${GRAPHRAG_API_KEY}\n</code></pre>"}, {"location": "config/yaml/#config-sections", "title": "Config Sections", "text": ""}, {"location": "config/yaml/#indexing", "title": "Indexing", "text": ""}, {"location": "config/yaml/#llm", "title": "llm", "text": "<p>This is the base LLM configuration section. Other steps may override this configuration with their own LLM configuration.</p>"}, {"location": "config/yaml/#fields", "title": "Fields", "text": "<ul> <li><code>api_key</code> str - The OpenAI API key to use.</li> <li><code>type</code> openai_chat|azure_openai_chat|openai_embedding|azure_openai_embedding - The type of LLM to use.</li> <li><code>model</code> str - The model name.</li> <li><code>max_tokens</code> int - The maximum number of output tokens.</li> <li><code>request_timeout</code> float - The per-request timeout.</li> <li><code>api_base</code> str - The API base url to use.</li> <li><code>api_version</code> str - The API version</li> <li><code>organization</code> str - The client organization.</li> <li><code>proxy</code> str - The proxy URL to use.</li> <li><code>audience</code> str - (Azure OpenAI only) The URI of the target Azure resource/service for which a managed identity token is requested. Used if <code>api_key</code> is not defined. Default=<code>https://cognitiveservices.azure.com/.default</code></li> <li><code>deployment_name</code> str - The deployment name to use (Azure).</li> <li><code>model_supports_json</code> bool - Whether the model supports JSON-mode output.</li> <li><code>tokens_per_minute</code> int - Set a leaky-bucket throttle on tokens-per-minute.</li> <li><code>requests_per_minute</code> int - Set a leaky-bucket throttle on requests-per-minute.</li> <li><code>max_retries</code> int - The maximum number of retries to use.</li> <li><code>max_retry_wait</code> float - The maximum backoff time.</li> <li><code>sleep_on_rate_limit_recommendation</code> bool - Whether to adhere to sleep recommendations (Azure).</li> <li><code>concurrent_requests</code> int The number of open requests to allow at once.</li> <li><code>temperature</code> float - The temperature to use.</li> <li><code>top_p</code> float - The top-p value to use.</li> <li><code>n</code> int - The number of completions to generate.</li> </ul>"}, {"location": "config/yaml/#parallelization", "title": "parallelization", "text": ""}, {"location": "config/yaml/#fields_1", "title": "Fields", "text": "<ul> <li><code>stagger</code> float - The threading stagger value.</li> <li><code>num_threads</code> int - The maximum number of work threads.</li> </ul>"}, {"location": "config/yaml/#async_mode", "title": "async_mode", "text": "<p>asyncio|threaded The async mode to use. Either <code>asyncio</code> or `threaded.</p>"}, {"location": "config/yaml/#embeddings", "title": "embeddings", "text": ""}, {"location": "config/yaml/#fields_2", "title": "Fields", "text": "<ul> <li><code>llm</code> (see LLM top-level config)</li> <li><code>parallelization</code> (see Parallelization top-level config)</li> <li><code>async_mode</code> (see Async Mode top-level config)</li> <li><code>batch_size</code> int - The maximum batch size to use.</li> <li><code>batch_max_tokens</code> int - The maximum batch # of tokens.</li> <li><code>target</code> required|all|none - Determines which set of embeddings to export.</li> <li><code>skip</code> list[str] - Which embeddings to skip. Only useful if target=all to customize the list.</li> <li><code>vector_store</code> dict - The vector store to use. Configured for lancedb by default.<ul> <li><code>type</code> str - <code>lancedb</code> or <code>azure_ai_search</code>. Default=<code>lancedb</code></li> <li><code>db_uri</code> str (only for lancedb) - The database uri. Default=<code>storage.base_dir/lancedb</code></li> <li><code>url</code> str (only for AI Search) - AI Search endpoint</li> <li><code>api_key</code> str (optional - only for AI Search) - The AI Search api key to use.</li> <li><code>audience</code> str (only for AI Search) - Audience for managed identity token if managed identity authentication is used.</li> <li><code>overwrite</code> bool (only used at index creation time) - Overwrite collection if it exist. Default=<code>True</code></li> <li><code>container_name</code> str - The name of a vector container. This stores all indexes (tables) for a given dataset ingest. Default=<code>default</code></li> </ul> </li> <li><code>strategy</code> dict - Fully override the text-embedding strategy.</li> </ul>"}, {"location": "config/yaml/#input", "title": "input", "text": ""}, {"location": "config/yaml/#fields_3", "title": "Fields", "text": "<ul> <li><code>type</code> file|blob - The input type to use. Default=<code>file</code></li> <li><code>file_type</code> text|csv - The type of input data to load. Either <code>text</code> or <code>csv</code>. Default is <code>text</code></li> <li><code>base_dir</code> str - The base directory to read input from, relative to the root.</li> <li><code>connection_string</code> str - (blob only) The Azure Storage connection string.</li> <li><code>storage_account_blob_url</code> str - The storage account blob URL to use.</li> <li><code>container_name</code> str - (blob only) The Azure Storage container name.</li> <li><code>file_encoding</code> str - The encoding of the input file. Default is <code>utf-8</code></li> <li><code>file_pattern</code> str - A regex to match input files. Default is <code>.*\\.csv$</code> if in csv mode and <code>.*\\.txt$</code> if in text mode.</li> <li><code>file_filter</code> dict - Key/value pairs to filter. Default is None.</li> <li><code>source_column</code> str - (CSV Mode Only) The source column name.</li> <li><code>timestamp_column</code> str - (CSV Mode Only) The timestamp column name.</li> <li><code>timestamp_format</code> str - (CSV Mode Only) The source format.</li> <li><code>text_column</code> str - (CSV Mode Only) The text column name.</li> <li><code>title_column</code> str - (CSV Mode Only) The title column name.</li> <li><code>document_attribute_columns</code> list[str] - (CSV Mode Only) The additional document attributes to include.</li> </ul>"}, {"location": "config/yaml/#chunks", "title": "chunks", "text": ""}, {"location": "config/yaml/#fields_4", "title": "Fields", "text": "<ul> <li><code>size</code> int - The max chunk size in tokens.</li> <li><code>overlap</code> int - The chunk overlap in tokens.</li> <li><code>group_by_columns</code> list[str] - group documents by fields before chunking.</li> <li><code>encoding_model</code> str - The text encoding model to use. Default is to use the top-level encoding model.</li> <li><code>strategy</code> dict - Fully override the chunking strategy.</li> </ul>"}, {"location": "config/yaml/#cache", "title": "cache", "text": ""}, {"location": "config/yaml/#fields_5", "title": "Fields", "text": "<ul> <li><code>type</code> file|memory|none|blob - The cache type to use. Default=<code>file</code></li> <li><code>connection_string</code> str - (blob only) The Azure Storage connection string.</li> <li><code>container_name</code> str - (blob only) The Azure Storage container name.</li> <li><code>base_dir</code> str - The base directory to write cache to, relative to the root.</li> <li><code>storage_account_blob_url</code> str - The storage account blob URL to use.</li> </ul>"}, {"location": "config/yaml/#storage", "title": "storage", "text": ""}, {"location": "config/yaml/#fields_6", "title": "Fields", "text": "<ul> <li><code>type</code> file|memory|blob - The storage type to use. Default=<code>file</code></li> <li><code>connection_string</code> str - (blob only) The Azure Storage connection string.</li> <li><code>container_name</code> str - (blob only) The Azure Storage container name.</li> <li><code>base_dir</code> str - The base directory to write output artifacts to, relative to the root.</li> <li><code>storage_account_blob_url</code> str - The storage account blob URL to use.</li> </ul>"}, {"location": "config/yaml/#update_index_storage", "title": "update_index_storage", "text": ""}, {"location": "config/yaml/#fields_7", "title": "Fields", "text": "<ul> <li><code>type</code> file|memory|blob - The storage type to use. Default=<code>file</code></li> <li><code>connection_string</code> str - (blob only) The Azure Storage connection string.</li> <li><code>container_name</code> str - (blob only) The Azure Storage container name.</li> <li><code>base_dir</code> str - The base directory to write output artifacts to, relative to the root.</li> <li><code>storage_account_blob_url</code> str - The storage account blob URL to use.</li> </ul>"}, {"location": "config/yaml/#reporting", "title": "reporting", "text": ""}, {"location": "config/yaml/#fields_8", "title": "Fields", "text": "<ul> <li><code>type</code> file|console|blob - The reporting type to use. Default=<code>file</code></li> <li><code>connection_string</code> str - (blob only) The Azure Storage connection string.</li> <li><code>container_name</code> str - (blob only) The Azure Storage container name.</li> <li><code>base_dir</code> str - The base directory to write reports to, relative to the root.</li> <li><code>storage_account_blob_url</code> str - The storage account blob URL to use.</li> </ul>"}, {"location": "config/yaml/#entity_extraction", "title": "entity_extraction", "text": ""}, {"location": "config/yaml/#fields_9", "title": "Fields", "text": "<ul> <li><code>llm</code> (see LLM top-level config)</li> <li><code>parallelization</code> (see Parallelization top-level config)</li> <li><code>async_mode</code> (see Async Mode top-level config)</li> <li><code>prompt</code> str - The prompt file to use.</li> <li><code>entity_types</code> list[str] - The entity types to identify.</li> <li><code>max_gleanings</code> int - The maximum number of gleaning cycles to use.</li> <li><code>encoding_model</code> str - The text encoding model to use. By default, this will use the top-level encoding model.</li> <li><code>strategy</code> dict - Fully override the entity extraction strategy.</li> </ul>"}, {"location": "config/yaml/#summarize_descriptions", "title": "summarize_descriptions", "text": ""}, {"location": "config/yaml/#fields_10", "title": "Fields", "text": "<ul> <li><code>llm</code> (see LLM top-level config)</li> <li><code>parallelization</code> (see Parallelization top-level config)</li> <li><code>async_mode</code> (see Async Mode top-level config)</li> <li><code>prompt</code> str - The prompt file to use.</li> <li><code>max_length</code> int - The maximum number of output tokens per summarization.</li> <li><code>strategy</code> dict - Fully override the summarize description strategy.</li> </ul>"}, {"location": "config/yaml/#claim_extraction", "title": "claim_extraction", "text": ""}, {"location": "config/yaml/#fields_11", "title": "Fields", "text": "<ul> <li><code>enabled</code> bool - Whether to enable claim extraction. Off by default, because claim prompts really need user tuning.</li> <li><code>llm</code> (see LLM top-level config)</li> <li><code>parallelization</code> (see Parallelization top-level config)</li> <li><code>async_mode</code> (see Async Mode top-level config)</li> <li><code>prompt</code> str - The prompt file to use.</li> <li><code>description</code> str - Describes the types of claims we want to extract.</li> <li><code>max_gleanings</code> int - The maximum number of gleaning cycles to use.</li> <li><code>encoding_model</code> str - The text encoding model to use. By default, this will use the top-level encoding model.</li> <li><code>strategy</code> dict - Fully override the claim extraction strategy.</li> </ul>"}, {"location": "config/yaml/#community_reports", "title": "community_reports", "text": ""}, {"location": "config/yaml/#fields_12", "title": "Fields", "text": "<ul> <li><code>llm</code> (see LLM top-level config)</li> <li><code>parallelization</code> (see Parallelization top-level config)</li> <li><code>async_mode</code> (see Async Mode top-level config)</li> <li><code>prompt</code> str - The prompt file to use.</li> <li><code>max_length</code> int - The maximum number of output tokens per report.</li> <li><code>max_input_length</code> int - The maximum number of input tokens to use when generating reports.</li> <li><code>strategy</code> dict - Fully override the community reports strategy.</li> </ul>"}, {"location": "config/yaml/#cluster_graph", "title": "cluster_graph", "text": ""}, {"location": "config/yaml/#fields_13", "title": "Fields", "text": "<ul> <li><code>max_cluster_size</code> int - The maximum cluster size to export.</li> <li><code>strategy</code> dict - Fully override the cluster_graph strategy.</li> </ul>"}, {"location": "config/yaml/#embed_graph", "title": "embed_graph", "text": ""}, {"location": "config/yaml/#fields_14", "title": "Fields", "text": "<ul> <li><code>enabled</code> bool - Whether to enable graph embeddings.</li> <li><code>num_walks</code> int - The node2vec number of walks.</li> <li><code>walk_length</code> int - The node2vec walk length.</li> <li><code>window_size</code> int - The node2vec window size.</li> <li><code>iterations</code> int - The node2vec number of iterations.</li> <li><code>random_seed</code> int - The node2vec random seed.</li> <li><code>strategy</code> dict - Fully override the embed graph strategy.</li> </ul>"}, {"location": "config/yaml/#umap", "title": "umap", "text": ""}, {"location": "config/yaml/#fields_15", "title": "Fields", "text": "<ul> <li><code>enabled</code> bool - Whether to enable UMAP layouts.</li> </ul>"}, {"location": "config/yaml/#snapshots", "title": "snapshots", "text": ""}, {"location": "config/yaml/#fields_16", "title": "Fields", "text": "<ul> <li><code>embeddings</code> bool - Export embeddings snapshots to parquet.</li> <li><code>graphml</code> bool - Export graph snapshots to GraphML.</li> <li><code>transient</code> bool - Export transient workflow tables snapshots to parquet.</li> </ul>"}, {"location": "config/yaml/#encoding_model", "title": "encoding_model", "text": "<p>str - The text encoding model to use. Default=<code>cl100k_base</code>.</p>"}, {"location": "config/yaml/#skip_workflows", "title": "skip_workflows", "text": "<p>list[str] - Which workflow names to skip.</p>"}, {"location": "config/yaml/#query", "title": "Query", "text": ""}, {"location": "config/yaml/#local_search", "title": "local_search", "text": ""}, {"location": "config/yaml/#fields_17", "title": "Fields", "text": "<ul> <li><code>prompt</code> str - The prompt file to use.</li> <li><code>text_unit_prop</code> float - The text unit proportion. </li> <li><code>community_prop</code> float - The community proportion.</li> <li><code>conversation_history_max_turns</code> int - The conversation history maximum turns.</li> <li><code>top_k_entities</code> int - The top k mapped entities.</li> <li><code>top_k_relationships</code> int - The top k mapped relations.</li> <li><code>temperature</code> float | None - The temperature to use for token generation.</li> <li><code>top_p</code> float | None - The top-p value to use for token generation.</li> <li><code>n</code> int | None - The number of completions to generate.</li> <li><code>max_tokens</code> int - The maximum tokens.</li> <li><code>llm_max_tokens</code> int - The LLM maximum tokens.</li> </ul>"}, {"location": "config/yaml/#global_search", "title": "global_search", "text": ""}, {"location": "config/yaml/#fields_18", "title": "Fields", "text": "<ul> <li><code>map_prompt</code> str - The mapper prompt file to use.</li> <li><code>reduce_prompt</code> str - The reducer prompt file to use.</li> <li><code>knowledge_prompt</code> str - The knowledge prompt file to use.</li> <li><code>map_prompt</code> str | None - The global search mapper prompt to use.</li> <li><code>reduce_prompt</code> str | None - The global search reducer to use.</li> <li><code>knowledge_prompt</code> str | None - The global search general prompt to use.</li> <li><code>temperature</code> float | None - The temperature to use for token generation.</li> <li><code>top_p</code> float | None - The top-p value to use for token generation.</li> <li><code>n</code> int | None - The number of completions to generate.</li> <li><code>max_tokens</code> int - The maximum context size in tokens.</li> <li><code>data_max_tokens</code> int - The data llm maximum tokens.</li> <li><code>map_max_tokens</code> int - The map llm maximum tokens.</li> <li><code>reduce_max_tokens</code> int - The reduce llm maximum tokens.</li> <li><code>concurrency</code> int - The number of concurrent requests.</li> <li><code>dynamic_search_llm</code> str - LLM model to use for dynamic community selection.</li> <li><code>dynamic_search_threshold</code> int - Rating threshold in include a community report.</li> <li><code>dynamic_search_keep_parent</code> bool - Keep parent community if any of the child communities are relevant.</li> <li><code>dynamic_search_num_repeats</code> int - Number of times to rate the same community report.</li> <li><code>dynamic_search_use_summary</code> bool - Use community summary instead of full_context.</li> <li><code>dynamic_search_concurrent_coroutines</code> int - Number of concurrent coroutines to rate community reports.</li> <li><code>dynamic_search_max_level</code> int - The maximum level of community hierarchy to consider if none of the processed communities are relevant.</li> </ul>"}, {"location": "config/yaml/#drift_search", "title": "drift_search", "text": ""}, {"location": "config/yaml/#fields_19", "title": "Fields", "text": "<ul> <li><code>prompt</code> str - The prompt file to use.</li> <li><code>temperature</code> float - The temperature to use for token generation.\",</li> <li><code>top_p</code> float - The top-p value to use for token generation.</li> <li><code>n</code> int - The number of completions to generate.</li> <li><code>max_tokens</code> int - The maximum context size in tokens.</li> <li><code>data_max_tokens</code> int - The data llm maximum tokens.</li> <li><code>concurrency</code> int - The number of concurrent requests.</li> <li><code>drift_k_followups</code> int - The number of top global results to retrieve.</li> <li><code>primer_folds</code> int - The number of folds for search priming.</li> <li><code>primer_llm_max_tokens</code> int - The maximum number of tokens for the LLM in primer.</li> <li><code>n_depth</code> int - The number of drift search steps to take.</li> <li><code>local_search_text_unit_prop</code> float - The proportion of search dedicated to text units.</li> <li><code>local_search_community_prop</code> float - The proportion of search dedicated to community properties.</li> <li><code>local_search_top_k_mapped_entities</code> int - The number of top K entities to map during local search.</li> <li><code>local_search_top_k_relationships</code> int - The number of top K relationships to map during local search.</li> <li><code>local_search_max_data_tokens</code> int - The maximum context size in tokens for local search.</li> <li><code>local_search_temperature</code> float - The temperature to use for token generation in local search.</li> <li><code>local_search_top_p</code> float - The top-p value to use for token generation in local search.</li> <li><code>local_search_n</code> int - The number of completions to generate in local search.</li> <li><code>local_search_llm_max_gen_tokens</code> int - The maximum number of generated tokens for the LLM in local search.</li> </ul>"}, {"location": "data/operation_dulce/ABOUT/", "title": "About", "text": "<p>This document (Operation Dulce) is an AI-generated science fiction novella, included here for the purposes of integration testing.</p>"}, {"location": "index/architecture/", "title": "Indexing Architecture", "text": ""}, {"location": "index/architecture/#key-concepts", "title": "Key Concepts", "text": ""}, {"location": "index/architecture/#knowledge-model", "title": "Knowledge Model", "text": "<p>In order to support the GraphRAG system, the outputs of the indexing engine (in the Default Configuration Mode) are aligned to a knowledge model we call the GraphRAG Knowledge Model. This model is designed to be an abstraction over the underlying data storage technology, and to provide a common interface for the GraphRAG system to interact with. In normal use-cases the outputs of the GraphRAG Indexer would be loaded into a database system, and the GraphRAG's Query Engine would interact with the database using the knowledge model data-store types.</p>"}, {"location": "index/architecture/#datashaper-workflows", "title": "DataShaper Workflows", "text": "<p>GraphRAG's Indexing Pipeline is built on top of our open-source library, DataShaper. DataShaper is a data processing library that allows users to declaratively express data pipelines, schemas, and related assets using well-defined schemas. DataShaper has implementations in JavaScript and Python, and is designed to be extensible to other languages.</p> <p>One of the core resource types within DataShaper is a Workflow. Workflows are expressed as sequences of steps, which we call verbs. Each step has a verb name and a configuration object. In DataShaper, these verbs model relational concepts such as SELECT, DROP, JOIN, etc.. Each verb transforms an input data table, and that table is passed down the pipeline.</p> <pre><code>---\ntitle: Sample Workflow\n---\nflowchart LR\n    input[Input Table] --&gt; select[SELECT] --&gt; join[JOIN] --&gt; binarize[BINARIZE] --&gt; output[Output Table]</code></pre>"}, {"location": "index/architecture/#llm-based-workflow-steps", "title": "LLM-based Workflow Steps", "text": "<p>GraphRAG's Indexing Pipeline implements a handful of custom verbs on top of the standard, relational verbs that our DataShaper library provides. These verbs give us the ability to augment text documents with rich, structured data using the power of LLMs such as GPT-4. We utilize these verbs in our standard workflow to extract entities, relationships, claims, community structures, and community reports and summaries. This behavior is customizable and can be extended to support many kinds of AI-based data enrichment and extraction tasks.</p>"}, {"location": "index/architecture/#workflow-graphs", "title": "Workflow Graphs", "text": "<p>Because of the complexity of our data indexing tasks, we needed to be able to express our data pipeline as series of multiple, interdependent workflows. In the GraphRAG Indexing Pipeline, each workflow may define dependencies on other workflows, effectively forming a directed acyclic graph (DAG) of workflows, which is then used to schedule processing.</p> <pre><code>---\ntitle: Sample Workflow DAG\n---\nstateDiagram-v2\n    [*] --&gt; Prepare\n    Prepare --&gt; Chunk\n    Chunk --&gt; ExtractGraph\n    Chunk --&gt; EmbedDocuments\n    ExtractGraph --&gt; GenerateReports\n    ExtractGraph --&gt; EmbedEntities\n    ExtractGraph --&gt; EmbedGraph</code></pre>"}, {"location": "index/architecture/#dataframe-message-format", "title": "Dataframe Message Format", "text": "<p>The primary unit of communication between workflows, and between workflow steps is an instance of <code>pandas.DataFrame</code>. Although side-effects are possible, our goal is to be data-centric and table-centric in our approach to data processing. This allows us to easily reason about our data, and to leverage the power of dataframe-based ecosystems. Our underlying dataframe technology may change over time, but our primary goal is to support the DataShaper workflow schema while retaining single-machine ease of use and developer ergonomics.</p>"}, {"location": "index/architecture/#llm-caching", "title": "LLM Caching", "text": "<p>The GraphRAG library was designed with LLM interactions in mind, and a common setback when working with LLM APIs is various errors due to network latency, throttling, etc.. Because of these potential error cases, we've added a cache layer around LLM interactions. When completion requests are made using the same input set (prompt and tuning parameters), we return a cached result if one exists. This allows our indexer to be more resilient to network issues, to act idempotently, and to provide a more efficient end-user experience.</p>"}, {"location": "index/default_dataflow/", "title": "Indexing Dataflow", "text": ""}, {"location": "index/default_dataflow/#the-graphrag-knowledge-model", "title": "The GraphRAG Knowledge Model", "text": "<p>The knowledge model is a specification for data outputs that conform to our data-model definition. You can find these definitions in the python/graphrag/graphrag/model folder within the GraphRAG repository. The following entity types are provided. The fields here represent the fields that are text-embedded by default.</p> <ul> <li><code>Document</code> - An input document into the system. These either represent individual rows in a CSV or individual .txt file.</li> <li><code>TextUnit</code> - A chunk of text to analyze. The size of these chunks, their overlap, and whether they adhere to any data boundaries may be configured below. A common use case is to set <code>CHUNK_BY_COLUMNS</code> to <code>id</code> so that there is a 1-to-many relationship between documents and TextUnits instead of a many-to-many.</li> <li><code>Entity</code> - An entity extracted from a TextUnit. These represent people, places, events, or some other entity-model that you provide.</li> <li><code>Relationship</code> - A relationship between two entities. These are generated from the covariates.</li> <li><code>Covariate</code> - Extracted claim information, which contains statements about entities which may be time-bound.</li> <li><code>Community</code> - Once the graph of entities and relationships is built, we perform hierarchical community detection on them to create a clustering structure.</li> <li><code>Community Report</code> - The contents of each community are summarized into a generated report, useful for human reading and downstream search.</li> <li><code>Node</code> - This table contains layout information for rendered graph-views of the Entities and Documents which have been embedded and clustered.</li> </ul>"}, {"location": "index/default_dataflow/#the-default-configuration-workflow", "title": "The Default Configuration Workflow", "text": "<p>Let's take a look at how the default-configuration workflow transforms text documents into the GraphRAG Knowledge Model. This page gives a general overview of the major steps in this process. To fully configure this workflow, check out the configuration documentation.</p> <pre><code>---\ntitle: Dataflow Overview\n---\nflowchart TB\n    subgraph phase1[Phase 1: Compose TextUnits]\n    documents[Documents] --&gt; chunk[Chunk]\n    chunk --&gt; embed[Embed] --&gt; textUnits[Text Units]\n    end\n    subgraph phase2[Phase 2: Graph Extraction]\n    textUnits --&gt; graph_extract[Entity &amp; Relationship Extraction]\n    graph_extract --&gt; graph_summarize[Entity &amp; Relationship Summarization]\n    graph_summarize --&gt; claim_extraction[Claim Extraction]\n    claim_extraction --&gt; graph_outputs[Graph Tables]\n    end\n    subgraph phase3[Phase 3: Graph Augmentation]\n    graph_outputs --&gt; community_detect[Community Detection]\n    community_detect --&gt; graph_embed[Graph Embedding]\n    graph_embed --&gt; augmented_graph[Augmented Graph Tables]\n    end\n    subgraph phase4[Phase 4: Community Summarization]\n    augmented_graph --&gt; summarized_communities[Community Summarization]\n    summarized_communities --&gt; embed_communities[Community Embedding]\n    embed_communities --&gt; community_outputs[Community Tables]\n    end\n    subgraph phase5[Phase 5: Document Processing]\n    documents --&gt; link_to_text_units[Link to TextUnits]\n    textUnits --&gt; link_to_text_units\n    link_to_text_units --&gt; embed_documents[Document Embedding]\n    embed_documents --&gt; document_graph[Document Graph Creation]\n    document_graph --&gt; document_outputs[Document Tables]\n    end\n    subgraph phase6[Phase 6: Network Visualization]\n    document_outputs --&gt; umap_docs[Umap Documents]\n    augmented_graph --&gt; umap_entities[Umap Entities]\n    umap_docs --&gt; combine_nodes[Nodes Table]\n    umap_entities --&gt; combine_nodes\n    end</code></pre>"}, {"location": "index/default_dataflow/#phase-1-compose-textunits", "title": "Phase 1: Compose TextUnits", "text": "<p>The first phase of the default-configuration workflow is to transform input documents into TextUnits. A TextUnit is a chunk of text that is used for our graph extraction techniques. They are also used as source-references by extracted knowledge items in order to empower breadcrumbs and provenance by concepts back to their original source tex.</p> <p>The chunk size (counted in tokens), is user-configurable. By default this is set to 300 tokens, although we've had positive experience with 1200-token chunks using a single \"glean\" step. (A \"glean\" step is a follow-on extraction). Larger chunks result in lower-fidelity output and less meaningful reference texts; however, using larger chunks can result in much faster processing time.</p> <p>The group-by configuration is also user-configurable. By default, we align our chunks to document boundaries, meaning that there is a strict 1-to-many relationship between Documents and TextUnits. In rare cases, this can be turned into a many-to-many relationship. This is useful when the documents are very short and we need several of them to compose a meaningful analysis unit (e.g. Tweets or a chat log)</p> <p>Each of these text-units are text-embedded and passed into the next phase of the pipeline.</p> <pre><code>---\ntitle: Documents into Text Chunks\n---\nflowchart LR\n    doc1[Document 1] --&gt; tu1[TextUnit 1]\n    doc1 --&gt; tu2[TextUnit 2]\n    doc2[Document 2] --&gt; tu3[TextUnit 3]\n    doc2 --&gt; tu4[TextUnit 4]\n</code></pre>"}, {"location": "index/default_dataflow/#phase-2-graph-extraction", "title": "Phase 2: Graph Extraction", "text": "<p>In this phase, we analyze each text unit and extract our graph primitives: Entities, Relationships, and Claims. Entities and Relationships are extracted at once in our entity_extract verb, and claims are extracted in our claim_extract verb. Results are then combined and passed into following phases of the pipeline.</p> <pre><code>---\ntitle: Graph Extraction\n---\nflowchart LR\n    tu[TextUnit] --&gt; ge[Graph Extraction] --&gt; gs[Graph Summarization]\n    tu --&gt; ce[Claim Extraction]</code></pre>"}, {"location": "index/default_dataflow/#entity-relationship-extraction", "title": "Entity &amp; Relationship Extraction", "text": "<p>In this first step of graph extraction, we process each text-unit in order to extract entities and relationships out of the raw text using the LLM. The output of this step is a subgraph-per-TextUnit containing a list of entities with a name, type, and description, and a list of relationships with a source, target, and description.</p> <p>These subgraphs are merged together - any entities with the same name and type are merged by creating an array of their descriptions. Similarly, any relationships with the same source and target are merged by creating an array of their descriptions.</p>"}, {"location": "index/default_dataflow/#entity-relationship-summarization", "title": "Entity &amp; Relationship Summarization", "text": "<p>Now that we have a graph of entities and relationships, each with a list of descriptions, we can summarize these lists into a single description per entity and relationship. This is done by asking the LLM for a short summary that captures all of the distinct information from each description. This allows all of our entities and relationships to have a single concise description.</p>"}, {"location": "index/default_dataflow/#claim-extraction-emission", "title": "Claim Extraction &amp; Emission", "text": "<p>Finally, as an independent workflow, we extract claims from the source TextUnits. These claims represent positive factual statements with an evaluated status and time-bounds. These get exported as a primary artifact called Covariates.</p> <p>Note: claim extraction is optional and turned off by default. This is because claim extraction generally requires prompt tuning to be useful.</p>"}, {"location": "index/default_dataflow/#phase-3-graph-augmentation", "title": "Phase 3: Graph Augmentation", "text": "<p>Now that we have a usable graph of entities and relationships, we want to understand their community structure and augment the graph with additional information. This is done in two steps: Community Detection and Graph Embedding. These give us explicit (communities) and implicit (embeddings) ways of understanding the topological structure of our graph.</p> <pre><code>---\ntitle: Graph Augmentation\n---\nflowchart LR\n    cd[Leiden Hierarchical Community Detection] --&gt; ge[Node2Vec Graph Embedding] --&gt; ag[Graph Table Emission]</code></pre>"}, {"location": "index/default_dataflow/#community-detection", "title": "Community Detection", "text": "<p>In this step, we generate a hierarchy of entity communities using the Hierarchical Leiden Algorithm. This method will apply a recursive community-clustering to our graph until we reach a community-size threshold. This will allow us to understand the community structure of our graph and provide a way to navigate and summarize the graph at different levels of granularity.</p>"}, {"location": "index/default_dataflow/#graph-embedding", "title": "Graph Embedding", "text": "<p>In this step, we generate a vector representation of our graph using the Node2Vec algorithm. This will allow us to understand the implicit structure of our graph and provide an additional vector-space in which to search for related concepts during our query phase.</p>"}, {"location": "index/default_dataflow/#graph-tables-emission", "title": "Graph Tables Emission", "text": "<p>Once our graph augmentation steps are complete, the final Entities and Relationships tables are exported after their text fields are text-embedded.</p>"}, {"location": "index/default_dataflow/#phase-4-community-summarization", "title": "Phase 4: Community Summarization", "text": "<pre><code>---\ntitle: Community Summarization\n---\nflowchart LR\n    sc[Generate Community Reports] --&gt; ss[Summarize Community Reports] --&gt; ce[Community Embedding] --&gt; co[Community Tables Emission]</code></pre> <p>At this point, we have a functional graph of entities and relationships, a hierarchy of communities for the entities, as well as node2vec embeddings.</p> <p>Now we want to build on the communities data and generate reports for each community. This gives us a high-level understanding of the graph at several points of graph granularity. For example, if community A is the top-level community, we'll get a report about the entire graph. If the community is lower-level, we'll get a report about a local cluster.</p>"}, {"location": "index/default_dataflow/#generate-community-reports", "title": "Generate Community Reports", "text": "<p>In this step, we generate a summary of each community using the LLM. This will allow us to understand the distinct information contained within each community and provide a scoped understanding of the graph, from either a high-level or a low-level perspective. These reports contain an executive overview and reference the key entities, relationships, and claims within the community sub-structure.</p>"}, {"location": "index/default_dataflow/#summarize-community-reports", "title": "Summarize Community Reports", "text": "<p>In this step, each community report is then summarized via the LLM for shorthand use.</p>"}, {"location": "index/default_dataflow/#community-embedding", "title": "Community Embedding", "text": "<p>In this step, we generate a vector representation of our communities by generating text embeddings of the community report, the community report summary, and the title of the community report.</p>"}, {"location": "index/default_dataflow/#community-tables-emission", "title": "Community Tables Emission", "text": "<p>At this point, some bookkeeping work is performed and we export the Communities and CommunityReports tables.</p>"}, {"location": "index/default_dataflow/#phase-5-document-processing", "title": "Phase 5: Document Processing", "text": "<p>In this phase of the workflow, we create the Documents table for the knowledge model.</p> <pre><code>---\ntitle: Document Processing\n---\nflowchart LR\n    aug[Augment] --&gt; dp[Link to TextUnits] --&gt; de[Avg. Embedding] --&gt; dg[Document Table Emission]</code></pre>"}, {"location": "index/default_dataflow/#augment-with-columns-csv-only", "title": "Augment with Columns (CSV Only)", "text": "<p>If the workflow is operating on CSV data, you may configure your workflow to add additional fields to Documents output. These fields should exist on the incoming CSV tables. Details about configuring this can be found in the configuration documentation.</p>"}, {"location": "index/default_dataflow/#link-to-textunits", "title": "Link to TextUnits", "text": "<p>In this step, we link each document to the text-units that were created in the first phase. This allows us to understand which documents are related to which text-units and vice-versa.</p>"}, {"location": "index/default_dataflow/#document-embedding", "title": "Document Embedding", "text": "<p>In this step, we generate a vector representation of our documents using an average embedding of document slices. We re-chunk documents without overlapping chunks, and then generate an embedding for each chunk. We create an average of these chunks weighted by token-count and use this as the document embedding. This will allow us to understand the implicit relationship between documents, and will help us generate a network representation of our documents.</p>"}, {"location": "index/default_dataflow/#documents-table-emission", "title": "Documents Table Emission", "text": "<p>At this point, we can export the Documents table into the knowledge Model.</p>"}, {"location": "index/default_dataflow/#phase-6-network-visualization", "title": "Phase 6: Network Visualization", "text": "<p>In this phase of the workflow, we perform some steps to support network visualization of our high-dimensional vector spaces within our existing graphs. At this point there are two logical graphs at play: the Entity-Relationship graph and the Document graph.</p> <pre><code>---\ntitle: Network Visualization Workflows\n---\nflowchart LR\n    nv[Umap Documents] --&gt; ne[Umap Entities] --&gt; ng[Nodes Table Emission]</code></pre> <p>For each of the logical graphs, we perform a UMAP dimensionality reduction to generate a 2D representation of the graph. This will allow us to visualize the graph in a 2D space and understand the relationships between the nodes in the graph. The UMAP embeddings are then exported as a table of Nodes. The rows of this table include a discriminator indicating whether the node is a document or an entity, and the UMAP coordinates.</p>"}, {"location": "index/outputs/", "title": "Outputs", "text": "<p>The default pipeline produces a series of output tables that align with the conceptual knowledge model. This page describes the detailed output table schemas. By default we write these tables out as parquet files on disk.</p>"}, {"location": "index/outputs/#shared-fields", "title": "Shared fields", "text": "<p>All tables have two identifier fields:</p> name type description id str Generated UUID, assuring global uniqueness human_readable_id int This is an incremented short ID created per-run. For example, we use this short ID with generated summaries that print citations so they are easy to cross-reference visually."}, {"location": "index/outputs/#create_final_communities", "title": "create_final_communities", "text": "<p>This is a list of the final communities generated by Leiden. Communities are strictly hierarchical, subdividing into children as the cluster affinity is narrowed.</p> name type description community int Leiden-generated cluster ID for the community. Note that these increment with depth, so they are unique through all levels of the community hierarchy. For this table, human_readable_id is a copy of the community ID rather than a plain increment. level int Depth of the community in the hierarchy. title str Friendly name of the community. entity_ids str[] List of entities that are members of the community. relationship_ids str[] List of relationships that are wholly within the community (source and target are both in the community). text_unit_ids str[] List of text units represented within the community. period str Date of ingest, used for incremental update merges. ISO8601 size int Size of the community (entity count), used for incremental update merges."}, {"location": "index/outputs/#create_final_community_reports", "title": "create_final_community_reports", "text": "<p>This is the list of summarized reports for each community.</p> name type description community int Short ID of the community this report applies to. level int Level of the community this report applies to. title str LM-generated title for the report. summary str LM-generated summary of the report. full_content str LM-generated full report. rank float LM-derived relevance ranking of the report based on member entity salience rank_explanation str LM-derived explanation of the rank. findings dict LM-derived list of the top 5-10 insights from the community. Contains <code>summary</code> and <code>explanation</code> values. full_content_json json Full JSON output as returned by the LM. Most fields are extracted into columns, but this JSON is sent for query summarization so we leave it to allow for prompt tuning to add fields/content by end users. period str Date of ingest, used for incremental update merges. ISO8601 size int Size of the community (entity count), used for incremental update merges."}, {"location": "index/outputs/#create_final_covariates", "title": "create_final_covariates", "text": "<p>(Optional) If claim extraction is turned on, this is a list of the extracted covariates. Note that claims are typically oriented around identifying malicious behavior such as fraud, so they are not useful for all datasets.</p> name type description covariate_type str This is always \"claim\" with our default covariates. type str Nature of the claim type. description str LM-generated description of the behavior. subject_id str Name of the source entity (that is performing the claimed behavior). object_id str Name of the target entity (that the claimed behavior is performed on). status str LM-derived assessment of the correctness of the claim. One of [TRUE, FALSE, SUSPECTED] start_date str LM-derived start of the claimed activity. ISO8601 end_date str LM-derived end of the claimed activity. ISO8601 source_text str Short string of text containing the claimed behavior. text_unit_id str ID of the text unit the claim text was extracted from."}, {"location": "index/outputs/#create_final_documents", "title": "create_final_documents", "text": "<p>List of document content after import.</p> name type description title str Filename, unless otherwise configured during CSV import. text str Full text of the document. text_unit_ids str[] List of text units (chunks) that were parsed from the document. attributes dict (optional) If specified during CSV import, this is a dict of attributes for the document."}, {"location": "index/outputs/#create_final_entities", "title": "create_final_entities", "text": "<p>List of all entities found in the data by the LM.</p> name type description title str Name of the entity. type str Type of the entity. By default this will be \"organization\", \"person\", \"geo\", or \"event\" unless configured differently or auto-tuning is used. description str Textual description of the entity. Entities may be found in many text units, so this is an LM-derived summary of all descriptions. text_unit_ids str[] List of the text units containing the entity."}, {"location": "index/outputs/#create_final_nodes", "title": "create_final_nodes", "text": "<p>This is graph-related information for the entities. It contains only information relevant to the graph such as community. There is an entry for each entity at every community level it is found within, so you may see \"duplicate\" entities.</p> <p>Note that the ID fields match those in create_final_entities and can be used for joining if additional information about a node is required.</p> name type description title str Name of the referenced entity. Duplicated from create_final_entities for convenient cross-referencing. community int Leiden community the node is found within. Entities are not always assigned a community (they may not be close enough to any), so they may have a ID of -1. level int Level of the community the entity is in. degree int Node degree (connectedness) in the graph. x float X position of the node for visual layouts. If graph embeddings and UMAP are not turned on, this will be 0. y float Y position of the node for visual layouts. If graph embeddings and UMAP are not turned on, this will be 0."}, {"location": "index/outputs/#create_final_relationships", "title": "create_final_relationships", "text": "<p>List of all entity-to-entity relationships found in the data by the LM. This is also the edge list for the graph.</p> name type description source str Name of the source entity. target str Name of the target entity. description str LM-derived description of the relationship. Also see note for entity descriptions. weight float Weight of the edge in the graph. This is summed from an LM-derived \"strength\" measure for each relationship instance. combined_degree int Sum of source and target node degrees. text_unit_ids str[] List of text units the relationship was found within."}, {"location": "index/outputs/#create_final_text_units", "title": "create_final_text_units", "text": "<p>List of all text chunks parsed from the input documents.</p> name type description text str Raw full text of the chunk. n_tokens int Number of tokens in the chunk. This should normally match the <code>chunk_size</code> config parameter, except for the last chunk which is often shorter. document_ids str[] List of document IDs the chunk came from. This is normally only 1 due to our default groupby, but for very short text documents (e.g., microblogs) it can be configured so text units span multiple documents. entity_ids str[] List of entities found in the text unit. relationships_ids str[] List of relationships found in the text unit. covariate_ids str[] Optional list of covariates found in the text unit."}, {"location": "index/overview/", "title": "GraphRAG Indexing \ud83e\udd16", "text": "<p>The GraphRAG indexing package is a data pipeline and transformation suite that is designed to extract meaningful, structured data from unstructured text using LLMs.</p> <p>Indexing Pipelines are configurable. They are composed of workflows, standard and custom steps, prompt templates, and input/output adapters. Our standard pipeline is designed to:</p> <ul> <li>extract entities, relationships and claims from raw text</li> <li>perform community detection in entities</li> <li>generate community summaries and reports at multiple levels of granularity</li> <li>embed entities into a graph vector space</li> <li>embed text chunks into a textual vector space</li> </ul> <p>The outputs of the pipeline can be stored in a variety of formats, including JSON and Parquet - or they can be handled manually via the Python API.</p>"}, {"location": "index/overview/#getting-started", "title": "Getting Started", "text": ""}, {"location": "index/overview/#requirements", "title": "Requirements", "text": "<p>See the requirements section in Get Started for details on setting up a development environment.</p> <p>The Indexing Engine can be used in either a default configuration mode or with a custom pipeline. To configure GraphRAG, see the configuration documentation. After you have a config file you can run the pipeline using the CLI or the Python API.</p>"}, {"location": "index/overview/#usage", "title": "Usage", "text": ""}, {"location": "index/overview/#cli", "title": "CLI", "text": "<pre><code># Via Poetry\npoetry run poe cli --root &lt;data_root&gt; # default config mode\npoetry run poe cli --config your_pipeline.yml # custom config mode\n\n# Via Node\nyarn run:index --root &lt;data_root&gt; # default config mode\nyarn run:index --config your_pipeline.yml # custom config mode\n</code></pre>"}, {"location": "index/overview/#python-api", "title": "Python API", "text": "<p>Please see the examples folder for a handful of functional pipelines illustrating how to create and run via a custom settings.yml or through custom python scripts.</p>"}, {"location": "index/overview/#further-reading", "title": "Further Reading", "text": "<ul> <li>To start developing within the GraphRAG project, see getting started</li> <li>To understand the underlying concepts and execution model of the indexing library, see the architecture documentation</li> <li>To get running with a series of examples, see the examples documentation</li> <li>To read more about configuring the indexing engine, see the configuration documentation</li> </ul>"}, {"location": "prompt_tuning/auto_prompt_tuning/", "title": "Auto Prompt Tuning \u2699\ufe0f", "text": "<p>GraphRAG provides the ability to create domain adapted prompts for the generation of the knowledge graph. This step is optional, though it is highly encouraged to run it as it will yield better results when executing an Index Run.</p> <p>These are generated by loading the inputs, splitting them into chunks (text units) and then running a series of LLM invocations and template substitutions to generate the final prompts. We suggest using the default values provided by the script, but in this page you'll find the detail of each in case you want to further explore and tweak the prompt tuning algorithm.</p> <p> </p> <p> Figure 1: Auto Tuning Conceptual Diagram. </p>"}, {"location": "prompt_tuning/auto_prompt_tuning/#prerequisites", "title": "Prerequisites", "text": "<p>Before running auto tuning, ensure you have already initialized your workspace with the <code>graphrag init</code> command. This will create the necessary configuration files and the default prompts. Refer to the Init Documentation for more information about the initialization process.</p>"}, {"location": "prompt_tuning/auto_prompt_tuning/#usage", "title": "Usage", "text": "<p>You can run the main script from the command line with various options:</p> <pre><code>graphrag prompt-tune [--root ROOT] [--config CONFIG] [--domain DOMAIN]  [--selection-method METHOD] [--limit LIMIT] [--language LANGUAGE] \\\n[--max-tokens MAX_TOKENS] [--chunk-size CHUNK_SIZE] [--n-subset-max N_SUBSET_MAX] [--k K] \\\n[--min-examples-required MIN_EXAMPLES_REQUIRED] [--discover-entity-types] [--output OUTPUT]\n</code></pre>"}, {"location": "prompt_tuning/auto_prompt_tuning/#command-line-options", "title": "Command-Line Options", "text": "<ul> <li> <p><code>--config</code> (required): The path to the configuration file. This is required to load the data and model settings.</p> </li> <li> <p><code>--root</code> (optional): The data project root directory, including the config files (YML, JSON, or .env). Defaults to the current directory.</p> </li> <li> <p><code>--domain</code> (optional): The domain related to your input data, such as 'space science', 'microbiology', or 'environmental news'. If left empty, the domain will be inferred from the input data.</p> </li> <li> <p><code>--method</code> (optional): The method to select documents. Options are all, random, auto or top. Default is random.</p> </li> <li> <p><code>--limit</code> (optional): The limit of text units to load when using random or top selection. Default is 15.</p> </li> <li> <p><code>--language</code> (optional): The language to use for input processing. If it is different from the inputs' language, the LLM will translate. Default is \"\" meaning it will be automatically detected from the inputs.</p> </li> <li> <p><code>--max-tokens</code> (optional): Maximum token count for prompt generation. Default is 2000.</p> </li> <li> <p><code>--chunk-size</code> (optional): The size in tokens to use for generating text units from input documents. Default is 200.</p> </li> <li> <p><code>--n-subset-max</code> (optional): The number of text chunks to embed when using auto selection method. Default is 300.</p> </li> <li> <p><code>--k</code> (optional): The number of documents to select when using auto selection method. Default is 15.</p> </li> <li> <p><code>--min-examples-required</code> (optional): The minimum number of examples required for entity extraction prompts. Default is 2.</p> </li> <li> <p><code>--discover-entity-types</code> (optional): Allow the LLM to discover and extract entities automatically. We recommend using this when your data covers a lot of topics or it is highly randomized.</p> </li> <li> <p><code>--output</code> (optional): The folder to save the generated prompts. Default is \"prompts\".</p> </li> </ul>"}, {"location": "prompt_tuning/auto_prompt_tuning/#example-usage", "title": "Example Usage", "text": "<pre><code>python -m graphrag prompt-tune --root /path/to/project --config /path/to/settings.yaml --domain \"environmental news\" \\\n--method random --limit 10 --language English --max-tokens 2048 --chunk-size 256 --min-examples-required 3 \\\n--no-entity-types --output /path/to/output\n</code></pre> <p>or, with minimal configuration (suggested):</p> <pre><code>python -m graphrag prompt-tune --root /path/to/project --config /path/to/settings.yaml --no-entity-types\n</code></pre>"}, {"location": "prompt_tuning/auto_prompt_tuning/#document-selection-methods", "title": "Document Selection Methods", "text": "<p>The auto tuning feature ingests the input data and then divides it into text units the size of the chunk size parameter. After that, it uses one of the following selection methods to pick a sample to work with for prompt generation:</p> <ul> <li><code>random</code>: Select text units randomly. This is the default and recommended option.</li> <li><code>top</code>: Select the head n text units.</li> <li><code>all</code>: Use all text units for the generation. Use only with small datasets; this option is not usually recommended.</li> <li><code>auto</code>: Embed text units in a lower-dimensional space and select the k nearest neighbors to the centroid. This is useful when you have a large dataset and want to select a representative sample.</li> </ul>"}, {"location": "prompt_tuning/auto_prompt_tuning/#modify-env-vars", "title": "Modify Env Vars", "text": "<p>After running auto tuning, you should modify the following environment variables (or config variables) to pick up the new prompts on your index run. Note: Please make sure to update the correct path to the generated prompts, in this example we are using the default \"prompts\" path.</p> <ul> <li> <p><code>GRAPHRAG_ENTITY_EXTRACTION_PROMPT_FILE</code> = \"prompts/entity_extraction.txt\"</p> </li> <li> <p><code>GRAPHRAG_COMMUNITY_REPORT_PROMPT_FILE</code> = \"prompts/community_report.txt\"</p> </li> <li> <p><code>GRAPHRAG_SUMMARIZE_DESCRIPTIONS_PROMPT_FILE</code> = \"prompts/summarize_descriptions.txt\"</p> </li> </ul> <p>or in your yaml config file:</p> <pre><code>entity_extraction:\n  prompt: \"prompts/entity_extraction.txt\"\n\nsummarize_descriptions:\n  prompt: \"prompts/summarize_descriptions.txt\"\n\ncommunity_reports:\n  prompt: \"prompts/community_report.txt\"\n</code></pre>"}, {"location": "prompt_tuning/manual_prompt_tuning/", "title": "Manual Prompt Tuning \u2699\ufe0f", "text": "<p>The GraphRAG indexer, by default, will run with a handful of prompts that are designed to work well in the broad context of knowledge discovery. However, it is quite common to want to tune the prompts to better suit your specific use case. We provide a means for you to do this by allowing you to specify a custom prompt file, which will each use a series of token-replacements internally.</p> <p>Each of these prompts may be overridden by writing a custom prompt file in plaintext. We use token-replacements in the form of <code>{token_name}</code>, and the descriptions for the available tokens can be found below.</p>"}, {"location": "prompt_tuning/manual_prompt_tuning/#indexing-prompts", "title": "Indexing Prompts", "text": ""}, {"location": "prompt_tuning/manual_prompt_tuning/#entityrelationship-extraction", "title": "Entity/Relationship Extraction", "text": "<p>Prompt Source</p>"}, {"location": "prompt_tuning/manual_prompt_tuning/#tokens", "title": "Tokens", "text": "<ul> <li>{input_text} - The input text to be processed.</li> <li>{entity_types} - A list of entity types</li> <li>{tuple_delimiter} - A delimiter for separating values within a tuple. A single tuple is used to represent an individual entity or relationship.</li> <li>{record_delimiter} - A delimiter for separating tuple instances.</li> <li>{completion_delimiter} - An indicator for when generation is complete.</li> </ul>"}, {"location": "prompt_tuning/manual_prompt_tuning/#summarize-entityrelationship-descriptions", "title": "Summarize Entity/Relationship Descriptions", "text": "<p>Prompt Source</p>"}, {"location": "prompt_tuning/manual_prompt_tuning/#tokens_1", "title": "Tokens", "text": "<ul> <li>{entity_name} - The name of the entity or the source/target pair of the relationship.</li> <li>{description_list} - A list of descriptions for the entity or relationship.</li> </ul>"}, {"location": "prompt_tuning/manual_prompt_tuning/#claim-extraction", "title": "Claim Extraction", "text": "<p>Prompt Source</p>"}, {"location": "prompt_tuning/manual_prompt_tuning/#tokens_2", "title": "Tokens", "text": "<ul> <li>{input_text} - The input text to be processed.</li> <li>{tuple_delimiter} - A delimiter for separating values within a tuple. A single tuple is used to represent an individual entity or relationship.</li> <li>{record_delimiter} - A delimiter for separating tuple instances.</li> <li>{completion_delimiter} - An indicator for when generation is complete.</li> <li>{entity_specs} - A list of entity types.</li> <li>{claim_description} - Description of what claims should look like. Default is: <code>\"Any claims or facts that could be relevant to information discovery.\"</code></li> </ul> <p>See the configuration documentation for details on how to change this.</p>"}, {"location": "prompt_tuning/manual_prompt_tuning/#generate-community-reports", "title": "Generate Community Reports", "text": "<p>Prompt Source</p>"}, {"location": "prompt_tuning/manual_prompt_tuning/#tokens_3", "title": "Tokens", "text": "<ul> <li>{input_text} - The input text to generate the report with. This will contain tables of entities and relationships.</li> </ul>"}, {"location": "prompt_tuning/manual_prompt_tuning/#query-prompts", "title": "Query Prompts", "text": ""}, {"location": "prompt_tuning/manual_prompt_tuning/#local-search", "title": "Local Search", "text": "<p>Prompt Source</p>"}, {"location": "prompt_tuning/manual_prompt_tuning/#tokens_4", "title": "Tokens", "text": "<ul> <li>{response_type} - Describe how the response should look. We default to \"multiple paragraphs\".</li> <li>{context_data} - The data tables from GraphRAG's index.</li> </ul>"}, {"location": "prompt_tuning/manual_prompt_tuning/#global-search", "title": "Global Search", "text": "<p>Mapper Prompt Source</p> <p>Reducer Prompt Source</p> <p>Knowledge Prompt Source</p> <p>Global search uses a map/reduce approach to summarization. You can tune these prompts independently. This search also includes the ability to adjust the use of general knowledge from the model's training.</p>"}, {"location": "prompt_tuning/manual_prompt_tuning/#tokens_5", "title": "Tokens", "text": "<ul> <li>{response_type} - Describe how the response should look (reducer only). We default to \"multiple paragraphs\".</li> <li>{context_data} - The data tables from GraphRAG's index.</li> </ul>"}, {"location": "prompt_tuning/manual_prompt_tuning/#drift-search", "title": "Drift Search", "text": "<p>Prompt Source</p>"}, {"location": "prompt_tuning/manual_prompt_tuning/#tokens_6", "title": "Tokens", "text": "<ul> <li>{response_type} - Describe how the response should look. We default to \"multiple paragraphs\".</li> <li>{context_data} - The data tables from GraphRAG's index.</li> <li>{community_reports} - The most relevant community reports to include in the summarization.</li> <li>{query} - The query text as injected into the context.</li> </ul>"}, {"location": "prompt_tuning/overview/", "title": "Prompt Tuning \u2699\ufe0f", "text": "<p>This page provides an overview of the prompt tuning options available for the GraphRAG indexing engine.</p>"}, {"location": "prompt_tuning/overview/#default-prompts", "title": "Default Prompts", "text": "<p>The default prompts are the simplest way to get started with the GraphRAG system. It is designed to work out-of-the-box with minimal configuration. More details about each of the default prompts for indexing and query can be found on the manual tuning page.</p>"}, {"location": "prompt_tuning/overview/#auto-tuning", "title": "Auto Tuning", "text": "<p>Auto Tuning leverages your input data and LLM interactions to create domain adapted prompts for the generation of the knowledge graph. It is highly encouraged to run it as it will yield better results when executing an Index Run. For more details about how to use it, please refer to the Auto Tuning documentation.</p>"}, {"location": "prompt_tuning/overview/#manual-tuning", "title": "Manual Tuning", "text": "<p>Manual tuning is an advanced use-case. Most users will want to use the Auto Tuning feature instead. Details about how to use manual configuration are available in the manual tuning documentation.</p>"}, {"location": "query/drift_search/", "title": "DRIFT Search \ud83d\udd0e", "text": ""}, {"location": "query/drift_search/#combining-local-and-global-search", "title": "Combining Local and Global Search", "text": "<p>GraphRAG is a technique that uses large language models (LLMs) to create knowledge graphs and summaries from unstructured text documents and leverages them to improve retrieval-augmented generation (RAG) operations on private datasets. It offers comprehensive global overviews of large, private troves of unstructured text documents while also enabling exploration of detailed, localized information. By using LLMs to create comprehensive knowledge graphs that connect and describe entities and relationships contained in those documents, GraphRAG leverages semantic structuring of the data to generate responses to a wide variety of complex user queries.</p> <p>DRIFT search (Dynamic Reasoning and Inference with Flexible Traversal) builds upon Microsoft\u2019s GraphRAG technique, combining characteristics of both global and local search to generate detailed responses in a method that balances computational costs with quality outcomes using our drift search method.</p>"}, {"location": "query/drift_search/#methodology", "title": "Methodology", "text": "<p> Figure 1. An entire DRIFT search hierarchy highlighting the three core phases of the DRIFT search process. A (Primer): DRIFT compares the user\u2019s query with the top K most semantically relevant community reports, generating a broad initial answer and follow-up questions to steer further exploration. B (Follow-Up): DRIFT uses local search to refine queries, producing additional intermediate answers and follow-up questions that enhance specificity, guiding the engine towards context-rich information. A glyph on each node in the diagram shows the confidence the algorithm has to continue the query expansion step.  C (Output Hierarchy): The final output is a hierarchical structure of questions and answers ranked by relevance, reflecting a balanced mix of global insights and local refinements, making the results adaptable and comprehensive.</p> <p>DRIFT Search introduces a new approach to local search queries by including community information in the search process. This greatly expands the breadth of the query\u2019s starting point and leads to retrieval and usage of a far higher variety of facts in the final answer. This addition expands the GraphRAG query engine by providing a more comprehensive option for local search, which uses community insights to refine a query into detailed follow-up questions.</p>"}, {"location": "query/drift_search/#configuration", "title": "Configuration", "text": "<p>Below are the key parameters of the DRIFTSearch class:</p> <ul> <li><code>llm</code>: OpenAI model object to be used for response generation</li> <li><code>context_builder</code>: context builder object to be used for preparing context data from community reports and query information</li> <li><code>config</code>: model to define the DRIFT Search hyperparameters. DRIFT Config model</li> <li><code>token_encoder</code>: token encoder for tracking the budget for the algorithm.</li> <li><code>query_state</code>: a state object as defined in Query State that allows to track execution of a DRIFT Search instance, alongside follow ups and DRIFT actions.</li> </ul>"}, {"location": "query/drift_search/#how-to-use", "title": "How to Use", "text": "<p>An example of a drift search scenario can be found in the following notebook.</p>"}, {"location": "query/drift_search/#learn-more", "title": "Learn More", "text": "<p>For a more in-depth look at the DRIFT search method, please refer to our DRIFT Search blog post</p>"}, {"location": "query/global_search/", "title": "Global Search \ud83d\udd0e", "text": ""}, {"location": "query/global_search/#whole-dataset-reasoning", "title": "Whole Dataset Reasoning", "text": "<p>Baseline RAG struggles with queries that require aggregation of information across the dataset to compose an answer. Queries such as \u201cWhat are the top 5 themes in the data?\u201d perform terribly because baseline RAG relies on a vector search of semantically similar text content within the dataset. There is nothing in the query to direct it to the correct information.</p> <p>However, with GraphRAG we can answer such questions, because the structure of the LLM-generated knowledge graph tells us about the structure (and thus themes) of the dataset as a whole. This allows the private dataset to be organized into meaningful semantic clusters that are pre-summarized. Using our global search method, the LLM uses these clusters to summarize these themes when responding to a user query.</p>"}, {"location": "query/global_search/#methodology", "title": "Methodology", "text": "<pre><code>---\ntitle: Global Search Dataflow\n---\n%%{ init: { 'flowchart': { 'curve': 'step' } } }%%\nflowchart LR\n\n    uq[User Query] --- .1\n    ch1[Conversation History] --- .1\n\n    subgraph RIR\n        direction TB\n        ri1[Rated Intermediate&lt;br/&gt;Response 1]~~~ri2[Rated Intermediate&lt;br/&gt;Response 2] -.\"{1..N}\".-rin[Rated Intermediate&lt;br/&gt;Response N]\n    end\n\n    .1--Shuffled Community&lt;br/&gt;Report Batch 1--&gt;RIR\n    .1--Shuffled Community&lt;br/&gt;Report Batch 2--&gt;RIR---.2\n    .1--Shuffled Community&lt;br/&gt;Report Batch N--&gt;RIR\n\n    .2--Ranking +&lt;br/&gt;Filtering--&gt;agr[Aggregated Intermediate&lt;br/&gt;Responses]--&gt;res[Response]\n\n\n\n     classDef green fill:#26B653,stroke:#333,stroke-width:2px,color:#fff;\n     classDef turquoise fill:#19CCD3,stroke:#333,stroke-width:2px,color:#fff;\n     classDef rose fill:#DD8694,stroke:#333,stroke-width:2px,color:#fff;\n     classDef orange fill:#F19914,stroke:#333,stroke-width:2px,color:#fff;\n     classDef purple fill:#B356CD,stroke:#333,stroke-width:2px,color:#fff;\n     classDef invisible fill:#fff,stroke:#fff,stroke-width:0px,color:#fff, width:0px;\n     class uq,ch1 turquoise;\n     class ri1,ri2,rin rose;\n     class agr orange;\n     class res purple;\n     class .1,.2 invisible;\n</code></pre> <p>Given a user query and, optionally, the conversation history, the global search method uses a collection of LLM-generated community reports from a specified level of the graph's community hierarchy as context data to generate response in a map-reduce manner. At the <code>map</code> step, community reports are segmented into text chunks of pre-defined size. Each text chunk is then used to produce an intermediate response containing a list of point, each of which is accompanied by a numerical rating indicating the importance of the point. At the <code>reduce</code> step, a filtered set of the most important points from the intermediate responses are aggregated and used as the context to generate the final response. </p> <p>The quality of the global search\u2019s response can be heavily influenced by the level of the community hierarchy chosen for sourcing community reports. Lower hierarchy levels, with their detailed reports, tend to yield more thorough responses, but may also increase the time and LLM resources needed to generate the final response due to the volume of reports.</p>"}, {"location": "query/global_search/#configuration", "title": "Configuration", "text": "<p>Below are the key parameters of the GlobalSearch class:</p> <ul> <li><code>llm</code>: OpenAI model object to be used for response generation</li> <li><code>context_builder</code>: context builder object to be used for preparing context data from community reports</li> <li><code>map_system_prompt</code>: prompt template used in the <code>map</code> stage. Default template can be found at map_system_prompt</li> <li><code>reduce_system_prompt</code>: prompt template used in the <code>reduce</code> stage, default template can be found at reduce_system_prompt</li> <li><code>response_type</code>: free-form text describing the desired response type and format (e.g., <code>Multiple Paragraphs</code>, <code>Multi-Page Report</code>)</li> <li><code>allow_general_knowledge</code>: setting this to True will include additional instructions to the <code>reduce_system_prompt</code> to prompt the LLM to incorporate relevant real-world knowledge outside of the dataset. Note that this may increase hallucinations, but can be useful for certain scenarios. Default is False *<code>general_knowledge_inclusion_prompt</code>: instruction to add to the <code>reduce_system_prompt</code> if <code>allow_general_knowledge</code> is enabled. Default instruction can be found at general_knowledge_instruction</li> <li><code>max_data_tokens</code>: token budget for the context data</li> <li><code>map_llm_params</code>: a dictionary of additional parameters (e.g., temperature, max_tokens) to be passed to the LLM call at the <code>map</code> stage</li> <li><code>reduce_llm_params</code>: a dictionary of additional parameters (e.g., temperature, max_tokens) to passed to the LLM call at the <code>reduce</code> stage</li> <li><code>context_builder_params</code>: a dictionary of additional parameters to be passed to the <code>context_builder</code> object when building context window for the <code>map</code> stage.</li> <li><code>concurrent_coroutines</code>: controls the degree of parallelism in the <code>map</code> stage.</li> <li><code>callbacks</code>: optional callback functions, can be used to provide custom event handlers for LLM's completion streaming events</li> </ul>"}, {"location": "query/global_search/#how-to-use", "title": "How to Use", "text": "<p>An example of a global search scenario can be found in the following notebook.</p>"}, {"location": "query/local_search/", "title": "Local Search \ud83d\udd0e", "text": ""}, {"location": "query/local_search/#entity-based-reasoning", "title": "Entity-based Reasoning", "text": "<p>The local search method combines structured data from the knowledge graph with unstructured data from the input documents to augment the LLM context with relevant entity information at query time. It is well-suited for answering questions that require an understanding of specific entities mentioned in the input documents (e.g., \u201cWhat are the healing properties of chamomile?\u201d).</p>"}, {"location": "query/local_search/#methodology", "title": "Methodology", "text": "<pre><code>---\ntitle: Local Search Dataflow\n---\n%%{ init: { 'flowchart': { 'curve': 'step' } } }%%\nflowchart LR\n\n    uq[User Query] ---.1\n    ch1[Conversation&lt;br/&gt;History]---.1\n\n    .1--Entity&lt;br/&gt;Description&lt;br/&gt;Embedding--&gt; ee[Extracted Entities]\n\n    ee[Extracted Entities] ---.2--Entity-Text&lt;br/&gt;Unit Mapping--&gt; ctu[Candidate&lt;br/&gt;Text Units]--Ranking + &lt;br/&gt;Filtering --&gt;ptu[Prioritized&lt;br/&gt;Text Units]---.3\n    .2--Entity-Report&lt;br/&gt;Mapping--&gt; ccr[Candidate&lt;br/&gt;Community Reports]--Ranking + &lt;br/&gt;Filtering --&gt;pcr[Prioritized&lt;br/&gt;Community Reports]---.3\n    .2--Entity-Entity&lt;br/&gt;Relationships--&gt; ce[Candidate&lt;br/&gt;Entities]--Ranking + &lt;br/&gt;Filtering --&gt;pe[Prioritized&lt;br/&gt;Entities]---.3\n    .2--Entity-Entity&lt;br/&gt;Relationships--&gt; cr[Candidate&lt;br/&gt;Relationships]--Ranking + &lt;br/&gt;Filtering --&gt;pr[Prioritized&lt;br/&gt;Relationships]---.3\n    .2--Entity-Covariate&lt;br/&gt;Mappings--&gt; cc[Candidate&lt;br/&gt;Covariates]--Ranking + &lt;br/&gt;Filtering --&gt;pc[Prioritized&lt;br/&gt;Covariates]---.3\n    ch1 --&gt;ch2[Conversation History]---.3\n    .3--&gt;res[Response]\n\n     classDef green fill:#26B653,stroke:#333,stroke-width:2px,color:#fff;\n     classDef turquoise fill:#19CCD3,stroke:#333,stroke-width:2px,color:#fff;\n     classDef rose fill:#DD8694,stroke:#333,stroke-width:2px,color:#fff;\n     classDef orange fill:#F19914,stroke:#333,stroke-width:2px,color:#fff;\n     classDef purple fill:#B356CD,stroke:#333,stroke-width:2px,color:#fff;\n     classDef invisible fill:#fff,stroke:#fff,stroke-width:0px,color:#fff, width:0px;\n     class uq,ch1 turquoise\n     class ee green\n     class ctu,ccr,ce,cr,cc rose\n     class ptu,pcr,pe,pr,pc,ch2 orange\n     class res purple\n     class .1,.2,.3 invisible\n\n</code></pre> <p>Given a user query and, optionally, the conversation history, the local search method identifies a set of entities from the knowledge graph that are semantically-related to the user input. These entities serve as access points into the knowledge graph, enabling the extraction of further relevant details such as connected entities, relationships, entity covariates, and community reports. Additionally, it also extracts relevant text chunks from the raw input documents that are associated with the identified entities. These candidate data sources are then prioritized and filtered to fit within a single context window of pre-defined size, which is used to generate a response to the user query.</p>"}, {"location": "query/local_search/#configuration", "title": "Configuration", "text": "<p>Below are the key parameters of the LocalSearch class:</p> <ul> <li><code>llm</code>: OpenAI model object to be used for response generation</li> <li><code>context_builder</code>: context builder object to be used for preparing context data from collections of knowledge model objects</li> <li><code>system_prompt</code>: prompt template used to generate the search response. Default template can be found at system_prompt</li> <li><code>response_type</code>: free-form text describing the desired response type and format (e.g., <code>Multiple Paragraphs</code>, <code>Multi-Page Report</code>)</li> <li><code>llm_params</code>: a dictionary of additional parameters (e.g., temperature, max_tokens) to be passed to the LLM call</li> <li><code>context_builder_params</code>: a dictionary of additional parameters to be passed to the <code>context_builder</code> object when building context for the search prompt</li> <li><code>callbacks</code>: optional callback functions, can be used to provide custom event handlers for LLM's completion streaming events</li> </ul>"}, {"location": "query/local_search/#how-to-use", "title": "How to Use", "text": "<p>An example of a local search scenario can be found in the following notebook.</p>"}, {"location": "query/overview/", "title": "Query Engine \ud83d\udd0e", "text": "<p>The Query Engine is the retrieval module of the Graph RAG Library. It is one of the two main components of the Graph RAG library, the other being the Indexing Pipeline (see Indexing Pipeline). It is responsible for the following tasks:</p> <ul> <li>Local Search</li> <li>Global Search</li> <li>DRIFT Search</li> <li>Question Generation</li> </ul>"}, {"location": "query/overview/#local-search", "title": "Local Search", "text": "<p>Local search method generates answers by combining relevant data from the AI-extracted knowledge-graph with text chunks of the raw documents. This method is suitable for questions that require an understanding of specific entities mentioned in the documents (e.g. What are the healing properties of chamomile?).</p> <p>For more details about how Local Search works please refer to the Local Search documentation.</p>"}, {"location": "query/overview/#global-search", "title": "Global Search", "text": "<p>Global search method generates answers by searching over all AI-generated community reports in a map-reduce fashion. This is a resource-intensive method, but often gives good responses for questions that require an understanding of the dataset as a whole (e.g. What are the most significant values of the herbs mentioned in this notebook?).</p> <p>More about this can be checked at the Global Search documentation.</p>"}, {"location": "query/overview/#drift-search", "title": "DRIFT Search", "text": "<p>DRIFT Search introduces a new approach to local search queries by including community information in the search process. This greatly expands the breadth of the query\u2019s starting point and leads to retrieval and usage of a far higher variety of facts in the final answer. This addition expands the GraphRAG query engine by providing a more comprehensive option for local search, which uses community insights to refine a query into detailed follow-up questions.</p> <p>To learn more about DRIFT Search, please refer to the DRIFT Search documentation.</p>"}, {"location": "query/overview/#question-generation", "title": "Question Generation", "text": "<p>This functionality takes a list of user queries and generates the next candidate questions. This is useful for generating follow-up questions in a conversation or for generating a list of questions for the investigator to dive deeper into the dataset.</p> <p>Information about how question generation works can be found at the Question Generation documentation page.</p>"}, {"location": "query/question_generation/", "title": "Question Generation \u2754", "text": ""}, {"location": "query/question_generation/#entity-based-question-generation", "title": "Entity-based Question Generation", "text": "<p>The question generation method combines structured data from the knowledge graph with unstructured data from the input documents to generate candidate questions related to specific entities.</p>"}, {"location": "query/question_generation/#methodology", "title": "Methodology", "text": "<p>Given a list of prior user questions, the question generation method uses the same context-building approach employed in local search to extract and prioritize relevant structured and unstructured data, including entities, relationships, covariates, community reports and raw text chunks. These data records are then fitted into a single LLM prompt to generate candidate follow-up questions that represent the most important or urgent information content or themes in the data.</p>"}, {"location": "query/question_generation/#configuration", "title": "Configuration", "text": "<p>Below are the key parameters of the Question Generation class:</p> <ul> <li><code>llm</code>: OpenAI model object to be used for response generation</li> <li><code>context_builder</code>: context builder object to be used for preparing context data from collections of knowledge model objects, using the same context builder class as in local search</li> <li><code>system_prompt</code>: prompt template used to generate candidate questions. Default template can be found at system_prompt</li> <li><code>llm_params</code>: a dictionary of additional parameters (e.g., temperature, max_tokens) to be passed to the LLM call</li> <li><code>context_builder_params</code>: a dictionary of additional parameters to be passed to the <code>context_builder</code> object when building context for the question generation prompt</li> <li><code>callbacks</code>: optional callback functions, can be used to provide custom event handlers for LLM's completion streaming events</li> </ul>"}, {"location": "query/question_generation/#how-to-use", "title": "How to Use", "text": "<p>An example of the question generation function can be found in the following notebook.</p>"}, {"location": "query/notebooks/overview/", "title": "Query Engine Notebooks", "text": "<p>For examples about running Query please refer to the following notebooks:</p> <ul> <li>Global Search Notebook</li> <li>Local Search Notebook</li> <li>DRIFT Search Notebook</li> </ul> <p>The test dataset for these notebooks can be found in dataset.zip.</p>"}]}
\ No newline at end of file
diff --git a/sitemap.xml.gz b/sitemap.xml.gz
index 412ffb42..b651cf06 100644
Binary files a/sitemap.xml.gz and b/sitemap.xml.gz differ

	id	title	occurrence weight	content	rank
0	15	Dulce Base and the Paranormal Military Squad: ...	1.00	# Dulce Base and the Paranormal Military Squad...	9.5
1	1	Earth's Interstellar Communication Initiative	0.16	# Earth's Interstellar Communication Initiativ...	8.5
2	16	Dulce Military Base and Alien Intelligence Com...	0.08	# Dulce Military Base and Alien Intelligence C...	8.5
3	4	Dulce Facility and Control Room of Dulce: Extr...	0.02	# Dulce Facility and Control Room of Dulce: Ex...	8.5
4	17	Dulce Team and Underground Command Center: Int...	0.02	# Dulce Team and Underground Command Center: I...	8.5
5	19	Central Terminal and Viewing Monitors at Dulce...	0.02	# Central Terminal and Viewing Monitors at Dul...	8.5
6	6	Cosmic Vocalization and Universe Interactions	0.02	# Cosmic Vocalization and Universe Interaction...	7.5
	id	entity	description	number of relationships	in_context
0	17	DR. JORDAN HAYES	Dr. Jordan Hayes is a key scientist at Dulce B...	18	True
1	7	JORDAN	Jordan Hayes is a key member of the Paranormal...	22	True
2	2	JORDAN HAYES	Dr. Jordan Hayes is a central figure at Dulce ...	48	True
3	47	DR. HAYES	Dr. Hayes is a scientist working on understand...	1	True
4	10	AGENT HAYES	Agent Hayes is known for emphasizing empowerme...	4	True
	id	source	target	description	weight	links	in_context
0	260	JORDAN	DR. JORDAN HAYES	Dr. Jordan Hayes and Jordan refer to the same ...	1.0	1	True
1	50	ALEX MERCER	JORDAN	Alex Mercer values Jordan's analytical approac...	1.0	2	True
2	26	ALEX MERCER	DR. JORDAN HAYES	Alex Mercer and Dr. Jordan Hayes are collabora...	5.0	2	True
3	77	TAYLOR CRUZ	JORDAN	Jordan and Taylor Cruz are team members workin...	4.0	2	True
4	82	TAYLOR CRUZ	DR. JORDAN HAYES	Dr. Jordan Hayes and Taylor Cruz are colleague...	4.0	2	True
	id	text
0	40	and the distant hum of machinery hinted at Du...
1	18	the universe.\n\nIn a symphony of clicks and ...
2	37	from across the console, their eyes not leavi...
3	19	extraterrestrial sentience that had outreache...
4	44	It's a... symphony. It's as if they're teachi...