graphrag/tests/integration/_pipeline/megapipeline.yml
Nathan Evans f5b4d2fea5
Ci streamline (#988)
* Remove excess vars from gh-pages build

* Delete redundant javascript ci

* Pull apart testing CI

* Clean up integration tests build

* Move storage tests to integration CI

* Take py 3.10 out of smoke tests matrix

* Use minimum supported python version for most tests

* Re-run main CI on any test change

* Add Josh and Kenny to author list

* Update auto-resolve perms
2024-08-21 15:16:15 -06:00

65 lines
1.1 KiB
YAML

input:
file_type: text
base_dir: ../../fixtures/min-csv
file_pattern: .*\.txt$
storage:
type: memory
cache:
type: memory
workflows:
- name: create_base_text_units
config:
text_chunk:
strategy:
type: sentence
# Just lump everything together
chunk_by: []
- name: create_base_extracted_entities
config:
graphml_snapshot: True
entity_extract:
strategy:
type: nltk
- name: create_base_entity_graph
config:
graphml_snapshot: True
embed_graph_enabled: True
cluster_graph:
strategy:
type: leiden
verbose: True
- name: create_final_nodes
- name: create_base_documents
- name: create_final_communities
- name: create_final_text_units
config:
text_embed:
strategy:
type: mock
- name: create_final_entities
config:
text_embed:
strategy:
type: mock
- name: create_final_documents
config:
text_embed:
strategy:
type: mock
- name: create_final_relationships
config:
text_embed:
strategy:
type: mock