mirror of
https://github.com/Unstructured-IO/unstructured.git
synced 2025-07-03 07:05:20 +00:00

Adds OpenSearch as a source and destination. Since OpenSearch is a fork of Elasticsearch, these connectors rely heavily on inheriting the Elasticsearch connectors whenever possible. - Adds OpenSearch source connector to be able to ingest documents from OpenSearch. - Adds OpenSearch destination connector to be able to ingest documents from any supported source, embed them and write the embeddings / documents into OpenSearch. - Defines an example unstructured elements schema for users to be able to setup their unstructured OpenSearch indexes easily. --------- Co-authored-by: potter-potter <david.potter@gmail.com>
25 lines
695 B
Python
25 lines
695 B
Python
#!/usr/bin/env python3
|
|
|
|
from opensearch_cluster_config import (
|
|
INDEX_NAME,
|
|
mappings,
|
|
)
|
|
from opensearchpy import OpenSearch
|
|
|
|
print("Connecting to the OpenSearch cluster.")
|
|
client = OpenSearch(
|
|
hosts=[{"host": "localhost", "port": 9200}],
|
|
http_auth=("admin", "admin"),
|
|
use_ssl=True,
|
|
verify_certs=False,
|
|
ssl_show_warn=False,
|
|
)
|
|
print(client.info())
|
|
|
|
print("Creating an OpenSearch index for testing ingest opensearch destination connector.")
|
|
response = client.indices.create(index=INDEX_NAME, body=mappings)
|
|
if not response["acknowledged"]:
|
|
raise RuntimeError("failed to create index")
|
|
|
|
print("Succesfully created an OpenSearch index for testing opensearch ingest.")
|