mirror of
https://github.com/Unstructured-IO/unstructured.git
synced 2025-06-27 02:30:08 +00:00

**Summary** Step 2 in prep for pluggable auto-partitioners, remove `regex_metadata` field from `ElementMetadata`. **Additional Context** - "regex-metadata" was an experimental feature that didn't pan out. - It's implemented by one of the post-partitioning metadata decorators, so get rid of it as part of the cleanup before consolidating those decorators.
41 lines
868 B
SQL
41 lines
868 B
SQL
CREATE TABLE elements (
|
|
id TEXT PRIMARY KEY,
|
|
element_id TEXT,
|
|
text TEXT,
|
|
embeddings TEXT,
|
|
type TEXT,
|
|
system TEXT,
|
|
layout_width REAL,
|
|
layout_height REAL,
|
|
points TEXT,
|
|
url TEXT,
|
|
version TEXT,
|
|
date_created TEXT,
|
|
date_modified TEXT,
|
|
date_processed TEXT,
|
|
permissions_data TEXT,
|
|
record_locator TEXT,
|
|
category_depth INTEGER,
|
|
parent_id TEXT,
|
|
attached_filename TEXT,
|
|
filetype TEXT,
|
|
last_modified TEXT,
|
|
file_directory TEXT,
|
|
filename TEXT,
|
|
languages TEXT,
|
|
page_number TEXT,
|
|
links TEXT,
|
|
page_name TEXT,
|
|
link_urls TEXT,
|
|
link_texts TEXT,
|
|
sent_from TEXT,
|
|
sent_to TEXT,
|
|
subject TEXT,
|
|
section TEXT,
|
|
header_footer_type TEXT,
|
|
emphasized_text_contents TEXT,
|
|
emphasized_text_tags TEXT,
|
|
text_as_html TEXT,
|
|
detection_class_prob DECIMAL
|
|
);
|