mirror of
https://github.com/Unstructured-IO/unstructured.git
synced 2025-06-27 02:30:08 +00:00

* first pass on partition_xml * add option to keep xml tags * added tests for xml * fix filename * update filenames * remove outdated readme * add xml to auto * version and changelog * update readme and docs * pass through include_metadata * update include_metadata description * add README back in * linting, linting, linting * more linting * spooled to bytes doesnt need to be a tuple * Add tests for newly supported filetypes * Correct metadata filetype * doc typo Co-authored-by: qued <64741807+qued@users.noreply.github.com> * typo fix Co-authored-by: qued <64741807+qued@users.noreply.github.com> * typo fix Co-authored-by: qued <64741807+qued@users.noreply.github.com> * keep_xml_tags -> xml_keep_tags --------- Co-authored-by: Alan Bertl <alan@unstructured.io> Co-authored-by: qued <64741807+qued@users.noreply.github.com>
28 lines
669 B
XML
28 lines
669 B
XML
<?xml version="1.0" encoding="UTF-8"?>
|
|
<factbook>
|
|
<country>
|
|
<name>United States</name>
|
|
<capital>Washington, DC</capital>
|
|
<leader>Joe Biden</leader>
|
|
<sport>Baseball</sport>
|
|
</country>
|
|
<country>
|
|
<name>Canada</name>
|
|
<capital>Ottawa</capital>
|
|
<leader>Justin Trudeau</leader>
|
|
<sport>Hockey</sport>
|
|
</country>
|
|
<country>
|
|
<name>France</name>
|
|
<capital>Paris</capital>
|
|
<leader>Emmanuel Macron</leader>
|
|
<sport>Soccer</sport>
|
|
</country>
|
|
<country>
|
|
<name>Trinidad & Tobado</name>
|
|
<capital>Port of Spain</capital>
|
|
<leader>Keith Rowley</leader>
|
|
<sport>Track & Field</sport>
|
|
</country>
|
|
</factbook>
|