mirror of
https://github.com/Unstructured-IO/unstructured.git
synced 2025-06-27 02:30:08 +00:00

Add functionality to try other common encodings for html, xml files if an error related to the encoding is raised and the user has not specified an encoding. Change auto.py to have a None default for encoding Remove the unused parameter encoding from partition_pdf Add functionality to the read_txt_file utility function to handle file-like object from URL
28 lines
1.3 KiB
XML
28 lines
1.3 KiB
XML
<?xml version="1.0" encoding="UTF-8"?>
|
||
<factbook>
|
||
<country>
|
||
<name>United States</name>
|
||
<capital>Washington, DC</capital>
|
||
<leader>Joe Biden</leader>
|
||
<sport>Baseball</sport>
|
||
</country>
|
||
<country>
|
||
<name>Canada</name>
|
||
<capital>Ottawa</capital>
|
||
<leader>Justin Trudeau</leader>
|
||
<sport>Hockey</sport>
|
||
</country>
|
||
<country>
|
||
<name>France</name>
|
||
<capital>Paris</capital>
|
||
<leader>Emmanuel Macron</leader>
|
||
<sport>Soccer</sport>
|
||
</country>
|
||
<country>
|
||
<name>Trinidad & Tobado</name>
|
||
<capital>Port of Spain</capital>
|
||
<leader>Keith Rowley</leader>
|
||
<sport>Track & Field</sport>
|
||
</country>
|
||
</factbook>
|