mirror of
				https://github.com/Unstructured-IO/unstructured.git
				synced 2025-10-31 10:03:07 +00:00 
			
		
		
		
	 547bb38d86
			
		
	
	
		547bb38d86
		
			
		
	
	
	
	
		
			
			Add functionality to try other common encodings for html, xml files if an error related to the encoding is raised and the user has not specified an encoding. Change auto.py to have a None default for encoding Remove the unused parameter encoding from partition_pdf Add functionality to the read_txt_file utility function to handle file-like object from URL
		
			
				
	
	
		
			28 lines
		
	
	
		
			1.3 KiB
		
	
	
	
		
			XML
		
	
	
	
	
	
			
		
		
	
	
			28 lines
		
	
	
		
			1.3 KiB
		
	
	
	
		
			XML
		
	
	
	
	
	
| <?xml version="1.0" encoding="UTF-8"?>
 | ||
| <factbook>
 | ||
|   <country>
 | ||
|     <name>United States</name>
 | ||
|     <capital>Washington, DC</capital>
 | ||
|     <leader>Joe Biden</leader>
 | ||
|     <sport>Baseball</sport>
 | ||
|   </country>
 | ||
|   <country>
 | ||
|     <name>Canada</name>
 | ||
|     <capital>Ottawa</capital>
 | ||
|     <leader>Justin Trudeau</leader>
 | ||
|     <sport>Hockey</sport>
 | ||
|   </country>
 | ||
|   <country>
 | ||
|     <name>France</name>
 | ||
|     <capital>Paris</capital>
 | ||
|     <leader>Emmanuel Macron</leader>
 | ||
|     <sport>Soccer</sport>
 | ||
|   </country>
 | ||
|   <country>
 | ||
|     <name>Trinidad & Tobado</name>
 | ||
|     <capital>Port of Spain</capital>
 | ||
|     <leader>Keith Rowley</leader>
 | ||
|     <sport>Track & Field</sport>
 | ||
|   </country>
 | ||
| </factbook>
 |