From f402e651c67328af25bd90debde0f907ae9f210a Mon Sep 17 00:00:00 2001 From: Chris Mattmann Date: Tue, 17 Jul 2018 00:43:58 -0500 Subject: [PATCH] Fix unit tests with working URLs. --- tika/tests/arguments/test_remote_content.csv | 2 +- tika/tests/arguments/test_remote_metadata.csv | 2 +- tika/tests/test_tika.py | 4 ++-- 3 files changed, 4 insertions(+), 4 deletions(-) diff --git a/tika/tests/arguments/test_remote_content.csv b/tika/tests/arguments/test_remote_content.csv index 6e6835e..dc8753d 100644 --- a/tika/tests/arguments/test_remote_content.csv +++ b/tika/tests/arguments/test_remote_content.csv @@ -4,5 +4,5 @@ ,"https://studentaid.ed.gov/sites/default/files/fsawg/datacenter/library/FAFSAReportDefinitions.doc",,"FAFSAReportDefinitions.doc" ,"http://open.defense.gov/Portals/23/Documents/FOIA_WebsiteCompliance.ppt",,"FOIA_WebsiteCompliance.ppt" ,"https://catalog.data.gov/dataset/geologic-map-of-the-state-of-hawaii",,"geologic-map-of-the-state-of-hawaii" -,"http://data.octo.dc.gov/Attachment.aspx?where=Citywide&area=&what=CSV&date=Issueddate&from=4/12/2015%2012:00:00%20AM&to=4/19/2015%2010:00:00%20PM&dataset=DCRA_PERMIT&datasetid=5&whereInd=0&areaInd=0&whatInd=0&dateInd=0&whenInd=0",,"DCRA_PERMIT__from04_12_2015__to04_19_2015.csv" +,"https://data.oregon.gov/api/views/i8h7-mn6v/rows.csv?accessType=DOWNLOAD",,"NewBusinessList.csv" ,"http://www.dmdc.osd.mil/Rank_Gender_Race.xls",,"Rank_Gender_Race.xls" diff --git a/tika/tests/arguments/test_remote_metadata.csv b/tika/tests/arguments/test_remote_metadata.csv index deaca54..19e78d4 100644 --- a/tika/tests/arguments/test_remote_metadata.csv +++ b/tika/tests/arguments/test_remote_metadata.csv @@ -14,5 +14,5 @@ ,"http://media.ars.usda.gov/is/mp4/freezeplants.mp4",,"freezeplants.mp4" ,"https://catalog.data.gov/dataset/geologic-map-of-the-state-of-hawaii",,"geologic-map-of-the-state-of-hawaii" ,"http://pubs.usgs.gov/of/2007/1089/Haw_St_tabfiles.zip",,"Haw_St_tabfiles.zip" -,"http://data.octo.dc.gov/Attachment.aspx?where=Citywide&area=&what=CSV&date=Issueddate&from=4/12/2015%2012:00:00%20AM&to=4/19/2015%2010:00:00%20PM&dataset=DCRA_PERMIT&datasetid=5&whereInd=0&areaInd=0&whatInd=0&dateInd=0&whenInd=0",,"DCRA_PERMIT__from04_12_2015__to04_19_2015.csv" +,"https://data.oregon.gov/api/views/i8h7-mn6v/rows.csv?accessType=DOWNLOAD",,"NewBusinessList.csv" ,"http://www.dmdc.osd.mil/Rank_Gender_Race.xls",,"Rank_Gender_Race.xls" diff --git a/tika/tests/test_tika.py b/tika/tests/test_tika.py index fb4853a..7f6773e 100644 --- a/tika/tests/test_tika.py +++ b/tika/tests/test_tika.py @@ -31,11 +31,11 @@ def test_remote_pdf(self): def test_remote_html(self): 'parse remote HTML' self.assertTrue(tika.parser.from_file( - 'https://www.nasa.gov/index.html')) + 'https://www.jpl.nasa.gov/index.html')) def test_remote_mp3(self): 'parese remote mp3' self.assertTrue(tika.parser.from_file( - 'http://tindeck.com/download/pro/viqis/theCalling-Lemming-Version.mp3')) + 'https://archive.org/download/Ainst-Spaceshipdemo.mp3/Ainst-Spaceshipdemo.mp3')) def test_remote_jpg(self): 'parse remote jpg' self.assertTrue(tika.parser.from_file(