Tests for bz2, xz & zip URLs · pandas-dev/pandas@25114c3 (original) (raw)
`@@ -14,23 +14,63 @@
`
14
14
`from pandas.io.parsers import read_csv, read_table
`
15
15
``
16
16
``
17
``
`-
class TestUrlGz(tm.TestCase):
`
``
17
`+
class TestCompressedUrl(tm.TestCase):
`
18
18
``
19
19
`def setUp(self):
`
20
20
`dirpath = tm.get_data_path()
`
21
``
`-
localtable = os.path.join(dirpath, 'salaries.csv')
`
22
``
`-
self.local_table = read_table(localtable)
`
``
21
`+
path = os.path.join(dirpath, 'salary.table.csv')
`
``
22
`+
self.local_table = read_table(path)
`
``
23
`+
NOTE: change URL once https://github.com/pandas-dev/pandas/pull/14587
`
``
24
`+
is merged.
`
``
25
`+
self.base_url = ('https://github.com/dhimmel/pandas/raw/'
`
``
26
`+
'24341b53341455433abcb6d01a2c7b4071e35316/'
`
``
27
`+
'pandas/io/tests/parser/data/salaries.csv')
`
23
28
``
24
29
`@tm.network
`
25
30
`def test_url_gz(self):
`
26
``
`-
url = ('https://raw.github.com/pandas-dev/pandas/'
`
27
``
`-
'master/pandas/io/tests/parser/data/salaries.csv.gz')
`
``
31
`+
url = self.base_url + '.gz'
`
28
32
`url_table = read_table(url, compression="gzip", engine="python")
`
29
33
`tm.assert_frame_equal(url_table, self.local_table)
`
30
34
``
``
35
`+
@tm.network
`
``
36
`+
def test_url_bz2(self):
`
``
37
`+
url = self.base_url + '.bz2'
`
``
38
`+
url_table = read_table(url, compression="bz2", engine="python")
`
``
39
`+
tm.assert_frame_equal(url_table, self.local_table)
`
``
40
+
``
41
`+
@tm.network
`
``
42
`+
def test_url_xz(self):
`
``
43
`+
url = self.base_url + '.xz'
`
``
44
`+
url_table = read_table(url, compression="zip", engine="python")
`
``
45
`+
tm.assert_frame_equal(url_table, self.local_table)
`
``
46
+
``
47
`+
@tm.network
`
``
48
`+
def test_url_zip(self):
`
``
49
`+
url = self.base_url + '.zip'
`
``
50
`+
url_table = read_table(url, compression="zip", engine="python")
`
``
51
`+
tm.assert_frame_equal(url_table, self.local_table)
`
``
52
+
31
53
`@tm.network
`
32
54
`def test_url_gz_infer(self):
`
33
``
`-
url = 'https://s3.amazonaws.com/pandas-test/salary.table.gz'
`
``
55
`+
url = self.base_url + '.gz'
`
``
56
`+
url_table = read_table(url, compression="infer", engine="python")
`
``
57
`+
tm.assert_frame_equal(url_table, self.local_table)
`
``
58
+
``
59
`+
@tm.network
`
``
60
`+
def test_url_bz2_infer(self):
`
``
61
`+
url = self.base_url + '.bz2'
`
``
62
`+
url_table = read_table(url, compression="infer", engine="python")
`
``
63
`+
tm.assert_frame_equal(url_table, self.local_table)
`
``
64
+
``
65
`+
@tm.network
`
``
66
`+
def test_url_xz_infer(self):
`
``
67
`+
url = self.base_url + '.xz'
`
``
68
`+
url_table = read_table(url, compression="infer", engine="python")
`
``
69
`+
tm.assert_frame_equal(url_table, self.local_table)
`
``
70
+
``
71
`+
@tm.network
`
``
72
`+
def test_url_zip_infer(self):
`
``
73
`+
url = self.base_url + '.zip'
`
34
74
`url_table = read_table(url, compression="infer", engine="python")
`
35
75
`tm.assert_frame_equal(url_table, self.local_table)
`
36
76
``