Tests for bz2, xz & zip URLs · pandas-dev/pandas@25114c3 (original) (raw)

`@@ -14,23 +14,63 @@

`

14

14

`from pandas.io.parsers import read_csv, read_table

`

15

15

``

16

16

``

17

``

`-

class TestUrlGz(tm.TestCase):

`

``

17

`+

class TestCompressedUrl(tm.TestCase):

`

18

18

``

19

19

`def setUp(self):

`

20

20

`dirpath = tm.get_data_path()

`

21

``

`-

localtable = os.path.join(dirpath, 'salaries.csv')

`

22

``

`-

self.local_table = read_table(localtable)

`

``

21

`+

path = os.path.join(dirpath, 'salary.table.csv')

`

``

22

`+

self.local_table = read_table(path)

`

``

23

`+

NOTE: change URL once https://github.com/pandas-dev/pandas/pull/14587

`

``

24

`+

is merged.

`

``

25

`+

self.base_url = ('https://github.com/dhimmel/pandas/raw/'

`

``

26

`+

'24341b53341455433abcb6d01a2c7b4071e35316/'

`

``

27

`+

'pandas/io/tests/parser/data/salaries.csv')

`

23

28

``

24

29

`@tm.network

`

25

30

`def test_url_gz(self):

`

26

``

`-

url = ('https://raw.github.com/pandas-dev/pandas/'

`

27

``

`-

'master/pandas/io/tests/parser/data/salaries.csv.gz')

`

``

31

`+

url = self.base_url + '.gz'

`

28

32

`url_table = read_table(url, compression="gzip", engine="python")

`

29

33

`tm.assert_frame_equal(url_table, self.local_table)

`

30

34

``

``

35

`+

@tm.network

`

``

36

`+

def test_url_bz2(self):

`

``

37

`+

url = self.base_url + '.bz2'

`

``

38

`+

url_table = read_table(url, compression="bz2", engine="python")

`

``

39

`+

tm.assert_frame_equal(url_table, self.local_table)

`

``

40

+

``

41

`+

@tm.network

`

``

42

`+

def test_url_xz(self):

`

``

43

`+

url = self.base_url + '.xz'

`

``

44

`+

url_table = read_table(url, compression="zip", engine="python")

`

``

45

`+

tm.assert_frame_equal(url_table, self.local_table)

`

``

46

+

``

47

`+

@tm.network

`

``

48

`+

def test_url_zip(self):

`

``

49

`+

url = self.base_url + '.zip'

`

``

50

`+

url_table = read_table(url, compression="zip", engine="python")

`

``

51

`+

tm.assert_frame_equal(url_table, self.local_table)

`

``

52

+

31

53

`@tm.network

`

32

54

`def test_url_gz_infer(self):

`

33

``

`-

url = 'https://s3.amazonaws.com/pandas-test/salary.table.gz'

`

``

55

`+

url = self.base_url + '.gz'

`

``

56

`+

url_table = read_table(url, compression="infer", engine="python")

`

``

57

`+

tm.assert_frame_equal(url_table, self.local_table)

`

``

58

+

``

59

`+

@tm.network

`

``

60

`+

def test_url_bz2_infer(self):

`

``

61

`+

url = self.base_url + '.bz2'

`

``

62

`+

url_table = read_table(url, compression="infer", engine="python")

`

``

63

`+

tm.assert_frame_equal(url_table, self.local_table)

`

``

64

+

``

65

`+

@tm.network

`

``

66

`+

def test_url_xz_infer(self):

`

``

67

`+

url = self.base_url + '.xz'

`

``

68

`+

url_table = read_table(url, compression="infer", engine="python")

`

``

69

`+

tm.assert_frame_equal(url_table, self.local_table)

`

``

70

+

``

71

`+

@tm.network

`

``

72

`+

def test_url_zip_infer(self):

`

``

73

`+

url = self.base_url + '.zip'

`

34

74

`url_table = read_table(url, compression="infer", engine="python")

`

35

75

`tm.assert_frame_equal(url_table, self.local_table)

`

36

76

``