1
0
mirror of https://github.com/kellyjonbrazil/jc.git synced 2025-06-17 00:07:37 +02:00
Files
jc/tests/test_csv.py

155 lines
6.3 KiB
Python
Raw Normal View History

2020-03-02 15:05:56 -08:00
import os
import json
import unittest
import jc.parsers.csv
THIS_DIR = os.path.dirname(os.path.abspath(__file__))
class MyTests(unittest.TestCase):
2022-09-23 10:58:28 -07:00
# input
with open(os.path.join(THIS_DIR, os.pardir, 'tests/fixtures/generic/csv-biostats.csv'), 'r', encoding='utf-8') as f:
generic_csv_biostats = f.read()
2020-03-02 15:05:56 -08:00
2022-09-23 10:58:28 -07:00
with open(os.path.join(THIS_DIR, os.pardir, 'tests/fixtures/generic/csv-cities.csv'), 'r', encoding='utf-8') as f:
generic_csv_cities = f.read()
2020-03-02 15:05:56 -08:00
2022-09-23 10:58:28 -07:00
with open(os.path.join(THIS_DIR, os.pardir, 'tests/fixtures/generic/csv-deniro.csv'), 'r', encoding='utf-8') as f:
generic_csv_deniro = f.read()
2020-03-02 15:05:56 -08:00
2022-09-23 10:58:28 -07:00
with open(os.path.join(THIS_DIR, os.pardir, 'tests/fixtures/generic/csv-example.csv'), 'r', encoding='utf-8') as f:
generic_csv_example = f.read()
2020-03-02 15:05:56 -08:00
2022-09-23 10:58:28 -07:00
with open(os.path.join(THIS_DIR, os.pardir, 'tests/fixtures/generic/csv-flyrna.tsv'), 'r', encoding='utf-8') as f:
generic_csv_flyrna = f.read()
2020-03-02 15:05:56 -08:00
2022-09-23 10:58:28 -07:00
with open(os.path.join(THIS_DIR, os.pardir, 'tests/fixtures/generic/csv-flyrna2.tsv'), 'r', encoding='utf-8') as f:
generic_csv_flyrna2 = f.read()
2020-03-02 15:05:56 -08:00
2022-09-23 10:58:28 -07:00
with open(os.path.join(THIS_DIR, os.pardir, 'tests/fixtures/generic/csv-homes-pipe.csv'), 'r', encoding='utf-8') as f:
generic_csv_homes_pipe = f.read()
2020-03-02 15:05:56 -08:00
2022-09-23 10:58:28 -07:00
with open(os.path.join(THIS_DIR, os.pardir, 'tests/fixtures/generic/csv-homes.csv'), 'r', encoding='utf-8') as f:
generic_csv_homes = f.read()
2020-03-02 15:05:56 -08:00
2022-09-23 10:58:28 -07:00
with open(os.path.join(THIS_DIR, os.pardir, 'tests/fixtures/generic/csv-insurance.csv'), 'r', encoding='utf-8') as f:
generic_csv_insurance = f.read()
2020-03-02 15:05:56 -08:00
2022-09-23 10:58:28 -07:00
with open(os.path.join(THIS_DIR, os.pardir, 'tests/fixtures/generic/csv-doubleqouted.csv'), 'r', encoding='utf-8') as f:
generic_csv_doubleqouted = f.read()
2022-01-02 17:11:20 +02:00
2022-10-25 11:46:31 -07:00
with open(os.path.join(THIS_DIR, os.pardir, 'tests/fixtures/generic/csv-utf-8-bom.csv'), 'r', encoding='utf-8') as f:
generic_csv_utf8_bom = f.read()
2022-09-23 10:58:28 -07:00
# output
with open(os.path.join(THIS_DIR, os.pardir, 'tests/fixtures/generic/csv-biostats.json'), 'r', encoding='utf-8') as f:
generic_csv_biostats_json = json.loads(f.read())
2020-03-02 15:05:56 -08:00
2022-09-23 10:58:28 -07:00
with open(os.path.join(THIS_DIR, os.pardir, 'tests/fixtures/generic/csv-cities.json'), 'r', encoding='utf-8') as f:
generic_csv_cities_json = json.loads(f.read())
2020-03-02 15:05:56 -08:00
2022-09-23 10:58:28 -07:00
with open(os.path.join(THIS_DIR, os.pardir, 'tests/fixtures/generic/csv-deniro.json'), 'r', encoding='utf-8') as f:
generic_csv_deniro_json = json.loads(f.read())
2020-03-02 15:05:56 -08:00
2022-09-23 10:58:28 -07:00
with open(os.path.join(THIS_DIR, os.pardir, 'tests/fixtures/generic/csv-example.json'), 'r', encoding='utf-8') as f:
generic_csv_example_json = json.loads(f.read())
2020-03-02 15:05:56 -08:00
2022-09-23 10:58:28 -07:00
with open(os.path.join(THIS_DIR, os.pardir, 'tests/fixtures/generic/csv-flyrna.json'), 'r', encoding='utf-8') as f:
generic_csv_flyrna_json = json.loads(f.read())
2020-03-02 15:05:56 -08:00
2022-09-23 10:58:28 -07:00
with open(os.path.join(THIS_DIR, os.pardir, 'tests/fixtures/generic/csv-flyrna2.json'), 'r', encoding='utf-8') as f:
generic_csv_flyrna2_json = json.loads(f.read())
2020-03-02 15:05:56 -08:00
2022-09-23 10:58:28 -07:00
with open(os.path.join(THIS_DIR, os.pardir, 'tests/fixtures/generic/csv-homes-pipe.json'), 'r', encoding='utf-8') as f:
generic_csv_homes_pipe_json = json.loads(f.read())
2020-03-02 15:05:56 -08:00
2022-09-23 10:58:28 -07:00
with open(os.path.join(THIS_DIR, os.pardir, 'tests/fixtures/generic/csv-homes.json'), 'r', encoding='utf-8') as f:
generic_csv_homes_json = json.loads(f.read())
2020-03-02 15:05:56 -08:00
2022-09-23 10:58:28 -07:00
with open(os.path.join(THIS_DIR, os.pardir, 'tests/fixtures/generic/csv-insurance.json'), 'r', encoding='utf-8') as f:
generic_csv_insurance_json = json.loads(f.read())
with open(os.path.join(THIS_DIR, os.pardir, 'tests/fixtures/generic/csv-doubleqouted.json'), 'r', encoding='utf-8') as f:
generic_csv_doubleqouted_json = json.loads(f.read())
2020-03-02 15:05:56 -08:00
2022-10-25 11:46:31 -07:00
with open(os.path.join(THIS_DIR, os.pardir, 'tests/fixtures/generic/csv-utf-8-bom.json'), 'r', encoding='utf-8') as f:
generic_csv_utf8_bom_json = json.loads(f.read())
2022-01-02 17:11:20 +02:00
2020-06-10 17:22:59 -07:00
def test_csv_nodata(self):
"""
Test with no data
"""
self.assertEqual(jc.parsers.csv.parse('', quiet=True), [])
2020-03-02 15:05:56 -08:00
def test_csv_biostats(self):
"""
Test 'biostats.csv' file
"""
self.assertEqual(jc.parsers.csv.parse(self.generic_csv_biostats, quiet=True), self.generic_csv_biostats_json)
def test_csv_cities(self):
"""
Test 'cities.csv' file
"""
self.assertEqual(jc.parsers.csv.parse(self.generic_csv_cities, quiet=True), self.generic_csv_cities_json)
def test_csv_deniro(self):
"""
Test 'deniro.csv' file
"""
self.assertEqual(jc.parsers.csv.parse(self.generic_csv_deniro, quiet=True), self.generic_csv_deniro_json)
def test_csv_example(self):
"""
Test 'example.csv' file
"""
self.assertEqual(jc.parsers.csv.parse(self.generic_csv_example, quiet=True), self.generic_csv_example_json)
def test_csv_flyrna(self):
"""
Test 'flyrna.tsv' file
"""
self.assertEqual(jc.parsers.csv.parse(self.generic_csv_flyrna, quiet=True), self.generic_csv_flyrna_json)
def test_csv_flyrna2(self):
"""
Test 'flyrna2.tsv' file
"""
self.assertEqual(jc.parsers.csv.parse(self.generic_csv_flyrna2, quiet=True), self.generic_csv_flyrna2_json)
def test_csv_homes_pipe(self):
"""
Test 'homes-pipe.csv' file
"""
self.assertEqual(jc.parsers.csv.parse(self.generic_csv_homes_pipe, quiet=True), self.generic_csv_homes_pipe_json)
def test_csv_homes(self):
"""
Test 'homes.csv' file
"""
self.assertEqual(jc.parsers.csv.parse(self.generic_csv_homes, quiet=True), self.generic_csv_homes_json)
def test_csv_insurance(self):
"""
Test 'insurance.csv' file
"""
self.assertEqual(jc.parsers.csv.parse(self.generic_csv_insurance, quiet=True), self.generic_csv_insurance_json)
2022-10-25 11:46:31 -07:00
def test_csv_doubleqouted(self):
2022-01-02 17:11:20 +02:00
"""
Test 'csv-doubleqouted.csv' file
"""
self.assertEqual(jc.parsers.csv.parse(self.generic_csv_doubleqouted, quiet=True), self.generic_csv_doubleqouted_json)
2022-10-25 11:46:31 -07:00
def test_csv_utf8_bom(self):
"""
Test 'csv-utf-8-bom.csv' file to ensure the first column is correct if UTF-8 BOM bytes are present
"""
self.assertEqual(jc.parsers.csv.parse(self.generic_csv_utf8_bom, quiet=True), self.generic_csv_utf8_bom_json)
2020-03-02 15:05:56 -08:00
if __name__ == '__main__':
unittest.main()