File: test_potential_dialects.py

package info (click to toggle)
python-clevercsv 0.7.5%2Bds-1
  • links: PTS, VCS
  • area: main
  • in suites: bookworm
  • size: 872 kB
  • sloc: python: 5,076; ansic: 763; makefile: 81
file content (44 lines) | stat: -rw-r--r-- 1,367 bytes parent folder | download
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
# -*- coding: utf-8 -*-

"""
Unit tests for the potential dialect selection.

Author: Gertjan van den Burg

"""

import unittest

from clevercsv.potential_dialects import filter_urls
from clevercsv.potential_dialects import get_delimiters
from clevercsv.potential_dialects import get_quotechars
from clevercsv.potential_dialects import masked_by_quotechar


class PotentialDialectTestCase(unittest.TestCase):
    def test_masked_by_quotechar(self):
        self.assertTrue(masked_by_quotechar('A"B&C"A', '"', "", "&"))
        self.assertFalse(masked_by_quotechar('A"B&C"A&A', '"', "", "&"))
        self.assertFalse(masked_by_quotechar('A|"B&C"A', '"', "|", "&"))
        self.assertFalse(masked_by_quotechar('A"B"C', '"', "", ""))

    def test_filter_urls(self):
        data = "A,B\nwww.google.com,10\nhttps://gertjanvandenburg.com,25\n"
        exp = "A,B\nU,10\nU,25\n"
        self.assertEqual(exp, filter_urls(data))

    def test_get_quotechars(self):
        data = "A,B,'A',B\"D\"E"
        exp = set(['"', "'", ""])
        out = get_quotechars(data)
        self.assertEqual(out, exp)

    def test_get_delimiters(self):
        data = "A,B|CD,E;F\tD123£123€10.,0"
        exp = set([",", "|", ";", "\t", "€", "£", ""])
        out = get_delimiters(data, "UTF-8")
        self.assertEqual(out, exp)


if __name__ == "__main__":
    unittest.main()