File: 17744.test

package info (click to toggle)
duckdb 1.5.1-2
  • links: PTS, VCS
  • area: main
  • in suites:
  • size: 299,196 kB
  • sloc: cpp: 865,414; ansic: 57,292; python: 18,871; sql: 12,663; lisp: 11,751; yacc: 7,412; lex: 1,682; sh: 747; makefile: 558
file content (70 lines) | stat: -rw-r--r-- 2,310 bytes parent folder | download | duplicates (3)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
# name: test/sql/copy/csv/17744.test
# description: Test for issue #17744
# group: [csv]

statement ok
PRAGMA enable_verification

statement ok
COPY (
    SELECT
        -- The string must start with a hash to reproduce the issue
        '#hash start' AS first_column,
        1 AS second_column
    UNION ALL
    SELECT
        -- Quoted value can go anywhere between rows 1 and 2048 just not 1 or 2048. It must be between the hashes
        '"my, quoted value"' AS first_column,
        1 AS second_column
    UNION ALL
    -- These rows make the csv 2048 rows long which is required to reproduce
    SELECT
        'any value' AS first_column,
        1 AS second_column
    FROM range(0, 2045)
    UNION ALL
    SELECT
        -- This hash value must be somewhere in the string just not at the beginning
        'hash not at start #' AS column_value,
     1 AS second_column
) TO '__TEST_DIR__/test.csv' (format csv, header 1);

query II
SELECT columns, comment FROM sniff_csv('__TEST_DIR__/test.csv', null_padding = true)
----
[{'name': first_column, 'type': VARCHAR}, {'name': second_column, 'type': BIGINT}]	(empty)

query II
SELECT columns, comment FROM sniff_csv('__TEST_DIR__/test.csv', null_padding = true, comment = '#')
----
[{'name': first_column, 'type': VARCHAR}, {'name': second_column, 'type': BIGINT}]	#


statement ok
COPY (
    SELECT
        -- The string must start with a hash to reproduce the issue
        '#hash start' AS first_column,
        1 AS second_column
    UNION ALL
    SELECT
        -- Quoted value can go anywhere between rows 1 and 2048 just not 1 or 2048. It must be between the hashes
        '"my, quoted value"' AS first_column,
        1 AS second_column
    UNION ALL
    -- These rows make the csv 2048 rows long which is required to reproduce
    SELECT
        'any value' AS first_column,
        1 AS second_column
    FROM range(0, 2045)
    UNION ALL
    SELECT
        -- This hash value must be somewhere in the string just not at the beginning
        'hash not at start #' AS column_value,
     1 AS second_column
) TO '__TEST_DIR__/test_2.csv' (format csv, header 1, QUOTE '');

query II
SELECT columns, comment FROM sniff_csv('__TEST_DIR__/test_2.csv')
----
[{'name': first_column, 'type': VARCHAR}, {'name': second_column, 'type': BIGINT}]	(empty)