Skip to content

Commit

Permalink
Fixes #16559 - Do not trim leading spaces for tab delimited
Browse files Browse the repository at this point in the history
  • Loading branch information
richmahn committed Oct 26, 2021
1 parent b428b0f commit ec3137b
Show file tree
Hide file tree
Showing 2 changed files with 49 additions and 8 deletions.
6 changes: 5 additions & 1 deletion modules/csv/csv.go
Original file line number Diff line number Diff line change
Expand Up @@ -22,7 +22,11 @@ var quoteRegexp = regexp.MustCompile(`["'][\s\S]+?["']`)
func CreateReader(input io.Reader, delimiter rune) *stdcsv.Reader {
rd := stdcsv.NewReader(input)
rd.Comma = delimiter
rd.TrimLeadingSpace = true
if delimiter != '\t' && delimiter != ' ' {
// TrimLeadingSpace can't be true when delimiter is a tab or a space as the value for a column might be empty,
// thus would change `\t\t` to just `\t` or ` ` (two spaces) to just ` ` (single space)
rd.TrimLeadingSpace = true
}
return rd
}

Expand Down
51 changes: 44 additions & 7 deletions modules/csv/csv_test.go
Original file line number Diff line number Diff line change
Expand Up @@ -18,15 +18,52 @@ func TestCreateReader(t *testing.T) {
}

func TestCreateReaderAndGuessDelimiter(t *testing.T) {
input := "a;b;c\n1;2;3\n4;5;6"
var csvToRowsMap = map[string][][]string{
`col1 col2 col3
a b c
e f
g h i
j l
m n
p q r
u
v w x
y
`: {{"col1", "col2", "col3"},
{"a", "b", "c"},
{"", "e", "f"},
{"g", "h", "i"},
{"j", "", "l"},
{"m", "n", ""},
{"p", "q", "r"},
{"", "", "u"},
{"v", "w", "x"},
{"y", "", ""},
{"", "", ""}},
` col1,col2,col3
a, b, c
d,e,f
,h, i
j, ,
, , `: {{"col1", "col2", "col3"},
{"a", "b", "c"},
{"d", "e", "f"},
{"", "h", "i"},
{"j", "", ""},
{"", "", ""}},
}

rd, err := CreateReaderAndGuessDelimiter(strings.NewReader(input))
assert.NoError(t, err)
assert.Equal(t, ';', rd.Comma)
for csv, expectedRows := range csvToRowsMap {
rd, err := CreateReaderAndGuessDelimiter(strings.NewReader(csv))
assert.NoError(t, err)
rows, err := rd.ReadAll()
assert.NoError(t, err)
assert.EqualValues(t, rows, expectedRows)
}
}

func TestGuessDelimiter(t *testing.T) {
var kases = map[string]rune{
var csvToDelimiterMap = map[string]rune{
"a": ',',
"1,2": ',',
"1;2": ';',
Expand All @@ -37,7 +74,7 @@ func TestGuessDelimiter(t *testing.T) {
"<br/>": ',',
}

for k, v := range kases {
assert.EqualValues(t, guessDelimiter([]byte(k)), v)
for csv, expectedDelimiter := range csvToDelimiterMap {
assert.EqualValues(t, guessDelimiter([]byte(csv)), expectedDelimiter)
}
}

0 comments on commit ec3137b

Please sign in to comment.