csv: fix field multiple lines error

pull/4815/head
yuyi 2020-05-10 20:19:26 +08:00 committed by GitHub
parent eabc72d4fe
commit 0606d26ba7
No known key found for this signature in database
GPG Key ID: 4AEE18F83AFDEB23
2 changed files with 53 additions and 23 deletions

View File

@ -98,27 +98,32 @@ fn (r mut Reader) read_record() ?[]string {
if !valid_delim(r.delimiter) {
return err_invalid_delim
}
mut need_read := true
mut keep_raw := false
mut line := ''
mut fields := []string{}
mut i := -1
for {
if need_read {
l := r.read_line() or {
return error(err)
}
if l.len <= 0 {
if keep_raw { line += '\n'}
continue
}
line = l
// skip commented lines
if line[0] == r.comment {
} else if l[0] == r.comment {
if keep_raw { line += '\n' + l }
continue
} else {
if keep_raw { line += '\n'}
line += l
}
break
need_read = false
keep_raw = false
}
mut fields := []string{}
mut i := -1
for {
// not quoted
if line[0] != `"` {
// QTODO i = ...
if line[0] != `"` { // not quoted
j := line.index(r.delimiter.str()) or {
// last
fields << line[..line.len]
@ -128,13 +133,13 @@ fn (r mut Reader) read_record() ?[]string {
fields << line[..i]
line = line[i+1..]
continue
} else { // quoted
j := line[1..].index('"') or {
need_read = true
keep_raw = true
continue
}
// quoted
else {
line = line[1..]
j := line.index('"') or {
break
}
if j+1 == line.len {
// last record
fields << line[..j]

View File

@ -174,3 +174,28 @@ fn test_empty_line() {
}
}
}
fn test_field_multiple_line() {
data := '"name","multiple
line","value"\n"one","first","1"'
mut csv_reader := csv.new_reader(data)
mut row_count := 0
for {
row := csv_reader.read() or {
break
}
row_count++
if row_count == 1 {
assert row[0] == 'name'
assert row[1] == 'multiple\n\n line'
assert row[2] == 'value'
}
if row_count == 2 {
assert row[0] == 'one'
assert row[1] == 'first'
assert row[2] == '1'
}
}
}