csv: fix field multiple lines error

pull/4815/head
yuyi 2020-05-10 20:19:26 +08:00 committed by GitHub
parent eabc72d4fe
commit 0606d26ba7
No known key found for this signature in database
GPG Key ID: 4AEE18F83AFDEB23
2 changed files with 53 additions and 23 deletions

View File

@ -98,27 +98,32 @@ fn (r mut Reader) read_record() ?[]string {
if !valid_delim(r.delimiter) { if !valid_delim(r.delimiter) {
return err_invalid_delim return err_invalid_delim
} }
mut need_read := true
mut keep_raw := false
mut line := '' mut line := ''
for {
l := r.read_line() or {
return error(err)
}
if l.len <= 0 {
continue
}
line = l
// skip commented lines
if line[0] == r.comment {
continue
}
break
}
mut fields := []string{} mut fields := []string{}
mut i := -1 mut i := -1
for { for {
// not quoted if need_read {
if line[0] != `"` { l := r.read_line() or {
// QTODO i = ... return error(err)
}
if l.len <= 0 {
if keep_raw { line += '\n'}
continue
} else if l[0] == r.comment {
if keep_raw { line += '\n' + l }
continue
} else {
if keep_raw { line += '\n'}
line += l
}
need_read = false
keep_raw = false
}
if line[0] != `"` { // not quoted
j := line.index(r.delimiter.str()) or { j := line.index(r.delimiter.str()) or {
// last // last
fields << line[..line.len] fields << line[..line.len]
@ -128,13 +133,13 @@ fn (r mut Reader) read_record() ?[]string {
fields << line[..i] fields << line[..i]
line = line[i+1..] line = line[i+1..]
continue continue
} } else { // quoted
// quoted j := line[1..].index('"') or {
else { need_read = true
line = line[1..] keep_raw = true
j := line.index('"') or { continue
break
} }
line = line[1..]
if j+1 == line.len { if j+1 == line.len {
// last record // last record
fields << line[..j] fields << line[..j]

View File

@ -174,3 +174,28 @@ fn test_empty_line() {
} }
} }
} }
fn test_field_multiple_line() {
data := '"name","multiple
line","value"\n"one","first","1"'
mut csv_reader := csv.new_reader(data)
mut row_count := 0
for {
row := csv_reader.read() or {
break
}
row_count++
if row_count == 1 {
assert row[0] == 'name'
assert row[1] == 'multiple\n\n line'
assert row[2] == 'value'
}
if row_count == 2 {
assert row[0] == 'one'
assert row[1] == 'first'
assert row[2] == '1'
}
}
}