58 lines
1 KiB
Go
58 lines
1 KiB
Go
|
package chart
|
||
|
|
||
|
import "strings"
|
||
|
|
||
|
// SplitCSV splits a corpus by the `,`, dropping leading or trailing whitespace unless quoted.
|
||
|
func SplitCSV(text string) (output []string) {
|
||
|
if len(text) == 0 {
|
||
|
return
|
||
|
}
|
||
|
|
||
|
var state int
|
||
|
var word []rune
|
||
|
var opened rune
|
||
|
for _, r := range text {
|
||
|
switch state {
|
||
|
case 0: // word
|
||
|
if isQuote(r) {
|
||
|
opened = r
|
||
|
state = 1
|
||
|
} else if isCSVDelim(r) {
|
||
|
output = append(output, strings.TrimSpace(string(word)))
|
||
|
word = nil
|
||
|
} else {
|
||
|
word = append(word, r)
|
||
|
}
|
||
|
case 1: // we're in a quoted section
|
||
|
if matchesQuote(opened, r) {
|
||
|
state = 0
|
||
|
continue
|
||
|
}
|
||
|
word = append(word, r)
|
||
|
}
|
||
|
}
|
||
|
|
||
|
if len(word) > 0 {
|
||
|
output = append(output, strings.TrimSpace(string(word)))
|
||
|
}
|
||
|
return
|
||
|
}
|
||
|
|
||
|
func isCSVDelim(r rune) bool {
|
||
|
return r == rune(',')
|
||
|
}
|
||
|
|
||
|
func isQuote(r rune) bool {
|
||
|
return r == '"' || r == '\'' || r == '“' || r == '”' || r == '`'
|
||
|
}
|
||
|
|
||
|
func matchesQuote(a, b rune) bool {
|
||
|
if a == '“' && b == '”' {
|
||
|
return true
|
||
|
}
|
||
|
if a == '”' && b == '“' {
|
||
|
return true
|
||
|
}
|
||
|
return a == b
|
||
|
}
|