Skip to content

Commit 92de288

Browse files
committed
frequency: fix BOM bug
1 parent 4b308ad commit 92de288

File tree

1 file changed

+26
-1
lines changed

1 file changed

+26
-1
lines changed

tests/test_frequency.rs

+26-1
Original file line numberDiff line numberDiff line change
@@ -136,6 +136,27 @@ fn prop_frequency() {
136136
qcheck_sized(p as fn(CsvData) -> bool, 2);
137137
}
138138

139+
140+
// This tests that running the frequency command on a CSV file with these two
141+
// rows does not burst in flames:
142+
//
143+
// \u{FEFF}
144+
// ""
145+
//
146+
// In this case, the `param_prop_frequency` just ignores this particular test.
147+
// Namely, \u{FEFF} is the UTF-8 BOM, which is ignored by the underlying CSV
148+
// reader.
149+
#[test]
150+
fn frequency_bom() {
151+
let rows = CsvData {
152+
data: vec![
153+
::CsvRecord(vec!["\u{FEFF}".to_string()]),
154+
::CsvRecord(vec!["".to_string()]),
155+
],
156+
};
157+
assert!(param_prop_frequency("prop_frequency", rows, false))
158+
}
159+
139160
// This tests that a frequency table computed by `xsv` (with an index) is
140161
// always the same as the frequency table computed in memory.
141162
#[test]
@@ -149,6 +170,9 @@ fn prop_frequency_indexed() {
149170
}
150171

151172
fn param_prop_frequency(name: &str, rows: CsvData, idx: bool) -> bool {
173+
if !rows.is_empty() && rows[0][0].len() == 3 && rows[0][0] == "\u{FEFF}" {
174+
return true;
175+
}
152176
let wrk = Workdir::new(name);
153177
if idx {
154178
wrk.create_indexed("in.csv", rows.clone());
@@ -159,7 +183,8 @@ fn param_prop_frequency(name: &str, rows: CsvData, idx: bool) -> bool {
159183
let mut cmd = wrk.command("frequency");
160184
cmd.arg("in.csv").args(&["-j", "4"]).args(&["--limit", "0"]);
161185

162-
let got_ftables = ftables_from_csv_string(wrk.stdout::<String>(&mut cmd));
186+
let stdout = wrk.stdout::<String>(&mut cmd);
187+
let got_ftables = ftables_from_csv_string(stdout);
163188
let expected_ftables = ftables_from_rows(rows);
164189
assert_eq_ftables(&got_ftables, &expected_ftables)
165190
}

0 commit comments

Comments
 (0)