@@ -136,6 +136,27 @@ fn prop_frequency() {
136
136
qcheck_sized ( p as fn ( CsvData ) -> bool , 2 ) ;
137
137
}
138
138
139
+
140
+ // This tests that running the frequency command on a CSV file with these two
141
+ // rows does not burst in flames:
142
+ //
143
+ // \u{FEFF}
144
+ // ""
145
+ //
146
+ // In this case, the `param_prop_frequency` just ignores this particular test.
147
+ // Namely, \u{FEFF} is the UTF-8 BOM, which is ignored by the underlying CSV
148
+ // reader.
149
+ #[ test]
150
+ fn frequency_bom ( ) {
151
+ let rows = CsvData {
152
+ data : vec ! [
153
+ :: CsvRecord ( vec![ "\u{FEFF} " . to_string( ) ] ) ,
154
+ :: CsvRecord ( vec![ "" . to_string( ) ] ) ,
155
+ ] ,
156
+ } ;
157
+ assert ! ( param_prop_frequency( "prop_frequency" , rows, false ) )
158
+ }
159
+
139
160
// This tests that a frequency table computed by `xsv` (with an index) is
140
161
// always the same as the frequency table computed in memory.
141
162
#[ test]
@@ -149,6 +170,9 @@ fn prop_frequency_indexed() {
149
170
}
150
171
151
172
fn param_prop_frequency ( name : & str , rows : CsvData , idx : bool ) -> bool {
173
+ if !rows. is_empty ( ) && rows[ 0 ] [ 0 ] . len ( ) == 3 && rows[ 0 ] [ 0 ] == "\u{FEFF} " {
174
+ return true ;
175
+ }
152
176
let wrk = Workdir :: new ( name) ;
153
177
if idx {
154
178
wrk. create_indexed ( "in.csv" , rows. clone ( ) ) ;
@@ -159,7 +183,8 @@ fn param_prop_frequency(name: &str, rows: CsvData, idx: bool) -> bool {
159
183
let mut cmd = wrk. command ( "frequency" ) ;
160
184
cmd. arg ( "in.csv" ) . args ( & [ "-j" , "4" ] ) . args ( & [ "--limit" , "0" ] ) ;
161
185
162
- let got_ftables = ftables_from_csv_string ( wrk. stdout :: < String > ( & mut cmd) ) ;
186
+ let stdout = wrk. stdout :: < String > ( & mut cmd) ;
187
+ let got_ftables = ftables_from_csv_string ( stdout) ;
163
188
let expected_ftables = ftables_from_rows ( rows) ;
164
189
assert_eq_ftables ( & got_ftables, & expected_ftables)
165
190
}
0 commit comments