Skip to content

Commit cc3e47e

Browse files
committed
let all filter names start with capital
1 parent 62dfe7d commit cc3e47e

File tree

2 files changed

+29
-29
lines changed

2 files changed

+29
-29
lines changed

doc/source/stringsext--man.md

Lines changed: 5 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -110,7 +110,7 @@ as *GNU strings* replacement.
110110

111111
The integer AF is notated in hexadecimal with prefix `0x...`.
112112
For the most common use-cases, predefined filters can be set:
113-
e.g. alias names like `all-ctrl` or `all-ctrl+wsp` are shorthand
113+
e.g. alias names like `All-Ctrl` or `All-Ctrl+Wsp` are shorthand
114114
terms for ASCII-filters "all codes, but no control-codes" or
115115
"all codes, including white-space, but no control-codes.
116116
See the output of `--list-encodings` for more details
@@ -240,7 +240,7 @@ as *GNU strings* replacement.
240240
shows all UTF-8-leading-bytes and their codes.
241241

242242
Alternatively, predefined alias names for the most common Unicode-blocks
243-
can be used: e.g.`latin`, `cyrillic`, `greek` and others. See the output of
243+
can be used: e.g.`Latin`, `Cyrillic`, `Greek` and others. See the output of
244244
`--list-encodings` for more predefined filter names.
245245

246246

@@ -329,15 +329,15 @@ Reduce the number of false positives, when scanning for
329329
UTF-16LE or UTF-16BE encoded strings. In the following example
330330
we search for Cyrillic only:
331331

332-
stringsext -t x -e UTF-16le,,none,cyrillic someimage.raw
332+
stringsext -t x -e UTF-16le,,None,Cyrillic someimage.raw
333333

334334
Search for UTF-16LE encoded Arabic and the digits 0 to 9:
335335

336-
stringsext -t x -e UTF-16le,,0x3f000000000000,arabic someimage.raw
336+
stringsext -t x -e UTF-16le,,0x3f000000000000,Arabic someimage.raw
337337

338338
Search for UTF-8 encoded Syriac and all ASCII, control-codes excluded:
339339

340-
stringsext -t x -e UTF-8,,all-ctrl,0x10000000 someimage.raw
340+
stringsext -t x -e UTF-8,,All-Ctrl,0x10000000 someimage.raw
341341

342342
Combine Little-Endian and Big-Endian scanning:
343343

src/mission.rs

Lines changed: 24 additions & 24 deletions
Original file line numberDiff line numberDiff line change
@@ -163,53 +163,53 @@ pub const UBF_UNCOMMON: u64 = 0x000f_0000_0000_0000;
163163
/// For value see chapter *Codepage layout* in
164164
/// [UTF-8 - Wikipedia](https://en.wikipedia.org/wiki/UTF-8)
165165
pub const UNICODE_BLOCK_FILTER_ALIASSE: [([u8; 12], u64, [u8; 25]); 18] = [
166-
(*b"african ", UBF_AFRICAN, *b"all in U+540..U+800 "),
166+
(*b"African ", UBF_AFRICAN, *b"all in U+540..U+800 "),
167167
(
168-
*b"all-asian ",
168+
*b"All-Asian ",
169169
UBF_ALL & !UBF_INVALID & !UBF_ASIAN,
170170
*b"all, except Asian ",
171171
),
172172
(
173-
*b"all ",
173+
*b"All ",
174174
UBF_ALL & !UBF_INVALID,
175175
*b"all valid multibyte UTF-8",
176176
),
177177
(
178-
*b"arabic ",
178+
*b"Arabic ",
179179
UBF_ARABIC | UBF_SYRIAC,
180180
*b"Arabic+Syriac ",
181181
),
182182
(
183-
*b"armenian ",
183+
*b"Armenian ",
184184
UBF_ARMENIAN,
185185
*b"Armenian ",
186186
),
187-
(*b"asian ", UBF_ASIAN, *b"all in U+3000..U+E000 "),
188-
(*b"cjk ", UBF_CJK, *b"CJK : U+4000..U+A000 "),
189-
(*b"common ", UBF_COMMON, *b"all 2-byte-UFT-8 "),
187+
(*b"Asian ", UBF_ASIAN, *b"all in U+3000..U+E000 "),
188+
(*b"CJK ", UBF_CJK, *b"CJK : U+4000..U+A000 "),
189+
(*b"Common ", UBF_COMMON, *b"all 2-byte-UFT-8 "),
190190
(
191-
*b"cyrillic ",
191+
*b"Cyrillic ",
192192
UBF_CYRILLIC,
193193
*b"Cyrillic ",
194194
),
195195
(
196-
*b"default ",
196+
*b"Default ",
197197
UBF_ALL & !UBF_INVALID,
198198
*b"all valid multibyte UTF-8",
199199
),
200-
(*b"greek ", UBF_GREEK, *b"Greek "),
201-
(*b"hangul ", UBF_HANGUL, *b"Hangul: U+B000..U+E000 "),
202-
(*b"hebrew ", UBF_HEBREW, *b"Hebrew "),
203-
(*b"kana ", UBF_KANA, *b"Kana: U+3000..U+4000 "),
200+
(*b"Greek ", UBF_GREEK, *b"Greek "),
201+
(*b"Hangul ", UBF_HANGUL, *b"Hangul: U+B000..U+E000 "),
202+
(*b"Hebrew ", UBF_HEBREW, *b"Hebrew "),
203+
(*b"Kana ", UBF_KANA, *b"Kana: U+3000..U+4000 "),
204204
(
205-
*b"latin ",
205+
*b"Latin ",
206206
UBF_LATIN | UBF_ACCENTS,
207207
*b"Latin + accents ",
208208
),
209-
(*b"none ", !UBF_ALL, *b"block all multibyte UTF-8"),
210-
(*b"private ", UBF_PUA, *b"private use areas "),
209+
(*b"None ", !UBF_ALL, *b"block all multibyte UTF-8"),
210+
(*b"Private ", UBF_PUA, *b"private use areas "),
211211
(
212-
*b"uncommon ",
212+
*b"Uncommon ",
213213
UBF_UNCOMMON | UBF_PUA,
214214
*b"private + all>=U+10_000 ",
215215
),
@@ -242,21 +242,21 @@ pub const AF_WHITESPACE: u128 = 0x0000_0000_0000_0000_0000_0001_0000_0200;
242242
pub const AF_DEFAULT: u128 = AF_ALL & !AF_CTRL | AF_WHITESPACE;
243243

244244
pub const ASCII_FILTER_ALIASSE: [([u8; 12], u128, [u8; 25]); 6] = [
245-
(*b"all ", AF_ALL, *b"all ASCII = pass all "),
245+
(*b"All ", AF_ALL, *b"all ASCII = pass all "),
246246
(
247-
*b"all-ctrl ",
247+
*b"All-Ctrl ",
248248
AF_ALL & !AF_CTRL,
249249
*b"all-control ",
250250
),
251251
(
252-
*b"all-ctrl+wsp",
252+
*b"All-Ctrl+Wsp",
253253
AF_ALL & !AF_CTRL | AF_WHITESPACE,
254254
*b"all-control+whitespace ",
255255
),
256-
(*b"default ", AF_DEFAULT, *b"all-control+whitespace "),
257-
(*b"none ", AF_NONE, *b"no ASCII = block all "),
256+
(*b"Default ", AF_DEFAULT, *b"all-control+whitespace "),
257+
(*b"None ", AF_NONE, *b"no ASCII = block all "),
258258
(
259-
*b"wsp ",
259+
*b"Wsp ",
260260
AF_WHITESPACE,
261261
*b"only white-space ",
262262
),

0 commit comments

Comments
 (0)