1 unstable release
0.1.0 | May 17, 2022 |
---|
#6 in #diacritics
4KB
lib.rs
:
Lightweight library for removing hebrew diacritics ("Niqqud", Hebrew: נִקּוּד) from a string.
reference: https://www.unicode.org/charts/PDF/U0590.pdf
Examples
let diacrited_quoted = "״שָׁלוֹם עוֹלָם״";
// Remove only the diacritics (keep '״' chars)
let quoted = niqqud::remove(diacrited_quoted);
assert_eq!("״שלום עולם״", quoted);
// Remove diacritics and hebrew quotes (double '״' and single '׳')
let unquoted = niqqud::remove_thorough(diacrited_quoted);
assert_eq!("שלום עולם", unquoted);