3 releases (breaking)
Uses old Rust 2015
0.3.0 | Feb 4, 2020 |
---|---|
0.2.0 | Nov 15, 2019 |
0.1.0 | Nov 2, 2019 |
#759 in Text processing
14,963 downloads per month
53KB
1.5K
SLoC
ttaw
talking to a wall, a piecemeal natural language processing library.
A couple caveats
- My implementation's aren't a sure thing 😄 If you encounter anything peculiar or unexpected, please raise an issue ❤️ ❤️
Functionality
-
Determine if two words rhyme using the Double Metaphone phonetic encoding
-
Determine if two words rhyme using CMUdict phonetic encoding
-
Determine if two words alliterate using the Double Metaphone phonetic encoding
-
Determine if two words alliterate using CMUdict phonetic encoding
-
Get the CMUdict phonetic encoding of a word
-
Get the Double Metaphone phonetic encoding of a word (port of words/double-metahone library)
Rhyme
extern crate ttaw;
use ttaw;
// Initialize the CmuDict with a path to the existing serialized CMU dictionary
// or a directoy containing it. If the dictionary doesn't exisit, it will be
// downloaded and serialized at the location specified by the path parameter.
let cmudict = ttaw::cmu::CmuDict::new("cmudict.json").unwrap();
assert_eq!(Ok(true), cmudict.rhyme("far", "tar"));
assert_eq!(Ok(true), ttaw::metaphone::rhyme("far", "tar"));
assert_eq!(Ok(false), cmudict.rhyme("shopping", "cart"));
assert_eq!(Ok(false), ttaw::metaphone::rhyme("shopping", "cart"));
// Deviations in cmu and metaphone
assert_eq!(true, ttaw::metaphone::rhyme("hear", "near"));
assert_eq!(Ok(false), cmudict.rhyme("hear", "near"));
Alliteration
extern crate ttaw;
use ttaw;
// Initialize the CmuDict with a path to the existing serialized CMU dictionary
// or a directoy containing it. If the dictionary doesn't exisit, it will be
// downloaded and serialized at the location specified by the path parameter.
let cmudict = ttaw::cmu::CmuDict::new("cmudict.json").unwrap();
assert_eq!(Ok(true), cmudict.alliteration("bounding","bears"));
assert_eq!(true, ttaw::metaphone::alliteration("bounding","bears"));
assert_eq!(Ok(false), cmudict.alliteration("lazy", "dog"));
assert_eq!(false, ttaw::metaphone::alliteration("lazy", "dog"));
CMUdict
extern crate ttaw;
use ttaw;
// Initialize the CmuDict with a path to the existing serialized CMU dictionary
// or a directoy containing it. If the dictionary doesn't exisit, it will be
// downloaded and serialized at the location specified by the path parameter.
let cmudict = ttaw::cmu::CmuDict::new("cmudict.json").unwrap();
assert_eq!(
cmudict.encoding(("unearthed"),
Ok(Some(vec![vec![
"AH0".to_string(),
"N".to_string(),
"ER1".to_string(),
"TH".to_string(),
"T".to_string()
]]))
);
Double Metaphone
extern crate ttaw;
use ttaw;
assert_eq!(ttaw::metaphone::encoding("Arnow").primary, "ARN");
assert_eq!(ttaw::metaphone::encoding("Arnow").secondary, "ARNF");
assert_eq!(
ttaw::metaphone::encoding("detestable").primary,
"TTSTPL"
);
assert_eq!(
ttaw::metaphone::encoding("detestable").secondary,
"TTSTPL"
);
Dependencies
~24MB
~488K SLoC