23 std::unordered_map<String, StringArray>
findEntity(String text,
24 const std::unordered_map<String, StringArray>& dictionary,
25 float similarityThreshold = 0.9f);
34 StringArray
ngrams(
const StringArray& tokens,
int n = 1);
56 const std::unordered_map<String, StringArray>& dictionary,
57 float similarityThreshold);
NER is a Named Entity Recognition (NER) class designed to identify and extract named entities from un...
Definition NER.h:14
float stringSimilarity(const String &str1, const String &str2)
Compute the string similarity.
Definition NER.cpp:177
int levenshteinDistance(const String &str1, const String &str2)
Compute the Levenshtein distance between strings.
Definition NER.cpp:144
std::unordered_map< String, StringArray > findEntity(String text, const std::unordered_map< String, StringArray > &dictionary, float similarityThreshold=0.9f)
Search text for named entities held in dictionary.
Definition NER.cpp:61
std::tuple< float, String, String > getFuzzySimilarity(String text, const std::unordered_map< String, StringArray > &dictionary, float similarityThreshold)
Search for matching named entities using fuzzy string matching.
Definition NER.cpp:38
std::vector< Entity > removeOverlapping(std::vector< Entity > entities)
Remove overlapping entities (keep longest)
Definition NER.cpp:5
StringArray ngrams(const StringArray &tokens, int n=1)
Compute ngrams for the given StringArray.
Definition NER.cpp:128
Definition AirAbsorptionFilter.cpp:2
String name
Definition NER.h:62
int endIndex
Definition NER.h:66
Entity(String name=String(), String category=String(), float score=0.0f, int startIndex=0, int endIndex=0)
Definition NER.h:67
float score
Definition NER.h:64
String category
Definition NER.h:63
int startIndex
Definition NER.h:65