diff options
author | 2023-10-22 20:54:58 +0500 | |
---|---|---|
committer | 2023-10-22 20:54:58 +0500 | |
commit | 69fcf984b733774336952bcc6f8ad42d796e5a5d (patch) | |
tree | 14529f2ee5db3725e08b8da2876d38601e6fc8c4 /model/probabilistic_intent_parser/intent_classifier/featurizer | |
parent | f97f5665a9263cca3609ac8f732e4590a4bf6178 (diff) |
Add pre-trained model for Snips
Add a Snips model trained on HVAC Temperature, Fan Speed,
and Volume Control intents.
SPEC-4856
Signed-off-by: Malik Talha <talhamalik727x@gmail.com>
Change-Id: I624fa48c059d4fa1a5f2ef07e3af88b3076509f2
Diffstat (limited to 'model/probabilistic_intent_parser/intent_classifier/featurizer')
4 files changed, 259 insertions, 0 deletions
diff --git a/model/probabilistic_intent_parser/intent_classifier/featurizer/featurizer.json b/model/probabilistic_intent_parser/intent_classifier/featurizer/featurizer.json new file mode 100644 index 0000000..d75a5e2 --- /dev/null +++ b/model/probabilistic_intent_parser/intent_classifier/featurizer/featurizer.json @@ -0,0 +1,22 @@ +{ + "config": { + "added_cooccurrence_feature_ratio": 0.0, + "cooccurrence_vectorizer_config": { + "filter_stop_words": true, + "keep_order": true, + "unit_name": "cooccurrence_vectorizer", + "unknown_words_replacement_string": null, + "window_size": null + }, + "pvalue_threshold": 0.4, + "tfidf_vectorizer_config": { + "unit_name": "tfidf_vectorizer", + "use_stemming": false, + "word_clusters_name": null + }, + "unit_name": "featurizer" + }, + "cooccurrence_vectorizer": null, + "language_code": "en", + "tfidf_vectorizer": "tfidf_vectorizer" +}
\ No newline at end of file diff --git a/model/probabilistic_intent_parser/intent_classifier/featurizer/metadata.json b/model/probabilistic_intent_parser/intent_classifier/featurizer/metadata.json new file mode 100644 index 0000000..7cfe779 --- /dev/null +++ b/model/probabilistic_intent_parser/intent_classifier/featurizer/metadata.json @@ -0,0 +1,3 @@ +{ + "unit_name": "featurizer" +}
\ No newline at end of file diff --git a/model/probabilistic_intent_parser/intent_classifier/featurizer/tfidf_vectorizer/metadata.json b/model/probabilistic_intent_parser/intent_classifier/featurizer/tfidf_vectorizer/metadata.json new file mode 100644 index 0000000..ea6fa93 --- /dev/null +++ b/model/probabilistic_intent_parser/intent_classifier/featurizer/tfidf_vectorizer/metadata.json @@ -0,0 +1,3 @@ +{ + "unit_name": "tfidf_vectorizer" +}
\ No newline at end of file diff --git a/model/probabilistic_intent_parser/intent_classifier/featurizer/tfidf_vectorizer/vectorizer.json b/model/probabilistic_intent_parser/intent_classifier/featurizer/tfidf_vectorizer/vectorizer.json new file mode 100644 index 0000000..ddd3858 --- /dev/null +++ b/model/probabilistic_intent_parser/intent_classifier/featurizer/tfidf_vectorizer/vectorizer.json @@ -0,0 +1,231 @@ +{ + "builtin_entity_scope": [], + "config": { + "unit_name": "tfidf_vectorizer", + "use_stemming": false, + "word_clusters_name": null + }, + "language_code": "en", + "vectorizer": { + "idf_diag": [ + 5.945207488773801, + 5.945207488773801, + 5.945207488773801, + 5.945207488773801, + 5.539742380665636, + 5.945207488773801, + 5.945207488773801, + 5.945207488773801, + 5.945207488773801, + 2.7671536584258547, + 4.441130091997526, + 5.539742380665636, + 5.2520603082138555, + 3.693915690167305, + 5.028916756899646, + 3.9992973397184874, + 5.539742380665636, + 4.846595200105691, + 4.692444520278432, + 5.539742380665636, + 3.1726187665340193, + 3.693915690167305, + 5.028916756899646, + 4.1534480195457455, + 4.3357695763397, + 5.539742380665636, + 5.945207488773801, + 5.945207488773801, + 5.539742380665636, + 4.240459396535375, + 5.2520603082138555, + 4.441130091997526, + 3.2371572876715904, + 5.539742380665636, + 4.3357695763397, + 5.945207488773801, + 5.028916756899646, + 2.0636436908303626, + 1.9843943191762223, + 2.4336620499427797, + 2.334289576129576, + 2.172446550679162, + 4.558913127653909, + 3.2043674648485996, + 5.2520603082138555, + 4.692444520278432, + 5.539742380665636, + 5.2520603082138555, + 5.945207488773801, + 5.945207488773801, + 4.558913127653909, + 5.945207488773801, + 3.502860453404596, + 4.441130091997526, + 5.2520603082138555, + 3.502860453404596, + 4.558913127653909, + 5.945207488773801, + 4.240459396535375, + 5.028916756899646, + 5.2520603082138555, + 4.558913127653909, + 4.558913127653909, + 5.945207488773801, + 5.945207488773801, + 5.2520603082138555, + 5.945207488773801, + 4.692444520278432, + 5.2520603082138555, + 3.2043674648485996, + 3.8657659470939647, + 5.539742380665636, + 5.945207488773801, + 3.502860453404596, + 4.692444520278432, + 5.539742380665636, + 5.539742380665636, + 4.3357695763397, + 4.558913127653909, + 5.945207488773801, + 4.441130091997526, + 4.692444520278432, + 4.846595200105691, + 4.558913127653909, + 5.945207488773801, + 5.539742380665636, + 4.240459396535375, + 3.4603008389858, + 5.539742380665636, + 3.502860453404596, + 1.6755100390738384, + 5.539742380665636, + 4.692444520278432, + 5.028916756899646, + 2.854165035415485, + 5.2520603082138555, + 5.945207488773801, + 4.558913127653909, + 5.945207488773801, + 4.3357695763397, + 4.240459396535375, + 5.945207488773801, + 3.693915690167305, + 4.692444520278432, + 5.2520603082138555, + 5.945207488773801, + 4.692444520278432, + 3.2710588393472717 + ], + "vocab": { + "19": 0, + "41": 1, + "51": 2, + "52": 3, + "58": 4, + "60": 5, + "76": 6, + "81": 7, + "94": 8, + "a": 9, + "adjust": 10, + "airflow": 11, + "amp": 12, + "and": 13, + "back": 14, + "bit": 15, + "blower": 16, + "boost": 17, + "boosting": 18, + "breezy": 19, + "by": 20, + "can": 21, + "cars": 22, + "celsius": 23, + "change": 24, + "circulation": 25, + "cold": 26, + "colder": 27, + "cool": 28, + "could": 29, + "crank": 30, + "decrease": 31, + "degrees": 32, + "dial": 33, + "down": 34, + "eight": 35, + "eighty": 36, + "entityfeaturehvac_fan_speed_action": 37, + "entityfeaturehvac_temperature_action": 38, + "entityfeaturenumeric_value": 39, + "entityfeatureto_or_by": 40, + "entityfeaturevolume_control_action": 41, + "fahrenheit": 42, + "fan": 43, + "fans": 44, + "fifty": 45, + "five": 46, + "four": 47, + "fully": 48, + "heat": 49, + "hey": 50, + "hot": 51, + "i": 52, + "increase": 53, + "intensity": 54, + "it": 55, + "its": 56, + "just": 57, + "lets": 58, + "little": 59, + "louder": 60, + "lower": 61, + "make": 62, + "max": 63, + "maybe": 64, + "need": 65, + "nineteen": 66, + "ninety": 67, + "notch": 68, + "of": 69, + "percent": 70, + "performance": 71, + "place": 72, + "please": 73, + "power": 74, + "quarters": 75, + "quieter": 76, + "raise": 77, + "reduce": 78, + "room": 79, + "set": 80, + "seven": 81, + "seventy": 82, + "six": 83, + "slightly": 84, + "slow": 85, + "sound": 86, + "speed": 87, + "tad": 88, + "temperature": 89, + "the": 90, + "thermostat": 91, + "thirty": 92, + "three": 93, + "to": 94, + "too": 95, + "touch": 96, + "turn": 97, + "twenty": 98, + "two": 99, + "up": 100, + "ventilation": 101, + "volume": 102, + "want": 103, + "warmer": 104, + "warmth": 105, + "would": 106, + "you": 107 + } + } +}
\ No newline at end of file |