aboutsummaryrefslogtreecommitdiffstats
path: root/model/probabilistic_intent_parser/intent_classifier/featurizer
diff options
context:
space:
mode:
authorMalik Talha <talhamalik727x@gmail.com>2023-10-22 20:54:58 +0500
committerMalik Talha <talhamalik727x@gmail.com>2023-10-22 20:54:58 +0500
commit69fcf984b733774336952bcc6f8ad42d796e5a5d (patch)
tree14529f2ee5db3725e08b8da2876d38601e6fc8c4 /model/probabilistic_intent_parser/intent_classifier/featurizer
parentf97f5665a9263cca3609ac8f732e4590a4bf6178 (diff)
Add pre-trained model for Snips
Add a Snips model trained on HVAC Temperature, Fan Speed, and Volume Control intents. SPEC-4856 Signed-off-by: Malik Talha <talhamalik727x@gmail.com> Change-Id: I624fa48c059d4fa1a5f2ef07e3af88b3076509f2
Diffstat (limited to 'model/probabilistic_intent_parser/intent_classifier/featurizer')
-rw-r--r--model/probabilistic_intent_parser/intent_classifier/featurizer/featurizer.json22
-rw-r--r--model/probabilistic_intent_parser/intent_classifier/featurizer/metadata.json3
-rw-r--r--model/probabilistic_intent_parser/intent_classifier/featurizer/tfidf_vectorizer/metadata.json3
-rw-r--r--model/probabilistic_intent_parser/intent_classifier/featurizer/tfidf_vectorizer/vectorizer.json231
4 files changed, 259 insertions, 0 deletions
diff --git a/model/probabilistic_intent_parser/intent_classifier/featurizer/featurizer.json b/model/probabilistic_intent_parser/intent_classifier/featurizer/featurizer.json
new file mode 100644
index 0000000..d75a5e2
--- /dev/null
+++ b/model/probabilistic_intent_parser/intent_classifier/featurizer/featurizer.json
@@ -0,0 +1,22 @@
+{
+ "config": {
+ "added_cooccurrence_feature_ratio": 0.0,
+ "cooccurrence_vectorizer_config": {
+ "filter_stop_words": true,
+ "keep_order": true,
+ "unit_name": "cooccurrence_vectorizer",
+ "unknown_words_replacement_string": null,
+ "window_size": null
+ },
+ "pvalue_threshold": 0.4,
+ "tfidf_vectorizer_config": {
+ "unit_name": "tfidf_vectorizer",
+ "use_stemming": false,
+ "word_clusters_name": null
+ },
+ "unit_name": "featurizer"
+ },
+ "cooccurrence_vectorizer": null,
+ "language_code": "en",
+ "tfidf_vectorizer": "tfidf_vectorizer"
+} \ No newline at end of file
diff --git a/model/probabilistic_intent_parser/intent_classifier/featurizer/metadata.json b/model/probabilistic_intent_parser/intent_classifier/featurizer/metadata.json
new file mode 100644
index 0000000..7cfe779
--- /dev/null
+++ b/model/probabilistic_intent_parser/intent_classifier/featurizer/metadata.json
@@ -0,0 +1,3 @@
+{
+ "unit_name": "featurizer"
+} \ No newline at end of file
diff --git a/model/probabilistic_intent_parser/intent_classifier/featurizer/tfidf_vectorizer/metadata.json b/model/probabilistic_intent_parser/intent_classifier/featurizer/tfidf_vectorizer/metadata.json
new file mode 100644
index 0000000..ea6fa93
--- /dev/null
+++ b/model/probabilistic_intent_parser/intent_classifier/featurizer/tfidf_vectorizer/metadata.json
@@ -0,0 +1,3 @@
+{
+ "unit_name": "tfidf_vectorizer"
+} \ No newline at end of file
diff --git a/model/probabilistic_intent_parser/intent_classifier/featurizer/tfidf_vectorizer/vectorizer.json b/model/probabilistic_intent_parser/intent_classifier/featurizer/tfidf_vectorizer/vectorizer.json
new file mode 100644
index 0000000..ddd3858
--- /dev/null
+++ b/model/probabilistic_intent_parser/intent_classifier/featurizer/tfidf_vectorizer/vectorizer.json
@@ -0,0 +1,231 @@
+{
+ "builtin_entity_scope": [],
+ "config": {
+ "unit_name": "tfidf_vectorizer",
+ "use_stemming": false,
+ "word_clusters_name": null
+ },
+ "language_code": "en",
+ "vectorizer": {
+ "idf_diag": [
+ 5.945207488773801,
+ 5.945207488773801,
+ 5.945207488773801,
+ 5.945207488773801,
+ 5.539742380665636,
+ 5.945207488773801,
+ 5.945207488773801,
+ 5.945207488773801,
+ 5.945207488773801,
+ 2.7671536584258547,
+ 4.441130091997526,
+ 5.539742380665636,
+ 5.2520603082138555,
+ 3.693915690167305,
+ 5.028916756899646,
+ 3.9992973397184874,
+ 5.539742380665636,
+ 4.846595200105691,
+ 4.692444520278432,
+ 5.539742380665636,
+ 3.1726187665340193,
+ 3.693915690167305,
+ 5.028916756899646,
+ 4.1534480195457455,
+ 4.3357695763397,
+ 5.539742380665636,
+ 5.945207488773801,
+ 5.945207488773801,
+ 5.539742380665636,
+ 4.240459396535375,
+ 5.2520603082138555,
+ 4.441130091997526,
+ 3.2371572876715904,
+ 5.539742380665636,
+ 4.3357695763397,
+ 5.945207488773801,
+ 5.028916756899646,
+ 2.0636436908303626,
+ 1.9843943191762223,
+ 2.4336620499427797,
+ 2.334289576129576,
+ 2.172446550679162,
+ 4.558913127653909,
+ 3.2043674648485996,
+ 5.2520603082138555,
+ 4.692444520278432,
+ 5.539742380665636,
+ 5.2520603082138555,
+ 5.945207488773801,
+ 5.945207488773801,
+ 4.558913127653909,
+ 5.945207488773801,
+ 3.502860453404596,
+ 4.441130091997526,
+ 5.2520603082138555,
+ 3.502860453404596,
+ 4.558913127653909,
+ 5.945207488773801,
+ 4.240459396535375,
+ 5.028916756899646,
+ 5.2520603082138555,
+ 4.558913127653909,
+ 4.558913127653909,
+ 5.945207488773801,
+ 5.945207488773801,
+ 5.2520603082138555,
+ 5.945207488773801,
+ 4.692444520278432,
+ 5.2520603082138555,
+ 3.2043674648485996,
+ 3.8657659470939647,
+ 5.539742380665636,
+ 5.945207488773801,
+ 3.502860453404596,
+ 4.692444520278432,
+ 5.539742380665636,
+ 5.539742380665636,
+ 4.3357695763397,
+ 4.558913127653909,
+ 5.945207488773801,
+ 4.441130091997526,
+ 4.692444520278432,
+ 4.846595200105691,
+ 4.558913127653909,
+ 5.945207488773801,
+ 5.539742380665636,
+ 4.240459396535375,
+ 3.4603008389858,
+ 5.539742380665636,
+ 3.502860453404596,
+ 1.6755100390738384,
+ 5.539742380665636,
+ 4.692444520278432,
+ 5.028916756899646,
+ 2.854165035415485,
+ 5.2520603082138555,
+ 5.945207488773801,
+ 4.558913127653909,
+ 5.945207488773801,
+ 4.3357695763397,
+ 4.240459396535375,
+ 5.945207488773801,
+ 3.693915690167305,
+ 4.692444520278432,
+ 5.2520603082138555,
+ 5.945207488773801,
+ 4.692444520278432,
+ 3.2710588393472717
+ ],
+ "vocab": {
+ "19": 0,
+ "41": 1,
+ "51": 2,
+ "52": 3,
+ "58": 4,
+ "60": 5,
+ "76": 6,
+ "81": 7,
+ "94": 8,
+ "a": 9,
+ "adjust": 10,
+ "airflow": 11,
+ "amp": 12,
+ "and": 13,
+ "back": 14,
+ "bit": 15,
+ "blower": 16,
+ "boost": 17,
+ "boosting": 18,
+ "breezy": 19,
+ "by": 20,
+ "can": 21,
+ "cars": 22,
+ "celsius": 23,
+ "change": 24,
+ "circulation": 25,
+ "cold": 26,
+ "colder": 27,
+ "cool": 28,
+ "could": 29,
+ "crank": 30,
+ "decrease": 31,
+ "degrees": 32,
+ "dial": 33,
+ "down": 34,
+ "eight": 35,
+ "eighty": 36,
+ "entityfeaturehvac_fan_speed_action": 37,
+ "entityfeaturehvac_temperature_action": 38,
+ "entityfeaturenumeric_value": 39,
+ "entityfeatureto_or_by": 40,
+ "entityfeaturevolume_control_action": 41,
+ "fahrenheit": 42,
+ "fan": 43,
+ "fans": 44,
+ "fifty": 45,
+ "five": 46,
+ "four": 47,
+ "fully": 48,
+ "heat": 49,
+ "hey": 50,
+ "hot": 51,
+ "i": 52,
+ "increase": 53,
+ "intensity": 54,
+ "it": 55,
+ "its": 56,
+ "just": 57,
+ "lets": 58,
+ "little": 59,
+ "louder": 60,
+ "lower": 61,
+ "make": 62,
+ "max": 63,
+ "maybe": 64,
+ "need": 65,
+ "nineteen": 66,
+ "ninety": 67,
+ "notch": 68,
+ "of": 69,
+ "percent": 70,
+ "performance": 71,
+ "place": 72,
+ "please": 73,
+ "power": 74,
+ "quarters": 75,
+ "quieter": 76,
+ "raise": 77,
+ "reduce": 78,
+ "room": 79,
+ "set": 80,
+ "seven": 81,
+ "seventy": 82,
+ "six": 83,
+ "slightly": 84,
+ "slow": 85,
+ "sound": 86,
+ "speed": 87,
+ "tad": 88,
+ "temperature": 89,
+ "the": 90,
+ "thermostat": 91,
+ "thirty": 92,
+ "three": 93,
+ "to": 94,
+ "too": 95,
+ "touch": 96,
+ "turn": 97,
+ "twenty": 98,
+ "two": 99,
+ "up": 100,
+ "ventilation": 101,
+ "volume": 102,
+ "want": 103,
+ "warmer": 104,
+ "warmth": 105,
+ "would": 106,
+ "you": 107
+ }
+ }
+} \ No newline at end of file