diff options
author | Malik Talha <talhamalik727x@gmail.com> | 2023-10-22 20:54:58 +0500 |
---|---|---|
committer | Malik Talha <talhamalik727x@gmail.com> | 2023-10-22 20:54:58 +0500 |
commit | 69fcf984b733774336952bcc6f8ad42d796e5a5d (patch) | |
tree | 14529f2ee5db3725e08b8da2876d38601e6fc8c4 /model/probabilistic_intent_parser | |
parent | f97f5665a9263cca3609ac8f732e4590a4bf6178 (diff) |
Add pre-trained model for Snips
Add a Snips model trained on HVAC Temperature, Fan Speed,
and Volume Control intents.
SPEC-4856
Signed-off-by: Malik Talha <talhamalik727x@gmail.com>
Change-Id: I624fa48c059d4fa1a5f2ef07e3af88b3076509f2
Diffstat (limited to 'model/probabilistic_intent_parser')
17 files changed, 1526 insertions, 0 deletions
diff --git a/model/probabilistic_intent_parser/intent_classifier/featurizer/featurizer.json b/model/probabilistic_intent_parser/intent_classifier/featurizer/featurizer.json new file mode 100644 index 0000000..d75a5e2 --- /dev/null +++ b/model/probabilistic_intent_parser/intent_classifier/featurizer/featurizer.json @@ -0,0 +1,22 @@ +{ + "config": { + "added_cooccurrence_feature_ratio": 0.0, + "cooccurrence_vectorizer_config": { + "filter_stop_words": true, + "keep_order": true, + "unit_name": "cooccurrence_vectorizer", + "unknown_words_replacement_string": null, + "window_size": null + }, + "pvalue_threshold": 0.4, + "tfidf_vectorizer_config": { + "unit_name": "tfidf_vectorizer", + "use_stemming": false, + "word_clusters_name": null + }, + "unit_name": "featurizer" + }, + "cooccurrence_vectorizer": null, + "language_code": "en", + "tfidf_vectorizer": "tfidf_vectorizer" +}
\ No newline at end of file diff --git a/model/probabilistic_intent_parser/intent_classifier/featurizer/metadata.json b/model/probabilistic_intent_parser/intent_classifier/featurizer/metadata.json new file mode 100644 index 0000000..7cfe779 --- /dev/null +++ b/model/probabilistic_intent_parser/intent_classifier/featurizer/metadata.json @@ -0,0 +1,3 @@ +{ + "unit_name": "featurizer" +}
\ No newline at end of file diff --git a/model/probabilistic_intent_parser/intent_classifier/featurizer/tfidf_vectorizer/metadata.json b/model/probabilistic_intent_parser/intent_classifier/featurizer/tfidf_vectorizer/metadata.json new file mode 100644 index 0000000..ea6fa93 --- /dev/null +++ b/model/probabilistic_intent_parser/intent_classifier/featurizer/tfidf_vectorizer/metadata.json @@ -0,0 +1,3 @@ +{ + "unit_name": "tfidf_vectorizer" +}
\ No newline at end of file diff --git a/model/probabilistic_intent_parser/intent_classifier/featurizer/tfidf_vectorizer/vectorizer.json b/model/probabilistic_intent_parser/intent_classifier/featurizer/tfidf_vectorizer/vectorizer.json new file mode 100644 index 0000000..ddd3858 --- /dev/null +++ b/model/probabilistic_intent_parser/intent_classifier/featurizer/tfidf_vectorizer/vectorizer.json @@ -0,0 +1,231 @@ +{ + "builtin_entity_scope": [], + "config": { + "unit_name": "tfidf_vectorizer", + "use_stemming": false, + "word_clusters_name": null + }, + "language_code": "en", + "vectorizer": { + "idf_diag": [ + 5.945207488773801, + 5.945207488773801, + 5.945207488773801, + 5.945207488773801, + 5.539742380665636, + 5.945207488773801, + 5.945207488773801, + 5.945207488773801, + 5.945207488773801, + 2.7671536584258547, + 4.441130091997526, + 5.539742380665636, + 5.2520603082138555, + 3.693915690167305, + 5.028916756899646, + 3.9992973397184874, + 5.539742380665636, + 4.846595200105691, + 4.692444520278432, + 5.539742380665636, + 3.1726187665340193, + 3.693915690167305, + 5.028916756899646, + 4.1534480195457455, + 4.3357695763397, + 5.539742380665636, + 5.945207488773801, + 5.945207488773801, + 5.539742380665636, + 4.240459396535375, + 5.2520603082138555, + 4.441130091997526, + 3.2371572876715904, + 5.539742380665636, + 4.3357695763397, + 5.945207488773801, + 5.028916756899646, + 2.0636436908303626, + 1.9843943191762223, + 2.4336620499427797, + 2.334289576129576, + 2.172446550679162, + 4.558913127653909, + 3.2043674648485996, + 5.2520603082138555, + 4.692444520278432, + 5.539742380665636, + 5.2520603082138555, + 5.945207488773801, + 5.945207488773801, + 4.558913127653909, + 5.945207488773801, + 3.502860453404596, + 4.441130091997526, + 5.2520603082138555, + 3.502860453404596, + 4.558913127653909, + 5.945207488773801, + 4.240459396535375, + 5.028916756899646, + 5.2520603082138555, + 4.558913127653909, + 4.558913127653909, + 5.945207488773801, + 5.945207488773801, + 5.2520603082138555, + 5.945207488773801, + 4.692444520278432, + 5.2520603082138555, + 3.2043674648485996, + 3.8657659470939647, + 5.539742380665636, + 5.945207488773801, + 3.502860453404596, + 4.692444520278432, + 5.539742380665636, + 5.539742380665636, + 4.3357695763397, + 4.558913127653909, + 5.945207488773801, + 4.441130091997526, + 4.692444520278432, + 4.846595200105691, + 4.558913127653909, + 5.945207488773801, + 5.539742380665636, + 4.240459396535375, + 3.4603008389858, + 5.539742380665636, + 3.502860453404596, + 1.6755100390738384, + 5.539742380665636, + 4.692444520278432, + 5.028916756899646, + 2.854165035415485, + 5.2520603082138555, + 5.945207488773801, + 4.558913127653909, + 5.945207488773801, + 4.3357695763397, + 4.240459396535375, + 5.945207488773801, + 3.693915690167305, + 4.692444520278432, + 5.2520603082138555, + 5.945207488773801, + 4.692444520278432, + 3.2710588393472717 + ], + "vocab": { + "19": 0, + "41": 1, + "51": 2, + "52": 3, + "58": 4, + "60": 5, + "76": 6, + "81": 7, + "94": 8, + "a": 9, + "adjust": 10, + "airflow": 11, + "amp": 12, + "and": 13, + "back": 14, + "bit": 15, + "blower": 16, + "boost": 17, + "boosting": 18, + "breezy": 19, + "by": 20, + "can": 21, + "cars": 22, + "celsius": 23, + "change": 24, + "circulation": 25, + "cold": 26, + "colder": 27, + "cool": 28, + "could": 29, + "crank": 30, + "decrease": 31, + "degrees": 32, + "dial": 33, + "down": 34, + "eight": 35, + "eighty": 36, + "entityfeaturehvac_fan_speed_action": 37, + "entityfeaturehvac_temperature_action": 38, + "entityfeaturenumeric_value": 39, + "entityfeatureto_or_by": 40, + "entityfeaturevolume_control_action": 41, + "fahrenheit": 42, + "fan": 43, + "fans": 44, + "fifty": 45, + "five": 46, + "four": 47, + "fully": 48, + "heat": 49, + "hey": 50, + "hot": 51, + "i": 52, + "increase": 53, + "intensity": 54, + "it": 55, + "its": 56, + "just": 57, + "lets": 58, + "little": 59, + "louder": 60, + "lower": 61, + "make": 62, + "max": 63, + "maybe": 64, + "need": 65, + "nineteen": 66, + "ninety": 67, + "notch": 68, + "of": 69, + "percent": 70, + "performance": 71, + "place": 72, + "please": 73, + "power": 74, + "quarters": 75, + "quieter": 76, + "raise": 77, + "reduce": 78, + "room": 79, + "set": 80, + "seven": 81, + "seventy": 82, + "six": 83, + "slightly": 84, + "slow": 85, + "sound": 86, + "speed": 87, + "tad": 88, + "temperature": 89, + "the": 90, + "thermostat": 91, + "thirty": 92, + "three": 93, + "to": 94, + "too": 95, + "touch": 96, + "turn": 97, + "twenty": 98, + "two": 99, + "up": 100, + "ventilation": 101, + "volume": 102, + "want": 103, + "warmer": 104, + "warmth": 105, + "would": 106, + "you": 107 + } + } +}
\ No newline at end of file diff --git a/model/probabilistic_intent_parser/intent_classifier/intent_classifier.json b/model/probabilistic_intent_parser/intent_classifier/intent_classifier.json new file mode 100644 index 0000000..99b9b43 --- /dev/null +++ b/model/probabilistic_intent_parser/intent_classifier/intent_classifier.json @@ -0,0 +1,487 @@ +{ + "coeffs": [ + [ + -0.1944949449301576, + -0.1709338192954452, + -0.14643812047639607, + -0.19155332343920425, + -0.26203322806132484, + -0.06998595404922413, + -0.04616537127036657, + -0.09593063108159781, + 0.2670801970940651, + -0.7298972094796787, + 1.1659021913188135, + 1.7720959799070886, + 1.9152793569447697, + -1.4696163121979995, + 0.844395355117868, + 0.5986654133092939, + 1.3286721862827426, + 0.4202051337048011, + 1.8605029993612292, + 0.4864392153709908, + -0.1850026065080545, + 0.8315065579668949, + -0.4071500143626975, + -0.6911096635942332, + 0.33280464670368676, + 0.6895857907703777, + -0.33975347056860383, + -0.03409610336971599, + -0.1830205262812737, + -0.18959221713492214, + 0.8863962066067318, + 0.06351256100095176, + -1.9265904348973653, + 0.4031686676411473, + 0.20750138598813397, + -0.11880557452018371, + -0.551474327699674, + 2.8802191640954495, + 1.3603631129630487, + -0.7488685456543981, + -0.887369753407331, + 1.2416104378407142, + -0.6426741128019834, + 6.090534677887493, + 2.051176967856325, + 0.04897224563640065, + -0.5042980260523056, + -0.29850146748587314, + -0.2065434866677535, + -0.04002489365435418, + 0.5406886147155344, + -0.15356240192823065, + 0.25376821068531363, + -0.30572033754692146, + 1.7562240056899052, + 0.15126443772552664, + 1.6638008729301035, + -0.07372959362232727, + 2.932710325008, + 1.4239481274944663, + -0.46789548560291827, + 0.31995310111072084, + -1.3492128438591617, + -0.12568501546613994, + -0.06998595404922413, + 1.7679849531700071, + -0.21155141956582602, + -0.3088181546815536, + 0.956077467622598, + -1.9114985317889572, + 1.229239065917747, + 0.9249469840479404, + -0.3498944896366811, + 0.6503093350916289, + 0.85981654702734, + 0.5197910668573862, + -0.46524667806075454, + 0.375233322684959, + 0.7205348268191379, + -0.09593063108159781, + -0.7997164507929231, + -0.026335878116654075, + -0.5427886279639856, + 0.2551556850123977, + -0.40450344187720044, + 0.708709387300732, + -2.1052525890518363, + 4.7731182137937385, + 0.3827988890934132, + -1.6931132062614114, + -1.8036556963730381, + -0.2804552388335083, + -0.1652470817695098, + 0.44514380577026275, + -0.9185652404792951, + 0.3255194621979477, + -0.07372959362232727, + 0.020183885272701797, + -0.05895361676374134, + -1.000175188982346, + 1.1758401718339109, + 0.9496473146457145, + -2.8253317944196823, + 0.9097819033258351, + -0.13074043514374561, + -0.1416950074360412, + 1.6868101184990176, + -0.3008520671626627 + ], + [ + 0.39070411072369365, + -0.2103151585229938, + 0.7988194021633298, + -0.1752420388174099, + 0.5359507584882811, + 0.7428763997929889, + 0.158855764775961, + 0.2233411968906852, + -0.07370269321628466, + -1.8353538915479386, + -0.24029799505652064, + -0.28662267645598494, + -0.3595115590220648, + -1.4249662264232048, + 0.11414120061471919, + 0.6253185197288007, + -0.2993603475100838, + 0.6557637418838415, + 0.3557014021981265, + -0.15358862121789965, + 0.3548887422294314, + -0.15059374956989222, + 1.5206949602597781, + 2.6928307913975673, + 0.08170193267068891, + -0.14869989550318333, + 0.4508426407687237, + 0.1707324925480857, + 0.8886483462270193, + -0.340606576471467, + -0.38710229891410747, + 0.44320048583521526, + 7.196444715206654, + -0.2916192200060449, + 0.21640722331701634, + 0.45040301271625116, + 0.9377763049112277, + 0.8755178498002804, + 0.8196061708389681, + 1.5703298809444148, + 0.042469682467589566, + 0.2521622290502533, + 2.2729408186528097, + -1.700989160194387, + -0.4170959874909554, + 0.2167315857669742, + 0.7867573286977338, + 0.21162593666759807, + -0.17343424391911377, + 0.14752130265412475, + -0.8154556074367001, + 0.35069944086042243, + -1.324150568310463, + -0.6866034300206799, + -0.2935693407558982, + -1.0602676540273166, + -0.008528396235158536, + -0.07722958177613383, + 0.017356583477958265, + -0.321385951211114, + -0.23155135203451066, + 0.5110182231127964, + 0.06205537096880271, + 0.3442555505181098, + 0.7428763997929889, + -0.22909500623352944, + -0.16504042772830033, + 0.3303233868986131, + -0.3757524399605448, + -2.014770165348239, + -1.1481428689082491, + -0.31018813997890854, + 0.9788137882293648, + -0.35081262993291046, + -0.6948026076004692, + -0.14819138439352864, + -0.16781881301697193, + 0.6394955144239772, + -0.13242339035433284, + 0.2233411968906852, + -0.18916092326450623, + 0.30974673539675396, + 1.2905678974554733, + 0.8320047276962229, + -0.11020113224991683, + -0.18016743766145368, + -1.448445553920027, + -1.4810766380709515, + -0.25049837150446247, + 5.344480236722493, + -1.7977164071838685, + 1.2292488846986476, + 0.8556173004283408, + -0.36730614081727125, + -0.26733833583392214, + 0.1641989880763703, + -0.07722958177613383, + -0.06562764593404344, + 0.24183362545327178, + -0.08261514995386539, + 0.18092959776267203, + -0.28158672716472694, + -1.7142914600779355, + 0.1503396968334292, + 0.8915786935223018, + 0.827469912009148, + -0.4147546405943871, + -0.5545769283716919 + ], + [ + -0.17325949904557789, + 0.8469931420801717, + -0.17291345747016895, + 0.7415838862619261, + 0.4274229742431583, + -0.09169997501324818, + -0.03597382792706312, + -0.13192135575319, + -0.2232770261032077, + -0.5592833175250984, + 0.5337511339882469, + -0.7015203611158959, + -0.8050378425269331, + -1.391476008727117, + -0.3735367392593157, + 2.0229440028156285, + -0.4181439506999733, + -0.36284605476876275, + -0.4915128191910597, + -0.18772225278575058, + -0.1836211986385558, + -0.160170732625766, + -0.6051851028858776, + -1.0565838516982902, + 0.5189958389469236, + -0.21433651619833852, + -0.023427702566669335, + -0.06225802709330549, + -0.2479768365131114, + 0.6440642269943153, + 0.2166100015163753, + 0.5621214112752978, + -2.313937425413541, + -0.21383821821874424, + 0.9835776683215183, + -0.2868222554936089, + -0.3627790090966197, + 1.6715362856528764, + 0.562618698865241, + 0.5171144296225592, + -0.2875537588133474, + 3.7650951394831975, + -0.8430120071606295, + -2.9135485020163494, + -0.7732932028803183, + 0.5932157539375889, + -0.2654507724150584, + 0.48514783195537947, + 0.7791418129403005, + -0.04756567767655289, + -0.9235484068748897, + -0.09163744841391439, + -0.6668721180230781, + -0.06321633127931364, + -0.6917289046302094, + -0.1305307192739786, + -1.1611593110986207, + 0.5263090658353216, + -1.4746064278386666, + 0.9460179482446475, + 2.4559982942328866, + 0.47805946230351637, + 1.1885114249751079, + -0.16691223659534524, + -0.09169997501324818, + -0.3949458468417482, + 0.474115087649099, + 1.25941806477877, + 0.15775963405235455, + -1.8365325489417232, + 1.928737362375423, + -0.3042033412226444, + -0.13268872031822843, + 0.5825827594443002, + -0.7819548619354546, + -0.3715523694687792, + 1.11683978664795, + 0.6406233034386648, + 0.8966843996933499, + -0.13192135575319, + 0.0660616293488582, + 1.3349408184184337, + -0.39160770131537814, + 0.0035731969209047464, + 1.2860627823141233, + -0.38361195906555495, + 3.785997345890054, + -2.6370503870308153, + 1.5173096973089502, + -1.7959354415295845, + -1.343767356940433, + -0.34777521277572043, + 1.3770803738799031, + 0.8465636489321146, + -0.18640547635945673, + -0.2589272346446866, + 0.5263090658353216, + 0.7753397260785132, + -0.08233430114481251, + -1.0755682097425807, + 0.08747829557375957, + -0.40249375179638763, + 6.545271985656959, + 1.6846671518257648, + -0.3048123502498132, + -0.23150009268290092, + 0.2660331927407965, + 0.3908591521610277 + ], + [ + -0.08287008635301533, + -0.1707186300864661, + -0.12411651496367082, + -0.13270980721857845, + -0.2308574863622476, + -0.340776333289237, + -0.2799539501495442, + -0.09353490554395046, + -0.11003196602952028, + 0.8370329970945711, + -0.9057550121088088, + -0.44699057472930825, + -0.5638365474312759, + 1.5143809843780474, + -0.7058026613700651, + -1.5992446723775544, + -0.39548545877201235, + -0.5818138768809792, + -1.1918930105665881, + -0.20119295958315825, + -0.4106024666342698, + -0.6084017910626903, + -0.4053078456262127, + -1.2701652804160122, + -0.9082937192503221, + -0.41358650963042953, + -0.14507759075384705, + -0.25541322585710685, + -0.2834804666647943, + -0.35866596133820716, + -0.4883764320145827, + -0.7006698082266908, + -2.394669342089395, + -0.18631140125245332, + -0.8431834537195231, + -0.11298527662620045, + -0.46579176626926616, + -4.0614990005298495, + -3.2045951451142787, + -1.5108427566999016, + 0.004582928152167648, + -3.9044112386784877, + -0.6588826838562699, + -2.3102211611673735, + -0.6601615139051208, + -0.5798142278897691, + -0.16935515654474664, + -0.2994100797642838, + -0.13545535197391778, + -0.28214898970349794, + 0.07498510488180002, + -0.09906076894705139, + 0.3030837833573295, + 0.1750985085211981, + -0.549252376368689, + 0.19508025476427163, + -0.680325815274731, + -0.441542891929835, + -1.1986281021735854, + -1.2750417431062337, + -1.3332940190069578, + -0.6893972025209948, + -0.1977405184178932, + -0.08290274818842105, + -0.340776333289237, + -0.7441344382438827, + -0.11203102845288844, + -0.7110498382506533, + -0.4371808188047473, + 2.1062550992856974, + -1.2673967495828176, + -0.4547516653443288, + -0.07847727400663201, + -1.2025943363863212, + -0.18833967483902414, + -0.22494114094975098, + -0.496679271117596, + -0.9206374373470854, + -0.8795489026728613, + -0.09353490554395046, + 0.2645294880545335, + -0.8676466201790525, + -0.5294129510334283, + -0.7650069149680953, + -0.20093881100566283, + -0.25427142474416814, + -0.5720789301099184, + -1.5271844756130357, + -0.5885493969076697, + -2.011108297941673, + 1.2077089211008882, + -0.2762513025220224, + -0.7261332226437589, + -0.5449319964956103, + 0.3749915728825021, + -0.2782562410203223, + -0.441542891929835, + -0.7834555744093303, + -0.14867935969258925, + 0.7397541876426704, + -0.9776516885496953, + -0.22530286398490842, + -1.9790005442385892, + -0.9860056472866394, + -0.7413541914609503, + -0.18411241931805505, + -0.6485578833987582, + -0.25343404875508874 + ] + ], + "config": { + "data_augmentation_config": { + "add_builtin_entities_examples": false, + "max_unknown_words": null, + "min_utterances": 20, + "noise_factor": 5, + "unknown_word_prob": 0.0, + "unknown_words_replacement_string": null + }, + "featurizer_config": { + "added_cooccurrence_feature_ratio": 0.0, + "cooccurrence_vectorizer_config": { + "filter_stop_words": true, + "keep_order": true, + "unit_name": "cooccurrence_vectorizer", + "unknown_words_replacement_string": null, + "window_size": null + }, + "pvalue_threshold": 0.4, + "tfidf_vectorizer_config": { + "unit_name": "tfidf_vectorizer", + "use_stemming": false, + "word_clusters_name": null + }, + "unit_name": "featurizer" + }, + "noise_reweight_factor": 1, + "unit_name": "log_reg_intent_classifier" + }, + "featurizer": "featurizer", + "intent_list": [ + "HVACFanSpeed", + "HVACTemperature", + "VolumeControl", + null + ], + "intercept": [ + -2.0426926790934385, + -2.0967218978636635, + -2.263067120777316, + 1.0460915926972372 + ], + "t_": 7281.0 +}
\ No newline at end of file diff --git a/model/probabilistic_intent_parser/intent_classifier/metadata.json b/model/probabilistic_intent_parser/intent_classifier/metadata.json new file mode 100644 index 0000000..0c890bd --- /dev/null +++ b/model/probabilistic_intent_parser/intent_classifier/metadata.json @@ -0,0 +1,3 @@ +{ + "unit_name": "log_reg_intent_classifier" +}
\ No newline at end of file diff --git a/model/probabilistic_intent_parser/intent_parser.json b/model/probabilistic_intent_parser/intent_parser.json new file mode 100644 index 0000000..b86c94a --- /dev/null +++ b/model/probabilistic_intent_parser/intent_parser.json @@ -0,0 +1,201 @@ +{ + "config": { + "intent_classifier_config": { + "data_augmentation_config": { + "add_builtin_entities_examples": false, + "max_unknown_words": null, + "min_utterances": 20, + "noise_factor": 5, + "unknown_word_prob": 0.0, + "unknown_words_replacement_string": null + }, + "featurizer_config": { + "added_cooccurrence_feature_ratio": 0.0, + "cooccurrence_vectorizer_config": { + "filter_stop_words": true, + "keep_order": true, + "unit_name": "cooccurrence_vectorizer", + "unknown_words_replacement_string": null, + "window_size": null + }, + "pvalue_threshold": 0.4, + "tfidf_vectorizer_config": { + "unit_name": "tfidf_vectorizer", + "use_stemming": false, + "word_clusters_name": null + }, + "unit_name": "featurizer" + }, + "noise_reweight_factor": 1, + "unit_name": "log_reg_intent_classifier" + }, + "slot_filler_config": { + "crf_args": { + "algorithm": "lbfgs", + "c1": 0.1, + "c2": 0.1 + }, + "data_augmentation_config": { + "add_builtin_entities_examples": true, + "capitalization_ratio": 0.2, + "min_utterances": 200 + }, + "feature_factory_configs": [ + { + "args": { + "common_words_gazetteer_name": "top_10000_words_stemmed", + "n": 1, + "use_stemming": true + }, + "factory_name": "ngram", + "offsets": [ + -2, + -1, + 0, + 1, + 2 + ] + }, + { + "args": { + "common_words_gazetteer_name": "top_10000_words_stemmed", + "n": 2, + "use_stemming": true + }, + "factory_name": "ngram", + "offsets": [ + -2, + 1 + ] + }, + { + "args": {}, + "factory_name": "is_digit", + "offsets": [ + -1, + 0, + 1 + ] + }, + { + "args": {}, + "factory_name": "is_first", + "offsets": [ + -2, + -1, + 0 + ] + }, + { + "args": {}, + "factory_name": "is_last", + "offsets": [ + 0, + 1, + 2 + ] + }, + { + "args": { + "n": 1 + }, + "factory_name": "shape_ngram", + "offsets": [ + 0 + ] + }, + { + "args": { + "n": 2 + }, + "factory_name": "shape_ngram", + "offsets": [ + -1, + 0 + ] + }, + { + "args": { + "n": 3 + }, + "factory_name": "shape_ngram", + "offsets": [ + -1 + ] + }, + { + "args": { + "entity_filter": { + "automatically_extensible": false + }, + "tagging_scheme_code": 2, + "use_stemming": true + }, + "factory_name": "entity_match", + "offsets": [ + -2, + -1, + 0 + ] + }, + { + "args": { + "entity_filter": { + "automatically_extensible": true + }, + "tagging_scheme_code": 2, + "use_stemming": true + }, + "drop_out": 0.5, + "factory_name": "entity_match", + "offsets": [ + -2, + -1, + 0 + ] + }, + { + "args": { + "tagging_scheme_code": 1 + }, + "factory_name": "builtin_entity_match", + "offsets": [ + -2, + -1, + 0 + ] + }, + { + "args": { + "cluster_name": "brown_clusters", + "use_stemming": false + }, + "factory_name": "word_cluster", + "offsets": [ + -2, + -1, + 0, + 1 + ] + } + ], + "tagging_scheme": 1, + "unit_name": "crf_slot_filler" + }, + "unit_name": "probabilistic_intent_parser" + }, + "slot_fillers": [ + { + "intent": "HVACFanSpeed", + "slot_filler_name": "slot_filler_0" + }, + { + "intent": "HVACTemperature", + "slot_filler_name": "slot_filler_1" + }, + { + "intent": "VolumeControl", + "slot_filler_name": "slot_filler_2" + } + ] +}
\ No newline at end of file diff --git a/model/probabilistic_intent_parser/metadata.json b/model/probabilistic_intent_parser/metadata.json new file mode 100644 index 0000000..59777ca --- /dev/null +++ b/model/probabilistic_intent_parser/metadata.json @@ -0,0 +1,3 @@ +{ + "unit_name": "probabilistic_intent_parser" +}
\ No newline at end of file diff --git a/model/probabilistic_intent_parser/slot_filler_0/metadata.json b/model/probabilistic_intent_parser/slot_filler_0/metadata.json new file mode 100644 index 0000000..18ccb30 --- /dev/null +++ b/model/probabilistic_intent_parser/slot_filler_0/metadata.json @@ -0,0 +1,3 @@ +{ + "unit_name": "crf_slot_filler" +}
\ No newline at end of file diff --git a/model/probabilistic_intent_parser/slot_filler_0/model.crfsuite b/model/probabilistic_intent_parser/slot_filler_0/model.crfsuite Binary files differnew file mode 100644 index 0000000..ffc3f12 --- /dev/null +++ b/model/probabilistic_intent_parser/slot_filler_0/model.crfsuite diff --git a/model/probabilistic_intent_parser/slot_filler_0/slot_filler.json b/model/probabilistic_intent_parser/slot_filler_0/slot_filler.json new file mode 100644 index 0000000..9972c21 --- /dev/null +++ b/model/probabilistic_intent_parser/slot_filler_0/slot_filler.json @@ -0,0 +1,188 @@ +{ + "config": { + "crf_args": { + "algorithm": "lbfgs", + "c1": 0.1, + "c2": 0.1 + }, + "data_augmentation_config": { + "add_builtin_entities_examples": true, + "capitalization_ratio": 0.2, + "min_utterances": 200 + }, + "feature_factory_configs": [ + { + "args": { + "common_words_gazetteer_name": "top_10000_words_stemmed", + "language_code": "en", + "n": 1, + "use_stemming": true + }, + "factory_name": "ngram", + "offsets": [ + -2, + -1, + 0, + 1, + 2 + ] + }, + { + "args": { + "common_words_gazetteer_name": "top_10000_words_stemmed", + "language_code": "en", + "n": 2, + "use_stemming": true + }, + "factory_name": "ngram", + "offsets": [ + -2, + 1 + ] + }, + { + "args": {}, + "factory_name": "is_digit", + "offsets": [ + -1, + 0, + 1 + ] + }, + { + "args": {}, + "factory_name": "is_first", + "offsets": [ + -2, + -1, + 0 + ] + }, + { + "args": {}, + "factory_name": "is_last", + "offsets": [ + 0, + 1, + 2 + ] + }, + { + "args": { + "language_code": "en", + "n": 1 + }, + "factory_name": "shape_ngram", + "offsets": [ + 0 + ] + }, + { + "args": { + "language_code": "en", + "n": 2 + }, + "factory_name": "shape_ngram", + "offsets": [ + -1, + 0 + ] + }, + { + "args": { + "language_code": "en", + "n": 3 + }, + "factory_name": "shape_ngram", + "offsets": [ + -1 + ] + }, + { + "args": { + "entities": [ + "to_or_by", + "numeric_value", + "hvac_fan_speed_action" + ], + "entity_filter": { + "automatically_extensible": false + }, + "tagging_scheme_code": 2, + "use_stemming": true + }, + "factory_name": "entity_match", + "offsets": [ + -2, + -1, + 0 + ] + }, + { + "args": { + "entities": [], + "entity_filter": { + "automatically_extensible": true + }, + "tagging_scheme_code": 2, + "use_stemming": true + }, + "drop_out": 0.5, + "factory_name": "entity_match", + "offsets": [ + -2, + -1, + 0 + ] + }, + { + "args": { + "entity_labels": [ + "snips/amountOfMoney", + "snips/date", + "snips/datePeriod", + "snips/datetime", + "snips/duration", + "snips/number", + "snips/ordinal", + "snips/percentage", + "snips/temperature", + "snips/time", + "snips/timePeriod" + ], + "language_code": "en", + "tagging_scheme_code": 1 + }, + "factory_name": "builtin_entity_match", + "offsets": [ + -2, + -1, + 0 + ] + }, + { + "args": { + "cluster_name": "brown_clusters", + "use_stemming": false + }, + "factory_name": "word_cluster", + "offsets": [ + -2, + -1, + 0, + 1 + ] + } + ], + "tagging_scheme": 1, + "unit_name": "crf_slot_filler" + }, + "crf_model_file": "model.crfsuite", + "intent": "HVACFanSpeed", + "language_code": "en", + "slot_name_mapping": { + "hvac_fan_speed_action": "hvac_fan_speed_action", + "numeric_value": "numeric_value", + "to_or_by": "to_or_by" + } +}
\ No newline at end of file diff --git a/model/probabilistic_intent_parser/slot_filler_1/metadata.json b/model/probabilistic_intent_parser/slot_filler_1/metadata.json new file mode 100644 index 0000000..18ccb30 --- /dev/null +++ b/model/probabilistic_intent_parser/slot_filler_1/metadata.json @@ -0,0 +1,3 @@ +{ + "unit_name": "crf_slot_filler" +}
\ No newline at end of file diff --git a/model/probabilistic_intent_parser/slot_filler_1/model.crfsuite b/model/probabilistic_intent_parser/slot_filler_1/model.crfsuite Binary files differnew file mode 100644 index 0000000..d0a2123 --- /dev/null +++ b/model/probabilistic_intent_parser/slot_filler_1/model.crfsuite diff --git a/model/probabilistic_intent_parser/slot_filler_1/slot_filler.json b/model/probabilistic_intent_parser/slot_filler_1/slot_filler.json new file mode 100644 index 0000000..bbc51a4 --- /dev/null +++ b/model/probabilistic_intent_parser/slot_filler_1/slot_filler.json @@ -0,0 +1,188 @@ +{ + "config": { + "crf_args": { + "algorithm": "lbfgs", + "c1": 0.1, + "c2": 0.1 + }, + "data_augmentation_config": { + "add_builtin_entities_examples": true, + "capitalization_ratio": 0.2, + "min_utterances": 200 + }, + "feature_factory_configs": [ + { + "args": { + "common_words_gazetteer_name": "top_10000_words_stemmed", + "language_code": "en", + "n": 1, + "use_stemming": true + }, + "factory_name": "ngram", + "offsets": [ + -2, + -1, + 0, + 1, + 2 + ] + }, + { + "args": { + "common_words_gazetteer_name": "top_10000_words_stemmed", + "language_code": "en", + "n": 2, + "use_stemming": true + }, + "factory_name": "ngram", + "offsets": [ + -2, + 1 + ] + }, + { + "args": {}, + "factory_name": "is_digit", + "offsets": [ + -1, + 0, + 1 + ] + }, + { + "args": {}, + "factory_name": "is_first", + "offsets": [ + -2, + -1, + 0 + ] + }, + { + "args": {}, + "factory_name": "is_last", + "offsets": [ + 0, + 1, + 2 + ] + }, + { + "args": { + "language_code": "en", + "n": 1 + }, + "factory_name": "shape_ngram", + "offsets": [ + 0 + ] + }, + { + "args": { + "language_code": "en", + "n": 2 + }, + "factory_name": "shape_ngram", + "offsets": [ + -1, + 0 + ] + }, + { + "args": { + "language_code": "en", + "n": 3 + }, + "factory_name": "shape_ngram", + "offsets": [ + -1 + ] + }, + { + "args": { + "entities": [ + "hvac_temperature_action", + "to_or_by", + "numeric_value" + ], + "entity_filter": { + "automatically_extensible": false + }, + "tagging_scheme_code": 2, + "use_stemming": true + }, + "factory_name": "entity_match", + "offsets": [ + -2, + -1, + 0 + ] + }, + { + "args": { + "entities": [], + "entity_filter": { + "automatically_extensible": true + }, + "tagging_scheme_code": 2, + "use_stemming": true + }, + "drop_out": 0.5, + "factory_name": "entity_match", + "offsets": [ + -2, + -1, + 0 + ] + }, + { + "args": { + "entity_labels": [ + "snips/amountOfMoney", + "snips/date", + "snips/datePeriod", + "snips/datetime", + "snips/duration", + "snips/number", + "snips/ordinal", + "snips/percentage", + "snips/temperature", + "snips/time", + "snips/timePeriod" + ], + "language_code": "en", + "tagging_scheme_code": 1 + }, + "factory_name": "builtin_entity_match", + "offsets": [ + -2, + -1, + 0 + ] + }, + { + "args": { + "cluster_name": "brown_clusters", + "use_stemming": false + }, + "factory_name": "word_cluster", + "offsets": [ + -2, + -1, + 0, + 1 + ] + } + ], + "tagging_scheme": 1, + "unit_name": "crf_slot_filler" + }, + "crf_model_file": "model.crfsuite", + "intent": "HVACTemperature", + "language_code": "en", + "slot_name_mapping": { + "hvac_temperature_action": "hvac_temperature_action", + "numeric_value": "numeric_value", + "to_or_by": "to_or_by" + } +}
\ No newline at end of file diff --git a/model/probabilistic_intent_parser/slot_filler_2/metadata.json b/model/probabilistic_intent_parser/slot_filler_2/metadata.json new file mode 100644 index 0000000..18ccb30 --- /dev/null +++ b/model/probabilistic_intent_parser/slot_filler_2/metadata.json @@ -0,0 +1,3 @@ +{ + "unit_name": "crf_slot_filler" +}
\ No newline at end of file diff --git a/model/probabilistic_intent_parser/slot_filler_2/model.crfsuite b/model/probabilistic_intent_parser/slot_filler_2/model.crfsuite Binary files differnew file mode 100644 index 0000000..65a8577 --- /dev/null +++ b/model/probabilistic_intent_parser/slot_filler_2/model.crfsuite diff --git a/model/probabilistic_intent_parser/slot_filler_2/slot_filler.json b/model/probabilistic_intent_parser/slot_filler_2/slot_filler.json new file mode 100644 index 0000000..3ea6fbb --- /dev/null +++ b/model/probabilistic_intent_parser/slot_filler_2/slot_filler.json @@ -0,0 +1,188 @@ +{ + "config": { + "crf_args": { + "algorithm": "lbfgs", + "c1": 0.1, + "c2": 0.1 + }, + "data_augmentation_config": { + "add_builtin_entities_examples": true, + "capitalization_ratio": 0.2, + "min_utterances": 200 + }, + "feature_factory_configs": [ + { + "args": { + "common_words_gazetteer_name": "top_10000_words_stemmed", + "language_code": "en", + "n": 1, + "use_stemming": true + }, + "factory_name": "ngram", + "offsets": [ + -2, + -1, + 0, + 1, + 2 + ] + }, + { + "args": { + "common_words_gazetteer_name": "top_10000_words_stemmed", + "language_code": "en", + "n": 2, + "use_stemming": true + }, + "factory_name": "ngram", + "offsets": [ + -2, + 1 + ] + }, + { + "args": {}, + "factory_name": "is_digit", + "offsets": [ + -1, + 0, + 1 + ] + }, + { + "args": {}, + "factory_name": "is_first", + "offsets": [ + -2, + -1, + 0 + ] + }, + { + "args": {}, + "factory_name": "is_last", + "offsets": [ + 0, + 1, + 2 + ] + }, + { + "args": { + "language_code": "en", + "n": 1 + }, + "factory_name": "shape_ngram", + "offsets": [ + 0 + ] + }, + { + "args": { + "language_code": "en", + "n": 2 + }, + "factory_name": "shape_ngram", + "offsets": [ + -1, + 0 + ] + }, + { + "args": { + "language_code": "en", + "n": 3 + }, + "factory_name": "shape_ngram", + "offsets": [ + -1 + ] + }, + { + "args": { + "entities": [ + "to_or_by", + "numeric_value", + "volume_control_action" + ], + "entity_filter": { + "automatically_extensible": false + }, + "tagging_scheme_code": 2, + "use_stemming": true + }, + "factory_name": "entity_match", + "offsets": [ + -2, + -1, + 0 + ] + }, + { + "args": { + "entities": [], + "entity_filter": { + "automatically_extensible": true + }, + "tagging_scheme_code": 2, + "use_stemming": true + }, + "drop_out": 0.5, + "factory_name": "entity_match", + "offsets": [ + -2, + -1, + 0 + ] + }, + { + "args": { + "entity_labels": [ + "snips/amountOfMoney", + "snips/date", + "snips/datePeriod", + "snips/datetime", + "snips/duration", + "snips/number", + "snips/ordinal", + "snips/percentage", + "snips/temperature", + "snips/time", + "snips/timePeriod" + ], + "language_code": "en", + "tagging_scheme_code": 1 + }, + "factory_name": "builtin_entity_match", + "offsets": [ + -2, + -1, + 0 + ] + }, + { + "args": { + "cluster_name": "brown_clusters", + "use_stemming": false + }, + "factory_name": "word_cluster", + "offsets": [ + -2, + -1, + 0, + 1 + ] + } + ], + "tagging_scheme": 1, + "unit_name": "crf_slot_filler" + }, + "crf_model_file": "model.crfsuite", + "intent": "VolumeControl", + "language_code": "en", + "slot_name_mapping": { + "numeric_value": "numeric_value", + "to_or_by": "to_or_by", + "volume_control_action": "volume_control_action" + } +}
\ No newline at end of file |