Add gitlab issue/merge request templates
[src/snips-model-agl.git] / model / nlu_engine.json
1 {
2   "builtin_entity_parser": "builtin_entity_parser",
3   "config": {
4     "intent_parsers_configs": [
5       {
6         "ignore_stop_words": true,
7         "unit_name": "lookup_intent_parser"
8       },
9       {
10         "intent_classifier_config": {
11           "data_augmentation_config": {
12             "add_builtin_entities_examples": false,
13             "max_unknown_words": null,
14             "min_utterances": 20,
15             "noise_factor": 5,
16             "unknown_word_prob": 0.0,
17             "unknown_words_replacement_string": null
18           },
19           "featurizer_config": {
20             "added_cooccurrence_feature_ratio": 0.0,
21             "cooccurrence_vectorizer_config": {
22               "filter_stop_words": true,
23               "keep_order": true,
24               "unit_name": "cooccurrence_vectorizer",
25               "unknown_words_replacement_string": null,
26               "window_size": null
27             },
28             "pvalue_threshold": 0.4,
29             "tfidf_vectorizer_config": {
30               "unit_name": "tfidf_vectorizer",
31               "use_stemming": false,
32               "word_clusters_name": null
33             },
34             "unit_name": "featurizer"
35           },
36           "noise_reweight_factor": 1,
37           "unit_name": "log_reg_intent_classifier"
38         },
39         "slot_filler_config": {
40           "crf_args": {
41             "algorithm": "lbfgs",
42             "c1": 0.1,
43             "c2": 0.1
44           },
45           "data_augmentation_config": {
46             "add_builtin_entities_examples": true,
47             "capitalization_ratio": 0.2,
48             "min_utterances": 200
49           },
50           "feature_factory_configs": [
51             {
52               "args": {
53                 "common_words_gazetteer_name": "top_10000_words_stemmed",
54                 "n": 1,
55                 "use_stemming": true
56               },
57               "factory_name": "ngram",
58               "offsets": [
59                 -2,
60                 -1,
61                 0,
62                 1,
63                 2
64               ]
65             },
66             {
67               "args": {
68                 "common_words_gazetteer_name": "top_10000_words_stemmed",
69                 "n": 2,
70                 "use_stemming": true
71               },
72               "factory_name": "ngram",
73               "offsets": [
74                 -2,
75                 1
76               ]
77             },
78             {
79               "args": {},
80               "factory_name": "is_digit",
81               "offsets": [
82                 -1,
83                 0,
84                 1
85               ]
86             },
87             {
88               "args": {},
89               "factory_name": "is_first",
90               "offsets": [
91                 -2,
92                 -1,
93                 0
94               ]
95             },
96             {
97               "args": {},
98               "factory_name": "is_last",
99               "offsets": [
100                 0,
101                 1,
102                 2
103               ]
104             },
105             {
106               "args": {
107                 "n": 1
108               },
109               "factory_name": "shape_ngram",
110               "offsets": [
111                 0
112               ]
113             },
114             {
115               "args": {
116                 "n": 2
117               },
118               "factory_name": "shape_ngram",
119               "offsets": [
120                 -1,
121                 0
122               ]
123             },
124             {
125               "args": {
126                 "n": 3
127               },
128               "factory_name": "shape_ngram",
129               "offsets": [
130                 -1
131               ]
132             },
133             {
134               "args": {
135                 "entity_filter": {
136                   "automatically_extensible": false
137                 },
138                 "tagging_scheme_code": 2,
139                 "use_stemming": true
140               },
141               "factory_name": "entity_match",
142               "offsets": [
143                 -2,
144                 -1,
145                 0
146               ]
147             },
148             {
149               "args": {
150                 "entity_filter": {
151                   "automatically_extensible": true
152                 },
153                 "tagging_scheme_code": 2,
154                 "use_stemming": true
155               },
156               "drop_out": 0.5,
157               "factory_name": "entity_match",
158               "offsets": [
159                 -2,
160                 -1,
161                 0
162               ]
163             },
164             {
165               "args": {
166                 "tagging_scheme_code": 1
167               },
168               "factory_name": "builtin_entity_match",
169               "offsets": [
170                 -2,
171                 -1,
172                 0
173               ]
174             },
175             {
176               "args": {
177                 "cluster_name": "brown_clusters",
178                 "use_stemming": false
179               },
180               "factory_name": "word_cluster",
181               "offsets": [
182                 -2,
183                 -1,
184                 0,
185                 1
186               ]
187             }
188           ],
189           "tagging_scheme": 1,
190           "unit_name": "crf_slot_filler"
191         },
192         "unit_name": "probabilistic_intent_parser"
193       }
194     ],
195     "unit_name": "nlu_engine"
196   },
197   "custom_entity_parser": "custom_entity_parser",
198   "dataset_metadata": {
199     "entities": {
200       "hvac_fan_speed_action": {
201         "automatically_extensible": false
202       },
203       "hvac_temperature_action": {
204         "automatically_extensible": false
205       },
206       "numeric_value": {
207         "automatically_extensible": false
208       },
209       "to_or_by": {
210         "automatically_extensible": false
211       },
212       "volume_control_action": {
213         "automatically_extensible": false
214       }
215     },
216     "language_code": "en",
217     "slot_name_mappings": {
218       "HVACFanSpeed": {
219         "hvac_fan_speed_action": "hvac_fan_speed_action",
220         "numeric_value": "numeric_value",
221         "to_or_by": "to_or_by"
222       },
223       "HVACTemperature": {
224         "hvac_temperature_action": "hvac_temperature_action",
225         "numeric_value": "numeric_value",
226         "to_or_by": "to_or_by"
227       },
228       "VolumeControl": {
229         "numeric_value": "numeric_value",
230         "to_or_by": "to_or_by",
231         "volume_control_action": "volume_control_action"
232       }
233     }
234   },
235   "intent_parsers": [
236     "lookup_intent_parser",
237     "probabilistic_intent_parser"
238   ],
239   "model_version": "0.20.0",
240   "training_package_version": "0.20.2",
241   "unit_name": "nlu_engine"
242 }