rasa-pro 3.8.16__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of rasa-pro might be problematic. Click here for more details.

Files changed (644) hide show
  1. README.md +380 -0
  2. rasa/__init__.py +10 -0
  3. rasa/__main__.py +151 -0
  4. rasa/anonymization/__init__.py +2 -0
  5. rasa/anonymization/anonymisation_rule_yaml_reader.py +91 -0
  6. rasa/anonymization/anonymization_pipeline.py +287 -0
  7. rasa/anonymization/anonymization_rule_executor.py +260 -0
  8. rasa/anonymization/anonymization_rule_orchestrator.py +120 -0
  9. rasa/anonymization/schemas/config.yml +47 -0
  10. rasa/anonymization/utils.py +117 -0
  11. rasa/api.py +146 -0
  12. rasa/cli/__init__.py +5 -0
  13. rasa/cli/arguments/__init__.py +0 -0
  14. rasa/cli/arguments/data.py +81 -0
  15. rasa/cli/arguments/default_arguments.py +165 -0
  16. rasa/cli/arguments/evaluate.py +65 -0
  17. rasa/cli/arguments/export.py +51 -0
  18. rasa/cli/arguments/interactive.py +74 -0
  19. rasa/cli/arguments/run.py +204 -0
  20. rasa/cli/arguments/shell.py +13 -0
  21. rasa/cli/arguments/test.py +211 -0
  22. rasa/cli/arguments/train.py +263 -0
  23. rasa/cli/arguments/visualize.py +34 -0
  24. rasa/cli/arguments/x.py +30 -0
  25. rasa/cli/data.py +292 -0
  26. rasa/cli/e2e_test.py +566 -0
  27. rasa/cli/evaluate.py +222 -0
  28. rasa/cli/export.py +251 -0
  29. rasa/cli/inspect.py +63 -0
  30. rasa/cli/interactive.py +164 -0
  31. rasa/cli/license.py +65 -0
  32. rasa/cli/markers.py +78 -0
  33. rasa/cli/project_templates/__init__.py +0 -0
  34. rasa/cli/project_templates/calm/actions/__init__.py +0 -0
  35. rasa/cli/project_templates/calm/actions/action_template.py +27 -0
  36. rasa/cli/project_templates/calm/actions/add_contact.py +30 -0
  37. rasa/cli/project_templates/calm/actions/db.py +57 -0
  38. rasa/cli/project_templates/calm/actions/list_contacts.py +22 -0
  39. rasa/cli/project_templates/calm/actions/remove_contact.py +35 -0
  40. rasa/cli/project_templates/calm/config.yml +12 -0
  41. rasa/cli/project_templates/calm/credentials.yml +33 -0
  42. rasa/cli/project_templates/calm/data/flows/add_contact.yml +31 -0
  43. rasa/cli/project_templates/calm/data/flows/list_contacts.yml +14 -0
  44. rasa/cli/project_templates/calm/data/flows/remove_contact.yml +29 -0
  45. rasa/cli/project_templates/calm/db/contacts.json +10 -0
  46. rasa/cli/project_templates/calm/domain/add_contact.yml +33 -0
  47. rasa/cli/project_templates/calm/domain/list_contacts.yml +14 -0
  48. rasa/cli/project_templates/calm/domain/remove_contact.yml +31 -0
  49. rasa/cli/project_templates/calm/domain/shared.yml +5 -0
  50. rasa/cli/project_templates/calm/e2e_tests/cancelations/user_cancels_during_a_correction.yml +16 -0
  51. rasa/cli/project_templates/calm/e2e_tests/cancelations/user_changes_mind_on_a_whim.yml +7 -0
  52. rasa/cli/project_templates/calm/e2e_tests/corrections/user_corrects_contact_handle.yml +20 -0
  53. rasa/cli/project_templates/calm/e2e_tests/corrections/user_corrects_contact_name.yml +19 -0
  54. rasa/cli/project_templates/calm/e2e_tests/happy_paths/user_adds_contact_to_their_list.yml +15 -0
  55. rasa/cli/project_templates/calm/e2e_tests/happy_paths/user_lists_contacts.yml +5 -0
  56. rasa/cli/project_templates/calm/e2e_tests/happy_paths/user_removes_contact.yml +11 -0
  57. rasa/cli/project_templates/calm/e2e_tests/happy_paths/user_removes_contact_from_list.yml +12 -0
  58. rasa/cli/project_templates/calm/endpoints.yml +45 -0
  59. rasa/cli/project_templates/default/actions/__init__.py +0 -0
  60. rasa/cli/project_templates/default/actions/actions.py +27 -0
  61. rasa/cli/project_templates/default/config.yml +44 -0
  62. rasa/cli/project_templates/default/credentials.yml +33 -0
  63. rasa/cli/project_templates/default/data/nlu.yml +91 -0
  64. rasa/cli/project_templates/default/data/rules.yml +13 -0
  65. rasa/cli/project_templates/default/data/stories.yml +30 -0
  66. rasa/cli/project_templates/default/domain.yml +34 -0
  67. rasa/cli/project_templates/default/endpoints.yml +42 -0
  68. rasa/cli/project_templates/default/tests/test_stories.yml +91 -0
  69. rasa/cli/project_templates/tutorial/actions.py +22 -0
  70. rasa/cli/project_templates/tutorial/config.yml +11 -0
  71. rasa/cli/project_templates/tutorial/credentials.yml +33 -0
  72. rasa/cli/project_templates/tutorial/data/flows.yml +8 -0
  73. rasa/cli/project_templates/tutorial/domain.yml +17 -0
  74. rasa/cli/project_templates/tutorial/endpoints.yml +45 -0
  75. rasa/cli/run.py +136 -0
  76. rasa/cli/scaffold.py +268 -0
  77. rasa/cli/shell.py +141 -0
  78. rasa/cli/studio/__init__.py +0 -0
  79. rasa/cli/studio/download.py +51 -0
  80. rasa/cli/studio/studio.py +110 -0
  81. rasa/cli/studio/train.py +59 -0
  82. rasa/cli/studio/upload.py +85 -0
  83. rasa/cli/telemetry.py +90 -0
  84. rasa/cli/test.py +280 -0
  85. rasa/cli/train.py +260 -0
  86. rasa/cli/utils.py +453 -0
  87. rasa/cli/visualize.py +40 -0
  88. rasa/cli/x.py +205 -0
  89. rasa/constants.py +37 -0
  90. rasa/core/__init__.py +17 -0
  91. rasa/core/actions/__init__.py +0 -0
  92. rasa/core/actions/action.py +1450 -0
  93. rasa/core/actions/action_clean_stack.py +59 -0
  94. rasa/core/actions/action_run_slot_rejections.py +207 -0
  95. rasa/core/actions/action_trigger_chitchat.py +31 -0
  96. rasa/core/actions/action_trigger_flow.py +109 -0
  97. rasa/core/actions/action_trigger_search.py +31 -0
  98. rasa/core/actions/constants.py +2 -0
  99. rasa/core/actions/forms.py +737 -0
  100. rasa/core/actions/loops.py +111 -0
  101. rasa/core/actions/two_stage_fallback.py +186 -0
  102. rasa/core/agent.py +557 -0
  103. rasa/core/auth_retry_tracker_store.py +122 -0
  104. rasa/core/brokers/__init__.py +0 -0
  105. rasa/core/brokers/broker.py +126 -0
  106. rasa/core/brokers/file.py +58 -0
  107. rasa/core/brokers/kafka.py +322 -0
  108. rasa/core/brokers/pika.py +387 -0
  109. rasa/core/brokers/sql.py +86 -0
  110. rasa/core/channels/__init__.py +55 -0
  111. rasa/core/channels/audiocodes.py +463 -0
  112. rasa/core/channels/botframework.py +339 -0
  113. rasa/core/channels/callback.py +85 -0
  114. rasa/core/channels/channel.py +419 -0
  115. rasa/core/channels/console.py +243 -0
  116. rasa/core/channels/development_inspector.py +93 -0
  117. rasa/core/channels/facebook.py +422 -0
  118. rasa/core/channels/hangouts.py +335 -0
  119. rasa/core/channels/inspector/.eslintrc.cjs +25 -0
  120. rasa/core/channels/inspector/.gitignore +23 -0
  121. rasa/core/channels/inspector/README.md +54 -0
  122. rasa/core/channels/inspector/assets/favicon.ico +0 -0
  123. rasa/core/channels/inspector/assets/rasa-chat.js +2 -0
  124. rasa/core/channels/inspector/custom.d.ts +3 -0
  125. rasa/core/channels/inspector/dist/assets/arc-5623b6dc.js +1 -0
  126. rasa/core/channels/inspector/dist/assets/array-9f3ba611.js +1 -0
  127. rasa/core/channels/inspector/dist/assets/c4Diagram-d0fbc5ce-685c106a.js +10 -0
  128. rasa/core/channels/inspector/dist/assets/classDiagram-936ed81e-8cbed007.js +2 -0
  129. rasa/core/channels/inspector/dist/assets/classDiagram-v2-c3cb15f1-5889cf12.js +2 -0
  130. rasa/core/channels/inspector/dist/assets/createText-62fc7601-24c249d7.js +7 -0
  131. rasa/core/channels/inspector/dist/assets/edges-f2ad444c-7dd06a75.js +4 -0
  132. rasa/core/channels/inspector/dist/assets/erDiagram-9d236eb7-62c1e54c.js +51 -0
  133. rasa/core/channels/inspector/dist/assets/flowDb-1972c806-ce49b86f.js +6 -0
  134. rasa/core/channels/inspector/dist/assets/flowDiagram-7ea5b25a-4067e48f.js +4 -0
  135. rasa/core/channels/inspector/dist/assets/flowDiagram-v2-855bc5b3-85583a23.js +1 -0
  136. rasa/core/channels/inspector/dist/assets/flowchart-elk-definition-abe16c3d-59fe4051.js +139 -0
  137. rasa/core/channels/inspector/dist/assets/ganttDiagram-9b5ea136-47e3a43b.js +266 -0
  138. rasa/core/channels/inspector/dist/assets/gitGraphDiagram-99d0ae7c-5a2ac0d9.js +70 -0
  139. rasa/core/channels/inspector/dist/assets/ibm-plex-mono-v4-latin-regular-128cfa44.ttf +0 -0
  140. rasa/core/channels/inspector/dist/assets/ibm-plex-mono-v4-latin-regular-21dbcb97.woff +0 -0
  141. rasa/core/channels/inspector/dist/assets/ibm-plex-mono-v4-latin-regular-222b5e26.svg +329 -0
  142. rasa/core/channels/inspector/dist/assets/ibm-plex-mono-v4-latin-regular-9ad89b2a.woff2 +0 -0
  143. rasa/core/channels/inspector/dist/assets/index-268a75c0.js +1040 -0
  144. rasa/core/channels/inspector/dist/assets/index-2c4b9a3b-dfb8efc4.js +1 -0
  145. rasa/core/channels/inspector/dist/assets/index-3ee28881.css +1 -0
  146. rasa/core/channels/inspector/dist/assets/infoDiagram-736b4530-b0c470f2.js +7 -0
  147. rasa/core/channels/inspector/dist/assets/init-77b53fdd.js +1 -0
  148. rasa/core/channels/inspector/dist/assets/journeyDiagram-df861f2b-2edb829a.js +139 -0
  149. rasa/core/channels/inspector/dist/assets/lato-v14-latin-700-60c05ee4.woff +0 -0
  150. rasa/core/channels/inspector/dist/assets/lato-v14-latin-700-8335d9b8.svg +438 -0
  151. rasa/core/channels/inspector/dist/assets/lato-v14-latin-700-9cc39c75.ttf +0 -0
  152. rasa/core/channels/inspector/dist/assets/lato-v14-latin-700-ead13ccf.woff2 +0 -0
  153. rasa/core/channels/inspector/dist/assets/lato-v14-latin-regular-16705655.woff2 +0 -0
  154. rasa/core/channels/inspector/dist/assets/lato-v14-latin-regular-5aeb07f9.woff +0 -0
  155. rasa/core/channels/inspector/dist/assets/lato-v14-latin-regular-9c459044.ttf +0 -0
  156. rasa/core/channels/inspector/dist/assets/lato-v14-latin-regular-9e2898a4.svg +435 -0
  157. rasa/core/channels/inspector/dist/assets/layout-b6873d69.js +1 -0
  158. rasa/core/channels/inspector/dist/assets/line-1efc5781.js +1 -0
  159. rasa/core/channels/inspector/dist/assets/linear-661e9b94.js +1 -0
  160. rasa/core/channels/inspector/dist/assets/mindmap-definition-beec6740-2d2e727f.js +109 -0
  161. rasa/core/channels/inspector/dist/assets/ordinal-ba9b4969.js +1 -0
  162. rasa/core/channels/inspector/dist/assets/path-53f90ab3.js +1 -0
  163. rasa/core/channels/inspector/dist/assets/pieDiagram-dbbf0591-9d3ea93d.js +35 -0
  164. rasa/core/channels/inspector/dist/assets/quadrantDiagram-4d7f4fd6-06a178a2.js +7 -0
  165. rasa/core/channels/inspector/dist/assets/requirementDiagram-6fc4c22a-0bfedffc.js +52 -0
  166. rasa/core/channels/inspector/dist/assets/sankeyDiagram-8f13d901-d76d0a04.js +8 -0
  167. rasa/core/channels/inspector/dist/assets/sequenceDiagram-b655622a-37bb4341.js +122 -0
  168. rasa/core/channels/inspector/dist/assets/stateDiagram-59f0c015-f52f7f57.js +1 -0
  169. rasa/core/channels/inspector/dist/assets/stateDiagram-v2-2b26beab-4a986a20.js +1 -0
  170. rasa/core/channels/inspector/dist/assets/styles-080da4f6-7dd9ae12.js +110 -0
  171. rasa/core/channels/inspector/dist/assets/styles-3dcbcfbf-46e1ca14.js +159 -0
  172. rasa/core/channels/inspector/dist/assets/styles-9c745c82-4a97439a.js +207 -0
  173. rasa/core/channels/inspector/dist/assets/svgDrawCommon-4835440b-823917a3.js +1 -0
  174. rasa/core/channels/inspector/dist/assets/timeline-definition-5b62e21b-9ea72896.js +61 -0
  175. rasa/core/channels/inspector/dist/assets/xychartDiagram-2b33534f-b631a8b6.js +7 -0
  176. rasa/core/channels/inspector/dist/index.html +39 -0
  177. rasa/core/channels/inspector/index.html +37 -0
  178. rasa/core/channels/inspector/jest.config.ts +13 -0
  179. rasa/core/channels/inspector/package.json +48 -0
  180. rasa/core/channels/inspector/setupTests.ts +2 -0
  181. rasa/core/channels/inspector/src/App.tsx +170 -0
  182. rasa/core/channels/inspector/src/components/DiagramFlow.tsx +97 -0
  183. rasa/core/channels/inspector/src/components/DialogueInformation.tsx +187 -0
  184. rasa/core/channels/inspector/src/components/DialogueStack.tsx +151 -0
  185. rasa/core/channels/inspector/src/components/ExpandIcon.tsx +16 -0
  186. rasa/core/channels/inspector/src/components/FullscreenButton.tsx +45 -0
  187. rasa/core/channels/inspector/src/components/LoadingSpinner.tsx +19 -0
  188. rasa/core/channels/inspector/src/components/NoActiveFlow.tsx +21 -0
  189. rasa/core/channels/inspector/src/components/RasaLogo.tsx +32 -0
  190. rasa/core/channels/inspector/src/components/SaraDiagrams.tsx +39 -0
  191. rasa/core/channels/inspector/src/components/Slots.tsx +91 -0
  192. rasa/core/channels/inspector/src/components/Welcome.tsx +54 -0
  193. rasa/core/channels/inspector/src/helpers/formatters.test.ts +385 -0
  194. rasa/core/channels/inspector/src/helpers/formatters.ts +239 -0
  195. rasa/core/channels/inspector/src/helpers/utils.ts +42 -0
  196. rasa/core/channels/inspector/src/main.tsx +13 -0
  197. rasa/core/channels/inspector/src/theme/Button/Button.ts +29 -0
  198. rasa/core/channels/inspector/src/theme/Heading/Heading.ts +31 -0
  199. rasa/core/channels/inspector/src/theme/Input/Input.ts +27 -0
  200. rasa/core/channels/inspector/src/theme/Link/Link.ts +10 -0
  201. rasa/core/channels/inspector/src/theme/Modal/Modal.ts +47 -0
  202. rasa/core/channels/inspector/src/theme/Table/Table.tsx +38 -0
  203. rasa/core/channels/inspector/src/theme/Tooltip/Tooltip.ts +12 -0
  204. rasa/core/channels/inspector/src/theme/base/breakpoints.ts +8 -0
  205. rasa/core/channels/inspector/src/theme/base/colors.ts +88 -0
  206. rasa/core/channels/inspector/src/theme/base/fonts/fontFaces.css +29 -0
  207. rasa/core/channels/inspector/src/theme/base/fonts/ibm-plex-mono-v4-latin/ibm-plex-mono-v4-latin-regular.eot +0 -0
  208. rasa/core/channels/inspector/src/theme/base/fonts/ibm-plex-mono-v4-latin/ibm-plex-mono-v4-latin-regular.svg +329 -0
  209. rasa/core/channels/inspector/src/theme/base/fonts/ibm-plex-mono-v4-latin/ibm-plex-mono-v4-latin-regular.ttf +0 -0
  210. rasa/core/channels/inspector/src/theme/base/fonts/ibm-plex-mono-v4-latin/ibm-plex-mono-v4-latin-regular.woff +0 -0
  211. rasa/core/channels/inspector/src/theme/base/fonts/ibm-plex-mono-v4-latin/ibm-plex-mono-v4-latin-regular.woff2 +0 -0
  212. rasa/core/channels/inspector/src/theme/base/fonts/lato-v14-latin/lato-v14-latin-700.eot +0 -0
  213. rasa/core/channels/inspector/src/theme/base/fonts/lato-v14-latin/lato-v14-latin-700.svg +438 -0
  214. rasa/core/channels/inspector/src/theme/base/fonts/lato-v14-latin/lato-v14-latin-700.ttf +0 -0
  215. rasa/core/channels/inspector/src/theme/base/fonts/lato-v14-latin/lato-v14-latin-700.woff +0 -0
  216. rasa/core/channels/inspector/src/theme/base/fonts/lato-v14-latin/lato-v14-latin-700.woff2 +0 -0
  217. rasa/core/channels/inspector/src/theme/base/fonts/lato-v14-latin/lato-v14-latin-regular.eot +0 -0
  218. rasa/core/channels/inspector/src/theme/base/fonts/lato-v14-latin/lato-v14-latin-regular.svg +435 -0
  219. rasa/core/channels/inspector/src/theme/base/fonts/lato-v14-latin/lato-v14-latin-regular.ttf +0 -0
  220. rasa/core/channels/inspector/src/theme/base/fonts/lato-v14-latin/lato-v14-latin-regular.woff +0 -0
  221. rasa/core/channels/inspector/src/theme/base/fonts/lato-v14-latin/lato-v14-latin-regular.woff2 +0 -0
  222. rasa/core/channels/inspector/src/theme/base/radii.ts +9 -0
  223. rasa/core/channels/inspector/src/theme/base/shadows.ts +7 -0
  224. rasa/core/channels/inspector/src/theme/base/sizes.ts +7 -0
  225. rasa/core/channels/inspector/src/theme/base/space.ts +15 -0
  226. rasa/core/channels/inspector/src/theme/base/styles.ts +13 -0
  227. rasa/core/channels/inspector/src/theme/base/typography.ts +24 -0
  228. rasa/core/channels/inspector/src/theme/base/zIndices.ts +19 -0
  229. rasa/core/channels/inspector/src/theme/index.ts +101 -0
  230. rasa/core/channels/inspector/src/types.ts +64 -0
  231. rasa/core/channels/inspector/src/vite-env.d.ts +1 -0
  232. rasa/core/channels/inspector/tests/__mocks__/fileMock.ts +1 -0
  233. rasa/core/channels/inspector/tests/__mocks__/matchMedia.ts +16 -0
  234. rasa/core/channels/inspector/tests/__mocks__/styleMock.ts +1 -0
  235. rasa/core/channels/inspector/tests/renderWithProviders.tsx +14 -0
  236. rasa/core/channels/inspector/tsconfig.json +26 -0
  237. rasa/core/channels/inspector/tsconfig.node.json +10 -0
  238. rasa/core/channels/inspector/vite.config.ts +8 -0
  239. rasa/core/channels/inspector/yarn.lock +6156 -0
  240. rasa/core/channels/mattermost.py +229 -0
  241. rasa/core/channels/rasa_chat.py +126 -0
  242. rasa/core/channels/rest.py +210 -0
  243. rasa/core/channels/rocketchat.py +175 -0
  244. rasa/core/channels/slack.py +620 -0
  245. rasa/core/channels/socketio.py +274 -0
  246. rasa/core/channels/telegram.py +298 -0
  247. rasa/core/channels/twilio.py +169 -0
  248. rasa/core/channels/twilio_voice.py +367 -0
  249. rasa/core/channels/vier_cvg.py +374 -0
  250. rasa/core/channels/webexteams.py +135 -0
  251. rasa/core/concurrent_lock_store.py +210 -0
  252. rasa/core/constants.py +107 -0
  253. rasa/core/evaluation/__init__.py +0 -0
  254. rasa/core/evaluation/marker.py +267 -0
  255. rasa/core/evaluation/marker_base.py +925 -0
  256. rasa/core/evaluation/marker_stats.py +294 -0
  257. rasa/core/evaluation/marker_tracker_loader.py +103 -0
  258. rasa/core/exceptions.py +29 -0
  259. rasa/core/exporter.py +284 -0
  260. rasa/core/featurizers/__init__.py +0 -0
  261. rasa/core/featurizers/precomputation.py +410 -0
  262. rasa/core/featurizers/single_state_featurizer.py +402 -0
  263. rasa/core/featurizers/tracker_featurizers.py +1172 -0
  264. rasa/core/http_interpreter.py +89 -0
  265. rasa/core/information_retrieval/__init__.py +0 -0
  266. rasa/core/information_retrieval/faiss.py +116 -0
  267. rasa/core/information_retrieval/information_retrieval.py +72 -0
  268. rasa/core/information_retrieval/milvus.py +59 -0
  269. rasa/core/information_retrieval/qdrant.py +102 -0
  270. rasa/core/jobs.py +63 -0
  271. rasa/core/lock.py +139 -0
  272. rasa/core/lock_store.py +344 -0
  273. rasa/core/migrate.py +404 -0
  274. rasa/core/nlg/__init__.py +3 -0
  275. rasa/core/nlg/callback.py +147 -0
  276. rasa/core/nlg/contextual_response_rephraser.py +270 -0
  277. rasa/core/nlg/generator.py +230 -0
  278. rasa/core/nlg/interpolator.py +143 -0
  279. rasa/core/nlg/response.py +155 -0
  280. rasa/core/nlg/summarize.py +69 -0
  281. rasa/core/policies/__init__.py +0 -0
  282. rasa/core/policies/ensemble.py +329 -0
  283. rasa/core/policies/enterprise_search_policy.py +717 -0
  284. rasa/core/policies/enterprise_search_prompt_template.jinja2 +62 -0
  285. rasa/core/policies/flow_policy.py +205 -0
  286. rasa/core/policies/flows/__init__.py +0 -0
  287. rasa/core/policies/flows/flow_exceptions.py +44 -0
  288. rasa/core/policies/flows/flow_executor.py +582 -0
  289. rasa/core/policies/flows/flow_step_result.py +43 -0
  290. rasa/core/policies/intentless_policy.py +924 -0
  291. rasa/core/policies/intentless_prompt_template.jinja2 +22 -0
  292. rasa/core/policies/memoization.py +538 -0
  293. rasa/core/policies/policy.py +716 -0
  294. rasa/core/policies/rule_policy.py +1276 -0
  295. rasa/core/policies/ted_policy.py +2146 -0
  296. rasa/core/policies/unexpected_intent_policy.py +1015 -0
  297. rasa/core/processor.py +1331 -0
  298. rasa/core/run.py +315 -0
  299. rasa/core/secrets_manager/__init__.py +0 -0
  300. rasa/core/secrets_manager/constants.py +32 -0
  301. rasa/core/secrets_manager/endpoints.py +391 -0
  302. rasa/core/secrets_manager/factory.py +233 -0
  303. rasa/core/secrets_manager/secret_manager.py +262 -0
  304. rasa/core/secrets_manager/vault.py +576 -0
  305. rasa/core/test.py +1337 -0
  306. rasa/core/tracker_store.py +1664 -0
  307. rasa/core/train.py +107 -0
  308. rasa/core/training/__init__.py +89 -0
  309. rasa/core/training/converters/__init__.py +0 -0
  310. rasa/core/training/converters/responses_prefix_converter.py +119 -0
  311. rasa/core/training/interactive.py +1742 -0
  312. rasa/core/training/story_conflict.py +381 -0
  313. rasa/core/training/training.py +93 -0
  314. rasa/core/utils.py +344 -0
  315. rasa/core/visualize.py +70 -0
  316. rasa/dialogue_understanding/__init__.py +0 -0
  317. rasa/dialogue_understanding/coexistence/__init__.py +0 -0
  318. rasa/dialogue_understanding/coexistence/constants.py +4 -0
  319. rasa/dialogue_understanding/coexistence/intent_based_router.py +189 -0
  320. rasa/dialogue_understanding/coexistence/llm_based_router.py +261 -0
  321. rasa/dialogue_understanding/coexistence/router_template.jinja2 +12 -0
  322. rasa/dialogue_understanding/commands/__init__.py +45 -0
  323. rasa/dialogue_understanding/commands/can_not_handle_command.py +61 -0
  324. rasa/dialogue_understanding/commands/cancel_flow_command.py +116 -0
  325. rasa/dialogue_understanding/commands/chit_chat_answer_command.py +48 -0
  326. rasa/dialogue_understanding/commands/clarify_command.py +77 -0
  327. rasa/dialogue_understanding/commands/command.py +85 -0
  328. rasa/dialogue_understanding/commands/correct_slots_command.py +288 -0
  329. rasa/dialogue_understanding/commands/error_command.py +67 -0
  330. rasa/dialogue_understanding/commands/free_form_answer_command.py +9 -0
  331. rasa/dialogue_understanding/commands/handle_code_change_command.py +64 -0
  332. rasa/dialogue_understanding/commands/human_handoff_command.py +57 -0
  333. rasa/dialogue_understanding/commands/knowledge_answer_command.py +48 -0
  334. rasa/dialogue_understanding/commands/noop_command.py +45 -0
  335. rasa/dialogue_understanding/commands/set_slot_command.py +125 -0
  336. rasa/dialogue_understanding/commands/skip_question_command.py +66 -0
  337. rasa/dialogue_understanding/commands/start_flow_command.py +98 -0
  338. rasa/dialogue_understanding/generator/__init__.py +6 -0
  339. rasa/dialogue_understanding/generator/command_generator.py +257 -0
  340. rasa/dialogue_understanding/generator/command_prompt_template.jinja2 +57 -0
  341. rasa/dialogue_understanding/generator/flow_document_template.jinja2 +4 -0
  342. rasa/dialogue_understanding/generator/flow_retrieval.py +410 -0
  343. rasa/dialogue_understanding/generator/llm_command_generator.py +637 -0
  344. rasa/dialogue_understanding/generator/nlu_command_adapter.py +157 -0
  345. rasa/dialogue_understanding/patterns/__init__.py +0 -0
  346. rasa/dialogue_understanding/patterns/cancel.py +111 -0
  347. rasa/dialogue_understanding/patterns/cannot_handle.py +43 -0
  348. rasa/dialogue_understanding/patterns/chitchat.py +37 -0
  349. rasa/dialogue_understanding/patterns/clarify.py +97 -0
  350. rasa/dialogue_understanding/patterns/code_change.py +41 -0
  351. rasa/dialogue_understanding/patterns/collect_information.py +90 -0
  352. rasa/dialogue_understanding/patterns/completed.py +40 -0
  353. rasa/dialogue_understanding/patterns/continue_interrupted.py +42 -0
  354. rasa/dialogue_understanding/patterns/correction.py +278 -0
  355. rasa/dialogue_understanding/patterns/default_flows_for_patterns.yml +243 -0
  356. rasa/dialogue_understanding/patterns/human_handoff.py +37 -0
  357. rasa/dialogue_understanding/patterns/internal_error.py +47 -0
  358. rasa/dialogue_understanding/patterns/search.py +37 -0
  359. rasa/dialogue_understanding/patterns/skip_question.py +38 -0
  360. rasa/dialogue_understanding/processor/__init__.py +0 -0
  361. rasa/dialogue_understanding/processor/command_processor.py +578 -0
  362. rasa/dialogue_understanding/processor/command_processor_component.py +39 -0
  363. rasa/dialogue_understanding/stack/__init__.py +0 -0
  364. rasa/dialogue_understanding/stack/dialogue_stack.py +178 -0
  365. rasa/dialogue_understanding/stack/frames/__init__.py +19 -0
  366. rasa/dialogue_understanding/stack/frames/chit_chat_frame.py +27 -0
  367. rasa/dialogue_understanding/stack/frames/dialogue_stack_frame.py +137 -0
  368. rasa/dialogue_understanding/stack/frames/flow_stack_frame.py +157 -0
  369. rasa/dialogue_understanding/stack/frames/pattern_frame.py +10 -0
  370. rasa/dialogue_understanding/stack/frames/search_frame.py +27 -0
  371. rasa/dialogue_understanding/stack/utils.py +211 -0
  372. rasa/e2e_test/__init__.py +0 -0
  373. rasa/e2e_test/constants.py +10 -0
  374. rasa/e2e_test/e2e_test_case.py +322 -0
  375. rasa/e2e_test/e2e_test_result.py +34 -0
  376. rasa/e2e_test/e2e_test_runner.py +659 -0
  377. rasa/e2e_test/e2e_test_schema.yml +67 -0
  378. rasa/engine/__init__.py +0 -0
  379. rasa/engine/caching.py +464 -0
  380. rasa/engine/constants.py +17 -0
  381. rasa/engine/exceptions.py +14 -0
  382. rasa/engine/graph.py +625 -0
  383. rasa/engine/loader.py +36 -0
  384. rasa/engine/recipes/__init__.py +0 -0
  385. rasa/engine/recipes/config_files/default_config.yml +44 -0
  386. rasa/engine/recipes/default_components.py +99 -0
  387. rasa/engine/recipes/default_recipe.py +1252 -0
  388. rasa/engine/recipes/graph_recipe.py +79 -0
  389. rasa/engine/recipes/recipe.py +93 -0
  390. rasa/engine/runner/__init__.py +0 -0
  391. rasa/engine/runner/dask.py +256 -0
  392. rasa/engine/runner/interface.py +49 -0
  393. rasa/engine/storage/__init__.py +0 -0
  394. rasa/engine/storage/local_model_storage.py +248 -0
  395. rasa/engine/storage/resource.py +110 -0
  396. rasa/engine/storage/storage.py +203 -0
  397. rasa/engine/training/__init__.py +0 -0
  398. rasa/engine/training/components.py +176 -0
  399. rasa/engine/training/fingerprinting.py +64 -0
  400. rasa/engine/training/graph_trainer.py +256 -0
  401. rasa/engine/training/hooks.py +164 -0
  402. rasa/engine/validation.py +839 -0
  403. rasa/env.py +5 -0
  404. rasa/exceptions.py +69 -0
  405. rasa/graph_components/__init__.py +0 -0
  406. rasa/graph_components/converters/__init__.py +0 -0
  407. rasa/graph_components/converters/nlu_message_converter.py +48 -0
  408. rasa/graph_components/providers/__init__.py +0 -0
  409. rasa/graph_components/providers/domain_for_core_training_provider.py +87 -0
  410. rasa/graph_components/providers/domain_provider.py +71 -0
  411. rasa/graph_components/providers/flows_provider.py +74 -0
  412. rasa/graph_components/providers/forms_provider.py +44 -0
  413. rasa/graph_components/providers/nlu_training_data_provider.py +56 -0
  414. rasa/graph_components/providers/responses_provider.py +44 -0
  415. rasa/graph_components/providers/rule_only_provider.py +49 -0
  416. rasa/graph_components/providers/story_graph_provider.py +43 -0
  417. rasa/graph_components/providers/training_tracker_provider.py +55 -0
  418. rasa/graph_components/validators/__init__.py +0 -0
  419. rasa/graph_components/validators/default_recipe_validator.py +552 -0
  420. rasa/graph_components/validators/finetuning_validator.py +302 -0
  421. rasa/hooks.py +113 -0
  422. rasa/jupyter.py +63 -0
  423. rasa/keys +1 -0
  424. rasa/markers/__init__.py +0 -0
  425. rasa/markers/marker.py +269 -0
  426. rasa/markers/marker_base.py +828 -0
  427. rasa/markers/upload.py +74 -0
  428. rasa/markers/validate.py +21 -0
  429. rasa/model.py +118 -0
  430. rasa/model_testing.py +457 -0
  431. rasa/model_training.py +535 -0
  432. rasa/nlu/__init__.py +7 -0
  433. rasa/nlu/classifiers/__init__.py +3 -0
  434. rasa/nlu/classifiers/classifier.py +5 -0
  435. rasa/nlu/classifiers/diet_classifier.py +1874 -0
  436. rasa/nlu/classifiers/fallback_classifier.py +192 -0
  437. rasa/nlu/classifiers/keyword_intent_classifier.py +188 -0
  438. rasa/nlu/classifiers/llm_intent_classifier.py +519 -0
  439. rasa/nlu/classifiers/logistic_regression_classifier.py +240 -0
  440. rasa/nlu/classifiers/mitie_intent_classifier.py +156 -0
  441. rasa/nlu/classifiers/regex_message_handler.py +56 -0
  442. rasa/nlu/classifiers/sklearn_intent_classifier.py +309 -0
  443. rasa/nlu/constants.py +77 -0
  444. rasa/nlu/convert.py +40 -0
  445. rasa/nlu/emulators/__init__.py +0 -0
  446. rasa/nlu/emulators/dialogflow.py +55 -0
  447. rasa/nlu/emulators/emulator.py +49 -0
  448. rasa/nlu/emulators/luis.py +86 -0
  449. rasa/nlu/emulators/no_emulator.py +10 -0
  450. rasa/nlu/emulators/wit.py +56 -0
  451. rasa/nlu/extractors/__init__.py +0 -0
  452. rasa/nlu/extractors/crf_entity_extractor.py +672 -0
  453. rasa/nlu/extractors/duckling_entity_extractor.py +206 -0
  454. rasa/nlu/extractors/entity_synonyms.py +178 -0
  455. rasa/nlu/extractors/extractor.py +470 -0
  456. rasa/nlu/extractors/mitie_entity_extractor.py +293 -0
  457. rasa/nlu/extractors/regex_entity_extractor.py +220 -0
  458. rasa/nlu/extractors/spacy_entity_extractor.py +95 -0
  459. rasa/nlu/featurizers/__init__.py +0 -0
  460. rasa/nlu/featurizers/dense_featurizer/__init__.py +0 -0
  461. rasa/nlu/featurizers/dense_featurizer/convert_featurizer.py +449 -0
  462. rasa/nlu/featurizers/dense_featurizer/dense_featurizer.py +57 -0
  463. rasa/nlu/featurizers/dense_featurizer/lm_featurizer.py +772 -0
  464. rasa/nlu/featurizers/dense_featurizer/mitie_featurizer.py +170 -0
  465. rasa/nlu/featurizers/dense_featurizer/spacy_featurizer.py +132 -0
  466. rasa/nlu/featurizers/featurizer.py +89 -0
  467. rasa/nlu/featurizers/sparse_featurizer/__init__.py +0 -0
  468. rasa/nlu/featurizers/sparse_featurizer/count_vectors_featurizer.py +840 -0
  469. rasa/nlu/featurizers/sparse_featurizer/lexical_syntactic_featurizer.py +539 -0
  470. rasa/nlu/featurizers/sparse_featurizer/regex_featurizer.py +269 -0
  471. rasa/nlu/featurizers/sparse_featurizer/sparse_featurizer.py +9 -0
  472. rasa/nlu/model.py +24 -0
  473. rasa/nlu/persistor.py +240 -0
  474. rasa/nlu/run.py +27 -0
  475. rasa/nlu/selectors/__init__.py +0 -0
  476. rasa/nlu/selectors/response_selector.py +990 -0
  477. rasa/nlu/test.py +1943 -0
  478. rasa/nlu/tokenizers/__init__.py +0 -0
  479. rasa/nlu/tokenizers/jieba_tokenizer.py +148 -0
  480. rasa/nlu/tokenizers/mitie_tokenizer.py +75 -0
  481. rasa/nlu/tokenizers/spacy_tokenizer.py +72 -0
  482. rasa/nlu/tokenizers/tokenizer.py +239 -0
  483. rasa/nlu/tokenizers/whitespace_tokenizer.py +106 -0
  484. rasa/nlu/utils/__init__.py +35 -0
  485. rasa/nlu/utils/bilou_utils.py +462 -0
  486. rasa/nlu/utils/hugging_face/__init__.py +0 -0
  487. rasa/nlu/utils/hugging_face/registry.py +108 -0
  488. rasa/nlu/utils/hugging_face/transformers_pre_post_processors.py +311 -0
  489. rasa/nlu/utils/mitie_utils.py +113 -0
  490. rasa/nlu/utils/pattern_utils.py +168 -0
  491. rasa/nlu/utils/spacy_utils.py +312 -0
  492. rasa/plugin.py +90 -0
  493. rasa/server.py +1536 -0
  494. rasa/shared/__init__.py +0 -0
  495. rasa/shared/constants.py +181 -0
  496. rasa/shared/core/__init__.py +0 -0
  497. rasa/shared/core/constants.py +168 -0
  498. rasa/shared/core/conversation.py +46 -0
  499. rasa/shared/core/domain.py +2106 -0
  500. rasa/shared/core/events.py +2507 -0
  501. rasa/shared/core/flows/__init__.py +7 -0
  502. rasa/shared/core/flows/flow.py +353 -0
  503. rasa/shared/core/flows/flow_step.py +146 -0
  504. rasa/shared/core/flows/flow_step_links.py +319 -0
  505. rasa/shared/core/flows/flow_step_sequence.py +70 -0
  506. rasa/shared/core/flows/flows_list.py +211 -0
  507. rasa/shared/core/flows/flows_yaml_schema.json +217 -0
  508. rasa/shared/core/flows/nlu_trigger.py +117 -0
  509. rasa/shared/core/flows/steps/__init__.py +24 -0
  510. rasa/shared/core/flows/steps/action.py +51 -0
  511. rasa/shared/core/flows/steps/call.py +64 -0
  512. rasa/shared/core/flows/steps/collect.py +112 -0
  513. rasa/shared/core/flows/steps/constants.py +5 -0
  514. rasa/shared/core/flows/steps/continuation.py +36 -0
  515. rasa/shared/core/flows/steps/end.py +22 -0
  516. rasa/shared/core/flows/steps/internal.py +44 -0
  517. rasa/shared/core/flows/steps/link.py +51 -0
  518. rasa/shared/core/flows/steps/no_operation.py +48 -0
  519. rasa/shared/core/flows/steps/set_slots.py +50 -0
  520. rasa/shared/core/flows/steps/start.py +30 -0
  521. rasa/shared/core/flows/validation.py +527 -0
  522. rasa/shared/core/flows/yaml_flows_io.py +278 -0
  523. rasa/shared/core/generator.py +907 -0
  524. rasa/shared/core/slot_mappings.py +235 -0
  525. rasa/shared/core/slots.py +647 -0
  526. rasa/shared/core/trackers.py +1159 -0
  527. rasa/shared/core/training_data/__init__.py +0 -0
  528. rasa/shared/core/training_data/loading.py +90 -0
  529. rasa/shared/core/training_data/story_reader/__init__.py +0 -0
  530. rasa/shared/core/training_data/story_reader/story_reader.py +129 -0
  531. rasa/shared/core/training_data/story_reader/story_step_builder.py +168 -0
  532. rasa/shared/core/training_data/story_reader/yaml_story_reader.py +888 -0
  533. rasa/shared/core/training_data/story_writer/__init__.py +0 -0
  534. rasa/shared/core/training_data/story_writer/story_writer.py +76 -0
  535. rasa/shared/core/training_data/story_writer/yaml_story_writer.py +442 -0
  536. rasa/shared/core/training_data/structures.py +838 -0
  537. rasa/shared/core/training_data/visualization.html +146 -0
  538. rasa/shared/core/training_data/visualization.py +603 -0
  539. rasa/shared/data.py +192 -0
  540. rasa/shared/engine/__init__.py +0 -0
  541. rasa/shared/engine/caching.py +26 -0
  542. rasa/shared/exceptions.py +129 -0
  543. rasa/shared/importers/__init__.py +0 -0
  544. rasa/shared/importers/importer.py +705 -0
  545. rasa/shared/importers/multi_project.py +203 -0
  546. rasa/shared/importers/rasa.py +100 -0
  547. rasa/shared/importers/utils.py +34 -0
  548. rasa/shared/nlu/__init__.py +0 -0
  549. rasa/shared/nlu/constants.py +45 -0
  550. rasa/shared/nlu/interpreter.py +10 -0
  551. rasa/shared/nlu/training_data/__init__.py +0 -0
  552. rasa/shared/nlu/training_data/entities_parser.py +209 -0
  553. rasa/shared/nlu/training_data/features.py +374 -0
  554. rasa/shared/nlu/training_data/formats/__init__.py +10 -0
  555. rasa/shared/nlu/training_data/formats/dialogflow.py +162 -0
  556. rasa/shared/nlu/training_data/formats/luis.py +87 -0
  557. rasa/shared/nlu/training_data/formats/rasa.py +135 -0
  558. rasa/shared/nlu/training_data/formats/rasa_yaml.py +605 -0
  559. rasa/shared/nlu/training_data/formats/readerwriter.py +245 -0
  560. rasa/shared/nlu/training_data/formats/wit.py +52 -0
  561. rasa/shared/nlu/training_data/loading.py +137 -0
  562. rasa/shared/nlu/training_data/lookup_tables_parser.py +30 -0
  563. rasa/shared/nlu/training_data/message.py +477 -0
  564. rasa/shared/nlu/training_data/schemas/__init__.py +0 -0
  565. rasa/shared/nlu/training_data/schemas/data_schema.py +85 -0
  566. rasa/shared/nlu/training_data/schemas/nlu.yml +53 -0
  567. rasa/shared/nlu/training_data/schemas/responses.yml +70 -0
  568. rasa/shared/nlu/training_data/synonyms_parser.py +42 -0
  569. rasa/shared/nlu/training_data/training_data.py +732 -0
  570. rasa/shared/nlu/training_data/util.py +223 -0
  571. rasa/shared/providers/__init__.py +0 -0
  572. rasa/shared/providers/openai/__init__.py +0 -0
  573. rasa/shared/providers/openai/clients.py +43 -0
  574. rasa/shared/providers/openai/session_handler.py +110 -0
  575. rasa/shared/utils/__init__.py +0 -0
  576. rasa/shared/utils/cli.py +72 -0
  577. rasa/shared/utils/common.py +308 -0
  578. rasa/shared/utils/constants.py +1 -0
  579. rasa/shared/utils/io.py +403 -0
  580. rasa/shared/utils/llm.py +405 -0
  581. rasa/shared/utils/pykwalify_extensions.py +26 -0
  582. rasa/shared/utils/schemas/__init__.py +0 -0
  583. rasa/shared/utils/schemas/config.yml +2 -0
  584. rasa/shared/utils/schemas/domain.yml +142 -0
  585. rasa/shared/utils/schemas/events.py +212 -0
  586. rasa/shared/utils/schemas/model_config.yml +46 -0
  587. rasa/shared/utils/schemas/stories.yml +173 -0
  588. rasa/shared/utils/yaml.py +777 -0
  589. rasa/studio/__init__.py +0 -0
  590. rasa/studio/auth.py +252 -0
  591. rasa/studio/config.py +127 -0
  592. rasa/studio/constants.py +16 -0
  593. rasa/studio/data_handler.py +352 -0
  594. rasa/studio/download.py +350 -0
  595. rasa/studio/train.py +136 -0
  596. rasa/studio/upload.py +408 -0
  597. rasa/telemetry.py +1583 -0
  598. rasa/tracing/__init__.py +0 -0
  599. rasa/tracing/config.py +338 -0
  600. rasa/tracing/constants.py +38 -0
  601. rasa/tracing/instrumentation/__init__.py +0 -0
  602. rasa/tracing/instrumentation/attribute_extractors.py +663 -0
  603. rasa/tracing/instrumentation/instrumentation.py +939 -0
  604. rasa/tracing/instrumentation/intentless_policy_instrumentation.py +142 -0
  605. rasa/tracing/instrumentation/metrics.py +206 -0
  606. rasa/tracing/metric_instrument_provider.py +125 -0
  607. rasa/utils/__init__.py +0 -0
  608. rasa/utils/beta.py +83 -0
  609. rasa/utils/cli.py +27 -0
  610. rasa/utils/common.py +635 -0
  611. rasa/utils/converter.py +53 -0
  612. rasa/utils/endpoints.py +303 -0
  613. rasa/utils/io.py +326 -0
  614. rasa/utils/licensing.py +319 -0
  615. rasa/utils/log_utils.py +174 -0
  616. rasa/utils/mapper.py +210 -0
  617. rasa/utils/ml_utils.py +145 -0
  618. rasa/utils/plotting.py +362 -0
  619. rasa/utils/singleton.py +23 -0
  620. rasa/utils/tensorflow/__init__.py +0 -0
  621. rasa/utils/tensorflow/callback.py +112 -0
  622. rasa/utils/tensorflow/constants.py +116 -0
  623. rasa/utils/tensorflow/crf.py +492 -0
  624. rasa/utils/tensorflow/data_generator.py +440 -0
  625. rasa/utils/tensorflow/environment.py +161 -0
  626. rasa/utils/tensorflow/exceptions.py +5 -0
  627. rasa/utils/tensorflow/layers.py +1565 -0
  628. rasa/utils/tensorflow/layers_utils.py +113 -0
  629. rasa/utils/tensorflow/metrics.py +281 -0
  630. rasa/utils/tensorflow/model_data.py +991 -0
  631. rasa/utils/tensorflow/model_data_utils.py +500 -0
  632. rasa/utils/tensorflow/models.py +936 -0
  633. rasa/utils/tensorflow/rasa_layers.py +1094 -0
  634. rasa/utils/tensorflow/transformer.py +640 -0
  635. rasa/utils/tensorflow/types.py +6 -0
  636. rasa/utils/train_utils.py +572 -0
  637. rasa/utils/yaml.py +54 -0
  638. rasa/validator.py +1035 -0
  639. rasa/version.py +3 -0
  640. rasa_pro-3.8.16.dist-info/METADATA +528 -0
  641. rasa_pro-3.8.16.dist-info/NOTICE +5 -0
  642. rasa_pro-3.8.16.dist-info/RECORD +644 -0
  643. rasa_pro-3.8.16.dist-info/WHEEL +4 -0
  644. rasa_pro-3.8.16.dist-info/entry_points.txt +3 -0
@@ -0,0 +1,539 @@
1
+ from __future__ import annotations
2
+ import logging
3
+ from collections import OrderedDict
4
+
5
+ import scipy.sparse
6
+ import numpy as np
7
+ from typing import (
8
+ Any,
9
+ Dict,
10
+ Text,
11
+ List,
12
+ Tuple,
13
+ Callable,
14
+ Set,
15
+ Optional,
16
+ Type,
17
+ Union,
18
+ )
19
+
20
+ from rasa.engine.graph import ExecutionContext, GraphComponent
21
+ from rasa.engine.recipes.default_recipe import DefaultV1Recipe
22
+ from rasa.engine.storage.resource import Resource
23
+ from rasa.engine.storage.storage import ModelStorage
24
+ from rasa.nlu.tokenizers.spacy_tokenizer import POS_TAG_KEY, SpacyTokenizer
25
+ from rasa.nlu.tokenizers.tokenizer import Token, Tokenizer
26
+ from rasa.nlu.featurizers.sparse_featurizer.sparse_featurizer import SparseFeaturizer
27
+ from rasa.nlu.constants import TOKENS_NAMES
28
+ from rasa.shared.constants import DOCS_URL_COMPONENTS
29
+ from rasa.shared.nlu.training_data.training_data import TrainingData
30
+ from rasa.shared.nlu.training_data.message import Message
31
+ from rasa.shared.nlu.constants import TEXT
32
+ from rasa.shared.exceptions import InvalidConfigException
33
+ import rasa.shared.utils.io
34
+ import rasa.utils.io
35
+
36
+ logger = logging.getLogger(__name__)
37
+
38
+
39
+ END_OF_SENTENCE = "EOS"
40
+ BEGIN_OF_SENTENCE = "BOS"
41
+
42
+ FEATURES = "features"
43
+
44
+
45
+ @DefaultV1Recipe.register(
46
+ DefaultV1Recipe.ComponentType.MESSAGE_FEATURIZER, is_trainable=True
47
+ )
48
+ class LexicalSyntacticFeaturizer(SparseFeaturizer, GraphComponent):
49
+ """Extracts and encodes lexical syntactic features.
50
+
51
+ Given a sequence of tokens, this featurizer produces a sequence of features
52
+ where the `t`-th feature encodes lexical and syntactic information about the `t`-th
53
+ token and it's surrounding tokens.
54
+
55
+ In detail: The lexical syntactic features can be specified via a list of
56
+ configurations `[c_0, c_1, ..., c_n]` where each `c_i` is a list of names of
57
+ lexical and syntactic features (e.g. `low`, `suffix2`, `digit`).
58
+ For a given tokenized text, the featurizer will consider a window of size `n`
59
+ around each token and evaluate the given list of configurations as follows:
60
+ - It will extract the features listed in `c_m` where `m = (n-1)/2` if n is even and
61
+ `n/2` from token `t`
62
+ - It will extract the features listed in `c_{m-1}`,`c_{m-2}` ... , from the last,
63
+ second to last, ... token before token `t`, respectively.
64
+ - It will extract the features listed `c_{m+1}`, `c_{m+1}`, ... for the first,
65
+ second, ... token `t`, respectively.
66
+ It will then combine all these features into one feature for position `t`.
67
+
68
+ Example:
69
+ If we specify `[['low'], ['upper'], ['prefix2']]`, then for each position `t`
70
+ the `t`-th feature will encode whether the token at position `t` is upper case,
71
+ where the token at position `t-1` is lower case and the first two characters
72
+ of the token at position `t+1`.
73
+ """
74
+
75
+ FILENAME_FEATURE_TO_IDX_DICT = "feature_to_idx_dict.pkl"
76
+
77
+ # NOTE: "suffix5" of the token "is" will be "is". Hence, when combining multiple
78
+ # prefixes, short words will be represented/encoded repeatedly.
79
+ _FUNCTION_DICT: Dict[
80
+ Text, Callable[[Token], Union[Text, bool, None]]
81
+ ] = { # noqa: RUF012
82
+ "low": lambda token: token.text.islower(),
83
+ "title": lambda token: token.text.istitle(),
84
+ "prefix5": lambda token: token.text[:5],
85
+ "prefix2": lambda token: token.text[:2],
86
+ "suffix5": lambda token: token.text[-5:],
87
+ "suffix3": lambda token: token.text[-3:],
88
+ "suffix2": lambda token: token.text[-2:],
89
+ "suffix1": lambda token: token.text[-1:],
90
+ "pos": lambda token: token.data.get(POS_TAG_KEY, None),
91
+ "pos2": lambda token: token.data.get(POS_TAG_KEY, [])[:2]
92
+ if POS_TAG_KEY in token.data
93
+ else None,
94
+ "upper": lambda token: token.text.isupper(),
95
+ "digit": lambda token: token.text.isdigit(),
96
+ }
97
+
98
+ SUPPORTED_FEATURES = sorted(
99
+ set(_FUNCTION_DICT.keys()).union([END_OF_SENTENCE, BEGIN_OF_SENTENCE])
100
+ )
101
+
102
+ @classmethod
103
+ def _extract_raw_features_from_token(
104
+ cls, feature_name: Text, token: Token, token_position: int, num_tokens: int
105
+ ) -> Text:
106
+ """Extracts a raw feature from the token at the given position.
107
+
108
+ Args:
109
+ feature_name: the name of a supported feature
110
+ token: the token from which we want to extract the feature
111
+ token_position: the position of the token inside the tokenized text
112
+ num_tokens: the total number of tokens in the tokenized text
113
+ Returns:
114
+ the raw feature value as text
115
+ """
116
+ if feature_name not in cls.SUPPORTED_FEATURES:
117
+ raise InvalidConfigException(
118
+ f"Configured feature '{feature_name}' not valid. Please check "
119
+ f"'{DOCS_URL_COMPONENTS}' for valid configuration parameters."
120
+ )
121
+ if feature_name == END_OF_SENTENCE:
122
+ return str(token_position == num_tokens - 1)
123
+ if feature_name == BEGIN_OF_SENTENCE:
124
+ return str(token_position == 0)
125
+ return str(cls._FUNCTION_DICT[feature_name](token))
126
+
127
+ @classmethod
128
+ def required_components(cls) -> List[Type]:
129
+ """Components that should be included in the pipeline before this component."""
130
+ return [Tokenizer]
131
+
132
+ @staticmethod
133
+ def get_default_config() -> Dict[Text, Any]:
134
+ """Returns the component's default config."""
135
+ return {
136
+ **SparseFeaturizer.get_default_config(),
137
+ FEATURES: [
138
+ ["low", "title", "upper"],
139
+ ["BOS", "EOS", "low", "upper", "title", "digit"],
140
+ ["low", "title", "upper"],
141
+ ],
142
+ }
143
+
144
+ def __init__(
145
+ self,
146
+ config: Dict[Text, Any],
147
+ model_storage: ModelStorage,
148
+ resource: Resource,
149
+ execution_context: ExecutionContext,
150
+ feature_to_idx_dict: Optional[Dict[Tuple[int, Text], Dict[Text, int]]] = None,
151
+ ) -> None:
152
+ """Instantiates a new `LexicalSyntacticFeaturizer` instance."""
153
+ super().__init__(execution_context.node_name, config)
154
+ # graph component
155
+ self._model_storage = model_storage
156
+ self._resource = resource
157
+ self._execution_context = execution_context
158
+ # featurizer specific
159
+ self._feature_config = self._config[FEATURES]
160
+ self._set_feature_to_idx_dict(
161
+ feature_to_idx_dict or {}, check_consistency_with_config=True
162
+ )
163
+
164
+ @classmethod
165
+ def validate_config(cls, config: Dict[Text, Any]) -> None:
166
+ """Validates that the component is configured properly."""
167
+ if FEATURES not in config:
168
+ return # will be replaced with default
169
+ feature_config = config[FEATURES]
170
+ message = (
171
+ f"Expected configuration of `features` to be a list of lists that "
172
+ f"that contain names of lexical and syntactic features "
173
+ f"(i.e. {cls.SUPPORTED_FEATURES}). "
174
+ f"Received {feature_config} instead. "
175
+ )
176
+ try:
177
+ configured_feature_names = set(
178
+ feature_name
179
+ for pos_config in feature_config
180
+ for feature_name in pos_config
181
+ )
182
+ except TypeError as e:
183
+ raise InvalidConfigException(message) from e
184
+ if configured_feature_names.difference(cls.SUPPORTED_FEATURES):
185
+ raise InvalidConfigException(message)
186
+
187
+ def _set_feature_to_idx_dict(
188
+ self,
189
+ feature_to_idx_dict: Dict[Tuple[int, Text], Dict[Text, int]],
190
+ check_consistency_with_config: bool = False,
191
+ ) -> None:
192
+ """Sets the "feature" to index mapping.
193
+
194
+ Here, "feature" denotes the combination of window position, feature name,
195
+ and feature_value.
196
+
197
+ Args:
198
+ feature_to_idx_dict: mapping from tuples of window position and feature name
199
+ to a mapping from feature values to indices
200
+ check_consistency_with_config: whether the consistency with the current
201
+ `self.config` should be checked
202
+ """
203
+ self._feature_to_idx_dict = feature_to_idx_dict
204
+ self._number_of_features = sum(
205
+ [
206
+ len(feature_values.values())
207
+ for feature_values in self._feature_to_idx_dict.values()
208
+ ]
209
+ )
210
+ if check_consistency_with_config:
211
+ known_features = set(self._feature_to_idx_dict.keys())
212
+ not_in_config = known_features.difference(
213
+ (
214
+ (window_idx, feature_name)
215
+ for window_idx, feature_names in enumerate(self._feature_config)
216
+ for feature_name in feature_names
217
+ )
218
+ )
219
+ if not_in_config:
220
+ rasa.shared.utils.io.raise_warning(
221
+ f"A feature to index mapping has been loaded that does not match "
222
+ f"the configured features. The given mapping configures "
223
+ f" (position in window, feature_name): {not_in_config}. "
224
+ f" These are not specified in the given config "
225
+ f" {self._feature_config}. "
226
+ f"Continuing with constant values for these features. "
227
+ )
228
+
229
+ def train(self, training_data: TrainingData) -> Resource:
230
+ """Trains the featurizer.
231
+
232
+ Args:
233
+ training_data: the training data
234
+
235
+ Returns:
236
+ the resource from which this trained component can be loaded
237
+ """
238
+ self.warn_if_pos_features_cannot_be_computed(training_data)
239
+ feature_to_idx_dict = self._create_feature_to_idx_dict(training_data)
240
+ self._set_feature_to_idx_dict(feature_to_idx_dict=feature_to_idx_dict)
241
+ if not self._feature_to_idx_dict:
242
+ rasa.shared.utils.io.raise_warning(
243
+ "No lexical syntactic features could be extracted from the training "
244
+ "data. In order for this component to work you need to define "
245
+ "`features` that can be found in the given training data."
246
+ )
247
+ self.persist()
248
+ return self._resource
249
+
250
+ def warn_if_pos_features_cannot_be_computed(
251
+ self, training_data: TrainingData
252
+ ) -> None:
253
+ """Warn if part-of-speech features are needed but not given."""
254
+ training_example = next(
255
+ (
256
+ message
257
+ for message in training_data.training_examples
258
+ if message.get(TOKENS_NAMES[TEXT], [])
259
+ ),
260
+ Message(),
261
+ )
262
+ tokens_example = training_example.get(TOKENS_NAMES[TEXT], [])
263
+
264
+ configured_feature_names = set(
265
+ feature_name
266
+ for pos_config in self._feature_config
267
+ for feature_name in pos_config
268
+ )
269
+ if {"pos", "pos2"}.intersection(
270
+ configured_feature_names
271
+ ) and not tokens_example[0].data.get(POS_TAG_KEY, []):
272
+ rasa.shared.utils.io.raise_warning(
273
+ f"Expected training data to include tokens with part-of-speech tags"
274
+ f"because the given configuration includes part-of-speech features "
275
+ f"`pos` and/or `pos2`. "
276
+ f"Please add a {SpacyTokenizer.__name__} to your "
277
+ f"configuration if you want to use the part-of-speech-features in the"
278
+ f"{self.__class__.__name__}. "
279
+ f"Continuing without the part-of-speech-features."
280
+ )
281
+
282
+ def _create_feature_to_idx_dict(
283
+ self, training_data: TrainingData
284
+ ) -> Dict[Tuple[int, Text], Dict[Text, int]]:
285
+ """Create a nested dictionary of all feature values.
286
+
287
+ Returns:
288
+ a nested mapping that maps from tuples of positions (in the window) and
289
+ supported feature names to "raw feature to index" mappings, i.e.
290
+ mappings that map the respective raw feature values to unique indices
291
+ (where `unique` means unique with respect to all indices in the
292
+ *nested* mapping)
293
+ """
294
+ # collect all raw feature values
295
+ feature_vocabulary: Dict[Tuple[int, Text], Set[Text]] = dict()
296
+ for example in training_data.training_examples:
297
+ tokens = example.get(TOKENS_NAMES[TEXT], [])
298
+ sentence_features = self._map_tokens_to_raw_features(tokens)
299
+ for token_features in sentence_features:
300
+ for position_and_feature_name, feature_value in token_features.items():
301
+ feature_vocabulary.setdefault(position_and_feature_name, set()).add(
302
+ feature_value
303
+ )
304
+ # assign a unique index to each feature value
305
+ return self._build_feature_to_index_map(feature_vocabulary)
306
+
307
+ def _map_tokens_to_raw_features(
308
+ self, tokens: List[Token]
309
+ ) -> List[Dict[Tuple[int, Text], Text]]:
310
+ """Extracts the raw feature values.
311
+
312
+ Args:
313
+ tokens: a tokenized text
314
+ Returns:
315
+ a list of feature dictionaries for each token in the given list
316
+ where each feature dictionary maps a tuple containing
317
+ - a position (in the window) and
318
+ - a supported feature name
319
+ to the corresponding raw feature value
320
+ """
321
+ sentence_features = []
322
+
323
+ # in case of an even number we will look at one more word before,
324
+ # e.g. window size 4 will result in a window range of
325
+ # [-2, -1, 0, 1] (0 = current word in sentence)
326
+ window_size = len(self._feature_config)
327
+ half_window_size = window_size // 2
328
+ window_range = range(-half_window_size, half_window_size + window_size % 2)
329
+ assert len(window_range) == window_size
330
+
331
+ for anchor in range(len(tokens)):
332
+
333
+ token_features: Dict[Tuple[int, Text], Text] = {}
334
+
335
+ for window_position, relative_position in enumerate(window_range):
336
+ absolute_position = anchor + relative_position
337
+
338
+ # skip, if current_idx is pointing to a non-existing token
339
+ if absolute_position < 0 or absolute_position >= len(tokens):
340
+ continue
341
+
342
+ token = tokens[absolute_position]
343
+ for feature_name in self._feature_config[window_position]:
344
+ token_features[
345
+ (window_position, feature_name)
346
+ ] = self._extract_raw_features_from_token(
347
+ token=token,
348
+ feature_name=feature_name,
349
+ token_position=absolute_position,
350
+ num_tokens=len(tokens),
351
+ )
352
+
353
+ sentence_features.append(token_features)
354
+
355
+ return sentence_features
356
+
357
+ @staticmethod
358
+ def _build_feature_to_index_map(
359
+ feature_vocabulary: Dict[Tuple[int, Text], Set[Text]]
360
+ ) -> Dict[Tuple[int, Text], Dict[Text, int]]:
361
+ """Creates a nested dictionary for mapping raw features to indices.
362
+
363
+ Args:
364
+ feature_vocabulary: a mapping from tuples of positions (in the window) and
365
+ supported feature names to the set of possible feature values
366
+ Returns:
367
+ a nested mapping that maps from tuples of positions (in the window) and
368
+ supported feature names to "raw feature to index" mappings, i.e.
369
+ mappings that map the respective raw feature values to unique indices
370
+ (where `unique` means unique with respect to all indices in the
371
+ *nested* mapping)
372
+ """
373
+ # Note that this will only sort the top level keys - and we keep
374
+ # doing it to ensure consistently with what was done before)
375
+ ordered_feature_vocabulary: Dict[Tuple[int, Text], Set[Text]] = OrderedDict(
376
+ sorted(feature_vocabulary.items())
377
+ )
378
+
379
+ # create the nested mapping
380
+ feature_to_idx_dict: Dict[Tuple[int, Text], Dict[Text, int]] = {}
381
+ offset = 0
382
+ for (
383
+ position_and_feature_name,
384
+ feature_values,
385
+ ) in ordered_feature_vocabulary.items():
386
+ sorted_feature_values = sorted(feature_values)
387
+ feature_to_idx_dict[position_and_feature_name] = {
388
+ feature_value: feature_idx
389
+ for feature_idx, feature_value in enumerate(
390
+ sorted_feature_values, start=offset
391
+ )
392
+ }
393
+ offset += len(feature_values)
394
+
395
+ return feature_to_idx_dict
396
+
397
+ def process(self, messages: List[Message]) -> List[Message]:
398
+ """Featurizes all given messages in-place.
399
+
400
+ Args:
401
+ messages: messages to be featurized.
402
+
403
+ Returns:
404
+ The same list with the same messages after featurization.
405
+ """
406
+ for message in messages:
407
+ self._process_message(message)
408
+ return messages
409
+
410
+ def process_training_data(self, training_data: TrainingData) -> TrainingData:
411
+ """Processes the training examples in the given training data in-place.
412
+
413
+ Args:
414
+ training_data: the training data
415
+
416
+ Returns:
417
+ same training data after processing
418
+ """
419
+ self.process(training_data.training_examples)
420
+ return training_data
421
+
422
+ def _process_message(self, message: Message) -> None:
423
+ """Featurizes the given message in-place.
424
+
425
+ Args:
426
+ message: a message to be featurized
427
+ """
428
+ if not self._feature_to_idx_dict:
429
+ rasa.shared.utils.io.raise_warning(
430
+ f"The {self.__class__.__name__} {self._identifier} has not been "
431
+ f"trained properly yet. "
432
+ f"Continuing without adding features from this featurizer."
433
+ )
434
+ return
435
+ tokens = message.get(TOKENS_NAMES[TEXT])
436
+ if tokens:
437
+ sentence_features = self._map_tokens_to_raw_features(tokens)
438
+ sparse_matrix = self._map_raw_features_to_indices(sentence_features)
439
+ self.add_features_to_message(
440
+ # FIXME: create sentence feature and make `sentence` non optional
441
+ sequence=sparse_matrix,
442
+ sentence=None,
443
+ attribute=TEXT,
444
+ message=message,
445
+ )
446
+
447
+ def _map_raw_features_to_indices(
448
+ self, sentence_features: List[Dict[Tuple[int, Text], Any]]
449
+ ) -> scipy.sparse.coo_matrix:
450
+ """Converts the raw features to one-hot encodings.
451
+
452
+ Requires the "feature" to index dictionary, i.e. the featurizer must have
453
+ been trained.
454
+
455
+ Args:
456
+ sentence_features: a list of feature dictionaries where the `t`-th feature
457
+ dictionary maps a tuple containing
458
+ - a position (in the window) and
459
+ - a supported feature name
460
+ to the raw feature value extracted from the window around the `t`-th token.
461
+
462
+ Returns:
463
+ a sparse matrix where the `i`-th row is a multi-hot vector that encodes the
464
+ raw features extracted from the window around the `i`-th token
465
+ """
466
+ rows = []
467
+ cols = []
468
+ shape = (len(sentence_features), self._number_of_features)
469
+ for token_idx, token_features in enumerate(sentence_features):
470
+ for position_and_feature_name, feature_value in token_features.items():
471
+ mapping = self._feature_to_idx_dict.get(position_and_feature_name)
472
+ if not mapping:
473
+ continue
474
+ feature_idx = mapping.get(feature_value, -1)
475
+ if feature_idx > -1:
476
+ rows.append(token_idx)
477
+ cols.append(feature_idx)
478
+ data = np.ones(len(rows))
479
+ return scipy.sparse.coo_matrix(
480
+ (data, (np.array(rows), np.array(cols))), shape=shape
481
+ )
482
+
483
+ @classmethod
484
+ def create(
485
+ cls,
486
+ config: Dict[Text, Any],
487
+ model_storage: ModelStorage,
488
+ resource: Resource,
489
+ execution_context: ExecutionContext,
490
+ ) -> LexicalSyntacticFeaturizer:
491
+ """Creates a new untrained component (see parent class for full docstring)."""
492
+ return cls(config, model_storage, resource, execution_context)
493
+
494
+ @classmethod
495
+ def load(
496
+ cls,
497
+ config: Dict[Text, Any],
498
+ model_storage: ModelStorage,
499
+ resource: Resource,
500
+ execution_context: ExecutionContext,
501
+ **kwargs: Any,
502
+ ) -> LexicalSyntacticFeaturizer:
503
+ """Loads trained component (see parent class for full docstring)."""
504
+ try:
505
+ with model_storage.read_from(resource) as model_path:
506
+ feature_to_idx_dict = rasa.utils.io.json_unpickle(
507
+ model_path / cls.FILENAME_FEATURE_TO_IDX_DICT,
508
+ encode_non_string_keys=True,
509
+ )
510
+ return cls(
511
+ config=config,
512
+ model_storage=model_storage,
513
+ resource=resource,
514
+ execution_context=execution_context,
515
+ feature_to_idx_dict=feature_to_idx_dict,
516
+ )
517
+ except ValueError:
518
+ logger.debug(
519
+ f"Failed to load `{cls.__class__.__name__}` from model storage. "
520
+ f"Resource '{resource.name}' doesn't exist."
521
+ )
522
+ return cls(
523
+ config=config,
524
+ model_storage=model_storage,
525
+ resource=resource,
526
+ execution_context=execution_context,
527
+ )
528
+
529
+ def persist(self) -> None:
530
+ """Persist this model (see parent class for full docstring)."""
531
+ if not self._feature_to_idx_dict:
532
+ return None
533
+
534
+ with self._model_storage.write_to(self._resource) as model_path:
535
+ rasa.utils.io.json_pickle(
536
+ model_path / self.FILENAME_FEATURE_TO_IDX_DICT,
537
+ self._feature_to_idx_dict,
538
+ encode_non_string_keys=True,
539
+ )