mirror of
https://github.com/pyt0xic/pablo-bot.git
synced 2024-11-25 15:19:33 +01:00
Started on training data and wrote script for fetching knowledge base data from tripsit
This commit is contained in:
parent
7ac76d212e
commit
1f885928c7
3
.gitignore
vendored
3
.gitignore
vendored
@ -127,3 +127,6 @@ dmypy.json
|
|||||||
|
|
||||||
# Pyre type checker
|
# Pyre type checker
|
||||||
.pyre/
|
.pyre/
|
||||||
|
|
||||||
|
models/
|
||||||
|
.vscode
|
79
config.yml
79
config.yml
@ -1,36 +1,49 @@
|
|||||||
# Configuration for Rasa NLU.
|
|
||||||
# https://rasa.com/docs/rasa/nlu/components/
|
|
||||||
language: en
|
language: en
|
||||||
|
|
||||||
pipeline:
|
pipeline:
|
||||||
# # No configuration for the NLU pipeline was provided. The following default pipeline was used to train your model.
|
- name: WhitespaceTokenizer
|
||||||
# # If you'd like to customize it, uncomment and adjust the pipeline.
|
token_pattern: (?u)\b\w+\b
|
||||||
# # See https://rasa.com/docs/rasa/tuning-your-model for more information.
|
- name: RegexFeaturizer
|
||||||
# - name: WhitespaceTokenizer
|
- name: LexicalSyntacticFeaturizer
|
||||||
# - name: RegexFeaturizer
|
- name: CountVectorsFeaturizer
|
||||||
# - name: LexicalSyntacticFeaturizer
|
# OOV_token: oov
|
||||||
# - name: CountVectorsFeaturizer
|
- name: CountVectorsFeaturizer
|
||||||
# - name: CountVectorsFeaturizer
|
analyzer: char_wb
|
||||||
# analyzer: char_wb
|
min_ngram: 1
|
||||||
# min_ngram: 1
|
max_ngram: 4
|
||||||
# max_ngram: 4
|
- name: DIETClassifier
|
||||||
# - name: DIETClassifier
|
epochs: 100
|
||||||
# epochs: 100
|
ranking_length: 10
|
||||||
# - name: EntitySynonymMapper
|
# - name: DucklingEntityExtractor
|
||||||
# - name: ResponseSelector
|
# url: http://localhost:8000
|
||||||
# epochs: 100
|
# dimensions:
|
||||||
# - name: FallbackClassifier
|
# - email
|
||||||
# threshold: 0.3
|
# - number
|
||||||
# ambiguity_threshold: 0.1
|
# - amount-of-money
|
||||||
|
- name: EntitySynonymMapper
|
||||||
# Configuration for Rasa Core.
|
- name: ResponseSelector
|
||||||
# https://rasa.com/docs/rasa/core/policies/
|
retrieval_intent: out_of_scope
|
||||||
|
scale_loss: false
|
||||||
|
epochs: 100
|
||||||
|
- name: ResponseSelector
|
||||||
|
retrieval_intent: faq
|
||||||
|
scale_loss: false
|
||||||
|
epochs: 100
|
||||||
|
- name: ResponseSelector
|
||||||
|
retrieval_intent: chitchat
|
||||||
|
scale_loss: false
|
||||||
|
epochs: 100
|
||||||
|
- name: FallbackClassifier
|
||||||
|
threshold: 0.7
|
||||||
policies:
|
policies:
|
||||||
# # No configuration for policies was provided. The following default policies were used to train your model.
|
- name: RulePolicy
|
||||||
# # If you'd like to customize them, uncomment and adjust the policies.
|
core_fallback_threshold: 0.3
|
||||||
# # See https://rasa.com/docs/rasa/policies for more information.
|
core_fallback_action_name: "action_default_fallback"
|
||||||
# - name: MemoizationPolicy
|
enable_fallback_prediction: True
|
||||||
# - name: TEDPolicy
|
- max_history: 6
|
||||||
# max_history: 5
|
name: AugmentedMemoizationPolicy
|
||||||
# epochs: 100
|
- name: TEDPolicy
|
||||||
# - name: RulePolicy
|
max_history: 10
|
||||||
|
epochs: 20
|
||||||
|
batch_size:
|
||||||
|
- 32
|
||||||
|
- 64
|
2010
data/nlu.yml
2010
data/nlu.yml
File diff suppressed because it is too large
Load Diff
@ -4,10 +4,20 @@ rules:
|
|||||||
|
|
||||||
- rule: Say goodbye anytime the user says goodbye
|
- rule: Say goodbye anytime the user says goodbye
|
||||||
steps:
|
steps:
|
||||||
- intent: goodbye
|
- intent: bye
|
||||||
- action: utter_goodbye
|
- action: utter_goodbye
|
||||||
|
|
||||||
- rule: Say 'I am a bot' anytime the user challenges
|
- rule: Chitchat
|
||||||
steps:
|
steps:
|
||||||
- intent: bot_challenge
|
- intent: chitchat
|
||||||
- action: utter_iamabot
|
- action: utter_chitchat
|
||||||
|
|
||||||
|
- rule: FAQs
|
||||||
|
steps:
|
||||||
|
- intent: faq
|
||||||
|
- action: utter_faq
|
||||||
|
|
||||||
|
- rule: OOS
|
||||||
|
steps:
|
||||||
|
- intent: out_of_scope
|
||||||
|
- action: utter_out_of_scope
|
@ -2,29 +2,23 @@ version: "2.0"
|
|||||||
|
|
||||||
stories:
|
stories:
|
||||||
|
|
||||||
- story: happy path
|
- story: simple greet
|
||||||
steps:
|
steps:
|
||||||
- intent: greet
|
- intent: greet
|
||||||
- action: utter_greet
|
- action: utter_greet
|
||||||
- intent: mood_great
|
|
||||||
- action: utter_happy
|
|
||||||
|
|
||||||
- story: sad path 1
|
- story: happy interaction
|
||||||
steps:
|
steps:
|
||||||
- intent: greet
|
- intent: greet
|
||||||
- action: utter_greet
|
- action: utter_greet
|
||||||
- intent: mood_unhappy
|
- intent: faq
|
||||||
- action: utter_cheer_up
|
- action: utter_faq
|
||||||
- action: utter_did_that_help
|
|
||||||
- intent: affirm
|
|
||||||
- action: utter_happy
|
|
||||||
|
|
||||||
- story: sad path 2
|
- story: interactive_story_1
|
||||||
steps:
|
steps:
|
||||||
- intent: greet
|
- intent: greet
|
||||||
- action: utter_greet
|
- action: utter_greet
|
||||||
- intent: mood_unhappy
|
- intent: chitchat
|
||||||
- action: utter_cheer_up
|
- action: utter_chitchat
|
||||||
- action: utter_did_that_help
|
- intent: faq
|
||||||
- intent: deny
|
- action: utter_faq
|
||||||
- action: utter_goodbye
|
|
167
domain.yml
167
domain.yml
@ -1,34 +1,139 @@
|
|||||||
version: "2.0"
|
version: '2.0'
|
||||||
|
config:
|
||||||
intents:
|
store_entities_as_slots: true
|
||||||
- greet
|
|
||||||
- goodbye
|
|
||||||
- affirm
|
|
||||||
- deny
|
|
||||||
- mood_great
|
|
||||||
- mood_unhappy
|
|
||||||
- bot_challenge
|
|
||||||
|
|
||||||
responses:
|
|
||||||
utter_greet:
|
|
||||||
- text: "Hey! How are you?"
|
|
||||||
|
|
||||||
utter_cheer_up:
|
|
||||||
- text: "Here is something to cheer you up:"
|
|
||||||
image: "https://i.imgur.com/nGF1K8f.jpg"
|
|
||||||
|
|
||||||
utter_did_that_help:
|
|
||||||
- text: "Did that help you?"
|
|
||||||
|
|
||||||
utter_happy:
|
|
||||||
- text: "Great, carry on!"
|
|
||||||
|
|
||||||
utter_goodbye:
|
|
||||||
- text: "Bye"
|
|
||||||
|
|
||||||
utter_iamabot:
|
|
||||||
- text: "I am a bot, powered by Rasa."
|
|
||||||
|
|
||||||
session_config:
|
session_config:
|
||||||
session_expiration_time: 60
|
session_expiration_time: 60
|
||||||
carry_over_slots_to_new_session: true
|
carry_over_slots_to_new_session: true
|
||||||
|
intents:
|
||||||
|
- greet
|
||||||
|
- chitchat:
|
||||||
|
is_retrieval_intent: true
|
||||||
|
- faq:
|
||||||
|
is_retrieval_intent: true
|
||||||
|
- out_of_scope:
|
||||||
|
is_retrieval_intent: true
|
||||||
|
- affirm
|
||||||
|
- deny
|
||||||
|
- bye
|
||||||
|
- react_positive
|
||||||
|
- react_negative
|
||||||
|
- explain
|
||||||
|
- thank
|
||||||
|
- help
|
||||||
|
- contact
|
||||||
|
- inform
|
||||||
|
- restart
|
||||||
|
|
||||||
|
entities:
|
||||||
|
- language
|
||||||
|
- location
|
||||||
|
- name
|
||||||
|
|
||||||
|
slots:
|
||||||
|
name:
|
||||||
|
type: text
|
||||||
|
influence_conversation: true
|
||||||
|
|
||||||
|
responses:
|
||||||
|
utter_ask_name:
|
||||||
|
- text: Hey! My name is Pablo, I am a bot, whats your name?
|
||||||
|
utter_greet_by_name:
|
||||||
|
- text: Nice to meet you {name}! How are you doing?
|
||||||
|
utter_greet:
|
||||||
|
- text: Nice to meet you! How are you doing?
|
||||||
|
utter_cheer_up:
|
||||||
|
- text: 'Here is something to cheer you up:'
|
||||||
|
image: https://i.imgur.com/nGF1K8f.jpg
|
||||||
|
utter_did_that_help:
|
||||||
|
- text: Did that help you?
|
||||||
|
utter_happy:
|
||||||
|
- text: Great!, how can I help you today? I can tell you about our company, how we can help you or why you should consider implementign a chatbot into your business!
|
||||||
|
utter_goodbye:
|
||||||
|
- text: Bye! Was nice chatting to you, if you'd like you can restart this conversation by simply telling me too.
|
||||||
|
utter_chitchat/ask_howdoing:
|
||||||
|
- text: I'm great! Thanks for asking.
|
||||||
|
- text: I'm good, thanks!
|
||||||
|
- text: A little bit too warm, otherwise fine.
|
||||||
|
- text: A little bit cold, otherwise fine.
|
||||||
|
utter_chitchat/ask_howold:
|
||||||
|
- text: Old enough to be a bot!
|
||||||
|
- text: '42'
|
||||||
|
- text: Age is just an issue of mind over matter. If you don’t mind, it doesn’t matter.
|
||||||
|
- text: My first git commit was many moons ago.
|
||||||
|
- text: Why do you ask? Are my wrinkles showing?
|
||||||
|
- text: I've hit the age where I actively try to forget how old I am.
|
||||||
|
utter_chitchat/ask_isbot:
|
||||||
|
- text: Yep, I'm a bot!
|
||||||
|
- text: Yes, I'm a bot.
|
||||||
|
- text: Yep, you guessed it, I'm a bot!
|
||||||
|
- text: I am indeed a bot 🤖
|
||||||
|
utter_chitchat/ask_ishuman:
|
||||||
|
- text: I'm not a human, I'm a bot! 🤖
|
||||||
|
utter_chitchat/ask_restaurant:
|
||||||
|
- text: I'm sorry, I can't recommend you a restaurant as I usually cook at home.
|
||||||
|
- text: I'm sorry, I'm not getting taste buds for another few updates.
|
||||||
|
- text: I'd need some more data. If you lick the monitor perhaps I can evaluate your taste buds.
|
||||||
|
utter_chitchat/ask_time:
|
||||||
|
- text: It's the most wonderful time of the year!
|
||||||
|
- text: It's party time!
|
||||||
|
- text: Time is a human construct, you'll have to tell me.
|
||||||
|
- text: It's five o'clock somewhere!
|
||||||
|
- text: "In an ever expanding universe, the real question is: what time isn't it?"
|
||||||
|
- text: That's hard to say -- it's different all over the world!
|
||||||
|
utter_chitchat/ask_languagesbot:
|
||||||
|
- text: I can spell baguette in French, but unfortunately English is the only language I can answer you in.
|
||||||
|
- text: I am in the process of learning, but at the moment I can only speak English.
|
||||||
|
- text: Binary code and the language of love. And English.
|
||||||
|
- text: I was written in Python, but for your convenience I'll translate to English.
|
||||||
|
utter_chitchat/ask_weather:
|
||||||
|
- text: I don't know about where you live, but in my world it's always sunny 🔆
|
||||||
|
- text: It's getting pretty chilly!
|
||||||
|
- text: Where I'm from, it's almost never-leaving-the-house weather.
|
||||||
|
- text: Winter is coming ⚔️
|
||||||
|
utter_chitchat/ask_whatismyname:
|
||||||
|
- text: It's probably the one that your parents chose for you.
|
||||||
|
- text: I'd tell you, but there's restricted access to that chunk of memory.
|
||||||
|
- text: Believe it or not, I actually am not spying on your personal information.
|
||||||
|
- text: You're the second person now to ask me that. Rihanna was the first.
|
||||||
|
utter_chitchat/ask_whatspossible:
|
||||||
|
- text: You can ask me about how to get started with Rasa, the difference between Rasa and Rasa X, subscribing to our newsletter or booking a sales call.
|
||||||
|
utter_chitchat/ask_wherefrom:
|
||||||
|
- text: My developers come from all over the world!
|
||||||
|
- text: I was taught not to give out my address on the internet.
|
||||||
|
- text: My address starts with github.com.
|
||||||
|
utter_chitchat/ask_whoami:
|
||||||
|
- text: I hope you are being yourself.
|
||||||
|
- text: Who do you think you are?
|
||||||
|
- text: Unfortunately I haven't been programmed with the amount of necessary philosophy knowledge to answer that.
|
||||||
|
utter_chitchat/ask_whoisit:
|
||||||
|
- text: I'm Pablo, the drug education bot! 🐦
|
||||||
|
utter_chitchat/nicetomeetyou:
|
||||||
|
- text: Likewise!
|
||||||
|
- text: Thank you. It is a pleasure to meet you as well!
|
||||||
|
- text: It is nice to meet you too!
|
||||||
|
- text: Pleased to meet you too!
|
||||||
|
- text: It's always a pleasure to meet new people!
|
||||||
|
- text: Nice to meet you too! Happy to be of help.
|
||||||
|
utter_chitchat/telljoke:
|
||||||
|
- text: Why are eggs not very much into jokes? - Because they could crack up.
|
||||||
|
- text: What's a tree's favorite drink? - Root beer!
|
||||||
|
- text: Why do the French like to eat snails so much? - They can't stand fast food.
|
||||||
|
- text: Why did the robot get angry? - Because someone kept pushing its buttons.
|
||||||
|
- text: What do you call a pirate droid? - Arrrr-2-D2
|
||||||
|
- text: Why did the robot cross the road? - Because he was programmed to.
|
||||||
|
utter_chitchat/confirm_presence:
|
||||||
|
- text: Sure am!
|
||||||
|
utter_faq/drugs_safe:
|
||||||
|
- text: That depends on which you are using and, most importantly, how you are using them...
|
||||||
|
utter_faq/drugs_legal:
|
||||||
|
- text: Probably but it depends on where you are and what drugs
|
||||||
|
|
||||||
|
utter_out_of_scope/non_english:
|
||||||
|
- text: No hablo english
|
||||||
|
utter_out_of_scope/other:
|
||||||
|
- text: I cant do that
|
||||||
|
actions:
|
||||||
|
- utter_chitchat
|
||||||
|
- utter_faq
|
||||||
|
- utter_greet
|
||||||
|
- utter_out_of_scope
|
||||||
|
2
requirements.txt
Normal file
2
requirements.txt
Normal file
@ -0,0 +1,2 @@
|
|||||||
|
rasa
|
||||||
|
pandas
|
35201
tripsit/getAllDrugs.json
Normal file
35201
tripsit/getAllDrugs.json
Normal file
File diff suppressed because it is too large
Load Diff
27
tripsit/getAllDrugs.py
Normal file
27
tripsit/getAllDrugs.py
Normal file
@ -0,0 +1,27 @@
|
|||||||
|
import requests, json
|
||||||
|
import pandas as pd
|
||||||
|
|
||||||
|
# API URL
|
||||||
|
url = "http://tripbot.tripsit.me/api/tripsit/getAllDrugs"
|
||||||
|
r = requests.get(url)
|
||||||
|
data = r.json()
|
||||||
|
|
||||||
|
# Format dict and load into df
|
||||||
|
data = json.dumps(data["data"][0], indent=2, sort_keys=False, ensure_ascii=False)
|
||||||
|
df = pd.DataFrame.from_dict(json.loads(data), orient="index")
|
||||||
|
|
||||||
|
# Add id for each drug for rasa
|
||||||
|
id = []
|
||||||
|
for x in range(0, len(df)):
|
||||||
|
id.append(x)
|
||||||
|
df["id"] = id
|
||||||
|
|
||||||
|
# Write to JSON file
|
||||||
|
with open("tripsit/getAllDrugs.json", "w") as fp:
|
||||||
|
# Clean NaN values
|
||||||
|
clean_data = {
|
||||||
|
k1: {k: v for k, v in v1.items() if v == v and v is not None}
|
||||||
|
for k1, v1 in df.to_dict("index").items()
|
||||||
|
}
|
||||||
|
# Set ensure_ascii to false to ensure we can keep greek letters (like alpha)
|
||||||
|
fp.write(json.dumps(clean_data, indent=2, ensure_ascii=False))
|
@ -1,37 +0,0 @@
|
|||||||
{
|
|
||||||
"cells": [
|
|
||||||
{
|
|
||||||
"cell_type": "code",
|
|
||||||
"execution_count": 1,
|
|
||||||
"source": [
|
|
||||||
"import pandas as pd"
|
|
||||||
],
|
|
||||||
"outputs": [],
|
|
||||||
"metadata": {}
|
|
||||||
}
|
|
||||||
],
|
|
||||||
"metadata": {
|
|
||||||
"orig_nbformat": 4,
|
|
||||||
"language_info": {
|
|
||||||
"name": "python",
|
|
||||||
"version": "3.8.11",
|
|
||||||
"mimetype": "text/x-python",
|
|
||||||
"codemirror_mode": {
|
|
||||||
"name": "ipython",
|
|
||||||
"version": 3
|
|
||||||
},
|
|
||||||
"pygments_lexer": "ipython3",
|
|
||||||
"nbconvert_exporter": "python",
|
|
||||||
"file_extension": ".py"
|
|
||||||
},
|
|
||||||
"kernelspec": {
|
|
||||||
"name": "python3",
|
|
||||||
"display_name": "Python 3.9.7 64-bit ('pablo-bot': conda)"
|
|
||||||
},
|
|
||||||
"interpreter": {
|
|
||||||
"hash": "9b8925f46c4eb81faf51dd413b2890c72e106e6d9cdc933e302e3dbb556b2244"
|
|
||||||
}
|
|
||||||
},
|
|
||||||
"nbformat": 4,
|
|
||||||
"nbformat_minor": 2
|
|
||||||
}
|
|
Loading…
Reference in New Issue
Block a user