diff --git a/docker-compose.yml b/docker-compose.yml index 2bccc02a..96126e02 100644 --- a/docker-compose.yml +++ b/docker-compose.yml @@ -73,7 +73,20 @@ services: env_file: - docker/notebooks.env volumes: - - ./bot:/work/bot + - ./coach:/work/coach - ./notebooks:/work/notebooks + - notebook_models:/models:ro ports: - 8888:8888 + depends_on: + - coach + + # =============================== Coach ================================= + coach: + image: botcoach:latest + volumes: + - notebook_models:/notebook_models + command: sh -c "cp -r /src_models/* /notebook_models" + +volumes: + notebook_models: diff --git a/docker/notebooks.env b/docker/notebooks.env index 3bc123ee..61af9af3 100644 --- a/docker/notebooks.env +++ b/docker/notebooks.env @@ -1,8 +1,8 @@ -BOT_DIR_PATH=../../bot/ -BOT_DOMAIN_PATH=../../bot/domain.yml -BOT_NLU_CONFIG_PATH=../../bot/nlu_config.yml -BOT_STORIES_PATH=../../bot/data/stories/ -BOT_INTENTS_PATH=../../bot/data/intents/ -BOT_MODELS_PATH=../../bot/models/ -BOT_MODELS_NLU_PATH=../../bot/models/nlu/current/ -BOT_MODELS_DIALOGUE_PATH=../../bot/models/dialogue +COACH_DIR_PATH=../../coach/ +COACH_DOMAIN_PATH=../../coach/domain.yml +COACH_NLU_CONFIG_PATH=../../coach/nlu_config.yml +COACH_STORIES_PATH=../../coach/data/stories/ +COACH_INTENTS_PATH=../../coach/data/intents/ +COACH_MODELS_PATH=/models/ +COACH_MODELS_NLU_PATH=/models/nlu/current/ +COACH_MODELS_DIALOGUE_PATH=/models/dialogue \ No newline at end of file diff --git a/docs/README-en.md b/docs/README-en.md index 2e3d7d91..345a907b 100644 --- a/docs/README-en.md +++ b/docs/README-en.md @@ -16,7 +16,7 @@ Various technologies are used in boilerplate that interact with each other to ob The user interacts with Boilerplate via RocketChat or Telegram, which sends the messages to the Rasa NLU via -connectors, where it identifies the * intent *, and responds to the Rasa Core, according to *stories* and *actions*. +connectors, where it identifies the *intent*, and responds to the Rasa Core, according to *stories* and *actions*. The *models* used for the conversation were generated by the *trainer* module and then transferred to the bot, these models can be versioned and evolved between bots. Notebooks evaluate the operation according to the format of *intents* and *stories*. diff --git a/notebooks/intents/.ipynb_checkpoints/intents-analysis-checkpoint.ipynb b/notebooks/intents/.ipynb_checkpoints/intents-analysis-checkpoint.ipynb index ad9c062e..c15cddbf 100644 --- a/notebooks/intents/.ipynb_checkpoints/intents-analysis-checkpoint.ipynb +++ b/notebooks/intents/.ipynb_checkpoints/intents-analysis-checkpoint.ipynb @@ -7,541 +7,487 @@ "id": "kO9wt2g3okLS" }, "source": [ - "# Analisando o bot\n", + "# Análise das Intents\n", "\n", - "Este jupyter-notebook vai auxiliar na análise de detecção de intenções da Taís." + "Este jupyter-notebook vai auxiliar na análise de detecção de intenções de seu chatbot." ] }, { "cell_type": "markdown", "metadata": {}, "source": [ - "## Instalação\n", - "\n", - "### Configurando jupyter" + "### Configurando e Imports" ] }, { "cell_type": "code", "execution_count": 1, "metadata": { - "scrolled": true + "scrolled": false }, - "outputs": [], + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "rasa_nlu: 0.15.0\n" + ] + } + ], "source": [ - "%matplotlib inline\n", - "\n", - "import logging, io, json, warnings\n", - "logging.basicConfig(level=\"INFO\")\n", - "warnings.filterwarnings('ignore')\n", + "from IPython.display import IFrame\n", "\n", - "def pprint(o):\n", - " # small helper to make dict dumps a bit prettier\n", - " print(json.dumps(o, indent=2))" + "import rasa_nlu\n", + "print(\"rasa_nlu: {}\".format(rasa_nlu.__version__))" ] }, { "cell_type": "markdown", - "metadata": {}, + "metadata": { + "colab_type": "text", + "id": "1xeXgpdwzOAl" + }, "source": [ - "### Listando versões" + "### Treinando o modelo do Rasa NLU\n", + "\n", + "* Para avaliar o bot o primeiro passo é treiner o seu chatbot. Mas não é necessário treinar a parte de conversão completa (rasa_core) apenas a parte de interpretação de mensagens (rasa_nlu).\n", + "\n", + "* O comando `train-nlu` do Makefile executa o treinamento apenas do `rasa_nlu`" ] }, { "cell_type": "code", "execution_count": 2, "metadata": { - "scrolled": true + "scrolled": false }, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ - "rasa_nlu: 0.13.7\n" + "make: Entering directory '/work/coach'\n", + "python3 -m rasa_nlu.train -c nlu_config.yml --fixed_model_name current \\\n", + "--data data/intents/ -o /src_models --project nlu --verbose\n", + "/usr/local/lib/python3.6/runpy.py:125: RuntimeWarning: 'rasa_nlu.train' found in sys.modules after import of package 'rasa_nlu', but prior to execution of 'rasa_nlu.train'; this may result in unpredictable behaviour\n", + " warn(RuntimeWarning(msg))\n", + "2019-07-17 16:30:02 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.training_data.loading\u001b[0m - Training data format of data/intents/geral.md is md\n", + "2019-07-17 16:30:02 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.training_data.training_data\u001b[0m - Training data stats: \n", + "\t- intent examples: 85 (7 distinct intents)\n", + "\t- Found intents: 'elogios', 'negar', 'despedir', 'diga_mais', 'tudo_bem', 'out_of_scope', 'cumprimentar'\n", + "\t- entity examples: 0 (0 distinct entities)\n", + "\t- found entities: \n", + "\n", + "2019-07-17 16:30:02 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.training_data.loading\u001b[0m - Training data format of data/intents/aleatorio.md is md\n", + "2019-07-17 16:30:02 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.training_data.training_data\u001b[0m - Training data stats: \n", + "\t- intent examples: 197 (24 distinct intents)\n", + "\t- Found intents: 'bff', 'filhos', 'license', 'de_onde_voce_eh', 'triste', 'religiao', 'playlist', 'signo', 'risada', 'time', 'comida', 'star_wars', 'cor', 'onde_voce_mora', 'esporte', 'piada', 'me', 'historia', 'linguagens', 'filme', 'hobby', 'relationship', 'como_estou', 'genero'\n", + "\t- entity examples: 172 (22 distinct entities)\n", + "\t- found entities: 'filhos', 'starwars', 'license', 'triste', 'live', 'religiao', 'signo', 'cor', 'how', 'esporte', 'piada', 'me', 'historia', 'hobby', 'relationship', 'bff', 'playlist', 'comida', 'filme', 'linguagens', 'genero', 'where'\n", + "\n", + "2019-07-17 16:30:02 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.training_data.loading\u001b[0m - Training data format of data/intents/actions.md is md\n", + "2019-07-17 16:30:02 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.training_data.training_data\u001b[0m - Training data stats: \n", + "\t- intent examples: 6 (1 distinct intents)\n", + "\t- Found intents: 'action_test'\n", + "\t- entity examples: 0 (0 distinct entities)\n", + "\t- found entities: \n", + "\n", + "2019-07-17 16:30:02 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.training_data.training_data\u001b[0m - Training data stats: \n", + "\t- intent examples: 288 (32 distinct intents)\n", + "\t- Found intents: 'filhos', 'license', 'negar', 'action_test', 'triste', 'religiao', 'signo', 'time', 'star_wars', 'cor', 'elogios', 'esporte', 'piada', 'me', 'historia', 'hobby', 'relationship', 'tudo_bem', 'como_estou', 'cumprimentar', 'bff', 'despedir', 'de_onde_voce_eh', 'playlist', 'risada', 'comida', 'onde_voce_mora', 'linguagens', 'filme', 'diga_mais', 'out_of_scope', 'genero'\n", + "\t- entity examples: 172 (22 distinct entities)\n", + "\t- found entities: 'filhos', 'starwars', 'license', 'triste', 'live', 'religiao', 'signo', 'cor', 'how', 'esporte', 'piada', 'me', 'historia', 'hobby', 'relationship', 'bff', 'playlist', 'comida', 'filme', 'linguagens', 'genero', 'where'\n", + "\n", + "2019-07-17 16:30:02 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.model\u001b[0m - Starting to train component WhitespaceTokenizer\n", + "2019-07-17 16:30:02 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.model\u001b[0m - Finished training component.\n", + "2019-07-17 16:30:02 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.model\u001b[0m - Starting to train component CRFEntityExtractor\n", + "2019-07-17 16:30:02 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.model\u001b[0m - Finished training component.\n", + "2019-07-17 16:30:02 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.model\u001b[0m - Starting to train component EntitySynonymMapper\n", + "2019-07-17 16:30:02 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.model\u001b[0m - Finished training component.\n", + "2019-07-17 16:30:02 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.model\u001b[0m - Starting to train component CountVectorsFeaturizer\n", + "2019-07-17 16:30:03 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.model\u001b[0m - Finished training component.\n", + "2019-07-17 16:30:03 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.model\u001b[0m - Starting to train component EmbeddingIntentClassifier\n", + "\n", + "WARNING: The TensorFlow contrib module will not be included in TensorFlow 2.0.\n", + "For more information, please see:\n", + " * https://github.com/tensorflow/community/blob/master/rfcs/20180907-contrib-sunset.md\n", + " * https://github.com/tensorflow/addons\n", + "If you depend on functionality not listed there, please file an issue.\n", + "\n", + "2019-07-17 16:30:05 \u001b[1;30mWARNING \u001b[0m \u001b[34mtensorflow\u001b[0m - \u001b[33mFrom /usr/local/lib/python3.6/site-packages/rasa_nlu/classifiers/embedding_intent_classifier.py:285: dense (from tensorflow.python.layers.core) is deprecated and will be removed in a future version.\n", + "Instructions for updating:\n", + "Use keras.layers.dense instead.\u001b[0m\n", + "2019-07-17 16:30:05 \u001b[1;30mWARNING \u001b[0m \u001b[34mtensorflow\u001b[0m - \u001b[33mFrom /usr/local/lib/python3.6/site-packages/tensorflow/python/framework/op_def_library.py:263: colocate_with (from tensorflow.python.framework.ops) is deprecated and will be removed in a future version.\n", + "Instructions for updating:\n", + "Colocations handled automatically by placer.\u001b[0m\n", + "2019-07-17 16:30:05 \u001b[1;30mWARNING \u001b[0m \u001b[34mtensorflow\u001b[0m - \u001b[33mFrom /usr/local/lib/python3.6/site-packages/rasa_nlu/classifiers/embedding_intent_classifier.py:286: dropout (from tensorflow.python.layers.core) is deprecated and will be removed in a future version.\n", + "Instructions for updating:\n", + "Use keras.layers.dropout instead.\u001b[0m\n", + "2019-07-17 16:30:05 \u001b[1;30mWARNING \u001b[0m \u001b[34mtensorflow\u001b[0m - \u001b[33mFrom /usr/local/lib/python3.6/site-packages/tensorflow/python/keras/layers/core.py:143: calling dropout (from tensorflow.python.ops.nn_ops) with keep_prob is deprecated and will be removed in a future version.\n", + "Instructions for updating:\n", + "Please use `rate` instead of `keep_prob`. Rate should be set to `rate = 1 - keep_prob`.\u001b[0m\n", + "2019-07-17 16:30:05 \u001b[1;30mWARNING \u001b[0m \u001b[34mtensorflow\u001b[0m - \u001b[33mFrom /usr/local/lib/python3.6/site-packages/tensorflow/python/ops/math_ops.py:3066: to_int32 (from tensorflow.python.ops.math_ops) is deprecated and will be removed in a future version.\n", + "Instructions for updating:\n", + "Use tf.cast instead.\u001b[0m\n", + "2019-07-17 16:30:05 \u001b[1;30mWARNING \u001b[0m \u001b[34mtensorflow\u001b[0m - \u001b[33mFrom /usr/local/lib/python3.6/site-packages/tensorflow/python/ops/math_grad.py:102: div (from tensorflow.python.ops.math_ops) is deprecated and will be removed in a future version.\n", + "Instructions for updating:\n", + "Deprecated in favor of operator or tf.math.divide.\u001b[0m\n", + "2019-07-17 16:30:06.320809: I tensorflow/core/platform/cpu_feature_guard.cc:141] Your CPU supports instructions that this TensorFlow binary was not compiled to use: AVX2 FMA\n", + "2019-07-17 16:30:06.344961: I tensorflow/core/platform/profile_utils/cpu_utils.cc:94] CPU Frequency: 2194805000 Hz\n", + "2019-07-17 16:30:06.345414: I tensorflow/compiler/xla/service/service.cc:150] XLA service 0x563c2cae7710 executing computations on platform Host. Devices:\n", + "2019-07-17 16:30:06.345467: I tensorflow/compiler/xla/service/service.cc:158] StreamExecutor device (0): , \n", + "2019-07-17 16:30:06 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.classifiers.embedding_intent_classifier\u001b[0m - Accuracy is updated every 10 epochs\n", + "Epochs: 100%|██████████| 300/300 [00:14<00:00, 25.65it/s, loss=0.101, acc=0.993]\n", + "2019-07-17 16:30:20 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.classifiers.embedding_intent_classifier\u001b[0m - Finished training embedding classifier, loss=0.101, train accuracy=0.993\n", + "2019-07-17 16:30:20 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.model\u001b[0m - Finished training component.\n", + "2019-07-17 16:30:20 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.model\u001b[0m - Successfully saved model into '/src_models/nlu/current'\n", + "2019-07-17 16:30:20 \u001b[1;30mINFO \u001b[0m \u001b[34m__main__\u001b[0m - Finished training\n", + "make: Leaving directory '/work/coach'\n" ] } ], "source": [ - "import rasa_nlu\n", - "\n", - "print(\"rasa_nlu: {}\".format(rasa_nlu.__version__))" + "!make train-nlu -C $COACH_DIR_PATH" ] }, { "cell_type": "markdown", - "metadata": { - "colab_type": "text", - "id": "1xeXgpdwzOAl" - }, + "metadata": {}, "source": [ - "### Treinando o modelo do Rasa NLU" + "### Métodos de avaliação do chatbot\n", + "\n", + "* O Rasa fornece vários métodos de avaliação e validação das `intents`, para verificar como utiliza-los, cada método fornece um log, imagem, gráfico ou arquivo com dados relevantes para interpretação do chatbot." ] }, { "cell_type": "markdown", "metadata": {}, "source": [ - "Na celula abaixo todas as intents na pasta `../data/intents/` serão utilizadas para gerar a matrix de confuzão para de avaliação do bot.\n", + "* O comando `!python -m rasa_nlu.test` é a base para a avaliação do chatbot.\n", + "\n", + "* Na célula abaixo a flag `-h` foi utilizada para mostrar as funções e a forma de uso de cada uma delas, mude seus valores e flags para ter as informações desejadas na sua análise.\n", "\n", - "Ela irá treinar o modelo e executar a avaliação que pode ser verificada na saída da célula abaixo." + "* Atualmente o Rasa possui 2 modos, `evaluation` e `crossvalidation` que tem seções decicadas a eles neste jupyter notebook." ] }, { "cell_type": "code", "execution_count": 3, "metadata": { - "colab": { - "autoexec": { - "startup": false, - "wait_interval": 0 - }, - "base_uri": "https://localhost:8080/", - "height": 377 - }, - "colab_type": "code", - "executionInfo": { - "elapsed": 2821, - "status": "ok", - "timestamp": 1521380062879, - "user": { - "displayName": "Alexander Weidauer", - "photoUrl": "//lh6.googleusercontent.com/-j4xnI5_PFWA/AAAAAAAAAAI/AAAAAAAAAAo/wPT2w5Bl3xg/s50-c-k-no/photo.jpg", - "userId": "100444450157165144272" - }, - "user_tz": -60 - }, - "id": "qHsAH49OePcM", - "outputId": "f840c42d-acf2-4fbf-b439-e5a239ffb32b", - "scrolled": false + "scrolled": true }, "outputs": [ { - "name": "stderr", + "name": "stdout", "output_type": "stream", "text": [ - "INFO:rasa_nlu.training_data.loading:Training data format of ../../bot/data/intents/random.md is md\n", - "INFO:rasa_nlu.training_data.training_data:Training data stats: \n", - "\t- intent examples: 237 (30 distinct intents)\n", - "\t- Found intents: 'me', 'religion', 'its_ok', 'playlist', 'where_u_liv', 'license', 'weather', 'towel', 'laugh', 'genre', 'book', 'sons', 'relationship', 'name', 'sport', 'color', 'food', 'story', 'how_am_i', 'languages', 'sad', 'movie', 'team', 'star_wars', 'where_r_u_from', 'joke', 'bff', 'sign', 'creators', 'hobby'\n", - "\t- entity examples: 208 (28 distinct entities)\n", - "\t- found entities: 'religion', 'how', 'genre', 'book', 'relationship', 'name', 'ok', 'story', 'sad', 'movie', 'where', 'weather', 'bff', 'creators', 'hobby', 'me', 'playlist', 'license', 'towel', 'sons', 'sport', 'color', 'food', 'starwars', 'languages', 'joke', 'sign', 'live'\n", - "\n", - "INFO:rasa_nlu.training_data.loading:Training data format of ../../bot/data/intents/lappis.md is md\n", - "INFO:rasa_nlu.training_data.training_data:Training data stats: \n", - "\t- intent examples: 169 (14 distinct intents)\n", - "\t- Found intents: 'salic_api', 'meu_signo', 'software_livre', 'quem_eh_lappisudo', 'promova_cultura', 'como_contratar', 'pessoa_mais_cool', 'chatbot_tais', 'quais_tecnologias', 'o_que_eh_lappis', 'quais_projetos', 'zoacao_java', 'empurrando_juntos', 'salic_ml'\n", - "\t- entity examples: 0 (0 distinct entities)\n", - "\t- found entities: \n", - "\n", - "INFO:rasa_nlu.training_data.loading:Training data format of ../../bot/data/intents/general.md is md\n", - "INFO:rasa_nlu.training_data.training_data:Training data stats: \n", - "\t- intent examples: 125 (10 distinct intents)\n", - "\t- Found intents: 'despedir', 'tudo_bem', 'negar', 'erro_resposta_utter', 'diga_mais', 'quem_eh_voce', 'cumprimentar', 'out_of_scope', 'elogios', 'afirmar'\n", - "\t- entity examples: 0 (0 distinct entities)\n", - "\t- found entities: \n", - "\n", - "INFO:rasa_nlu.training_data.training_data:Training data stats: \n", - "\t- intent examples: 531 (54 distinct intents)\n", - "\t- Found intents: 'software_livre', 'religion', 'its_ok', 'where_u_liv', 'quais_tecnologias', 'cumprimentar', 'genre', 'book', 'relationship', 'name', 'salic_api', 'meu_signo', 'story', 'negar', 'out_of_scope', 'sad', 'movie', 'chatbot_tais', 'diga_mais', 'where_r_u_from', 'weather', 'bff', 'empurrando_juntos', 'creators', 'hobby', 'salic_ml', 'me', 'despedir', 'quem_eh_lappisudo', 'como_contratar', 'playlist', 'pessoa_mais_cool', 'license', 'towel', 'quem_eh_voce', 'laugh', 'elogios', 'sons', 'zoacao_java', 'afirmar', 'sport', 'color', 'food', 'tudo_bem', 'promova_cultura', 'how_am_i', 'languages', 'erro_resposta_utter', 'team', 'star_wars', 'o_que_eh_lappis', 'quais_projetos', 'joke', 'sign'\n", - "\t- entity examples: 208 (28 distinct entities)\n", - "\t- found entities: 'religion', 'how', 'genre', 'book', 'relationship', 'name', 'ok', 'story', 'sad', 'movie', 'where', 'weather', 'bff', 'creators', 'hobby', 'me', 'playlist', 'license', 'towel', 'sons', 'sport', 'color', 'food', 'starwars', 'languages', 'joke', 'sign', 'live'\n", - "\n", - "INFO:rasa_nlu.model:Starting to train component tokenizer_whitespace\n", - "INFO:rasa_nlu.model:Finished training component.\n", - "INFO:rasa_nlu.model:Starting to train component ner_crf\n", - "INFO:rasa_nlu.model:Finished training component.\n", - "INFO:rasa_nlu.model:Starting to train component ner_synonyms\n", - "INFO:rasa_nlu.model:Finished training component.\n", - "INFO:rasa_nlu.model:Starting to train component intent_featurizer_count_vectors\n", - "INFO:rasa_nlu.model:Finished training component.\n", - "INFO:rasa_nlu.model:Starting to train component intent_classifier_tensorflow_embedding\n", - "INFO:rasa_nlu.classifiers.embedding_intent_classifier:Accuracy is updated every 10 epochs\n", - "Epochs: 100%|██████████| 300/300 [00:20<00:00, 14.71it/s, loss=0.143, acc=0.976]\n", - "INFO:rasa_nlu.classifiers.embedding_intent_classifier:Finished training embedding policy, loss=0.143, train accuracy=0.976\n", - "INFO:rasa_nlu.model:Finished training component.\n", - "INFO:rasa_nlu.model:Successfully saved model into '/work/notebooks/intents/models/nlu/default/current'\n" + "/usr/local/lib/python3.6/runpy.py:125: RuntimeWarning: 'rasa_nlu.test' found in sys.modules after import of package 'rasa_nlu', but prior to execution of 'rasa_nlu.test'; this may result in unpredictable behaviour\r\n", + " warn(RuntimeWarning(msg))\r\n", + "usage: test.py [-h] [--debug] [-v] -d DATA [--mode MODE] [-c CONFIG]\r\n", + " [-m MODEL] [-f FOLDS] [--report [REPORT]]\r\n", + " [--successes [SUCCESSES]] [--errors ERRORS]\r\n", + " [--histogram HISTOGRAM] [--confmat CONFMAT]\r\n", + "\r\n", + "evaluate a Rasa NLU pipeline with cross validation or on external data\r\n", + "\r\n", + "optional arguments:\r\n", + " -h, --help show this help message and exit\r\n", + " --debug Print lots of debugging statements. Sets logging level\r\n", + " to DEBUG\r\n", + " -v, --verbose Be verbose. Sets logging level to INFO\r\n", + " -d DATA, --data DATA file containing training/evaluation data\r\n", + " --mode MODE evaluation|crossvalidation (evaluate pretrained model\r\n", + " or train model by crossvalidation)\r\n", + " -c CONFIG, --config CONFIG\r\n", + " model configuration file (crossvalidation only)\r\n", + " -m MODEL, --model MODEL\r\n", + " path to model (evaluation only)\r\n", + " -f FOLDS, --folds FOLDS\r\n", + " number of CV folds (crossvalidation only)\r\n", + " --report [REPORT] output path to save the intent/entitymetrics report\r\n", + " --successes [SUCCESSES]\r\n", + " output path to save successful predictions\r\n", + " --errors ERRORS output path to save model errors\r\n", + " --histogram HISTOGRAM\r\n", + " output path for the confidence histogram\r\n", + " --confmat CONFMAT output path for the confusion matrix plot\r\n" ] } ], "source": [ - "import os\n", - "\n", - "from rasa_nlu.training_data import load_data\n", - "from rasa_nlu.model import Trainer\n", - "from rasa_nlu import config\n", - "\n", - "\n", - "intents_directory = '../../bot/data/intents/'\n", - "\n", - "intents = {}\n", - "\n", - "for intent_file in os.listdir(intents_directory):\n", - " intent_file_path = os.path.join(intents_directory, intent_file)\n", - "\n", - " intents[intent_file] = {}\n", - "\n", - " intent_list = []\n", - " intent_name = None\n", - "\n", - " with open(intent_file_path) as f:\n", - " lines = f.readlines()\n", - "\n", - " for line in lines:\n", - " line = line.strip()\n", - "\n", - " if line.startswith('##'):\n", - " if intent_name is not None:\n", - " intents[intent_file][intent_name] = intent_list\n", - " intent_name = line.replace('## intent:', '') \n", - " intent_list = []\n", - "\n", - " elif line.startswith('- '):\n", - " intent_list.append(line.replace('- ', ''))\n", - "\n", - "\n", - "# loading the nlu training samples\n", - "training_data = load_data(intents_directory)\n", - "\n", - "# trainer to educate our pipeline\n", - "trainer = Trainer(config.load(\"../../bot/nlu_config.yml\"))\n", - "\n", - "# train the model!\n", - "interpreter = trainer.train(training_data)\n", - "\n", - "# store it for future use\n", - "model_directory = trainer.persist(\"./models/nlu\", fixed_model_name=\"current\")" + "!python -m rasa_nlu.test -h" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "### Evaluation" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "* O comando abaixo gera informações relevates para a validação das `intents` são elas:\n", + " * Matriz de confusão\n", + " * Histograma\n", + " * Erros de intents" ] }, { "cell_type": "code", "execution_count": 4, - "metadata": {}, + "metadata": { + "scrolled": true + }, "outputs": [ { - "name": "stderr", + "name": "stdout", "output_type": "stream", "text": [ - "INFO:tensorflow:Restoring parameters from /work/notebooks/intents/./models/nlu/default/current/intent_classifier_tensorflow_embedding.ckpt\n", - "INFO:rasa_nlu.training_data.loading:Training data format of ../../bot/data/intents/random.md is md\n", - "INFO:rasa_nlu.training_data.training_data:Training data stats: \n", - "\t- intent examples: 237 (30 distinct intents)\n", - "\t- Found intents: 'me', 'religion', 'its_ok', 'playlist', 'where_u_liv', 'license', 'weather', 'towel', 'laugh', 'genre', 'book', 'sons', 'relationship', 'name', 'sport', 'color', 'food', 'story', 'how_am_i', 'languages', 'sad', 'movie', 'team', 'star_wars', 'where_r_u_from', 'joke', 'bff', 'sign', 'creators', 'hobby'\n", - "\t- entity examples: 208 (28 distinct entities)\n", - "\t- found entities: 'religion', 'how', 'genre', 'book', 'relationship', 'name', 'ok', 'story', 'sad', 'movie', 'where', 'weather', 'bff', 'creators', 'hobby', 'me', 'playlist', 'license', 'towel', 'sons', 'sport', 'color', 'food', 'starwars', 'languages', 'joke', 'sign', 'live'\n", - "\n", - "INFO:rasa_nlu.training_data.loading:Training data format of ../../bot/data/intents/lappis.md is md\n", - "INFO:rasa_nlu.training_data.training_data:Training data stats: \n", - "\t- intent examples: 169 (14 distinct intents)\n", - "\t- Found intents: 'salic_api', 'meu_signo', 'software_livre', 'quem_eh_lappisudo', 'promova_cultura', 'como_contratar', 'pessoa_mais_cool', 'chatbot_tais', 'quais_tecnologias', 'o_que_eh_lappis', 'quais_projetos', 'zoacao_java', 'empurrando_juntos', 'salic_ml'\n", + "/usr/local/lib/python3.6/runpy.py:125: RuntimeWarning: 'rasa_nlu.test' found in sys.modules after import of package 'rasa_nlu', but prior to execution of 'rasa_nlu.test'; this may result in unpredictable behaviour\n", + " warn(RuntimeWarning(msg))\n", + "2019-07-17 16:31:33.800517: I tensorflow/core/platform/cpu_feature_guard.cc:141] Your CPU supports instructions that this TensorFlow binary was not compiled to use: AVX2 FMA\n", + "2019-07-17 16:31:33.828980: I tensorflow/core/platform/profile_utils/cpu_utils.cc:94] CPU Frequency: 2194805000 Hz\n", + "2019-07-17 16:31:33.829499: I tensorflow/compiler/xla/service/service.cc:150] XLA service 0x55c71b5187e0 executing computations on platform Host. Devices:\n", + "2019-07-17 16:31:33.829554: I tensorflow/compiler/xla/service/service.cc:158] StreamExecutor device (0): , \n", + "2019-07-17 16:31:34 \u001b[1;30mWARNING \u001b[0m \u001b[34mtensorflow\u001b[0m - \u001b[33mFrom /usr/local/lib/python3.6/site-packages/tensorflow/python/training/saver.py:1266: checkpoint_exists (from tensorflow.python.training.checkpoint_management) is deprecated and will be removed in a future version.\n", + "Instructions for updating:\n", + "Use standard file APIs to check for files with this prefix.\u001b[0m\n", + "2019-07-17 16:31:34 \u001b[1;30mINFO \u001b[0m \u001b[34mtensorflow\u001b[0m - Restoring parameters from /models/nlu/current/component_4_EmbeddingIntentClassifier.ckpt\n", + "2019-07-17 16:31:34 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.training_data.loading\u001b[0m - Training data format of ../../coach/data/intents/geral.md is md\n", + "2019-07-17 16:31:34 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.training_data.training_data\u001b[0m - Training data stats: \n", + "\t- intent examples: 85 (7 distinct intents)\n", + "\t- Found intents: 'cumprimentar', 'diga_mais', 'out_of_scope', 'despedir', 'tudo_bem', 'negar', 'elogios'\n", "\t- entity examples: 0 (0 distinct entities)\n", "\t- found entities: \n", "\n", - "INFO:rasa_nlu.training_data.loading:Training data format of ../../bot/data/intents/general.md is md\n", - "INFO:rasa_nlu.training_data.training_data:Training data stats: \n", - "\t- intent examples: 125 (10 distinct intents)\n", - "\t- Found intents: 'despedir', 'tudo_bem', 'negar', 'erro_resposta_utter', 'diga_mais', 'quem_eh_voce', 'cumprimentar', 'out_of_scope', 'elogios', 'afirmar'\n", + "2019-07-17 16:31:34 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.training_data.loading\u001b[0m - Training data format of ../../coach/data/intents/aleatorio.md is md\n", + "2019-07-17 16:31:34 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.training_data.training_data\u001b[0m - Training data stats: \n", + "\t- intent examples: 197 (24 distinct intents)\n", + "\t- Found intents: 'relationship', 'me', 'time', 'bff', 'religiao', 'license', 'esporte', 'filhos', 'risada', 'historia', 'de_onde_voce_eh', 'piada', 'genero', 'linguagens', 'cor', 'signo', 'onde_voce_mora', 'playlist', 'filme', 'star_wars', 'triste', 'comida', 'como_estou', 'hobby'\n", + "\t- entity examples: 172 (22 distinct entities)\n", + "\t- found entities: 'me', 'bff', 'religiao', 'license', 'piada', 'cor', 'filme', 'triste', 'comida', 'where', 'relationship', 'how', 'live', 'esporte', 'historia', 'filhos', 'genero', 'linguagens', 'signo', 'starwars', 'playlist', 'hobby'\n", + "\n", + "2019-07-17 16:31:34 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.training_data.loading\u001b[0m - Training data format of ../../coach/data/intents/actions.md is md\n", + "2019-07-17 16:31:34 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.training_data.training_data\u001b[0m - Training data stats: \n", + "\t- intent examples: 6 (1 distinct intents)\n", + "\t- Found intents: 'action_test'\n", "\t- entity examples: 0 (0 distinct entities)\n", "\t- found entities: \n", "\n", - "INFO:rasa_nlu.training_data.training_data:Training data stats: \n", - "\t- intent examples: 531 (54 distinct intents)\n", - "\t- Found intents: 'software_livre', 'religion', 'its_ok', 'where_u_liv', 'quais_tecnologias', 'cumprimentar', 'genre', 'book', 'relationship', 'name', 'salic_api', 'meu_signo', 'story', 'negar', 'out_of_scope', 'sad', 'movie', 'chatbot_tais', 'diga_mais', 'where_r_u_from', 'weather', 'bff', 'empurrando_juntos', 'creators', 'hobby', 'salic_ml', 'me', 'despedir', 'quem_eh_lappisudo', 'como_contratar', 'playlist', 'pessoa_mais_cool', 'license', 'towel', 'quem_eh_voce', 'laugh', 'elogios', 'sons', 'zoacao_java', 'afirmar', 'sport', 'color', 'food', 'tudo_bem', 'promova_cultura', 'how_am_i', 'languages', 'erro_resposta_utter', 'team', 'star_wars', 'o_que_eh_lappis', 'quais_projetos', 'joke', 'sign'\n", - "\t- entity examples: 208 (28 distinct entities)\n", - "\t- found entities: 'religion', 'how', 'genre', 'book', 'relationship', 'name', 'ok', 'story', 'sad', 'movie', 'where', 'weather', 'bff', 'creators', 'hobby', 'me', 'playlist', 'license', 'towel', 'sons', 'sport', 'color', 'food', 'starwars', 'languages', 'joke', 'sign', 'live'\n", + "2019-07-17 16:31:34 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.training_data.training_data\u001b[0m - Training data stats: \n", + "\t- intent examples: 288 (32 distinct intents)\n", + "\t- Found intents: 'me', 'cumprimentar', 'out_of_scope', 'bff', 'religiao', 'license', 'negar', 'elogios', 'risada', 'de_onde_voce_eh', 'piada', 'cor', 'filme', 'triste', 'comida', 'como_estou', 'relationship', 'action_test', 'despedir', 'hobby', 'esporte', 'filhos', 'historia', 'genero', 'linguagens', 'signo', 'diga_mais', 'playlist', 'tudo_bem', 'onde_voce_mora', 'time', 'star_wars'\n", + "\t- entity examples: 172 (22 distinct entities)\n", + "\t- found entities: 'me', 'bff', 'religiao', 'license', 'piada', 'cor', 'filme', 'triste', 'comida', 'where', 'relationship', 'how', 'live', 'esporte', 'historia', 'filhos', 'genero', 'linguagens', 'signo', 'starwars', 'playlist', 'hobby'\n", "\n", - "INFO:rasa_nlu.evaluate:Intent evaluation results:\n", - "INFO:rasa_nlu.evaluate:Intent Evaluation: Only considering those 531 examples that have a defined intent out of 531 examples\n", - "INFO:rasa_nlu.evaluate:F1-Score: 0.9747239685377217\n", - "INFO:rasa_nlu.evaluate:Precision: 0.9778755247681801\n", - "INFO:rasa_nlu.evaluate:Accuracy: 0.9736346516007532\n", - "INFO:rasa_nlu.evaluate:Classification report: \n", - " precision recall f1-score support\n", + "2019-07-17 16:31:34 \u001b[1;30mINFO \u001b[0m \u001b[34m__main__\u001b[0m - Running model for predictions:\n", + "100%|████████████████████████████████████████| 288/288 [00:00<00:00, 429.64it/s]\n", + "2019-07-17 16:31:34 \u001b[1;30mINFO \u001b[0m \u001b[34m__main__\u001b[0m - Intent evaluation results:\n", + "2019-07-17 16:31:34 \u001b[1;30mINFO \u001b[0m \u001b[34m__main__\u001b[0m - Intent Evaluation: Only considering those 288 examples that have a defined intent out of 288 examples\n", + "/usr/local/lib/python3.6/site-packages/sklearn/metrics/classification.py:1145: UndefinedMetricWarning: Recall and F-score are ill-defined and being set to 0.0 in labels with no true samples.\n", + " 'recall', 'true', average, warn_for)\n", + "/usr/local/lib/python3.6/site-packages/sklearn/metrics/classification.py:1145: UndefinedMetricWarning: F-score is ill-defined and being set to 0.0 in labels with no true samples.\n", + " 'recall', 'true', average, warn_for)\n", + "2019-07-17 16:31:34 \u001b[1;30mINFO \u001b[0m \u001b[34m__main__\u001b[0m - F1-Score: 0.9914054566832343\n", + "2019-07-17 16:31:34 \u001b[1;30mINFO \u001b[0m \u001b[34m__main__\u001b[0m - Precision: 0.9942129629629629\n", + "2019-07-17 16:31:34 \u001b[1;30mINFO \u001b[0m \u001b[34m__main__\u001b[0m - Accuracy: 0.9895833333333334\n", + "2019-07-17 16:31:34 \u001b[1;30mINFO \u001b[0m \u001b[34m__main__\u001b[0m - Classification report: \n", + " precision recall f1-score support\n", "\n", - " 0.00 0.00 0.00 0\n", - " afirmar 0.87 1.00 0.93 13\n", - " bff 1.00 1.00 1.00 11\n", - " book 1.00 1.00 1.00 5\n", - " chatbot_tais 1.00 1.00 1.00 10\n", - " color 1.00 1.00 1.00 6\n", - " como_contratar 1.00 1.00 1.00 19\n", - " creators 1.00 0.83 0.91 6\n", - " cumprimentar 1.00 0.91 0.95 22\n", - " despedir 1.00 1.00 1.00 16\n", - " diga_mais 1.00 1.00 1.00 9\n", - " elogios 1.00 1.00 1.00 4\n", - " empurrando_juntos 1.00 1.00 1.00 6\n", - "erro_resposta_utter 1.00 1.00 1.00 6\n", - " food 1.00 1.00 1.00 8\n", - " genre 1.00 1.00 1.00 8\n", - " hobby 1.00 1.00 1.00 7\n", - " how_am_i 1.00 1.00 1.00 8\n", - " its_ok 1.00 0.90 0.95 10\n", - " joke 1.00 1.00 1.00 7\n", - " languages 0.93 0.93 0.93 14\n", - " laugh 1.00 1.00 1.00 13\n", - " license 1.00 0.91 0.95 11\n", - " me 1.00 1.00 1.00 7\n", - " meu_signo 0.94 0.94 0.94 17\n", - " movie 1.00 1.00 1.00 4\n", - " name 1.00 1.00 1.00 4\n", - " negar 1.00 1.00 1.00 19\n", - " o_que_eh_lappis 0.77 1.00 0.87 10\n", - " out_of_scope 1.00 1.00 1.00 5\n", - " pessoa_mais_cool 1.00 1.00 1.00 19\n", - " playlist 1.00 1.00 1.00 8\n", - " promova_cultura 1.00 1.00 1.00 8\n", - " quais_projetos 1.00 1.00 1.00 20\n", - " quais_tecnologias 1.00 1.00 1.00 17\n", - " quem_eh_lappisudo 1.00 0.89 0.94 9\n", - " quem_eh_voce 0.90 0.90 0.90 21\n", - " relationship 1.00 1.00 1.00 10\n", - " religion 1.00 1.00 1.00 16\n", - " sad 1.00 1.00 1.00 7\n", - " salic_api 1.00 1.00 1.00 10\n", - " salic_ml 1.00 1.00 1.00 10\n", - " sign 0.67 0.67 0.67 3\n", - " software_livre 0.89 1.00 0.94 8\n", - " sons 1.00 1.00 1.00 11\n", - " sport 1.00 1.00 1.00 6\n", - " star_wars 1.00 1.00 1.00 10\n", - " story 1.00 1.00 1.00 6\n", - " team 1.00 1.00 1.00 7\n", - " towel 1.00 1.00 1.00 4\n", - " tudo_bem 0.82 0.90 0.86 10\n", - " weather 1.00 1.00 1.00 8\n", - " where_r_u_from 1.00 0.75 0.86 4\n", - " where_u_liv 1.00 1.00 1.00 8\n", - " zoacao_java 1.00 0.83 0.91 6\n", + " 0.00 0.00 0.00 0\n", + " action_test 1.00 1.00 1.00 6\n", + " bff 1.00 1.00 1.00 11\n", + " comida 1.00 1.00 1.00 8\n", + " como_estou 1.00 1.00 1.00 8\n", + " cor 1.00 1.00 1.00 6\n", + " cumprimentar 1.00 0.91 0.95 22\n", + "de_onde_voce_eh 1.00 1.00 1.00 4\n", + " despedir 1.00 1.00 1.00 16\n", + " diga_mais 1.00 1.00 1.00 9\n", + " elogios 1.00 1.00 1.00 4\n", + " esporte 1.00 1.00 1.00 6\n", + " filhos 1.00 1.00 1.00 11\n", + " filme 1.00 1.00 1.00 4\n", + " genero 1.00 1.00 1.00 8\n", + " historia 1.00 1.00 1.00 6\n", + " hobby 1.00 1.00 1.00 7\n", + " license 1.00 1.00 1.00 11\n", + " linguagens 1.00 0.93 0.96 14\n", + " me 1.00 1.00 1.00 6\n", + " negar 1.00 1.00 1.00 19\n", + " onde_voce_mora 1.00 1.00 1.00 8\n", + " out_of_scope 1.00 1.00 1.00 5\n", + " piada 1.00 1.00 1.00 7\n", + " playlist 1.00 1.00 1.00 8\n", + " relationship 1.00 1.00 1.00 10\n", + " religiao 1.00 1.00 1.00 16\n", + " risada 1.00 1.00 1.00 13\n", + " signo 1.00 1.00 1.00 3\n", + " star_wars 1.00 1.00 1.00 10\n", + " time 1.00 1.00 1.00 5\n", + " triste 1.00 1.00 1.00 7\n", + " tudo_bem 0.83 1.00 0.91 10\n", "\n", - " avg / total 0.98 0.97 0.97 531\n", + " micro avg 0.99 0.99 0.99 288\n", + " macro avg 0.96 0.96 0.96 288\n", + " weighted avg 0.99 0.99 0.99 288\n", "\n", - "INFO:rasa_nlu.evaluate:There were some nlu intent classification errors. Use `--verbose` to show them in the log.\n", - "INFO:rasa_nlu.evaluate:Model prediction errors saved to errors.json.\n", - "INFO:rasa_nlu.evaluate:Confusion matrix, without normalization: \n", + "2019-07-17 16:31:34 \u001b[1;30mINFO \u001b[0m \u001b[34m__main__\u001b[0m - Model prediction errors saved to errors.json.\n", + "2019-07-17 16:31:35 \u001b[1;30mINFO \u001b[0m \u001b[34mmatplotlib.font_manager\u001b[0m - font search path ['/usr/local/lib/python3.6/site-packages/matplotlib/mpl-data/fonts/ttf', '/usr/local/lib/python3.6/site-packages/matplotlib/mpl-data/fonts/afm', '/usr/local/lib/python3.6/site-packages/matplotlib/mpl-data/fonts/pdfcorefonts']\n", + "2019-07-17 16:31:36 \u001b[1;30mINFO \u001b[0m \u001b[34mmatplotlib.font_manager\u001b[0m - generated new fontManager\n", + "2019-07-17 16:31:38 \u001b[1;30mINFO \u001b[0m \u001b[34m__main__\u001b[0m - Confusion matrix, without normalization: \n", "[[ 0 0 0 ... 0 0 0]\n", - " [ 0 13 0 ... 0 0 0]\n", + " [ 0 6 0 ... 0 0 0]\n", " [ 0 0 11 ... 0 0 0]\n", " ...\n", - " [ 0 0 0 ... 3 0 0]\n", - " [ 0 0 0 ... 0 8 0]\n", - " [ 0 0 0 ... 0 0 5]]\n" + " [ 0 0 0 ... 5 0 0]\n", + " [ 0 0 0 ... 0 7 0]\n", + " [ 0 0 0 ... 0 0 10]]\n", + "Figure(2000x2000)\n", + "Figure(1000x1000)\n", + "2019-07-17 16:31:43 \u001b[1;30mINFO \u001b[0m \u001b[34m__main__\u001b[0m - Entity evaluation results:\n", + "2019-07-17 16:31:44 \u001b[1;30mINFO \u001b[0m \u001b[34m__main__\u001b[0m - Evaluation for entity extractor: CRFEntityExtractor \n" ] }, { - "data": { - "image/png": "\n", - "text/plain": [ - "
" - ] - }, - "metadata": { - "needs_background": "light" - }, - "output_type": "display_data" - }, - { - "data": { - "image/png": "\n", - "text/plain": [ - "
" - ] - }, - "metadata": { - "needs_background": "light" - }, - "output_type": "display_data" - }, - { - "name": "stderr", + "name": "stdout", "output_type": "stream", "text": [ - "INFO:rasa_nlu.evaluate:Entity evaluation results:\n", - "INFO:rasa_nlu.evaluate:Evaluation for entity extractor: ner_crf \n", - "INFO:rasa_nlu.evaluate:F1-Score: 0.9907693995778069\n", - "INFO:rasa_nlu.evaluate:Precision: 0.9915729577474618\n", - "INFO:rasa_nlu.evaluate:Accuracy: 0.9909584086799277\n", - "INFO:rasa_nlu.evaluate:Classification report: \n", - " precision recall f1-score support\n", - "\n", - " bff 1.00 1.00 1.00 17\n", - " book 1.00 1.00 1.00 5\n", - " color 1.00 1.00 1.00 13\n", - " creators 1.00 0.86 0.92 7\n", - " food 1.00 1.00 1.00 17\n", - " genre 0.83 1.00 0.91 15\n", - " hobby 1.00 1.00 1.00 11\n", - " how 1.00 1.00 1.00 24\n", - " joke 1.00 1.00 1.00 7\n", - " languages 1.00 0.93 0.96 14\n", - " license 1.00 0.86 0.92 14\n", - " live 1.00 1.00 1.00 13\n", - " me 1.00 0.86 0.92 7\n", - " movie 1.00 1.00 1.00 4\n", - " name 1.00 1.00 1.00 4\n", - " no_entity 0.99 1.00 0.99 1379\n", - " ok 0.93 0.93 0.93 15\n", - " playlist 1.00 1.00 1.00 7\n", - "relationship 1.00 1.00 1.00 9\n", - " religion 1.00 1.00 1.00 16\n", - " sad 1.00 1.00 1.00 7\n", - " sign 0.50 0.67 0.57 3\n", - " sons 1.00 1.00 1.00 11\n", - " sport 1.00 1.00 1.00 6\n", - " starwars 1.00 1.00 1.00 13\n", - " story 1.00 1.00 1.00 6\n", - " towel 1.00 1.00 1.00 4\n", - " weather 1.00 1.00 1.00 8\n", - " where 1.00 0.33 0.50 3\n", - "\n", - " avg / total 0.99 0.99 0.99 1659\n", - "\n" + "2019-07-17 16:31:44 \u001b[1;30mINFO \u001b[0m \u001b[34m__main__\u001b[0m - F1-Score: 1.0\r\n", + "2019-07-17 16:31:44 \u001b[1;30mINFO \u001b[0m \u001b[34m__main__\u001b[0m - Precision: 1.0\r\n", + "2019-07-17 16:31:44 \u001b[1;30mINFO \u001b[0m \u001b[34m__main__\u001b[0m - Accuracy: 1.0\r\n", + "2019-07-17 16:31:44 \u001b[1;30mINFO \u001b[0m \u001b[34m__main__\u001b[0m - Classification report: \r\n", + " precision recall f1-score support\r\n", + "\r\n", + " bff 1.00 1.00 1.00 17\r\n", + " comida 1.00 1.00 1.00 17\r\n", + " cor 1.00 1.00 1.00 13\r\n", + " esporte 1.00 1.00 1.00 6\r\n", + " filhos 1.00 1.00 1.00 11\r\n", + " filme 1.00 1.00 1.00 4\r\n", + " genero 1.00 1.00 1.00 15\r\n", + " historia 1.00 1.00 1.00 6\r\n", + " hobby 1.00 1.00 1.00 11\r\n", + " how 1.00 1.00 1.00 24\r\n", + " license 1.00 1.00 1.00 14\r\n", + " linguagens 1.00 1.00 1.00 14\r\n", + " live 1.00 1.00 1.00 13\r\n", + " me 1.00 1.00 1.00 6\r\n", + " no_entity 1.00 1.00 1.00 613\r\n", + " piada 1.00 1.00 1.00 7\r\n", + " playlist 1.00 1.00 1.00 7\r\n", + "relationship 1.00 1.00 1.00 9\r\n", + " religiao 1.00 1.00 1.00 16\r\n", + " signo 1.00 1.00 1.00 3\r\n", + " starwars 1.00 1.00 1.00 13\r\n", + " triste 1.00 1.00 1.00 7\r\n", + " where 1.00 1.00 1.00 3\r\n", + "\r\n", + " micro avg 1.00 1.00 1.00 849\r\n", + " macro avg 1.00 1.00 1.00 849\r\n", + "weighted avg 1.00 1.00 1.00 849\r\n", + "\r\n", + "2019-07-17 16:31:44 \u001b[1;30mINFO \u001b[0m \u001b[34m__main__\u001b[0m - Finished evaluation\r\n" ] } ], "source": [ - "from rasa_nlu.evaluate import run_evaluation\n", - "run_evaluation('../../bot/data/intents/', model_directory)" + "!python -m rasa_nlu.test -d $COACH_INTENTS_PATH -m $COACH_MODELS_NLU_PATH --mode evaluation" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ - "### Lista de Problemas\n", - "\n", - "O arquivo `erros,json` mostra os erros encontrados após executar o comando `rasa_nlu.evaluate.run_evaluation`.\n", - "\n", - "Normalmente os erros mostrados são textos repetidos nos exemplos de diferrentes `intents`.\n", - "\n", - "Caso o arquivo não seja gerado significa que não foram encontrados erros." + "#### Matriz de Confusão\n", + "* A matriz de confusão mostra a correlação entre as intents.\n", + "* A diagonal principal tem forte correlação pois mostra a relação de uma intent **com ela mesma**\n", + "* O ideal é que não haja **nenhum valor** diferente de **0 fora da diagonal principal**." ] }, { "cell_type": "code", "execution_count": 5, + "metadata": { + "scrolled": false + }, + "outputs": [ + { + "data": { + "text/html": [ + "\n", + " \n", + " " + ], + "text/plain": [ + "" + ] + }, + "execution_count": 5, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "IFrame(src='./confmat.png', width=900, height=700)" + ] + }, + { + "cell_type": "markdown", "metadata": {}, + "source": [ + "#### Erros\n", + "* O arquivo `erros,json` mostra os erros encontrados. Este arquivo lista os mesmos erros mostrados na **matriz de confusão**, então caso ela fique muito grande, não se preocupe, pois você pode apenas procurar os erros no arquivo gerado.\n", + "* Os erros mostrados são textos repetidos nos exemplos de diferrentes `intents`.\n", + "* Caso o arquivo não seja gerado significa que não foram encontrados erros." + ] + }, + { + "cell_type": "code", + "execution_count": 6, + "metadata": { + "scrolled": true + }, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ - "{\r\n", - " \"intent_errors\": [\r\n", - " {\r\n", - " \"text\": \"software livre\",\r\n", - " \"intent\": \"license\",\r\n", - " \"intent_prediction\": {\r\n", - " \"name\": \"software_livre\",\r\n", - " \"confidence\": 0.8758267164230347\r\n", - " }\r\n", - " },\r\n", - " {\r\n", - " \"text\": \"e o c#\",\r\n", - " \"intent\": \"languages\",\r\n", - " \"intent_prediction\": {\r\n", - " \"name\": \"\",\r\n", - " \"confidence\": 0.0\r\n", - " }\r\n", - " },\r\n", - " {\r\n", - " \"text\": \"Tudo bem?\",\r\n", - " \"intent\": \"its_ok\",\r\n", - " \"intent_prediction\": {\r\n", - " \"name\": \"afirmar\",\r\n", - " \"confidence\": 0.6227023005485535\r\n", - " }\r\n", - " },\r\n", - " {\r\n", - " \"text\": \"onde voce nasceu?\",\r\n", - " \"intent\": \"where_r_u_from\",\r\n", - " \"intent_prediction\": {\r\n", - " \"name\": \"quem_eh_voce\",\r\n", - " \"confidence\": 0.7670958042144775\r\n", - " }\r\n", - " },\r\n", - " {\r\n", - " \"text\": \"Quem te fez?\",\r\n", - " \"intent\": \"creators\",\r\n", - " \"intent_prediction\": {\r\n", - " \"name\": \"o_que_eh_lappis\",\r\n", - " \"confidence\": 0.8802075982093811\r\n", - " }\r\n", - " },\r\n", - " {\r\n", - " \"text\": \"Qual o seu signo?\",\r\n", - " \"intent\": \"sign\",\r\n", - " \"intent_prediction\": {\r\n", - " \"name\": \"meu_signo\",\r\n", - " \"confidence\": 0.7709224820137024\r\n", - " }\r\n", - " },\r\n", - " {\r\n", - " \"text\": \"chatbot\",\r\n", - " \"intent\": \"quem_eh_lappisudo\",\r\n", - " \"intent_prediction\": {\r\n", - " \"name\": \"quem_eh_voce\",\r\n", - " \"confidence\": 0.8417193293571472\r\n", - " }\r\n", - " },\r\n", - " {\r\n", - " \"text\": \"signo\",\r\n", - " \"intent\": \"meu_signo\",\r\n", - " \"intent_prediction\": {\r\n", - " \"name\": \"sign\",\r\n", - " \"confidence\": 0.7748193740844727\r\n", - " }\r\n", - " },\r\n", - " {\r\n", - " \"text\": \"java\",\r\n", - " \"intent\": \"zoacao_java\",\r\n", - " \"intent_prediction\": {\r\n", - " \"name\": \"languages\",\r\n", - " \"confidence\": 0.7685664892196655\r\n", - " }\r\n", - " },\r\n", - " {\r\n", - " \"text\": \"como vai\",\r\n", - " \"intent\": \"cumprimentar\",\r\n", - " \"intent_prediction\": {\r\n", - " \"name\": \"tudo_bem\",\r\n", - " \"confidence\": 0.7766595482826233\r\n", - " }\r\n", - " },\r\n", - " {\r\n", - " \"text\": \"tudo bom\",\r\n", - " \"intent\": \"cumprimentar\",\r\n", - " \"intent_prediction\": {\r\n", - " \"name\": \"tudo_bem\",\r\n", - " \"confidence\": 0.777603030204773\r\n", - " }\r\n", - " },\r\n", - " {\r\n", - " \"text\": \"Tudo bem\",\r\n", - " \"intent\": \"tudo_bem\",\r\n", - " \"intent_prediction\": {\r\n", - " \"name\": \"afirmar\",\r\n", - " \"confidence\": 0.6227023005485535\r\n", - " }\r\n", - " },\r\n", - " {\r\n", - " \"text\": \"Quem te criou?\",\r\n", - " \"intent\": \"quem_eh_voce\",\r\n", - " \"intent_prediction\": {\r\n", - " \"name\": \"o_que_eh_lappis\",\r\n", - " \"confidence\": 0.8640211820602417\r\n", - " }\r\n", - " },\r\n", - " {\r\n", - " \"text\": \"Quem te desenvolveu?\",\r\n", - " \"intent\": \"quem_eh_voce\",\r\n", - " \"intent_prediction\": {\r\n", - " \"name\": \"o_que_eh_lappis\",\r\n", - " \"confidence\": 0.8942159414291382\r\n", - " }\r\n", + "[\r\n", + " {\r\n", + " \"text\": \"como vai\",\r\n", + " \"intent\": \"cumprimentar\",\r\n", + " \"intent_prediction\": {\r\n", + " \"name\": \"tudo_bem\",\r\n", + " \"confidence\": 0.7145657539367676\r\n", + " }\r\n", + " },\r\n", + " {\r\n", + " \"text\": \"tudo bom\",\r\n", + " \"intent\": \"cumprimentar\",\r\n", + " \"intent_prediction\": {\r\n", + " \"name\": \"tudo_bem\",\r\n", + " \"confidence\": 0.7155274152755737\r\n", + " }\r\n", + " },\r\n", + " {\r\n", + " \"text\": \"e o c#\",\r\n", + " \"intent\": \"linguagens\",\r\n", + " \"intent_prediction\": {\r\n", + " \"name\": \"\",\r\n", + " \"confidence\": 0.0\r\n", " }\r\n", - " ]\r\n", - "}" + " }\r\n", + "]" ] } ], @@ -551,86 +497,254 @@ }, { "cell_type": "markdown", - "metadata": { - "colab_type": "text", - "id": "1xeXgpdwzOAl" - }, + "metadata": {}, "source": [ - "### Avaliação do modelo de NLU treinado\n", + "#### Histograma\n", "\n", - "Caso queira testar mensagens específicas mande a mensagem na célula seguinte:" + "* O histograma contém a distribuição da predições das `intents`" ] }, { "cell_type": "code", - "execution_count": 6, + "execution_count": 7, + "metadata": { + "scrolled": false + }, + "outputs": [ + { + "data": { + "text/html": [ + "\n", + " \n", + " " + ], + "text/plain": [ + "" + ] + }, + "execution_count": 7, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "IFrame(src='./hist.png', width=900, height=700)" + ] + }, + { + "cell_type": "markdown", "metadata": {}, + "source": [ + "### Crossvalidation" + ] + }, + { + "cell_type": "code", + "execution_count": 8, + "metadata": { + "scrolled": true + }, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ - "{\n", - " \"intent\": {\n", - " \"name\": \"quem_eh_voce\",\n", - " \"confidence\": 0.8361726403236389\n", - " },\n", - " \"entities\": [],\n", - " \"intent_ranking\": [\n", - " {\n", - " \"name\": \"quem_eh_voce\",\n", - " \"confidence\": 0.8361726403236389\n", - " },\n", - " {\n", - " \"name\": \"where_r_u_from\",\n", - " \"confidence\": 0.3619411289691925\n", - " },\n", - " {\n", - " \"name\": \"despedir\",\n", - " \"confidence\": 0.3474047780036926\n", - " },\n", - " {\n", - " \"name\": \"genre\",\n", - " \"confidence\": 0.2647324502468109\n", - " },\n", - " {\n", - " \"name\": \"sign\",\n", - " \"confidence\": 0.2186793088912964\n", - " },\n", - " {\n", - " \"name\": \"cumprimentar\",\n", - " \"confidence\": 0.20706906914710999\n", - " },\n", - " {\n", - " \"name\": \"meu_signo\",\n", - " \"confidence\": 0.19841191172599792\n", - " },\n", - " {\n", - " \"name\": \"story\",\n", - " \"confidence\": 0.18699833750724792\n", - " },\n", - " {\n", - " \"name\": \"laugh\",\n", - " \"confidence\": 0.1862882375717163\n", - " },\n", - " {\n", - " \"name\": \"erro_resposta_utter\",\n", - " \"confidence\": 0.15251879394054413\n", - " }\n", - " ],\n", - " \"text\": \"O que \\u00e9 um bot?\"\n", - "}\n" + "/usr/local/lib/python3.6/runpy.py:125: RuntimeWarning: 'rasa_nlu.test' found in sys.modules after import of package 'rasa_nlu', but prior to execution of 'rasa_nlu.test'; this may result in unpredictable behaviour\n", + " warn(RuntimeWarning(msg))\n", + "2019-07-17 16:32:19 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.training_data.loading\u001b[0m - Training data format of ../../coach/data/intents/geral.md is md\n", + "2019-07-17 16:32:19 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.training_data.training_data\u001b[0m - Training data stats: \n", + "\t- intent examples: 85 (7 distinct intents)\n", + "\t- Found intents: 'cumprimentar', 'tudo_bem', 'negar', 'elogios', 'despedir', 'out_of_scope', 'diga_mais'\n", + "\t- entity examples: 0 (0 distinct entities)\n", + "\t- found entities: \n", + "\n", + "2019-07-17 16:32:19 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.training_data.loading\u001b[0m - Training data format of ../../coach/data/intents/aleatorio.md is md\n", + "2019-07-17 16:32:19 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.training_data.training_data\u001b[0m - Training data stats: \n", + "\t- intent examples: 197 (24 distinct intents)\n", + "\t- Found intents: 'bff', 'risada', 'filhos', 'genero', 'piada', 'time', 'comida', 'cor', 'historia', 'triste', 'como_estou', 'filme', 'star_wars', 'relationship', 'esporte', 'signo', 'me', 'linguagens', 'de_onde_voce_eh', 'religiao', 'hobby', 'playlist', 'license', 'onde_voce_mora'\n", + "\t- entity examples: 172 (22 distinct entities)\n", + "\t- found entities: 'live', 'filhos', 'genero', 'relationship', 'linguagens', 'me', 'hobby', 'starwars', 'playlist', 'license', 'bff', 'piada', 'comida', 'cor', 'historia', 'triste', 'where', 'filme', 'how', 'esporte', 'signo', 'religiao'\n", + "\n", + "2019-07-17 16:32:19 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.training_data.loading\u001b[0m - Training data format of ../../coach/data/intents/actions.md is md\n", + "2019-07-17 16:32:19 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.training_data.training_data\u001b[0m - Training data stats: \n", + "\t- intent examples: 6 (1 distinct intents)\n", + "\t- Found intents: 'action_test'\n", + "\t- entity examples: 0 (0 distinct entities)\n", + "\t- found entities: \n", + "\n", + "2019-07-17 16:32:19 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.training_data.training_data\u001b[0m - Training data stats: \n", + "\t- intent examples: 288 (32 distinct intents)\n", + "\t- Found intents: 'filhos', 'genero', 'time', 'como_estou', 'cumprimentar', 'star_wars', 'relationship', 'tudo_bem', 'linguagens', 'me', 'hobby', 'playlist', 'license', 'onde_voce_mora', 'bff', 'risada', 'piada', 'negar', 'comida', 'cor', 'historia', 'out_of_scope', 'triste', 'elogios', 'filme', 'action_test', 'esporte', 'signo', 'de_onde_voce_eh', 'despedir', 'religiao', 'diga_mais'\n", + "\t- entity examples: 172 (22 distinct entities)\n", + "\t- found entities: 'live', 'filhos', 'genero', 'relationship', 'linguagens', 'me', 'hobby', 'starwars', 'playlist', 'license', 'bff', 'piada', 'comida', 'cor', 'historia', 'triste', 'where', 'filme', 'how', 'esporte', 'signo', 'religiao'\n", + "\n", + "2019-07-17 16:32:19 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.training_data.training_data\u001b[0m - Training data stats: \n", + "\t- intent examples: 273 (28 distinct intents)\n", + "\t- Found intents: 'bff', 'risada', 'filhos', 'genero', 'piada', 'time', 'negar', 'comida', 'cor', 'historia', 'out_of_scope', 'triste', 'como_estou', 'cumprimentar', 'star_wars', 'relationship', 'hobby', 'action_test', 'tudo_bem', 'esporte', 'linguagens', 'despedir', 'religiao', 'me', 'playlist', 'license', 'onde_voce_mora', 'diga_mais'\n", + "\t- entity examples: 162 (19 distinct entities)\n", + "\t- found entities: 'bff', 'triste', 'live', 'filhos', 'genero', 'how', 'piada', 'relationship', 'esporte', 'comida', 'me', 'cor', 'historia', 'linguagens', 'religiao', 'hobby', 'starwars', 'playlist', 'license'\n", + "\n", + "2019-07-17 16:32:20 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.training_data.training_data\u001b[0m - Training data stats: \n", + "\t- intent examples: 131 (28 distinct intents)\n", + "\t- Found intents: 'bff', 'risada', 'filhos', 'genero', 'piada', 'time', 'negar', 'comida', 'cor', 'historia', 'out_of_scope', 'triste', 'como_estou', 'cumprimentar', 'star_wars', 'relationship', 'hobby', 'action_test', 'tudo_bem', 'esporte', 'linguagens', 'despedir', 'religiao', 'me', 'playlist', 'license', 'onde_voce_mora', 'diga_mais'\n", + "\t- entity examples: 79 (19 distinct entities)\n", + "\t- found entities: 'bff', 'triste', 'live', 'filhos', 'genero', 'how', 'piada', 'relationship', 'esporte', 'comida', 'me', 'cor', 'historia', 'linguagens', 'religiao', 'hobby', 'starwars', 'playlist', 'license'\n", + "\n", + "2019-07-17 16:32:20 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.training_data.training_data\u001b[0m - Training data stats: \n", + "\t- intent examples: 142 (28 distinct intents)\n", + "\t- Found intents: 'bff', 'risada', 'filhos', 'genero', 'piada', 'time', 'negar', 'comida', 'cor', 'historia', 'out_of_scope', 'triste', 'como_estou', 'cumprimentar', 'star_wars', 'relationship', 'hobby', 'action_test', 'tudo_bem', 'esporte', 'linguagens', 'despedir', 'religiao', 'me', 'playlist', 'license', 'onde_voce_mora', 'diga_mais'\n", + "\t- entity examples: 83 (19 distinct entities)\n", + "\t- found entities: 'bff', 'triste', 'live', 'filhos', 'genero', 'how', 'piada', 'relationship', 'esporte', 'comida', 'me', 'cor', 'historia', 'linguagens', 'religiao', 'hobby', 'starwars', 'playlist', 'license'\n", + "\n", + "2019-07-17 16:32:20 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.model\u001b[0m - Starting to train component WhitespaceTokenizer\n", + "2019-07-17 16:32:20 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.model\u001b[0m - Finished training component.\n", + "2019-07-17 16:32:20 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.model\u001b[0m - Starting to train component CRFEntityExtractor\n", + "2019-07-17 16:32:21 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.model\u001b[0m - Finished training component.\n", + "2019-07-17 16:32:21 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.model\u001b[0m - Starting to train component EntitySynonymMapper\n", + "2019-07-17 16:32:21 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.model\u001b[0m - Finished training component.\n", + "2019-07-17 16:32:21 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.model\u001b[0m - Starting to train component CountVectorsFeaturizer\n", + "2019-07-17 16:32:21 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.model\u001b[0m - Finished training component.\n", + "2019-07-17 16:32:21 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.model\u001b[0m - Starting to train component EmbeddingIntentClassifier\n", + "\n", + "WARNING: The TensorFlow contrib module will not be included in TensorFlow 2.0.\n", + "For more information, please see:\n", + " * https://github.com/tensorflow/community/blob/master/rfcs/20180907-contrib-sunset.md\n", + " * https://github.com/tensorflow/addons\n", + "If you depend on functionality not listed there, please file an issue.\n", + "\n", + "2019-07-17 16:32:21 \u001b[1;30mWARNING \u001b[0m \u001b[34mtensorflow\u001b[0m - \u001b[33mFrom /usr/local/lib/python3.6/site-packages/rasa_nlu/classifiers/embedding_intent_classifier.py:285: dense (from tensorflow.python.layers.core) is deprecated and will be removed in a future version.\n", + "Instructions for updating:\n", + "Use keras.layers.dense instead.\u001b[0m\n", + "2019-07-17 16:32:21 \u001b[1;30mWARNING \u001b[0m \u001b[34mtensorflow\u001b[0m - \u001b[33mFrom /usr/local/lib/python3.6/site-packages/tensorflow/python/framework/op_def_library.py:263: colocate_with (from tensorflow.python.framework.ops) is deprecated and will be removed in a future version.\n", + "Instructions for updating:\n", + "Colocations handled automatically by placer.\u001b[0m\n", + "2019-07-17 16:32:21 \u001b[1;30mWARNING \u001b[0m \u001b[34mtensorflow\u001b[0m - \u001b[33mFrom /usr/local/lib/python3.6/site-packages/rasa_nlu/classifiers/embedding_intent_classifier.py:286: dropout (from tensorflow.python.layers.core) is deprecated and will be removed in a future version.\n", + "Instructions for updating:\n", + "Use keras.layers.dropout instead.\u001b[0m\n", + "2019-07-17 16:32:21 \u001b[1;30mWARNING \u001b[0m \u001b[34mtensorflow\u001b[0m - \u001b[33mFrom /usr/local/lib/python3.6/site-packages/tensorflow/python/keras/layers/core.py:143: calling dropout (from tensorflow.python.ops.nn_ops) with keep_prob is deprecated and will be removed in a future version.\n", + "Instructions for updating:\n", + "Please use `rate` instead of `keep_prob`. Rate should be set to `rate = 1 - keep_prob`.\u001b[0m\n", + "2019-07-17 16:32:22 \u001b[1;30mWARNING \u001b[0m \u001b[34mtensorflow\u001b[0m - \u001b[33mFrom /usr/local/lib/python3.6/site-packages/tensorflow/python/ops/math_ops.py:3066: to_int32 (from tensorflow.python.ops.math_ops) is deprecated and will be removed in a future version.\n", + "Instructions for updating:\n", + "Use tf.cast instead.\u001b[0m\n", + "2019-07-17 16:32:22 \u001b[1;30mWARNING \u001b[0m \u001b[34mtensorflow\u001b[0m - \u001b[33mFrom /usr/local/lib/python3.6/site-packages/tensorflow/python/ops/math_grad.py:102: div (from tensorflow.python.ops.math_ops) is deprecated and will be removed in a future version.\n", + "Instructions for updating:\n", + "Deprecated in favor of operator or tf.math.divide.\u001b[0m\n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "2019-07-17 16:32:22.678227: I tensorflow/core/platform/cpu_feature_guard.cc:141] Your CPU supports instructions that this TensorFlow binary was not compiled to use: AVX2 FMA\n", + "2019-07-17 16:32:22.700933: I tensorflow/core/platform/profile_utils/cpu_utils.cc:94] CPU Frequency: 2194805000 Hz\n", + "2019-07-17 16:32:22.701522: I tensorflow/compiler/xla/service/service.cc:150] XLA service 0x55be5a7c66c0 executing computations on platform Host. Devices:\n", + "2019-07-17 16:32:22.701579: I tensorflow/compiler/xla/service/service.cc:158] StreamExecutor device (0): , \n", + "2019-07-17 16:32:22 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.classifiers.embedding_intent_classifier\u001b[0m - Accuracy is updated every 10 epochs\n", + "Epochs: 100%|██████████| 300/300 [00:05<00:00, 53.69it/s, loss=0.194, acc=0.992]\n", + "2019-07-17 16:32:28 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.classifiers.embedding_intent_classifier\u001b[0m - Finished training embedding classifier, loss=0.194, train accuracy=0.992\n", + "2019-07-17 16:32:28 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.model\u001b[0m - Finished training component.\n", + "2019-07-17 16:32:28 \u001b[1;30mINFO \u001b[0m \u001b[34m__main__\u001b[0m - Running model for predictions:\n", + "100%|████████████████████████████████████████| 131/131 [00:00<00:00, 435.20it/s]\n", + "2019-07-17 16:32:28 \u001b[1;30mINFO \u001b[0m \u001b[34m__main__\u001b[0m - Running model for predictions:\n", + "100%|████████████████████████████████████████| 142/142 [00:00<00:00, 527.33it/s]\n", + "/usr/local/lib/python3.6/site-packages/sklearn/metrics/classification.py:1143: UndefinedMetricWarning: Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples.\n", + " 'precision', 'predicted', average, warn_for)\n", + "/usr/local/lib/python3.6/site-packages/sklearn/metrics/classification.py:1145: UndefinedMetricWarning: Recall and F-score are ill-defined and being set to 0.0 in labels with no true samples.\n", + " 'recall', 'true', average, warn_for)\n", + "/usr/local/lib/python3.6/site-packages/sklearn/metrics/classification.py:1143: UndefinedMetricWarning: Precision is ill-defined and being set to 0.0 in labels with no predicted samples.\n", + " 'precision', 'predicted', average, warn_for)\n", + "/usr/local/lib/python3.6/site-packages/sklearn/metrics/classification.py:1143: UndefinedMetricWarning: F-score is ill-defined and being set to 0.0 in labels with no predicted samples.\n", + " 'precision', 'predicted', average, warn_for)\n", + "/usr/local/lib/python3.6/site-packages/sklearn/metrics/classification.py:1145: UndefinedMetricWarning: F-score is ill-defined and being set to 0.0 in labels with no true samples.\n", + " 'recall', 'true', average, warn_for)\n", + "2019-07-17 16:32:28 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.training_data.training_data\u001b[0m - Training data stats: \n", + "\t- intent examples: 142 (28 distinct intents)\n", + "\t- Found intents: 'bff', 'risada', 'filhos', 'genero', 'piada', 'time', 'negar', 'comida', 'cor', 'historia', 'out_of_scope', 'triste', 'como_estou', 'cumprimentar', 'star_wars', 'relationship', 'hobby', 'action_test', 'tudo_bem', 'esporte', 'linguagens', 'despedir', 'religiao', 'me', 'playlist', 'license', 'onde_voce_mora', 'diga_mais'\n", + "\t- entity examples: 83 (19 distinct entities)\n", + "\t- found entities: 'bff', 'triste', 'live', 'filhos', 'genero', 'how', 'piada', 'relationship', 'esporte', 'comida', 'me', 'cor', 'historia', 'linguagens', 'religiao', 'hobby', 'starwars', 'playlist', 'license'\n", + "\n", + "2019-07-17 16:32:28 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.training_data.training_data\u001b[0m - Training data stats: \n", + "\t- intent examples: 131 (28 distinct intents)\n", + "\t- Found intents: 'bff', 'risada', 'filhos', 'genero', 'piada', 'time', 'negar', 'comida', 'cor', 'historia', 'out_of_scope', 'triste', 'como_estou', 'cumprimentar', 'star_wars', 'relationship', 'hobby', 'action_test', 'tudo_bem', 'esporte', 'linguagens', 'despedir', 'religiao', 'me', 'playlist', 'license', 'onde_voce_mora', 'diga_mais'\n", + "\t- entity examples: 79 (19 distinct entities)\n", + "\t- found entities: 'bff', 'triste', 'live', 'filhos', 'genero', 'how', 'piada', 'relationship', 'esporte', 'comida', 'me', 'cor', 'historia', 'linguagens', 'religiao', 'hobby', 'starwars', 'playlist', 'license'\n", + "\n", + "2019-07-17 16:32:29 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.model\u001b[0m - Starting to train component WhitespaceTokenizer\n", + "2019-07-17 16:32:29 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.model\u001b[0m - Finished training component.\n", + "2019-07-17 16:32:29 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.model\u001b[0m - Starting to train component CRFEntityExtractor\n", + "2019-07-17 16:32:29 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.model\u001b[0m - Finished training component.\n", + "2019-07-17 16:32:29 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.model\u001b[0m - Starting to train component EntitySynonymMapper\n", + "2019-07-17 16:32:29 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.model\u001b[0m - Finished training component.\n", + "2019-07-17 16:32:29 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.model\u001b[0m - Starting to train component CountVectorsFeaturizer\n", + "2019-07-17 16:32:29 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.model\u001b[0m - Finished training component.\n", + "2019-07-17 16:32:29 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.model\u001b[0m - Starting to train component EmbeddingIntentClassifier\n", + "2019-07-17 16:32:30 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.classifiers.embedding_intent_classifier\u001b[0m - Accuracy is updated every 10 epochs\n", + "Epochs: 100%|██████████| 300/300 [00:06<00:00, 45.43it/s, loss=0.188, acc=1.000]\n", + "2019-07-17 16:32:36 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.classifiers.embedding_intent_classifier\u001b[0m - Finished training embedding classifier, loss=0.188, train accuracy=1.000\n", + "2019-07-17 16:32:36 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.model\u001b[0m - Finished training component.\n", + "2019-07-17 16:32:36 \u001b[1;30mINFO \u001b[0m \u001b[34m__main__\u001b[0m - Running model for predictions:\n", + "100%|████████████████████████████████████████| 142/142 [00:00<00:00, 433.04it/s]\n", + "/usr/local/lib/python3.6/site-packages/sklearn/metrics/classification.py:1145: UndefinedMetricWarning: Recall and F-score are ill-defined and being set to 0.0 in labels with no true samples.\n", + " 'recall', 'true', average, warn_for)\n", + "/usr/local/lib/python3.6/site-packages/sklearn/metrics/classification.py:1145: UndefinedMetricWarning: F-score is ill-defined and being set to 0.0 in labels with no true samples.\n", + " 'recall', 'true', average, warn_for)\n", + "2019-07-17 16:32:37 \u001b[1;30mINFO \u001b[0m \u001b[34m__main__\u001b[0m - Running model for predictions:\n", + "100%|████████████████████████████████████████| 131/131 [00:00<00:00, 569.47it/s]\n", + "/usr/local/lib/python3.6/site-packages/sklearn/metrics/classification.py:1143: UndefinedMetricWarning: Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples.\n", + " 'precision', 'predicted', average, warn_for)\n", + "/usr/local/lib/python3.6/site-packages/sklearn/metrics/classification.py:1143: UndefinedMetricWarning: Precision is ill-defined and being set to 0.0 in labels with no predicted samples.\n", + " 'precision', 'predicted', average, warn_for)\n", + "/usr/local/lib/python3.6/site-packages/sklearn/metrics/classification.py:1143: UndefinedMetricWarning: F-score is ill-defined and being set to 0.0 in labels with no predicted samples.\n", + " 'precision', 'predicted', average, warn_for)\n", + "2019-07-17 16:32:37 \u001b[1;30mINFO \u001b[0m \u001b[34m__main__\u001b[0m - CV evaluation (n=2)\n", + "2019-07-17 16:32:37 \u001b[1;30mINFO \u001b[0m \u001b[34m__main__\u001b[0m - Intent evaluation results\n", + "2019-07-17 16:32:37 \u001b[1;30mINFO \u001b[0m \u001b[34m__main__\u001b[0m - train Accuracy: 0.993 (0.000)\n", + "2019-07-17 16:32:37 \u001b[1;30mINFO \u001b[0m \u001b[34m__main__\u001b[0m - train F1-score: 0.994 (0.002)\n", + "2019-07-17 16:32:37 \u001b[1;30mINFO \u001b[0m \u001b[34m__main__\u001b[0m - train Precision: 0.997 (0.003)\n", + "2019-07-17 16:32:37 \u001b[1;30mINFO \u001b[0m \u001b[34m__main__\u001b[0m - test Accuracy: 0.536 (0.029)\n", + "2019-07-17 16:32:37 \u001b[1;30mINFO \u001b[0m \u001b[34m__main__\u001b[0m - test F1-score: 0.561 (0.031)\n", + "2019-07-17 16:32:37 \u001b[1;30mINFO \u001b[0m \u001b[34m__main__\u001b[0m - test Precision: 0.681 (0.027)\n", + "2019-07-17 16:32:37 \u001b[1;30mINFO \u001b[0m \u001b[34m__main__\u001b[0m - Entity evaluation results\n", + "2019-07-17 16:32:37 \u001b[1;30mINFO \u001b[0m \u001b[34m__main__\u001b[0m - Entity extractor: CRFEntityExtractor\n", + "2019-07-17 16:32:37 \u001b[1;30mINFO \u001b[0m \u001b[34m__main__\u001b[0m - train Accuracy: 1.000 (0.000)\n", + "2019-07-17 16:32:37 \u001b[1;30mINFO \u001b[0m \u001b[34m__main__\u001b[0m - train F1-score: 1.000 (0.000)\n", + "2019-07-17 16:32:37 \u001b[1;30mINFO \u001b[0m \u001b[34m__main__\u001b[0m - train Precision: 1.000 (0.000)\n", + "2019-07-17 16:32:37 \u001b[1;30mINFO \u001b[0m \u001b[34m__main__\u001b[0m - Entity extractor: CRFEntityExtractor\n", + "2019-07-17 16:32:37 \u001b[1;30mINFO \u001b[0m \u001b[34m__main__\u001b[0m - test Accuracy: 0.826 (0.004)\n", + "2019-07-17 16:32:37 \u001b[1;30mINFO \u001b[0m \u001b[34m__main__\u001b[0m - test F1-score: 0.776 (0.001)\n", + "2019-07-17 16:32:37 \u001b[1;30mINFO \u001b[0m \u001b[34m__main__\u001b[0m - test Precision: 0.810 (0.033)\n", + "2019-07-17 16:32:37 \u001b[1;30mINFO \u001b[0m \u001b[34m__main__\u001b[0m - Finished evaluation\n" ] } ], "source": [ - "pprint(interpreter.parse('O que é um bot?'))" + "!python -m rasa_nlu.test -d $COACH_INTENTS_PATH -c $COACH_NLU_CONFIG_PATH --mode crossvalidation --folds 2 --report" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## Referências:\n", + "\n", + "O Rasa está em constante evolução, alguns links úteis para a construção deste jupyter-notebook e para a análise das `intents` são:\n", + "\n", + "* [Evaluation](https://rasa.com/docs/nlu/evaluation/)" ] }, { "cell_type": "code", "execution_count": null, - "metadata": {}, + "metadata": { + "scrolled": true + }, "outputs": [], "source": [] } @@ -670,7 +784,7 @@ "name": "python", "nbconvert_exporter": "python", "pygments_lexer": "ipython3", - "version": "3.6.8" + "version": "3.6.9" } }, "nbformat": 4, diff --git a/notebooks/intents/intents-analysis.ipynb b/notebooks/intents/intents-analysis.ipynb index ca6900e0..c15cddbf 100644 --- a/notebooks/intents/intents-analysis.ipynb +++ b/notebooks/intents/intents-analysis.ipynb @@ -32,14 +32,6 @@ "text": [ "rasa_nlu: 0.15.0\n" ] - }, - { - "name": "stderr", - "output_type": "stream", - "text": [ - "/usr/local/lib/python3.6/site-packages/requests/__init__.py:91: RequestsDependencyWarning: urllib3 (1.25.2) or chardet (3.0.4) doesn't match a supported version!\n", - " RequestsDependencyWarning)\n" - ] } ], "source": [ @@ -67,56 +59,54 @@ "cell_type": "code", "execution_count": 2, "metadata": { - "scrolled": true + "scrolled": false }, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ - "make: Entering directory '/work/bot'\n", + "make: Entering directory '/work/coach'\n", "python3 -m rasa_nlu.train -c nlu_config.yml --fixed_model_name current \\\n", - " --data data/intents/ -o models --project nlu --verbose\n", - "/usr/local/lib/python3.6/site-packages/requests/__init__.py:91: RequestsDependencyWarning: urllib3 (1.25.2) or chardet (3.0.4) doesn't match a supported version!\n", - " RequestsDependencyWarning)\n", + "--data data/intents/ -o /src_models --project nlu --verbose\n", "/usr/local/lib/python3.6/runpy.py:125: RuntimeWarning: 'rasa_nlu.train' found in sys.modules after import of package 'rasa_nlu', but prior to execution of 'rasa_nlu.train'; this may result in unpredictable behaviour\n", " warn(RuntimeWarning(msg))\n", - "2019-05-03 21:20:31 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.training_data.loading\u001b[0m - Training data format of data/intents/aleatorio.md is md\n", - "2019-05-03 21:20:31 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.training_data.training_data\u001b[0m - Training data stats: \n", + "2019-07-17 16:30:02 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.training_data.loading\u001b[0m - Training data format of data/intents/geral.md is md\n", + "2019-07-17 16:30:02 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.training_data.training_data\u001b[0m - Training data stats: \n", + "\t- intent examples: 85 (7 distinct intents)\n", + "\t- Found intents: 'elogios', 'negar', 'despedir', 'diga_mais', 'tudo_bem', 'out_of_scope', 'cumprimentar'\n", + "\t- entity examples: 0 (0 distinct entities)\n", + "\t- found entities: \n", + "\n", + "2019-07-17 16:30:02 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.training_data.loading\u001b[0m - Training data format of data/intents/aleatorio.md is md\n", + "2019-07-17 16:30:02 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.training_data.training_data\u001b[0m - Training data stats: \n", "\t- intent examples: 197 (24 distinct intents)\n", - "\t- Found intents: 'historia', 'de_onde_voce_eh', 'triste', 'filhos', 'hobby', 'signo', 'como_estou', 'piada', 'playlist', 'time', 'genero', 'relationship', 'bff', 'esporte', 'risada', 'star_wars', 'religiao', 'cor', 'linguagens', 'filme', 'me', 'onde_voce_mora', 'comida', 'license'\n", + "\t- Found intents: 'bff', 'filhos', 'license', 'de_onde_voce_eh', 'triste', 'religiao', 'playlist', 'signo', 'risada', 'time', 'comida', 'star_wars', 'cor', 'onde_voce_mora', 'esporte', 'piada', 'me', 'historia', 'linguagens', 'filme', 'hobby', 'relationship', 'como_estou', 'genero'\n", "\t- entity examples: 172 (22 distinct entities)\n", - "\t- found entities: 'historia', 'filhos', 'hobby', 'playlist', 'genero', 'esporte', 'linguagens', 'filme', 'me', 'where', 'comida', 'triste', 'signo', 'starwars', 'piada', 'how', 'relationship', 'bff', 'live', 'religiao', 'cor', 'license'\n", + "\t- found entities: 'filhos', 'starwars', 'license', 'triste', 'live', 'religiao', 'signo', 'cor', 'how', 'esporte', 'piada', 'me', 'historia', 'hobby', 'relationship', 'bff', 'playlist', 'comida', 'filme', 'linguagens', 'genero', 'where'\n", "\n", - "2019-05-03 21:20:31 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.training_data.loading\u001b[0m - Training data format of data/intents/actions.md is md\n", - "2019-05-03 21:20:31 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.training_data.training_data\u001b[0m - Training data stats: \n", + "2019-07-17 16:30:02 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.training_data.loading\u001b[0m - Training data format of data/intents/actions.md is md\n", + "2019-07-17 16:30:02 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.training_data.training_data\u001b[0m - Training data stats: \n", "\t- intent examples: 6 (1 distinct intents)\n", "\t- Found intents: 'action_test'\n", "\t- entity examples: 0 (0 distinct entities)\n", "\t- found entities: \n", "\n", - "2019-05-03 21:20:31 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.training_data.loading\u001b[0m - Training data format of data/intents/geral.md is md\n", - "2019-05-03 21:20:31 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.training_data.training_data\u001b[0m - Training data stats: \n", - "\t- intent examples: 85 (7 distinct intents)\n", - "\t- Found intents: 'elogios', 'out_of_scope', 'negar', 'despedir', 'diga_mais', 'cumprimentar', 'tudo_bem'\n", - "\t- entity examples: 0 (0 distinct entities)\n", - "\t- found entities: \n", - "\n", - "2019-05-03 21:20:31 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.training_data.training_data\u001b[0m - Training data stats: \n", + "2019-07-17 16:30:02 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.training_data.training_data\u001b[0m - Training data stats: \n", "\t- intent examples: 288 (32 distinct intents)\n", - "\t- Found intents: 'historia', 'de_onde_voce_eh', 'out_of_scope', 'filhos', 'hobby', 'playlist', 'diga_mais', 'genero', 'esporte', 'star_wars', 'negar', 'linguagens', 'filme', 'me', 'comida', 'elogios', 'triste', 'signo', 'como_estou', 'piada', 'time', 'relationship', 'tudo_bem', 'bff', 'risada', 'action_test', 'religiao', 'despedir', 'cor', 'onde_voce_mora', 'cumprimentar', 'license'\n", + "\t- Found intents: 'filhos', 'license', 'negar', 'action_test', 'triste', 'religiao', 'signo', 'time', 'star_wars', 'cor', 'elogios', 'esporte', 'piada', 'me', 'historia', 'hobby', 'relationship', 'tudo_bem', 'como_estou', 'cumprimentar', 'bff', 'despedir', 'de_onde_voce_eh', 'playlist', 'risada', 'comida', 'onde_voce_mora', 'linguagens', 'filme', 'diga_mais', 'out_of_scope', 'genero'\n", "\t- entity examples: 172 (22 distinct entities)\n", - "\t- found entities: 'historia', 'filhos', 'hobby', 'playlist', 'genero', 'esporte', 'linguagens', 'filme', 'me', 'where', 'comida', 'triste', 'signo', 'starwars', 'piada', 'how', 'relationship', 'bff', 'live', 'religiao', 'cor', 'license'\n", + "\t- found entities: 'filhos', 'starwars', 'license', 'triste', 'live', 'religiao', 'signo', 'cor', 'how', 'esporte', 'piada', 'me', 'historia', 'hobby', 'relationship', 'bff', 'playlist', 'comida', 'filme', 'linguagens', 'genero', 'where'\n", "\n", - "2019-05-03 21:20:31 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.model\u001b[0m - Starting to train component WhitespaceTokenizer\n", - "2019-05-03 21:20:31 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.model\u001b[0m - Finished training component.\n", - "2019-05-03 21:20:31 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.model\u001b[0m - Starting to train component CRFEntityExtractor\n", - "2019-05-03 21:20:31 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.model\u001b[0m - Finished training component.\n", - "2019-05-03 21:20:31 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.model\u001b[0m - Starting to train component EntitySynonymMapper\n", - "2019-05-03 21:20:31 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.model\u001b[0m - Finished training component.\n", - "2019-05-03 21:20:31 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.model\u001b[0m - Starting to train component CountVectorsFeaturizer\n", - "2019-05-03 21:20:32 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.model\u001b[0m - Finished training component.\n", - "2019-05-03 21:20:32 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.model\u001b[0m - Starting to train component EmbeddingIntentClassifier\n", + "2019-07-17 16:30:02 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.model\u001b[0m - Starting to train component WhitespaceTokenizer\n", + "2019-07-17 16:30:02 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.model\u001b[0m - Finished training component.\n", + "2019-07-17 16:30:02 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.model\u001b[0m - Starting to train component CRFEntityExtractor\n", + "2019-07-17 16:30:02 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.model\u001b[0m - Finished training component.\n", + "2019-07-17 16:30:02 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.model\u001b[0m - Starting to train component EntitySynonymMapper\n", + "2019-07-17 16:30:02 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.model\u001b[0m - Finished training component.\n", + "2019-07-17 16:30:02 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.model\u001b[0m - Starting to train component CountVectorsFeaturizer\n", + "2019-07-17 16:30:03 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.model\u001b[0m - Finished training component.\n", + "2019-07-17 16:30:03 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.model\u001b[0m - Starting to train component EmbeddingIntentClassifier\n", "\n", "WARNING: The TensorFlow contrib module will not be included in TensorFlow 2.0.\n", "For more information, please see:\n", @@ -124,40 +114,40 @@ " * https://github.com/tensorflow/addons\n", "If you depend on functionality not listed there, please file an issue.\n", "\n", - "2019-05-03 21:20:32 \u001b[1;30mWARNING \u001b[0m \u001b[34mtensorflow\u001b[0m - \u001b[33mFrom /usr/local/lib/python3.6/site-packages/rasa_nlu/classifiers/embedding_intent_classifier.py:285: dense (from tensorflow.python.layers.core) is deprecated and will be removed in a future version.\n", + "2019-07-17 16:30:05 \u001b[1;30mWARNING \u001b[0m \u001b[34mtensorflow\u001b[0m - \u001b[33mFrom /usr/local/lib/python3.6/site-packages/rasa_nlu/classifiers/embedding_intent_classifier.py:285: dense (from tensorflow.python.layers.core) is deprecated and will be removed in a future version.\n", "Instructions for updating:\n", "Use keras.layers.dense instead.\u001b[0m\n", - "2019-05-03 21:20:32 \u001b[1;30mWARNING \u001b[0m \u001b[34mtensorflow\u001b[0m - \u001b[33mFrom /usr/local/lib/python3.6/site-packages/tensorflow/python/framework/op_def_library.py:263: colocate_with (from tensorflow.python.framework.ops) is deprecated and will be removed in a future version.\n", + "2019-07-17 16:30:05 \u001b[1;30mWARNING \u001b[0m \u001b[34mtensorflow\u001b[0m - \u001b[33mFrom /usr/local/lib/python3.6/site-packages/tensorflow/python/framework/op_def_library.py:263: colocate_with (from tensorflow.python.framework.ops) is deprecated and will be removed in a future version.\n", "Instructions for updating:\n", "Colocations handled automatically by placer.\u001b[0m\n", - "2019-05-03 21:20:32 \u001b[1;30mWARNING \u001b[0m \u001b[34mtensorflow\u001b[0m - \u001b[33mFrom /usr/local/lib/python3.6/site-packages/rasa_nlu/classifiers/embedding_intent_classifier.py:286: dropout (from tensorflow.python.layers.core) is deprecated and will be removed in a future version.\n", + "2019-07-17 16:30:05 \u001b[1;30mWARNING \u001b[0m \u001b[34mtensorflow\u001b[0m - \u001b[33mFrom /usr/local/lib/python3.6/site-packages/rasa_nlu/classifiers/embedding_intent_classifier.py:286: dropout (from tensorflow.python.layers.core) is deprecated and will be removed in a future version.\n", "Instructions for updating:\n", "Use keras.layers.dropout instead.\u001b[0m\n", - "2019-05-03 21:20:32 \u001b[1;30mWARNING \u001b[0m \u001b[34mtensorflow\u001b[0m - \u001b[33mFrom /usr/local/lib/python3.6/site-packages/tensorflow/python/keras/layers/core.py:143: calling dropout (from tensorflow.python.ops.nn_ops) with keep_prob is deprecated and will be removed in a future version.\n", + "2019-07-17 16:30:05 \u001b[1;30mWARNING \u001b[0m \u001b[34mtensorflow\u001b[0m - \u001b[33mFrom /usr/local/lib/python3.6/site-packages/tensorflow/python/keras/layers/core.py:143: calling dropout (from tensorflow.python.ops.nn_ops) with keep_prob is deprecated and will be removed in a future version.\n", "Instructions for updating:\n", "Please use `rate` instead of `keep_prob`. Rate should be set to `rate = 1 - keep_prob`.\u001b[0m\n", - "2019-05-03 21:20:32 \u001b[1;30mWARNING \u001b[0m \u001b[34mtensorflow\u001b[0m - \u001b[33mFrom /usr/local/lib/python3.6/site-packages/tensorflow/python/ops/math_ops.py:3066: to_int32 (from tensorflow.python.ops.math_ops) is deprecated and will be removed in a future version.\n", + "2019-07-17 16:30:05 \u001b[1;30mWARNING \u001b[0m \u001b[34mtensorflow\u001b[0m - \u001b[33mFrom /usr/local/lib/python3.6/site-packages/tensorflow/python/ops/math_ops.py:3066: to_int32 (from tensorflow.python.ops.math_ops) is deprecated and will be removed in a future version.\n", "Instructions for updating:\n", "Use tf.cast instead.\u001b[0m\n", - "2019-05-03 21:20:32 \u001b[1;30mWARNING \u001b[0m \u001b[34mtensorflow\u001b[0m - \u001b[33mFrom /usr/local/lib/python3.6/site-packages/tensorflow/python/ops/math_grad.py:102: div (from tensorflow.python.ops.math_ops) is deprecated and will be removed in a future version.\n", + "2019-07-17 16:30:05 \u001b[1;30mWARNING \u001b[0m \u001b[34mtensorflow\u001b[0m - \u001b[33mFrom /usr/local/lib/python3.6/site-packages/tensorflow/python/ops/math_grad.py:102: div (from tensorflow.python.ops.math_ops) is deprecated and will be removed in a future version.\n", "Instructions for updating:\n", "Deprecated in favor of operator or tf.math.divide.\u001b[0m\n", - "2019-05-03 21:20:33.153976: I tensorflow/core/platform/cpu_feature_guard.cc:141] Your CPU supports instructions that this TensorFlow binary was not compiled to use: AVX2 FMA\n", - "2019-05-03 21:20:33.173206: I tensorflow/core/platform/profile_utils/cpu_utils.cc:94] CPU Frequency: 2905000000 Hz\n", - "2019-05-03 21:20:33.173981: I tensorflow/compiler/xla/service/service.cc:150] XLA service 0x559bc71337e0 executing computations on platform Host. Devices:\n", - "2019-05-03 21:20:33.174055: I tensorflow/compiler/xla/service/service.cc:158] StreamExecutor device (0): , \n", - "2019-05-03 21:20:33 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.classifiers.embedding_intent_classifier\u001b[0m - Accuracy is updated every 10 epochs\n", - "Epochs: 100%|██████████| 300/300 [00:09<00:00, 30.99it/s, loss=0.115, acc=0.993]\n", - "2019-05-03 21:20:42 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.classifiers.embedding_intent_classifier\u001b[0m - Finished training embedding classifier, loss=0.115, train accuracy=0.993\n", - "2019-05-03 21:20:42 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.model\u001b[0m - Finished training component.\n", - "2019-05-03 21:20:43 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.model\u001b[0m - Successfully saved model into '/work/bot/models/nlu/current'\n", - "2019-05-03 21:20:43 \u001b[1;30mINFO \u001b[0m \u001b[34m__main__\u001b[0m - Finished training\n", - "make: Leaving directory '/work/bot'\n" + "2019-07-17 16:30:06.320809: I tensorflow/core/platform/cpu_feature_guard.cc:141] Your CPU supports instructions that this TensorFlow binary was not compiled to use: AVX2 FMA\n", + "2019-07-17 16:30:06.344961: I tensorflow/core/platform/profile_utils/cpu_utils.cc:94] CPU Frequency: 2194805000 Hz\n", + "2019-07-17 16:30:06.345414: I tensorflow/compiler/xla/service/service.cc:150] XLA service 0x563c2cae7710 executing computations on platform Host. Devices:\n", + "2019-07-17 16:30:06.345467: I tensorflow/compiler/xla/service/service.cc:158] StreamExecutor device (0): , \n", + "2019-07-17 16:30:06 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.classifiers.embedding_intent_classifier\u001b[0m - Accuracy is updated every 10 epochs\n", + "Epochs: 100%|██████████| 300/300 [00:14<00:00, 25.65it/s, loss=0.101, acc=0.993]\n", + "2019-07-17 16:30:20 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.classifiers.embedding_intent_classifier\u001b[0m - Finished training embedding classifier, loss=0.101, train accuracy=0.993\n", + "2019-07-17 16:30:20 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.model\u001b[0m - Finished training component.\n", + "2019-07-17 16:30:20 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.model\u001b[0m - Successfully saved model into '/src_models/nlu/current'\n", + "2019-07-17 16:30:20 \u001b[1;30mINFO \u001b[0m \u001b[34m__main__\u001b[0m - Finished training\n", + "make: Leaving directory '/work/coach'\n" ] } ], "source": [ - "!make train-nlu -C $BOT_DIR_PATH" + "!make train-nlu -C $COACH_DIR_PATH" ] }, { @@ -191,38 +181,36 @@ "name": "stdout", "output_type": "stream", "text": [ - "/usr/local/lib/python3.6/site-packages/requests/__init__.py:91: RequestsDependencyWarning: urllib3 (1.25.2) or chardet (3.0.4) doesn't match a supported version!\n", - " RequestsDependencyWarning)\n", - "/usr/local/lib/python3.6/runpy.py:125: RuntimeWarning: 'rasa_nlu.test' found in sys.modules after import of package 'rasa_nlu', but prior to execution of 'rasa_nlu.test'; this may result in unpredictable behaviour\n", - " warn(RuntimeWarning(msg))\n", - "usage: test.py [-h] [--debug] [-v] -d DATA [--mode MODE] [-c CONFIG]\n", - " [-m MODEL] [-f FOLDS] [--report [REPORT]]\n", - " [--successes [SUCCESSES]] [--errors ERRORS]\n", - " [--histogram HISTOGRAM] [--confmat CONFMAT]\n", - "\n", - "evaluate a Rasa NLU pipeline with cross validation or on external data\n", - "\n", - "optional arguments:\n", - " -h, --help show this help message and exit\n", - " --debug Print lots of debugging statements. Sets logging level\n", - " to DEBUG\n", - " -v, --verbose Be verbose. Sets logging level to INFO\n", - " -d DATA, --data DATA file containing training/evaluation data\n", - " --mode MODE evaluation|crossvalidation (evaluate pretrained model\n", - " or train model by crossvalidation)\n", - " -c CONFIG, --config CONFIG\n", - " model configuration file (crossvalidation only)\n", - " -m MODEL, --model MODEL\n", - " path to model (evaluation only)\n", - " -f FOLDS, --folds FOLDS\n", - " number of CV folds (crossvalidation only)\n", - " --report [REPORT] output path to save the intent/entitymetrics report\n", - " --successes [SUCCESSES]\n", - " output path to save successful predictions\n", - " --errors ERRORS output path to save model errors\n", - " --histogram HISTOGRAM\n", - " output path for the confidence histogram\n", - " --confmat CONFMAT output path for the confusion matrix plot\n" + "/usr/local/lib/python3.6/runpy.py:125: RuntimeWarning: 'rasa_nlu.test' found in sys.modules after import of package 'rasa_nlu', but prior to execution of 'rasa_nlu.test'; this may result in unpredictable behaviour\r\n", + " warn(RuntimeWarning(msg))\r\n", + "usage: test.py [-h] [--debug] [-v] -d DATA [--mode MODE] [-c CONFIG]\r\n", + " [-m MODEL] [-f FOLDS] [--report [REPORT]]\r\n", + " [--successes [SUCCESSES]] [--errors ERRORS]\r\n", + " [--histogram HISTOGRAM] [--confmat CONFMAT]\r\n", + "\r\n", + "evaluate a Rasa NLU pipeline with cross validation or on external data\r\n", + "\r\n", + "optional arguments:\r\n", + " -h, --help show this help message and exit\r\n", + " --debug Print lots of debugging statements. Sets logging level\r\n", + " to DEBUG\r\n", + " -v, --verbose Be verbose. Sets logging level to INFO\r\n", + " -d DATA, --data DATA file containing training/evaluation data\r\n", + " --mode MODE evaluation|crossvalidation (evaluate pretrained model\r\n", + " or train model by crossvalidation)\r\n", + " -c CONFIG, --config CONFIG\r\n", + " model configuration file (crossvalidation only)\r\n", + " -m MODEL, --model MODEL\r\n", + " path to model (evaluation only)\r\n", + " -f FOLDS, --folds FOLDS\r\n", + " number of CV folds (crossvalidation only)\r\n", + " --report [REPORT] output path to save the intent/entitymetrics report\r\n", + " --successes [SUCCESSES]\r\n", + " output path to save successful predictions\r\n", + " --errors ERRORS output path to save model errors\r\n", + " --histogram HISTOGRAM\r\n", + " output path for the confidence histogram\r\n", + " --confmat CONFMAT output path for the confusion matrix plot\r\n" ] } ], @@ -242,7 +230,7 @@ "metadata": {}, "source": [ "* O comando abaixo gera informações relevates para a validação das `intents` são elas:\n", - " * Matriz de confuzão\n", + " * Matriz de confusão\n", " * Histograma\n", " * Erros de intents" ] @@ -258,57 +246,55 @@ "name": "stdout", "output_type": "stream", "text": [ - "/usr/local/lib/python3.6/site-packages/requests/__init__.py:91: RequestsDependencyWarning: urllib3 (1.25.2) or chardet (3.0.4) doesn't match a supported version!\n", - " RequestsDependencyWarning)\n", "/usr/local/lib/python3.6/runpy.py:125: RuntimeWarning: 'rasa_nlu.test' found in sys.modules after import of package 'rasa_nlu', but prior to execution of 'rasa_nlu.test'; this may result in unpredictable behaviour\n", " warn(RuntimeWarning(msg))\n", - "2019-05-03 21:20:46.960890: I tensorflow/core/platform/cpu_feature_guard.cc:141] Your CPU supports instructions that this TensorFlow binary was not compiled to use: AVX2 FMA\n", - "2019-05-03 21:20:46.979691: I tensorflow/core/platform/profile_utils/cpu_utils.cc:94] CPU Frequency: 2905000000 Hz\n", - "2019-05-03 21:20:46.979956: I tensorflow/compiler/xla/service/service.cc:150] XLA service 0x565180f44560 executing computations on platform Host. Devices:\n", - "2019-05-03 21:20:46.979989: I tensorflow/compiler/xla/service/service.cc:158] StreamExecutor device (0): , \n", - "2019-05-03 21:20:47 \u001b[1;30mWARNING \u001b[0m \u001b[34mtensorflow\u001b[0m - \u001b[33mFrom /usr/local/lib/python3.6/site-packages/tensorflow/python/training/saver.py:1266: checkpoint_exists (from tensorflow.python.training.checkpoint_management) is deprecated and will be removed in a future version.\n", + "2019-07-17 16:31:33.800517: I tensorflow/core/platform/cpu_feature_guard.cc:141] Your CPU supports instructions that this TensorFlow binary was not compiled to use: AVX2 FMA\n", + "2019-07-17 16:31:33.828980: I tensorflow/core/platform/profile_utils/cpu_utils.cc:94] CPU Frequency: 2194805000 Hz\n", + "2019-07-17 16:31:33.829499: I tensorflow/compiler/xla/service/service.cc:150] XLA service 0x55c71b5187e0 executing computations on platform Host. Devices:\n", + "2019-07-17 16:31:33.829554: I tensorflow/compiler/xla/service/service.cc:158] StreamExecutor device (0): , \n", + "2019-07-17 16:31:34 \u001b[1;30mWARNING \u001b[0m \u001b[34mtensorflow\u001b[0m - \u001b[33mFrom /usr/local/lib/python3.6/site-packages/tensorflow/python/training/saver.py:1266: checkpoint_exists (from tensorflow.python.training.checkpoint_management) is deprecated and will be removed in a future version.\n", "Instructions for updating:\n", "Use standard file APIs to check for files with this prefix.\u001b[0m\n", - "2019-05-03 21:20:47 \u001b[1;30mINFO \u001b[0m \u001b[34mtensorflow\u001b[0m - Restoring parameters from ../../bot/models/nlu/current/component_4_EmbeddingIntentClassifier.ckpt\n", - "2019-05-03 21:20:47 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.training_data.loading\u001b[0m - Training data format of ../../bot/data/intents/aleatorio.md is md\n", - "2019-05-03 21:20:47 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.training_data.training_data\u001b[0m - Training data stats: \n", + "2019-07-17 16:31:34 \u001b[1;30mINFO \u001b[0m \u001b[34mtensorflow\u001b[0m - Restoring parameters from /models/nlu/current/component_4_EmbeddingIntentClassifier.ckpt\n", + "2019-07-17 16:31:34 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.training_data.loading\u001b[0m - Training data format of ../../coach/data/intents/geral.md is md\n", + "2019-07-17 16:31:34 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.training_data.training_data\u001b[0m - Training data stats: \n", + "\t- intent examples: 85 (7 distinct intents)\n", + "\t- Found intents: 'cumprimentar', 'diga_mais', 'out_of_scope', 'despedir', 'tudo_bem', 'negar', 'elogios'\n", + "\t- entity examples: 0 (0 distinct entities)\n", + "\t- found entities: \n", + "\n", + "2019-07-17 16:31:34 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.training_data.loading\u001b[0m - Training data format of ../../coach/data/intents/aleatorio.md is md\n", + "2019-07-17 16:31:34 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.training_data.training_data\u001b[0m - Training data stats: \n", "\t- intent examples: 197 (24 distinct intents)\n", - "\t- Found intents: 'de_onde_voce_eh', 'me', 'esporte', 'risada', 'cor', 'signo', 'hobby', 'star_wars', 'linguagens', 'triste', 'historia', 'religiao', 'time', 'filme', 'relationship', 'onde_voce_mora', 'genero', 'playlist', 'bff', 'piada', 'filhos', 'license', 'comida', 'como_estou'\n", + "\t- Found intents: 'relationship', 'me', 'time', 'bff', 'religiao', 'license', 'esporte', 'filhos', 'risada', 'historia', 'de_onde_voce_eh', 'piada', 'genero', 'linguagens', 'cor', 'signo', 'onde_voce_mora', 'playlist', 'filme', 'star_wars', 'triste', 'comida', 'como_estou', 'hobby'\n", "\t- entity examples: 172 (22 distinct entities)\n", - "\t- found entities: 'signo', 'triste', 'linguagens', 'live', 'filme', 'relationship', 'where', 'genero', 'playlist', 'bff', 'starwars', 'piada', 'filhos', 'license', 'comida', 'me', 'esporte', 'cor', 'hobby', 'religiao', 'how', 'historia'\n", + "\t- found entities: 'me', 'bff', 'religiao', 'license', 'piada', 'cor', 'filme', 'triste', 'comida', 'where', 'relationship', 'how', 'live', 'esporte', 'historia', 'filhos', 'genero', 'linguagens', 'signo', 'starwars', 'playlist', 'hobby'\n", "\n", - "2019-05-03 21:20:47 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.training_data.loading\u001b[0m - Training data format of ../../bot/data/intents/actions.md is md\n", - "2019-05-03 21:20:47 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.training_data.training_data\u001b[0m - Training data stats: \n", + "2019-07-17 16:31:34 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.training_data.loading\u001b[0m - Training data format of ../../coach/data/intents/actions.md is md\n", + "2019-07-17 16:31:34 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.training_data.training_data\u001b[0m - Training data stats: \n", "\t- intent examples: 6 (1 distinct intents)\n", "\t- Found intents: 'action_test'\n", "\t- entity examples: 0 (0 distinct entities)\n", "\t- found entities: \n", "\n", - "2019-05-03 21:20:47 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.training_data.loading\u001b[0m - Training data format of ../../bot/data/intents/geral.md is md\n", - "2019-05-03 21:20:47 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.training_data.training_data\u001b[0m - Training data stats: \n", - "\t- intent examples: 85 (7 distinct intents)\n", - "\t- Found intents: 'elogios', 'cumprimentar', 'out_of_scope', 'despedir', 'negar', 'tudo_bem', 'diga_mais'\n", - "\t- entity examples: 0 (0 distinct entities)\n", - "\t- found entities: \n", - "\n", - "2019-05-03 21:20:47 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.training_data.training_data\u001b[0m - Training data stats: \n", + "2019-07-17 16:31:34 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.training_data.training_data\u001b[0m - Training data stats: \n", "\t- intent examples: 288 (32 distinct intents)\n", - "\t- Found intents: 'action_test', 'elogios', 'out_of_scope', 'signo', 'star_wars', 'linguagens', 'triste', 'diga_mais', 'filme', 'relationship', 'onde_voce_mora', 'genero', 'playlist', 'cumprimentar', 'bff', 'piada', 'filhos', 'license', 'comida', 'como_estou', 'de_onde_voce_eh', 'me', 'esporte', 'risada', 'cor', 'despedir', 'hobby', 'tudo_bem', 'religiao', 'time', 'negar', 'historia'\n", + "\t- Found intents: 'me', 'cumprimentar', 'out_of_scope', 'bff', 'religiao', 'license', 'negar', 'elogios', 'risada', 'de_onde_voce_eh', 'piada', 'cor', 'filme', 'triste', 'comida', 'como_estou', 'relationship', 'action_test', 'despedir', 'hobby', 'esporte', 'filhos', 'historia', 'genero', 'linguagens', 'signo', 'diga_mais', 'playlist', 'tudo_bem', 'onde_voce_mora', 'time', 'star_wars'\n", "\t- entity examples: 172 (22 distinct entities)\n", - "\t- found entities: 'signo', 'triste', 'linguagens', 'live', 'filme', 'relationship', 'where', 'genero', 'playlist', 'bff', 'starwars', 'piada', 'filhos', 'license', 'comida', 'me', 'esporte', 'cor', 'hobby', 'religiao', 'how', 'historia'\n", + "\t- found entities: 'me', 'bff', 'religiao', 'license', 'piada', 'cor', 'filme', 'triste', 'comida', 'where', 'relationship', 'how', 'live', 'esporte', 'historia', 'filhos', 'genero', 'linguagens', 'signo', 'starwars', 'playlist', 'hobby'\n", "\n", - "2019-05-03 21:20:47 \u001b[1;30mINFO \u001b[0m \u001b[34m__main__\u001b[0m - Running model for predictions:\n", - "100%|████████████████████████████████████████| 288/288 [00:00<00:00, 561.88it/s]\n", - "2019-05-03 21:20:47 \u001b[1;30mINFO \u001b[0m \u001b[34m__main__\u001b[0m - Intent evaluation results:\n", - "2019-05-03 21:20:47 \u001b[1;30mINFO \u001b[0m \u001b[34m__main__\u001b[0m - Intent Evaluation: Only considering those 288 examples that have a defined intent out of 288 examples\n", + "2019-07-17 16:31:34 \u001b[1;30mINFO \u001b[0m \u001b[34m__main__\u001b[0m - Running model for predictions:\n", + "100%|████████████████████████████████████████| 288/288 [00:00<00:00, 429.64it/s]\n", + "2019-07-17 16:31:34 \u001b[1;30mINFO \u001b[0m \u001b[34m__main__\u001b[0m - Intent evaluation results:\n", + "2019-07-17 16:31:34 \u001b[1;30mINFO \u001b[0m \u001b[34m__main__\u001b[0m - Intent Evaluation: Only considering those 288 examples that have a defined intent out of 288 examples\n", "/usr/local/lib/python3.6/site-packages/sklearn/metrics/classification.py:1145: UndefinedMetricWarning: Recall and F-score are ill-defined and being set to 0.0 in labels with no true samples.\n", " 'recall', 'true', average, warn_for)\n", "/usr/local/lib/python3.6/site-packages/sklearn/metrics/classification.py:1145: UndefinedMetricWarning: F-score is ill-defined and being set to 0.0 in labels with no true samples.\n", " 'recall', 'true', average, warn_for)\n", - "2019-05-03 21:20:47 \u001b[1;30mINFO \u001b[0m \u001b[34m__main__\u001b[0m - F1-Score: 0.9914054566832343\n", - "2019-05-03 21:20:47 \u001b[1;30mINFO \u001b[0m \u001b[34m__main__\u001b[0m - Precision: 0.9942129629629629\n", - "2019-05-03 21:20:47 \u001b[1;30mINFO \u001b[0m \u001b[34m__main__\u001b[0m - Accuracy: 0.9895833333333334\n", - "2019-05-03 21:20:47 \u001b[1;30mINFO \u001b[0m \u001b[34m__main__\u001b[0m - Classification report: \n", + "2019-07-17 16:31:34 \u001b[1;30mINFO \u001b[0m \u001b[34m__main__\u001b[0m - F1-Score: 0.9914054566832343\n", + "2019-07-17 16:31:34 \u001b[1;30mINFO \u001b[0m \u001b[34m__main__\u001b[0m - Precision: 0.9942129629629629\n", + "2019-07-17 16:31:34 \u001b[1;30mINFO \u001b[0m \u001b[34m__main__\u001b[0m - Accuracy: 0.9895833333333334\n", + "2019-07-17 16:31:34 \u001b[1;30mINFO \u001b[0m \u001b[34m__main__\u001b[0m - Classification report: \n", " precision recall f1-score support\n", "\n", " 0.00 0.00 0.00 0\n", @@ -349,8 +335,10 @@ " macro avg 0.96 0.96 0.96 288\n", " weighted avg 0.99 0.99 0.99 288\n", "\n", - "2019-05-03 21:20:47 \u001b[1;30mINFO \u001b[0m \u001b[34m__main__\u001b[0m - Model prediction errors saved to errors.json.\n", - "2019-05-03 21:20:49 \u001b[1;30mINFO \u001b[0m \u001b[34m__main__\u001b[0m - Confusion matrix, without normalization: \n", + "2019-07-17 16:31:34 \u001b[1;30mINFO \u001b[0m \u001b[34m__main__\u001b[0m - Model prediction errors saved to errors.json.\n", + "2019-07-17 16:31:35 \u001b[1;30mINFO \u001b[0m \u001b[34mmatplotlib.font_manager\u001b[0m - font search path ['/usr/local/lib/python3.6/site-packages/matplotlib/mpl-data/fonts/ttf', '/usr/local/lib/python3.6/site-packages/matplotlib/mpl-data/fonts/afm', '/usr/local/lib/python3.6/site-packages/matplotlib/mpl-data/fonts/pdfcorefonts']\n", + "2019-07-17 16:31:36 \u001b[1;30mINFO \u001b[0m \u001b[34mmatplotlib.font_manager\u001b[0m - generated new fontManager\n", + "2019-07-17 16:31:38 \u001b[1;30mINFO \u001b[0m \u001b[34m__main__\u001b[0m - Confusion matrix, without normalization: \n", "[[ 0 0 0 ... 0 0 0]\n", " [ 0 6 0 ... 0 0 0]\n", " [ 0 0 11 ... 0 0 0]\n", @@ -360,56 +348,62 @@ " [ 0 0 0 ... 0 0 10]]\n", "Figure(2000x2000)\n", "Figure(1000x1000)\n", - "2019-05-03 21:20:54 \u001b[1;30mINFO \u001b[0m \u001b[34m__main__\u001b[0m - Entity evaluation results:\n", - "2019-05-03 21:20:54 \u001b[1;30mINFO \u001b[0m \u001b[34m__main__\u001b[0m - Evaluation for entity extractor: CRFEntityExtractor \n", - "2019-05-03 21:20:54 \u001b[1;30mINFO \u001b[0m \u001b[34m__main__\u001b[0m - F1-Score: 1.0\n", - "2019-05-03 21:20:54 \u001b[1;30mINFO \u001b[0m \u001b[34m__main__\u001b[0m - Precision: 1.0\n", - "2019-05-03 21:20:54 \u001b[1;30mINFO \u001b[0m \u001b[34m__main__\u001b[0m - Accuracy: 1.0\n", - "2019-05-03 21:20:54 \u001b[1;30mINFO \u001b[0m \u001b[34m__main__\u001b[0m - Classification report: \n", - " precision recall f1-score support\n", - "\n", - " bff 1.00 1.00 1.00 17\n", - " comida 1.00 1.00 1.00 17\n", - " cor 1.00 1.00 1.00 13\n", - " esporte 1.00 1.00 1.00 6\n", - " filhos 1.00 1.00 1.00 11\n", - " filme 1.00 1.00 1.00 4\n", - " genero 1.00 1.00 1.00 15\n", - " historia 1.00 1.00 1.00 6\n", - " hobby 1.00 1.00 1.00 11\n", - " how 1.00 1.00 1.00 24\n", - " license 1.00 1.00 1.00 14\n", - " linguagens 1.00 1.00 1.00 14\n", - " live 1.00 1.00 1.00 13\n", - " me 1.00 1.00 1.00 6\n", - " no_entity 1.00 1.00 1.00 613\n", - " piada 1.00 1.00 1.00 7\n", - " playlist 1.00 1.00 1.00 7\n", - "relationship 1.00 1.00 1.00 9\n", - " religiao 1.00 1.00 1.00 16\n", - " signo 1.00 1.00 1.00 3\n", - " starwars 1.00 1.00 1.00 13\n", - " triste 1.00 1.00 1.00 7\n", - " where 1.00 1.00 1.00 3\n", - "\n", - " micro avg 1.00 1.00 1.00 849\n", - " macro avg 1.00 1.00 1.00 849\n", - "weighted avg 1.00 1.00 1.00 849\n", - "\n", - "2019-05-03 21:20:54 \u001b[1;30mINFO \u001b[0m \u001b[34m__main__\u001b[0m - Finished evaluation\n" + "2019-07-17 16:31:43 \u001b[1;30mINFO \u001b[0m \u001b[34m__main__\u001b[0m - Entity evaluation results:\n", + "2019-07-17 16:31:44 \u001b[1;30mINFO \u001b[0m \u001b[34m__main__\u001b[0m - Evaluation for entity extractor: CRFEntityExtractor \n" + ] + }, + { + "name": "stdout", + "output_type": "stream", + "text": [ + "2019-07-17 16:31:44 \u001b[1;30mINFO \u001b[0m \u001b[34m__main__\u001b[0m - F1-Score: 1.0\r\n", + "2019-07-17 16:31:44 \u001b[1;30mINFO \u001b[0m \u001b[34m__main__\u001b[0m - Precision: 1.0\r\n", + "2019-07-17 16:31:44 \u001b[1;30mINFO \u001b[0m \u001b[34m__main__\u001b[0m - Accuracy: 1.0\r\n", + "2019-07-17 16:31:44 \u001b[1;30mINFO \u001b[0m \u001b[34m__main__\u001b[0m - Classification report: \r\n", + " precision recall f1-score support\r\n", + "\r\n", + " bff 1.00 1.00 1.00 17\r\n", + " comida 1.00 1.00 1.00 17\r\n", + " cor 1.00 1.00 1.00 13\r\n", + " esporte 1.00 1.00 1.00 6\r\n", + " filhos 1.00 1.00 1.00 11\r\n", + " filme 1.00 1.00 1.00 4\r\n", + " genero 1.00 1.00 1.00 15\r\n", + " historia 1.00 1.00 1.00 6\r\n", + " hobby 1.00 1.00 1.00 11\r\n", + " how 1.00 1.00 1.00 24\r\n", + " license 1.00 1.00 1.00 14\r\n", + " linguagens 1.00 1.00 1.00 14\r\n", + " live 1.00 1.00 1.00 13\r\n", + " me 1.00 1.00 1.00 6\r\n", + " no_entity 1.00 1.00 1.00 613\r\n", + " piada 1.00 1.00 1.00 7\r\n", + " playlist 1.00 1.00 1.00 7\r\n", + "relationship 1.00 1.00 1.00 9\r\n", + " religiao 1.00 1.00 1.00 16\r\n", + " signo 1.00 1.00 1.00 3\r\n", + " starwars 1.00 1.00 1.00 13\r\n", + " triste 1.00 1.00 1.00 7\r\n", + " where 1.00 1.00 1.00 3\r\n", + "\r\n", + " micro avg 1.00 1.00 1.00 849\r\n", + " macro avg 1.00 1.00 1.00 849\r\n", + "weighted avg 1.00 1.00 1.00 849\r\n", + "\r\n", + "2019-07-17 16:31:44 \u001b[1;30mINFO \u001b[0m \u001b[34m__main__\u001b[0m - Finished evaluation\r\n" ] } ], "source": [ - "!python -m rasa_nlu.test -d $BOT_INTENTS_PATH -m $BOT_MODELS_NLU_PATH --mode evaluation" + "!python -m rasa_nlu.test -d $COACH_INTENTS_PATH -m $COACH_MODELS_NLU_PATH --mode evaluation" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ - "#### Matriz de Confuzão\n", - "* A matriz de confuzão mostra a correlação entre as intents.\n", + "#### Matriz de Confusão\n", + "* A matriz de confusão mostra a correlação entre as intents.\n", "* A diagonal principal tem forte correlação pois mostra a relação de uma intent **com ela mesma**\n", "* O ideal é que não haja **nenhum valor** diferente de **0 fora da diagonal principal**." ] @@ -435,7 +429,7 @@ " " ], "text/plain": [ - "" + "" ] }, "execution_count": 5, @@ -452,7 +446,7 @@ "metadata": {}, "source": [ "#### Erros\n", - "* O arquivo `erros,json` mostra os erros encontrados. Este arquivo lista os mesmos erros mostrados na **matriz de confuzão**, então caso ela fique muito grande, não se preocupe, pois você pode apenas procurar os erros no arquivo gerado.\n", + "* O arquivo `erros,json` mostra os erros encontrados. Este arquivo lista os mesmos erros mostrados na **matriz de confusão**, então caso ela fique muito grande, não se preocupe, pois você pode apenas procurar os erros no arquivo gerado.\n", "* Os erros mostrados são textos repetidos nos exemplos de diferrentes `intents`.\n", "* Caso o arquivo não seja gerado significa que não foram encontrados erros." ] @@ -470,19 +464,11 @@ "text": [ "[\r\n", " {\r\n", - " \"text\": \"e o c#\",\r\n", - " \"intent\": \"linguagens\",\r\n", - " \"intent_prediction\": {\r\n", - " \"name\": \"\",\r\n", - " \"confidence\": 0.0\r\n", - " }\r\n", - " },\r\n", - " {\r\n", " \"text\": \"como vai\",\r\n", " \"intent\": \"cumprimentar\",\r\n", " \"intent_prediction\": {\r\n", " \"name\": \"tudo_bem\",\r\n", - " \"confidence\": 0.835846483707428\r\n", + " \"confidence\": 0.7145657539367676\r\n", " }\r\n", " },\r\n", " {\r\n", @@ -490,7 +476,15 @@ " \"intent\": \"cumprimentar\",\r\n", " \"intent_prediction\": {\r\n", " \"name\": \"tudo_bem\",\r\n", - " \"confidence\": 0.8136337995529175\r\n", + " \"confidence\": 0.7155274152755737\r\n", + " }\r\n", + " },\r\n", + " {\r\n", + " \"text\": \"e o c#\",\r\n", + " \"intent\": \"linguagens\",\r\n", + " \"intent_prediction\": {\r\n", + " \"name\": \"\",\r\n", + " \"confidence\": 0.0\r\n", " }\r\n", " }\r\n", "]" @@ -531,7 +525,7 @@ " " ], "text/plain": [ - "" + "" ] }, "execution_count": 7, @@ -561,64 +555,62 @@ "name": "stdout", "output_type": "stream", "text": [ - "/usr/local/lib/python3.6/site-packages/requests/__init__.py:91: RequestsDependencyWarning: urllib3 (1.25.2) or chardet (3.0.4) doesn't match a supported version!\n", - " RequestsDependencyWarning)\n", "/usr/local/lib/python3.6/runpy.py:125: RuntimeWarning: 'rasa_nlu.test' found in sys.modules after import of package 'rasa_nlu', but prior to execution of 'rasa_nlu.test'; this may result in unpredictable behaviour\n", " warn(RuntimeWarning(msg))\n", - "2019-05-03 21:20:56 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.training_data.loading\u001b[0m - Training data format of ../../bot/data/intents/aleatorio.md is md\n", - "2019-05-03 21:20:56 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.training_data.training_data\u001b[0m - Training data stats: \n", + "2019-07-17 16:32:19 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.training_data.loading\u001b[0m - Training data format of ../../coach/data/intents/geral.md is md\n", + "2019-07-17 16:32:19 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.training_data.training_data\u001b[0m - Training data stats: \n", + "\t- intent examples: 85 (7 distinct intents)\n", + "\t- Found intents: 'cumprimentar', 'tudo_bem', 'negar', 'elogios', 'despedir', 'out_of_scope', 'diga_mais'\n", + "\t- entity examples: 0 (0 distinct entities)\n", + "\t- found entities: \n", + "\n", + "2019-07-17 16:32:19 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.training_data.loading\u001b[0m - Training data format of ../../coach/data/intents/aleatorio.md is md\n", + "2019-07-17 16:32:19 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.training_data.training_data\u001b[0m - Training data stats: \n", "\t- intent examples: 197 (24 distinct intents)\n", - "\t- Found intents: 'linguagens', 'triste', 'cor', 'hobby', 'risada', 'bff', 'genero', 'star_wars', 'religiao', 'filhos', 'como_estou', 'me', 'signo', 'historia', 'relationship', 'filme', 'playlist', 'time', 'license', 'piada', 'comida', 'onde_voce_mora', 'esporte', 'de_onde_voce_eh'\n", + "\t- Found intents: 'bff', 'risada', 'filhos', 'genero', 'piada', 'time', 'comida', 'cor', 'historia', 'triste', 'como_estou', 'filme', 'star_wars', 'relationship', 'esporte', 'signo', 'me', 'linguagens', 'de_onde_voce_eh', 'religiao', 'hobby', 'playlist', 'license', 'onde_voce_mora'\n", "\t- entity examples: 172 (22 distinct entities)\n", - "\t- found entities: 'linguagens', 'how', 'hobby', 'starwars', 'filhos', 'me', 'signo', 'relationship', 'where', 'playlist', 'filme', 'license', 'live', 'triste', 'cor', 'bff', 'genero', 'religiao', 'historia', 'piada', 'comida', 'esporte'\n", + "\t- found entities: 'live', 'filhos', 'genero', 'relationship', 'linguagens', 'me', 'hobby', 'starwars', 'playlist', 'license', 'bff', 'piada', 'comida', 'cor', 'historia', 'triste', 'where', 'filme', 'how', 'esporte', 'signo', 'religiao'\n", "\n", - "2019-05-03 21:20:56 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.training_data.loading\u001b[0m - Training data format of ../../bot/data/intents/actions.md is md\n", - "2019-05-03 21:20:56 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.training_data.training_data\u001b[0m - Training data stats: \n", + "2019-07-17 16:32:19 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.training_data.loading\u001b[0m - Training data format of ../../coach/data/intents/actions.md is md\n", + "2019-07-17 16:32:19 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.training_data.training_data\u001b[0m - Training data stats: \n", "\t- intent examples: 6 (1 distinct intents)\n", "\t- Found intents: 'action_test'\n", "\t- entity examples: 0 (0 distinct entities)\n", "\t- found entities: \n", "\n", - "2019-05-03 21:20:56 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.training_data.loading\u001b[0m - Training data format of ../../bot/data/intents/geral.md is md\n", - "2019-05-03 21:20:56 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.training_data.training_data\u001b[0m - Training data stats: \n", - "\t- intent examples: 85 (7 distinct intents)\n", - "\t- Found intents: 'despedir', 'diga_mais', 'cumprimentar', 'negar', 'elogios', 'tudo_bem', 'out_of_scope'\n", - "\t- entity examples: 0 (0 distinct entities)\n", - "\t- found entities: \n", - "\n", - "2019-05-03 21:20:57 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.training_data.training_data\u001b[0m - Training data stats: \n", + "2019-07-17 16:32:19 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.training_data.training_data\u001b[0m - Training data stats: \n", "\t- intent examples: 288 (32 distinct intents)\n", - "\t- Found intents: 'linguagens', 'hobby', 'star_wars', 'filhos', 'out_of_scope', 'me', 'signo', 'relationship', 'filme', 'playlist', 'license', 'elogios', 'tudo_bem', 'action_test', 'de_onde_voce_eh', 'despedir', 'triste', 'cor', 'risada', 'negar', 'bff', 'genero', 'religiao', 'como_estou', 'historia', 'time', 'diga_mais', 'piada', 'cumprimentar', 'comida', 'onde_voce_mora', 'esporte'\n", + "\t- Found intents: 'filhos', 'genero', 'time', 'como_estou', 'cumprimentar', 'star_wars', 'relationship', 'tudo_bem', 'linguagens', 'me', 'hobby', 'playlist', 'license', 'onde_voce_mora', 'bff', 'risada', 'piada', 'negar', 'comida', 'cor', 'historia', 'out_of_scope', 'triste', 'elogios', 'filme', 'action_test', 'esporte', 'signo', 'de_onde_voce_eh', 'despedir', 'religiao', 'diga_mais'\n", "\t- entity examples: 172 (22 distinct entities)\n", - "\t- found entities: 'linguagens', 'how', 'hobby', 'starwars', 'filhos', 'me', 'signo', 'relationship', 'where', 'playlist', 'filme', 'license', 'live', 'triste', 'cor', 'bff', 'genero', 'religiao', 'historia', 'piada', 'comida', 'esporte'\n", + "\t- found entities: 'live', 'filhos', 'genero', 'relationship', 'linguagens', 'me', 'hobby', 'starwars', 'playlist', 'license', 'bff', 'piada', 'comida', 'cor', 'historia', 'triste', 'where', 'filme', 'how', 'esporte', 'signo', 'religiao'\n", "\n", - "2019-05-03 21:20:57 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.training_data.training_data\u001b[0m - Training data stats: \n", + "2019-07-17 16:32:19 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.training_data.training_data\u001b[0m - Training data stats: \n", "\t- intent examples: 273 (28 distinct intents)\n", - "\t- Found intents: 'linguagens', 'despedir', 'triste', 'cor', 'hobby', 'risada', 'negar', 'bff', 'genero', 'star_wars', 'religiao', 'filhos', 'out_of_scope', 'como_estou', 'me', 'historia', 'relationship', 'playlist', 'time', 'license', 'diga_mais', 'piada', 'cumprimentar', 'comida', 'tudo_bem', 'onde_voce_mora', 'esporte', 'action_test'\n", + "\t- Found intents: 'bff', 'risada', 'filhos', 'genero', 'piada', 'time', 'negar', 'comida', 'cor', 'historia', 'out_of_scope', 'triste', 'como_estou', 'cumprimentar', 'star_wars', 'relationship', 'hobby', 'action_test', 'tudo_bem', 'esporte', 'linguagens', 'despedir', 'religiao', 'me', 'playlist', 'license', 'onde_voce_mora', 'diga_mais'\n", "\t- entity examples: 162 (19 distinct entities)\n", - "\t- found entities: 'triste', 'linguagens', 'live', 'license', 'me', 'cor', 'hobby', 'how', 'bff', 'comida', 'genero', 'piada', 'religiao', 'filhos', 'starwars', 'historia', 'esporte', 'relationship', 'playlist'\n", + "\t- found entities: 'bff', 'triste', 'live', 'filhos', 'genero', 'how', 'piada', 'relationship', 'esporte', 'comida', 'me', 'cor', 'historia', 'linguagens', 'religiao', 'hobby', 'starwars', 'playlist', 'license'\n", "\n", - "2019-05-03 21:20:58 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.training_data.training_data\u001b[0m - Training data stats: \n", + "2019-07-17 16:32:20 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.training_data.training_data\u001b[0m - Training data stats: \n", "\t- intent examples: 131 (28 distinct intents)\n", - "\t- Found intents: 'linguagens', 'despedir', 'triste', 'cor', 'hobby', 'risada', 'negar', 'bff', 'genero', 'star_wars', 'religiao', 'filhos', 'out_of_scope', 'como_estou', 'me', 'historia', 'relationship', 'playlist', 'time', 'license', 'diga_mais', 'piada', 'cumprimentar', 'comida', 'tudo_bem', 'onde_voce_mora', 'esporte', 'action_test'\n", - "\t- entity examples: 76 (19 distinct entities)\n", - "\t- found entities: 'triste', 'linguagens', 'live', 'license', 'me', 'cor', 'hobby', 'how', 'bff', 'comida', 'genero', 'piada', 'religiao', 'filhos', 'starwars', 'historia', 'esporte', 'relationship', 'playlist'\n", + "\t- Found intents: 'bff', 'risada', 'filhos', 'genero', 'piada', 'time', 'negar', 'comida', 'cor', 'historia', 'out_of_scope', 'triste', 'como_estou', 'cumprimentar', 'star_wars', 'relationship', 'hobby', 'action_test', 'tudo_bem', 'esporte', 'linguagens', 'despedir', 'religiao', 'me', 'playlist', 'license', 'onde_voce_mora', 'diga_mais'\n", + "\t- entity examples: 79 (19 distinct entities)\n", + "\t- found entities: 'bff', 'triste', 'live', 'filhos', 'genero', 'how', 'piada', 'relationship', 'esporte', 'comida', 'me', 'cor', 'historia', 'linguagens', 'religiao', 'hobby', 'starwars', 'playlist', 'license'\n", "\n", - "2019-05-03 21:20:58 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.training_data.training_data\u001b[0m - Training data stats: \n", + "2019-07-17 16:32:20 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.training_data.training_data\u001b[0m - Training data stats: \n", "\t- intent examples: 142 (28 distinct intents)\n", - "\t- Found intents: 'linguagens', 'despedir', 'triste', 'cor', 'hobby', 'risada', 'negar', 'bff', 'genero', 'star_wars', 'religiao', 'filhos', 'out_of_scope', 'como_estou', 'me', 'historia', 'relationship', 'playlist', 'time', 'license', 'diga_mais', 'piada', 'cumprimentar', 'comida', 'tudo_bem', 'onde_voce_mora', 'esporte', 'action_test'\n", - "\t- entity examples: 86 (19 distinct entities)\n", - "\t- found entities: 'triste', 'linguagens', 'live', 'license', 'me', 'cor', 'hobby', 'how', 'bff', 'comida', 'genero', 'piada', 'religiao', 'filhos', 'starwars', 'historia', 'esporte', 'relationship', 'playlist'\n", + "\t- Found intents: 'bff', 'risada', 'filhos', 'genero', 'piada', 'time', 'negar', 'comida', 'cor', 'historia', 'out_of_scope', 'triste', 'como_estou', 'cumprimentar', 'star_wars', 'relationship', 'hobby', 'action_test', 'tudo_bem', 'esporte', 'linguagens', 'despedir', 'religiao', 'me', 'playlist', 'license', 'onde_voce_mora', 'diga_mais'\n", + "\t- entity examples: 83 (19 distinct entities)\n", + "\t- found entities: 'bff', 'triste', 'live', 'filhos', 'genero', 'how', 'piada', 'relationship', 'esporte', 'comida', 'me', 'cor', 'historia', 'linguagens', 'religiao', 'hobby', 'starwars', 'playlist', 'license'\n", "\n", - "2019-05-03 21:20:58 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.model\u001b[0m - Starting to train component WhitespaceTokenizer\n", - "2019-05-03 21:20:58 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.model\u001b[0m - Finished training component.\n", - "2019-05-03 21:20:58 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.model\u001b[0m - Starting to train component CRFEntityExtractor\n", - "2019-05-03 21:20:59 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.model\u001b[0m - Finished training component.\n", - "2019-05-03 21:20:59 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.model\u001b[0m - Starting to train component EntitySynonymMapper\n", - "2019-05-03 21:20:59 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.model\u001b[0m - Finished training component.\n", - "2019-05-03 21:20:59 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.model\u001b[0m - Starting to train component CountVectorsFeaturizer\n", - "2019-05-03 21:20:59 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.model\u001b[0m - Finished training component.\n", - "2019-05-03 21:20:59 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.model\u001b[0m - Starting to train component EmbeddingIntentClassifier\n", + "2019-07-17 16:32:20 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.model\u001b[0m - Starting to train component WhitespaceTokenizer\n", + "2019-07-17 16:32:20 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.model\u001b[0m - Finished training component.\n", + "2019-07-17 16:32:20 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.model\u001b[0m - Starting to train component CRFEntityExtractor\n", + "2019-07-17 16:32:21 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.model\u001b[0m - Finished training component.\n", + "2019-07-17 16:32:21 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.model\u001b[0m - Starting to train component EntitySynonymMapper\n", + "2019-07-17 16:32:21 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.model\u001b[0m - Finished training component.\n", + "2019-07-17 16:32:21 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.model\u001b[0m - Starting to train component CountVectorsFeaturizer\n", + "2019-07-17 16:32:21 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.model\u001b[0m - Finished training component.\n", + "2019-07-17 16:32:21 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.model\u001b[0m - Starting to train component EmbeddingIntentClassifier\n", "\n", "WARNING: The TensorFlow contrib module will not be included in TensorFlow 2.0.\n", "For more information, please see:\n", @@ -626,22 +618,22 @@ " * https://github.com/tensorflow/addons\n", "If you depend on functionality not listed there, please file an issue.\n", "\n", - "2019-05-03 21:20:59 \u001b[1;30mWARNING \u001b[0m \u001b[34mtensorflow\u001b[0m - \u001b[33mFrom /usr/local/lib/python3.6/site-packages/rasa_nlu/classifiers/embedding_intent_classifier.py:285: dense (from tensorflow.python.layers.core) is deprecated and will be removed in a future version.\n", + "2019-07-17 16:32:21 \u001b[1;30mWARNING \u001b[0m \u001b[34mtensorflow\u001b[0m - \u001b[33mFrom /usr/local/lib/python3.6/site-packages/rasa_nlu/classifiers/embedding_intent_classifier.py:285: dense (from tensorflow.python.layers.core) is deprecated and will be removed in a future version.\n", "Instructions for updating:\n", "Use keras.layers.dense instead.\u001b[0m\n", - "2019-05-03 21:20:59 \u001b[1;30mWARNING \u001b[0m \u001b[34mtensorflow\u001b[0m - \u001b[33mFrom /usr/local/lib/python3.6/site-packages/tensorflow/python/framework/op_def_library.py:263: colocate_with (from tensorflow.python.framework.ops) is deprecated and will be removed in a future version.\n", + "2019-07-17 16:32:21 \u001b[1;30mWARNING \u001b[0m \u001b[34mtensorflow\u001b[0m - \u001b[33mFrom /usr/local/lib/python3.6/site-packages/tensorflow/python/framework/op_def_library.py:263: colocate_with (from tensorflow.python.framework.ops) is deprecated and will be removed in a future version.\n", "Instructions for updating:\n", "Colocations handled automatically by placer.\u001b[0m\n", - "2019-05-03 21:20:59 \u001b[1;30mWARNING \u001b[0m \u001b[34mtensorflow\u001b[0m - \u001b[33mFrom /usr/local/lib/python3.6/site-packages/rasa_nlu/classifiers/embedding_intent_classifier.py:286: dropout (from tensorflow.python.layers.core) is deprecated and will be removed in a future version.\n", + "2019-07-17 16:32:21 \u001b[1;30mWARNING \u001b[0m \u001b[34mtensorflow\u001b[0m - \u001b[33mFrom /usr/local/lib/python3.6/site-packages/rasa_nlu/classifiers/embedding_intent_classifier.py:286: dropout (from tensorflow.python.layers.core) is deprecated and will be removed in a future version.\n", "Instructions for updating:\n", "Use keras.layers.dropout instead.\u001b[0m\n", - "2019-05-03 21:20:59 \u001b[1;30mWARNING \u001b[0m \u001b[34mtensorflow\u001b[0m - \u001b[33mFrom /usr/local/lib/python3.6/site-packages/tensorflow/python/keras/layers/core.py:143: calling dropout (from tensorflow.python.ops.nn_ops) with keep_prob is deprecated and will be removed in a future version.\n", + "2019-07-17 16:32:21 \u001b[1;30mWARNING \u001b[0m \u001b[34mtensorflow\u001b[0m - \u001b[33mFrom /usr/local/lib/python3.6/site-packages/tensorflow/python/keras/layers/core.py:143: calling dropout (from tensorflow.python.ops.nn_ops) with keep_prob is deprecated and will be removed in a future version.\n", "Instructions for updating:\n", "Please use `rate` instead of `keep_prob`. Rate should be set to `rate = 1 - keep_prob`.\u001b[0m\n", - "2019-05-03 21:21:00 \u001b[1;30mWARNING \u001b[0m \u001b[34mtensorflow\u001b[0m - \u001b[33mFrom /usr/local/lib/python3.6/site-packages/tensorflow/python/ops/math_ops.py:3066: to_int32 (from tensorflow.python.ops.math_ops) is deprecated and will be removed in a future version.\n", + "2019-07-17 16:32:22 \u001b[1;30mWARNING \u001b[0m \u001b[34mtensorflow\u001b[0m - \u001b[33mFrom /usr/local/lib/python3.6/site-packages/tensorflow/python/ops/math_ops.py:3066: to_int32 (from tensorflow.python.ops.math_ops) is deprecated and will be removed in a future version.\n", "Instructions for updating:\n", "Use tf.cast instead.\u001b[0m\n", - "2019-05-03 21:21:00 \u001b[1;30mWARNING \u001b[0m \u001b[34mtensorflow\u001b[0m - \u001b[33mFrom /usr/local/lib/python3.6/site-packages/tensorflow/python/ops/math_grad.py:102: div (from tensorflow.python.ops.math_ops) is deprecated and will be removed in a future version.\n", + "2019-07-17 16:32:22 \u001b[1;30mWARNING \u001b[0m \u001b[34mtensorflow\u001b[0m - \u001b[33mFrom /usr/local/lib/python3.6/site-packages/tensorflow/python/ops/math_grad.py:102: div (from tensorflow.python.ops.math_ops) is deprecated and will be removed in a future version.\n", "Instructions for updating:\n", "Deprecated in favor of operator or tf.math.divide.\u001b[0m\n" ] @@ -650,80 +642,90 @@ "name": "stdout", "output_type": "stream", "text": [ - "2019-05-03 21:21:00.706185: I tensorflow/core/platform/cpu_feature_guard.cc:141] Your CPU supports instructions that this TensorFlow binary was not compiled to use: AVX2 FMA\n", - "2019-05-03 21:21:00.726392: I tensorflow/core/platform/profile_utils/cpu_utils.cc:94] CPU Frequency: 2905000000 Hz\n", - "2019-05-03 21:21:00.726674: I tensorflow/compiler/xla/service/service.cc:150] XLA service 0x555b9ee46db0 executing computations on platform Host. Devices:\n", - "2019-05-03 21:21:00.726702: I tensorflow/compiler/xla/service/service.cc:158] StreamExecutor device (0): , \n", - "2019-05-03 21:21:00 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.classifiers.embedding_intent_classifier\u001b[0m - Accuracy is updated every 10 epochs\n", - "Epochs: 100%|██████████| 300/300 [00:05<00:00, 59.85it/s, loss=0.186, acc=1.000]\n", - "2019-05-03 21:21:05 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.classifiers.embedding_intent_classifier\u001b[0m - Finished training embedding classifier, loss=0.186, train accuracy=1.000\n", - "2019-05-03 21:21:05 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.model\u001b[0m - Finished training component.\n", - "2019-05-03 21:21:05 \u001b[1;30mINFO \u001b[0m \u001b[34m__main__\u001b[0m - Running model for predictions:\n", - "100%|████████████████████████████████████████| 131/131 [00:00<00:00, 353.93it/s]\n", - "/usr/local/lib/python3.6/site-packages/sklearn/metrics/classification.py:1145: UndefinedMetricWarning: Recall and F-score are ill-defined and being set to 0.0 in labels with no true samples.\n", - " 'recall', 'true', average, warn_for)\n", - "/usr/local/lib/python3.6/site-packages/sklearn/metrics/classification.py:1145: UndefinedMetricWarning: F-score is ill-defined and being set to 0.0 in labels with no true samples.\n", - " 'recall', 'true', average, warn_for)\n", - "2019-05-03 21:21:06 \u001b[1;30mINFO \u001b[0m \u001b[34m__main__\u001b[0m - Running model for predictions:\n", - "100%|████████████████████████████████████████| 142/142 [00:00<00:00, 528.87it/s]\n", + "2019-07-17 16:32:22.678227: I tensorflow/core/platform/cpu_feature_guard.cc:141] Your CPU supports instructions that this TensorFlow binary was not compiled to use: AVX2 FMA\n", + "2019-07-17 16:32:22.700933: I tensorflow/core/platform/profile_utils/cpu_utils.cc:94] CPU Frequency: 2194805000 Hz\n", + "2019-07-17 16:32:22.701522: I tensorflow/compiler/xla/service/service.cc:150] XLA service 0x55be5a7c66c0 executing computations on platform Host. Devices:\n", + "2019-07-17 16:32:22.701579: I tensorflow/compiler/xla/service/service.cc:158] StreamExecutor device (0): , \n", + "2019-07-17 16:32:22 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.classifiers.embedding_intent_classifier\u001b[0m - Accuracy is updated every 10 epochs\n", + "Epochs: 100%|██████████| 300/300 [00:05<00:00, 53.69it/s, loss=0.194, acc=0.992]\n", + "2019-07-17 16:32:28 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.classifiers.embedding_intent_classifier\u001b[0m - Finished training embedding classifier, loss=0.194, train accuracy=0.992\n", + "2019-07-17 16:32:28 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.model\u001b[0m - Finished training component.\n", + "2019-07-17 16:32:28 \u001b[1;30mINFO \u001b[0m \u001b[34m__main__\u001b[0m - Running model for predictions:\n", + "100%|████████████████████████████████████████| 131/131 [00:00<00:00, 435.20it/s]\n", + "2019-07-17 16:32:28 \u001b[1;30mINFO \u001b[0m \u001b[34m__main__\u001b[0m - Running model for predictions:\n", + "100%|████████████████████████████████████████| 142/142 [00:00<00:00, 527.33it/s]\n", "/usr/local/lib/python3.6/site-packages/sklearn/metrics/classification.py:1143: UndefinedMetricWarning: Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples.\n", " 'precision', 'predicted', average, warn_for)\n", + "/usr/local/lib/python3.6/site-packages/sklearn/metrics/classification.py:1145: UndefinedMetricWarning: Recall and F-score are ill-defined and being set to 0.0 in labels with no true samples.\n", + " 'recall', 'true', average, warn_for)\n", "/usr/local/lib/python3.6/site-packages/sklearn/metrics/classification.py:1143: UndefinedMetricWarning: Precision is ill-defined and being set to 0.0 in labels with no predicted samples.\n", " 'precision', 'predicted', average, warn_for)\n", "/usr/local/lib/python3.6/site-packages/sklearn/metrics/classification.py:1143: UndefinedMetricWarning: F-score is ill-defined and being set to 0.0 in labels with no predicted samples.\n", " 'precision', 'predicted', average, warn_for)\n", - "2019-05-03 21:21:06 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.training_data.training_data\u001b[0m - Training data stats: \n", + "/usr/local/lib/python3.6/site-packages/sklearn/metrics/classification.py:1145: UndefinedMetricWarning: F-score is ill-defined and being set to 0.0 in labels with no true samples.\n", + " 'recall', 'true', average, warn_for)\n", + "2019-07-17 16:32:28 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.training_data.training_data\u001b[0m - Training data stats: \n", "\t- intent examples: 142 (28 distinct intents)\n", - "\t- Found intents: 'linguagens', 'despedir', 'triste', 'cor', 'hobby', 'risada', 'negar', 'bff', 'genero', 'star_wars', 'religiao', 'filhos', 'out_of_scope', 'como_estou', 'me', 'historia', 'relationship', 'playlist', 'time', 'license', 'diga_mais', 'piada', 'cumprimentar', 'comida', 'tudo_bem', 'onde_voce_mora', 'esporte', 'action_test'\n", - "\t- entity examples: 86 (19 distinct entities)\n", - "\t- found entities: 'triste', 'linguagens', 'live', 'license', 'me', 'cor', 'hobby', 'how', 'bff', 'comida', 'genero', 'piada', 'religiao', 'filhos', 'starwars', 'historia', 'esporte', 'relationship', 'playlist'\n", + "\t- Found intents: 'bff', 'risada', 'filhos', 'genero', 'piada', 'time', 'negar', 'comida', 'cor', 'historia', 'out_of_scope', 'triste', 'como_estou', 'cumprimentar', 'star_wars', 'relationship', 'hobby', 'action_test', 'tudo_bem', 'esporte', 'linguagens', 'despedir', 'religiao', 'me', 'playlist', 'license', 'onde_voce_mora', 'diga_mais'\n", + "\t- entity examples: 83 (19 distinct entities)\n", + "\t- found entities: 'bff', 'triste', 'live', 'filhos', 'genero', 'how', 'piada', 'relationship', 'esporte', 'comida', 'me', 'cor', 'historia', 'linguagens', 'religiao', 'hobby', 'starwars', 'playlist', 'license'\n", "\n", - "2019-05-03 21:21:06 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.training_data.training_data\u001b[0m - Training data stats: \n", + "2019-07-17 16:32:28 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.training_data.training_data\u001b[0m - Training data stats: \n", "\t- intent examples: 131 (28 distinct intents)\n", - "\t- Found intents: 'linguagens', 'despedir', 'triste', 'cor', 'hobby', 'risada', 'negar', 'bff', 'genero', 'star_wars', 'religiao', 'filhos', 'out_of_scope', 'como_estou', 'me', 'historia', 'relationship', 'playlist', 'time', 'license', 'diga_mais', 'piada', 'cumprimentar', 'comida', 'tudo_bem', 'onde_voce_mora', 'esporte', 'action_test'\n", - "\t- entity examples: 76 (19 distinct entities)\n", - "\t- found entities: 'triste', 'linguagens', 'live', 'license', 'me', 'cor', 'hobby', 'how', 'bff', 'comida', 'genero', 'piada', 'religiao', 'filhos', 'starwars', 'historia', 'esporte', 'relationship', 'playlist'\n", + "\t- Found intents: 'bff', 'risada', 'filhos', 'genero', 'piada', 'time', 'negar', 'comida', 'cor', 'historia', 'out_of_scope', 'triste', 'como_estou', 'cumprimentar', 'star_wars', 'relationship', 'hobby', 'action_test', 'tudo_bem', 'esporte', 'linguagens', 'despedir', 'religiao', 'me', 'playlist', 'license', 'onde_voce_mora', 'diga_mais'\n", + "\t- entity examples: 79 (19 distinct entities)\n", + "\t- found entities: 'bff', 'triste', 'live', 'filhos', 'genero', 'how', 'piada', 'relationship', 'esporte', 'comida', 'me', 'cor', 'historia', 'linguagens', 'religiao', 'hobby', 'starwars', 'playlist', 'license'\n", "\n", - "2019-05-03 21:21:06 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.model\u001b[0m - Starting to train component WhitespaceTokenizer\n", - "2019-05-03 21:21:06 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.model\u001b[0m - Finished training component.\n", - "2019-05-03 21:21:06 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.model\u001b[0m - Starting to train component CRFEntityExtractor\n", - "2019-05-03 21:21:06 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.model\u001b[0m - Finished training component.\n", - "2019-05-03 21:21:06 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.model\u001b[0m - Starting to train component EntitySynonymMapper\n", - "2019-05-03 21:21:06 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.model\u001b[0m - Finished training component.\n", - "2019-05-03 21:21:06 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.model\u001b[0m - Starting to train component CountVectorsFeaturizer\n", - "2019-05-03 21:21:06 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.model\u001b[0m - Finished training component.\n", - "2019-05-03 21:21:06 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.model\u001b[0m - Starting to train component EmbeddingIntentClassifier\n", - "2019-05-03 21:21:07 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.classifiers.embedding_intent_classifier\u001b[0m - Accuracy is updated every 10 epochs\n", - "Epochs: 100%|██████████| 300/300 [00:06<00:00, 47.98it/s, loss=0.186, acc=1.000]\n", - "2019-05-03 21:21:13 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.classifiers.embedding_intent_classifier\u001b[0m - Finished training embedding classifier, loss=0.186, train accuracy=1.000\n", - "2019-05-03 21:21:13 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.model\u001b[0m - Finished training component.\n", - "2019-05-03 21:21:13 \u001b[1;30mINFO \u001b[0m \u001b[34m__main__\u001b[0m - Running model for predictions:\n", - "100%|████████████████████████████████████████| 142/142 [00:00<00:00, 520.96it/s]\n", - "2019-05-03 21:21:14 \u001b[1;30mINFO \u001b[0m \u001b[34m__main__\u001b[0m - Running model for predictions:\n", - "100%|████████████████████████████████████████| 131/131 [00:00<00:00, 595.66it/s]\n", - "2019-05-03 21:21:14 \u001b[1;30mINFO \u001b[0m \u001b[34m__main__\u001b[0m - CV evaluation (n=2)\n", - "2019-05-03 21:21:14 \u001b[1;30mINFO \u001b[0m \u001b[34m__main__\u001b[0m - Intent evaluation results\n", - "2019-05-03 21:21:14 \u001b[1;30mINFO \u001b[0m \u001b[34m__main__\u001b[0m - train Accuracy: 0.996 (0.004)\n", - "2019-05-03 21:21:14 \u001b[1;30mINFO \u001b[0m \u001b[34m__main__\u001b[0m - train F1-score: 0.998 (0.002)\n", - "2019-05-03 21:21:14 \u001b[1;30mINFO \u001b[0m \u001b[34m__main__\u001b[0m - train Precision: 1.000 (0.000)\n", - "2019-05-03 21:21:14 \u001b[1;30mINFO \u001b[0m \u001b[34m__main__\u001b[0m - test Accuracy: 0.523 (0.012)\n", - "2019-05-03 21:21:14 \u001b[1;30mINFO \u001b[0m \u001b[34m__main__\u001b[0m - test F1-score: 0.545 (0.007)\n", - "2019-05-03 21:21:14 \u001b[1;30mINFO \u001b[0m \u001b[34m__main__\u001b[0m - test Precision: 0.641 (0.014)\n", - "2019-05-03 21:21:14 \u001b[1;30mINFO \u001b[0m \u001b[34m__main__\u001b[0m - Entity evaluation results\n", - "2019-05-03 21:21:14 \u001b[1;30mINFO \u001b[0m \u001b[34m__main__\u001b[0m - Entity extractor: CRFEntityExtractor\n", - "2019-05-03 21:21:14 \u001b[1;30mINFO \u001b[0m \u001b[34m__main__\u001b[0m - train Accuracy: 1.000 (0.000)\n", - "2019-05-03 21:21:14 \u001b[1;30mINFO \u001b[0m \u001b[34m__main__\u001b[0m - train F1-score: 1.000 (0.000)\n", - "2019-05-03 21:21:14 \u001b[1;30mINFO \u001b[0m \u001b[34m__main__\u001b[0m - train Precision: 1.000 (0.000)\n", - "2019-05-03 21:21:14 \u001b[1;30mINFO \u001b[0m \u001b[34m__main__\u001b[0m - Entity extractor: CRFEntityExtractor\n", - "2019-05-03 21:21:14 \u001b[1;30mINFO \u001b[0m \u001b[34m__main__\u001b[0m - test Accuracy: 0.834 (0.015)\n", - "2019-05-03 21:21:14 \u001b[1;30mINFO \u001b[0m \u001b[34m__main__\u001b[0m - test F1-score: 0.788 (0.013)\n", - "2019-05-03 21:21:14 \u001b[1;30mINFO \u001b[0m \u001b[34m__main__\u001b[0m - test Precision: 0.800 (0.015)\n", - "2019-05-03 21:21:14 \u001b[1;30mINFO \u001b[0m \u001b[34m__main__\u001b[0m - Finished evaluation\n" + "2019-07-17 16:32:29 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.model\u001b[0m - Starting to train component WhitespaceTokenizer\n", + "2019-07-17 16:32:29 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.model\u001b[0m - Finished training component.\n", + "2019-07-17 16:32:29 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.model\u001b[0m - Starting to train component CRFEntityExtractor\n", + "2019-07-17 16:32:29 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.model\u001b[0m - Finished training component.\n", + "2019-07-17 16:32:29 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.model\u001b[0m - Starting to train component EntitySynonymMapper\n", + "2019-07-17 16:32:29 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.model\u001b[0m - Finished training component.\n", + "2019-07-17 16:32:29 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.model\u001b[0m - Starting to train component CountVectorsFeaturizer\n", + "2019-07-17 16:32:29 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.model\u001b[0m - Finished training component.\n", + "2019-07-17 16:32:29 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.model\u001b[0m - Starting to train component EmbeddingIntentClassifier\n", + "2019-07-17 16:32:30 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.classifiers.embedding_intent_classifier\u001b[0m - Accuracy is updated every 10 epochs\n", + "Epochs: 100%|██████████| 300/300 [00:06<00:00, 45.43it/s, loss=0.188, acc=1.000]\n", + "2019-07-17 16:32:36 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.classifiers.embedding_intent_classifier\u001b[0m - Finished training embedding classifier, loss=0.188, train accuracy=1.000\n", + "2019-07-17 16:32:36 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.model\u001b[0m - Finished training component.\n", + "2019-07-17 16:32:36 \u001b[1;30mINFO \u001b[0m \u001b[34m__main__\u001b[0m - Running model for predictions:\n", + "100%|████████████████████████████████████████| 142/142 [00:00<00:00, 433.04it/s]\n", + "/usr/local/lib/python3.6/site-packages/sklearn/metrics/classification.py:1145: UndefinedMetricWarning: Recall and F-score are ill-defined and being set to 0.0 in labels with no true samples.\n", + " 'recall', 'true', average, warn_for)\n", + "/usr/local/lib/python3.6/site-packages/sklearn/metrics/classification.py:1145: UndefinedMetricWarning: F-score is ill-defined and being set to 0.0 in labels with no true samples.\n", + " 'recall', 'true', average, warn_for)\n", + "2019-07-17 16:32:37 \u001b[1;30mINFO \u001b[0m \u001b[34m__main__\u001b[0m - Running model for predictions:\n", + "100%|████████████████████████████████████████| 131/131 [00:00<00:00, 569.47it/s]\n", + "/usr/local/lib/python3.6/site-packages/sklearn/metrics/classification.py:1143: UndefinedMetricWarning: Precision and F-score are ill-defined and being set to 0.0 in labels with no predicted samples.\n", + " 'precision', 'predicted', average, warn_for)\n", + "/usr/local/lib/python3.6/site-packages/sklearn/metrics/classification.py:1143: UndefinedMetricWarning: Precision is ill-defined and being set to 0.0 in labels with no predicted samples.\n", + " 'precision', 'predicted', average, warn_for)\n", + "/usr/local/lib/python3.6/site-packages/sklearn/metrics/classification.py:1143: UndefinedMetricWarning: F-score is ill-defined and being set to 0.0 in labels with no predicted samples.\n", + " 'precision', 'predicted', average, warn_for)\n", + "2019-07-17 16:32:37 \u001b[1;30mINFO \u001b[0m \u001b[34m__main__\u001b[0m - CV evaluation (n=2)\n", + "2019-07-17 16:32:37 \u001b[1;30mINFO \u001b[0m \u001b[34m__main__\u001b[0m - Intent evaluation results\n", + "2019-07-17 16:32:37 \u001b[1;30mINFO \u001b[0m \u001b[34m__main__\u001b[0m - train Accuracy: 0.993 (0.000)\n", + "2019-07-17 16:32:37 \u001b[1;30mINFO \u001b[0m \u001b[34m__main__\u001b[0m - train F1-score: 0.994 (0.002)\n", + "2019-07-17 16:32:37 \u001b[1;30mINFO \u001b[0m \u001b[34m__main__\u001b[0m - train Precision: 0.997 (0.003)\n", + "2019-07-17 16:32:37 \u001b[1;30mINFO \u001b[0m \u001b[34m__main__\u001b[0m - test Accuracy: 0.536 (0.029)\n", + "2019-07-17 16:32:37 \u001b[1;30mINFO \u001b[0m \u001b[34m__main__\u001b[0m - test F1-score: 0.561 (0.031)\n", + "2019-07-17 16:32:37 \u001b[1;30mINFO \u001b[0m \u001b[34m__main__\u001b[0m - test Precision: 0.681 (0.027)\n", + "2019-07-17 16:32:37 \u001b[1;30mINFO \u001b[0m \u001b[34m__main__\u001b[0m - Entity evaluation results\n", + "2019-07-17 16:32:37 \u001b[1;30mINFO \u001b[0m \u001b[34m__main__\u001b[0m - Entity extractor: CRFEntityExtractor\n", + "2019-07-17 16:32:37 \u001b[1;30mINFO \u001b[0m \u001b[34m__main__\u001b[0m - train Accuracy: 1.000 (0.000)\n", + "2019-07-17 16:32:37 \u001b[1;30mINFO \u001b[0m \u001b[34m__main__\u001b[0m - train F1-score: 1.000 (0.000)\n", + "2019-07-17 16:32:37 \u001b[1;30mINFO \u001b[0m \u001b[34m__main__\u001b[0m - train Precision: 1.000 (0.000)\n", + "2019-07-17 16:32:37 \u001b[1;30mINFO \u001b[0m \u001b[34m__main__\u001b[0m - Entity extractor: CRFEntityExtractor\n", + "2019-07-17 16:32:37 \u001b[1;30mINFO \u001b[0m \u001b[34m__main__\u001b[0m - test Accuracy: 0.826 (0.004)\n", + "2019-07-17 16:32:37 \u001b[1;30mINFO \u001b[0m \u001b[34m__main__\u001b[0m - test F1-score: 0.776 (0.001)\n", + "2019-07-17 16:32:37 \u001b[1;30mINFO \u001b[0m \u001b[34m__main__\u001b[0m - test Precision: 0.810 (0.033)\n", + "2019-07-17 16:32:37 \u001b[1;30mINFO \u001b[0m \u001b[34m__main__\u001b[0m - Finished evaluation\n" ] } ], "source": [ - "!python -m rasa_nlu.test -d $BOT_INTENTS_PATH -c $BOT_NLU_CONFIG_PATH --mode crossvalidation --folds 2 --report" + "!python -m rasa_nlu.test -d $COACH_INTENTS_PATH -c $COACH_NLU_CONFIG_PATH --mode crossvalidation --folds 2 --report" ] }, { @@ -782,7 +784,7 @@ "name": "python", "nbconvert_exporter": "python", "pygments_lexer": "ipython3", - "version": "3.6.8" + "version": "3.6.9" } }, "nbformat": 4, diff --git a/notebooks/stories/chat_graph.html b/notebooks/stories/chat_graph.html index 6b9897e9..ebffb162 100644 --- a/notebooks/stories/chat_graph.html +++ b/notebooks/stories/chat_graph.html @@ -137,72 +137,72 @@ graph = `digraph { 0 [class="start active", fillcolor=green, fontsize=12, label=START, style=filled]; "-1" [class=end, fillcolor=red, fontsize=12, label=END, style=filled]; -1 [class="", fontsize=12, label=utter_como_estou]; -2 [class="", fontsize=12, label=utter_playlist]; -3 [class="", fontsize=12, label=utter_comida]; -4 [class="", fontsize=12, label=utter_cor]; -5 [class="", fontsize=12, label=utter_de_onde_voce_eh]; -6 [class="", fontsize=12, label=utter_relationship]; -7 [class="", fontsize=12, label=utter_me]; -8 [class="", fontsize=12, label=utter_filhos]; -9 [class="", fontsize=12, label=utter_filme]; -10 [class="", fontsize=12, label=utter_signo]; -11 [class="", fontsize=12, label=utter_triste]; -12 [class="", fontsize=12, label=utter_religiao]; -13 [class="", fontsize=12, label=utter_hobby]; -14 [class="", fontsize=12, label=utter_bff]; -15 [class="", fontsize=12, label=utter_historia]; -16 [class="", fontsize=12, label=utter_risada]; -17 [class="", fontsize=12, label=utter_cumprimentar]; -18 [class="", fontsize=12, label=action_test]; -20 [class="", fontsize=12, label=utter_despedir]; -21 [class="", fontsize=12, label=utter_tudo_bem]; -24 [class="", fontsize=12, label=utter_diga_mais]; -25 [class="", fontsize=12, label=utter_esporte]; -26 [class="", fontsize=12, label=utter_default]; -28 [class="", fontsize=12, label=utter_elogios]; -32 [class="", fontsize=12, label=utter_time]; -33 [class="", fontsize=12, label=utter_linguagens]; -34 [class="", fontsize=12, label=utter_genero]; -35 [class="", fontsize=12, label=utter_star_wars]; -36 [class="", fontsize=12, label=utter_piada]; -37 [class="", fontsize=12, label=utter_license]; -38 [class="", fontsize=12, label=utter_onde_voce_mora]; -39 [class=intent, fillcolor=lightblue, label=como_estou, shape=rect, style=filled]; -40 [class=intent, fillcolor=lightblue, label=playlist, shape=rect, style=filled]; -41 [class=intent, fillcolor=lightblue, label=comida, shape=rect, style=filled]; -42 [class=intent, fillcolor=lightblue, label=cor, shape=rect, style=filled]; -43 [class=intent, fillcolor=lightblue, label=de_onde_voce_eh, shape=rect, style=filled]; -44 [class=intent, fillcolor=lightblue, label=me, shape=rect, style=filled]; -45 [class=intent, fillcolor=lightblue, label=filhos, shape=rect, style=filled]; -46 [class=intent, fillcolor=lightblue, label=filme, shape=rect, style=filled]; -47 [class=intent, fillcolor=lightblue, label=signo, shape=rect, style=filled]; -48 [class=intent, fillcolor=lightblue, label=triste, shape=rect, style=filled]; -49 [class=intent, fillcolor=lightblue, label=religiao, shape=rect, style=filled]; -50 [class=intent, fillcolor=lightblue, label=hobby, shape=rect, style=filled]; -51 [class=intent, fillcolor=lightblue, label=bff, shape=rect, style=filled]; -52 [class=intent, fillcolor=lightblue, label=historia, shape=rect, style=filled]; -53 [class=intent, fillcolor=lightblue, label=risada, shape=rect, style=filled]; -54 [class=intent, fillcolor=lightblue, label=cumprimentar, shape=rect, style=filled]; -55 [class=intent, fillcolor=lightblue, label=despedir, shape=rect, style=filled]; -56 [class=intent, fillcolor=lightblue, label=negar, shape=rect, style=filled]; -57 [class=intent, fillcolor=lightblue, label=tudo_bem, shape=rect, style=filled]; -58 [class=intent, fillcolor=lightblue, label=diga_mais, shape=rect, style=filled]; -59 [class=intent, fillcolor=lightblue, label=esporte, shape=rect, style=filled]; -60 [class=intent, fillcolor=lightblue, label=out_of_scope, shape=rect, style=filled]; -61 [class=intent, fillcolor=lightblue, label=elogios, shape=rect, style=filled]; -62 [class=intent, fillcolor=lightblue, label=time, shape=rect, style=filled]; -63 [class=intent, fillcolor=lightblue, label=linguagens, shape=rect, style=filled]; -64 [class=intent, fillcolor=lightblue, label=genero, shape=rect, style=filled]; -65 [class=intent, fillcolor=lightblue, label=star_wars, shape=rect, style=filled]; -66 [class=intent, fillcolor=lightblue, label=piada, shape=rect, style=filled]; -67 [class=intent, fillcolor=lightblue, label=license, shape=rect, style=filled]; -68 [class=intent, fillcolor=lightblue, label=onde_voce_mora, shape=rect, style=filled]; +1 [class="", fontsize=12, label=utter_religiao]; +2 [class="", fontsize=12, label=utter_esporte]; +3 [class="", fontsize=12, label=utter_time]; +4 [class="", fontsize=12, label=utter_linguagens]; +5 [class="", fontsize=12, label=utter_genero]; +6 [class="", fontsize=12, label=utter_star_wars]; +7 [class="", fontsize=12, label=utter_piada]; +8 [class="", fontsize=12, label=utter_license]; +9 [class="", fontsize=12, label=utter_onde_voce_mora]; +10 [class="", fontsize=12, label=utter_como_estou]; +11 [class="", fontsize=12, label=utter_despedir]; +12 [class="", fontsize=12, label=utter_playlist]; +13 [class="", fontsize=12, label=utter_comida]; +14 [class="", fontsize=12, label=utter_cor]; +15 [class="", fontsize=12, label=utter_de_onde_voce_eh]; +16 [class="", fontsize=12, label=utter_relationship]; +17 [class="", fontsize=12, label=utter_me]; +18 [class="", fontsize=12, label=utter_filhos]; +19 [class="", fontsize=12, label=utter_filme]; +20 [class="", fontsize=12, label=utter_signo]; +21 [class="", fontsize=12, label=utter_triste]; +22 [class="", fontsize=12, label=utter_hobby]; +23 [class="", fontsize=12, label=utter_tudo_bem]; +24 [class="", fontsize=12, label=utter_bff]; +25 [class="", fontsize=12, label=utter_historia]; +26 [class="", fontsize=12, label=utter_risada]; +27 [class="", fontsize=12, label=utter_cumprimentar]; +28 [class="", fontsize=12, label=action_test]; +32 [class="", fontsize=12, label=utter_diga_mais]; +33 [class="", fontsize=12, label=utter_default]; +35 [class="", fontsize=12, label=utter_elogios]; +39 [class=intent, fillcolor=lightblue, label=religiao, shape=rect, style=filled]; +40 [class=intent, fillcolor=lightblue, label=esporte, shape=rect, style=filled]; +41 [class=intent, fillcolor=lightblue, label=time, shape=rect, style=filled]; +42 [class=intent, fillcolor=lightblue, label=linguagens, shape=rect, style=filled]; +43 [class=intent, fillcolor=lightblue, label=genero, shape=rect, style=filled]; +44 [class=intent, fillcolor=lightblue, label=star_wars, shape=rect, style=filled]; +45 [class=intent, fillcolor=lightblue, label=piada, shape=rect, style=filled]; +46 [class=intent, fillcolor=lightblue, label=license, shape=rect, style=filled]; +47 [class=intent, fillcolor=lightblue, label=onde_voce_mora, shape=rect, style=filled]; +48 [class=intent, fillcolor=lightblue, label=como_estou, shape=rect, style=filled]; +49 [class=intent, fillcolor=lightblue, label=despedir, shape=rect, style=filled]; +50 [class=intent, fillcolor=lightblue, label=negar, shape=rect, style=filled]; +51 [class=intent, fillcolor=lightblue, label=playlist, shape=rect, style=filled]; +52 [class=intent, fillcolor=lightblue, label=comida, shape=rect, style=filled]; +53 [class=intent, fillcolor=lightblue, label=cor, shape=rect, style=filled]; +54 [class=intent, fillcolor=lightblue, label=de_onde_voce_eh, shape=rect, style=filled]; +55 [class=intent, fillcolor=lightblue, label=me, shape=rect, style=filled]; +56 [class=intent, fillcolor=lightblue, label=filhos, shape=rect, style=filled]; +57 [class=intent, fillcolor=lightblue, label=filme, shape=rect, style=filled]; +58 [class=intent, fillcolor=lightblue, label=signo, shape=rect, style=filled]; +59 [class=intent, fillcolor=lightblue, label=triste, shape=rect, style=filled]; +60 [class=intent, fillcolor=lightblue, label=hobby, shape=rect, style=filled]; +61 [class=intent, fillcolor=lightblue, label=tudo_bem, shape=rect, style=filled]; +62 [class=intent, fillcolor=lightblue, label=bff, shape=rect, style=filled]; +63 [class=intent, fillcolor=lightblue, label=historia, shape=rect, style=filled]; +64 [class=intent, fillcolor=lightblue, label=risada, shape=rect, style=filled]; +65 [class=intent, fillcolor=lightblue, label=cumprimentar, shape=rect, style=filled]; +66 [class=intent, fillcolor=lightblue, label=diga_mais, shape=rect, style=filled]; +67 [class=intent, fillcolor=lightblue, label=out_of_scope, shape=rect, style=filled]; +68 [class=intent, fillcolor=lightblue, label=elogios, shape=rect, style=filled]; 69 [class=intent, fillcolor=lightblue, label=action_test, shape=rect, style=filled]; 70 [class=intent, fillcolor=lightblue, label=relationship, shape=rect, style=filled]; 71 [class=intent, fillcolor=lightblue, label=action_test, shape=rect, style=filled]; -72 [class=intent, fillcolor=lightblue, label=despedir, shape=rect, style=filled]; -73 [class=intent, fillcolor=lightblue, label=tudo_bem, shape=rect, style=filled]; +72 [class=intent, fillcolor=lightblue, label=tudo_bem, shape=rect, style=filled]; +73 [class=intent, fillcolor=lightblue, label=despedir, shape=rect, style=filled]; 0 -> 39 [class="", key=0]; 0 -> 40 [class="", key=0]; 0 -> 41 [class="", key=0]; @@ -238,7 +238,7 @@ 2 -> "-1" [class="", key=NONE, label=""]; 3 -> "-1" [class="", key=NONE, label=""]; 4 -> "-1" [class="", key=NONE, label=""]; -5 -> 70 [class="", key=0]; +5 -> "-1" [class="", key=NONE, label=""]; 6 -> "-1" [class="", key=NONE, label=""]; 7 -> "-1" [class="", key=NONE, label=""]; 8 -> "-1" [class="", key=NONE, label=""]; @@ -248,61 +248,61 @@ 12 -> "-1" [class="", key=NONE, label=""]; 13 -> "-1" [class="", key=NONE, label=""]; 14 -> "-1" [class="", key=NONE, label=""]; -15 -> "-1" [class="", key=NONE, label=""]; +15 -> 70 [class="", key=0]; 16 -> "-1" [class="", key=NONE, label=""]; 17 -> "-1" [class="", key=NONE, label=""]; -17 -> 71 [class="", key=0]; -17 -> 72 [class="", key=0]; -17 -> 73 [class="", key=0]; 18 -> "-1" [class="", key=NONE, label=""]; +19 -> "-1" [class="", key=NONE, label=""]; 20 -> "-1" [class="", key=NONE, label=""]; 21 -> "-1" [class="", key=NONE, label=""]; +22 -> "-1" [class="", key=NONE, label=""]; +23 -> "-1" [class="", key=NONE, label=""]; 24 -> "-1" [class="", key=NONE, label=""]; 25 -> "-1" [class="", key=NONE, label=""]; 26 -> "-1" [class="", key=NONE, label=""]; +27 -> "-1" [class="", key=NONE, label=""]; +27 -> 71 [class="", key=0]; +27 -> 72 [class="", key=0]; +27 -> 73 [class="", key=0]; 28 -> "-1" [class="", key=NONE, label=""]; 32 -> "-1" [class="", key=NONE, label=""]; 33 -> "-1" [class="", key=NONE, label=""]; -34 -> "-1" [class="", key=NONE, label=""]; 35 -> "-1" [class="", key=NONE, label=""]; -36 -> "-1" [class="", key=NONE, label=""]; -37 -> "-1" [class="", key=NONE, label=""]; -38 -> "-1" [class="", key=NONE, label=""]; 39 -> 1 [class="", key=0]; 40 -> 2 [class="", key=0]; 41 -> 3 [class="", key=0]; 42 -> 4 [class="", key=0]; 43 -> 5 [class="", key=0]; -44 -> 7 [class="", key=0]; -45 -> 8 [class="", key=0]; -46 -> 9 [class="", key=0]; -47 -> 10 [class="", key=0]; -48 -> 11 [class="", key=0]; -49 -> 12 [class="", key=0]; -50 -> 13 [class="", key=0]; -51 -> 14 [class="", key=0]; -52 -> 15 [class="", key=0]; -53 -> 16 [class="", key=0]; -54 -> 17 [class="", key=0]; -55 -> 20 [class="", key=0]; -56 -> 20 [class="", key=0]; -57 -> 21 [class="", key=0]; -58 -> 24 [class="", key=0]; -59 -> 25 [class="", key=0]; -60 -> 26 [class="", key=0]; -61 -> 28 [class="", key=0]; -62 -> 32 [class="", key=0]; -63 -> 33 [class="", key=0]; -64 -> 34 [class="", key=0]; -65 -> 35 [class="", key=0]; -66 -> 36 [class="", key=0]; -67 -> 37 [class="", key=0]; -68 -> 38 [class="", key=0]; -69 -> 18 [class="", key=0]; -70 -> 6 [class="", key=0]; -71 -> 18 [class="", key=0]; -72 -> 20 [class="", key=0]; -73 -> 21 [class="", key=0]; +44 -> 6 [class="", key=0]; +45 -> 7 [class="", key=0]; +46 -> 8 [class="", key=0]; +47 -> 9 [class="", key=0]; +48 -> 10 [class="", key=0]; +49 -> 11 [class="", key=0]; +50 -> 11 [class="", key=0]; +51 -> 12 [class="", key=0]; +52 -> 13 [class="", key=0]; +53 -> 14 [class="", key=0]; +54 -> 15 [class="", key=0]; +55 -> 17 [class="", key=0]; +56 -> 18 [class="", key=0]; +57 -> 19 [class="", key=0]; +58 -> 20 [class="", key=0]; +59 -> 21 [class="", key=0]; +60 -> 22 [class="", key=0]; +61 -> 23 [class="", key=0]; +62 -> 24 [class="", key=0]; +63 -> 25 [class="", key=0]; +64 -> 26 [class="", key=0]; +65 -> 27 [class="", key=0]; +66 -> 32 [class="", key=0]; +67 -> 33 [class="", key=0]; +68 -> 35 [class="", key=0]; +69 -> 28 [class="", key=0]; +70 -> 16 [class="", key=0]; +71 -> 28 [class="", key=0]; +72 -> 23 [class="", key=0]; +73 -> 11 [class="", key=0]; } `; drawGraph(graph); diff --git a/notebooks/stories/stories-analysis.ipynb b/notebooks/stories/stories-analysis.ipynb index 7a6b2388..c2ad4edf 100644 --- a/notebooks/stories/stories-analysis.ipynb +++ b/notebooks/stories/stories-analysis.ipynb @@ -24,14 +24,6 @@ "execution_count": 1, "metadata": {}, "outputs": [ - { - "name": "stderr", - "output_type": "stream", - "text": [ - "/usr/local/lib/python3.6/site-packages/requests/__init__.py:91: RequestsDependencyWarning: urllib3 (1.25.2) or chardet (3.0.4) doesn't match a supported version!\n", - " RequestsDependencyWarning)\n" - ] - }, { "name": "stdout", "output_type": "stream", @@ -83,11 +75,9 @@ "name": "stdout", "output_type": "stream", "text": [ - "/usr/local/lib/python3.6/site-packages/requests/__init__.py:91: RequestsDependencyWarning: urllib3 (1.25.2) or chardet (3.0.4) doesn't match a supported version!\n", - " RequestsDependencyWarning)\n", "/usr/local/lib/python3.6/runpy.py:125: RuntimeWarning: 'rasa_core.visualize' found in sys.modules after import of package 'rasa_core', but prior to execution of 'rasa_core.visualize'; this may result in unpredictable behaviour\n", " warn(RuntimeWarning(msg))\n", - "2019-05-03 21:20:43 \u001b[1;30mINFO \u001b[0m \u001b[34mapscheduler.scheduler\u001b[0m - Scheduler started\n", + "2019-07-17 16:33:49 \u001b[1;30mINFO \u001b[0m \u001b[34mapscheduler.scheduler\u001b[0m - Scheduler started\n", "\n", "WARNING: The TensorFlow contrib module will not be included in TensorFlow 2.0.\n", "For more information, please see:\n", @@ -95,14 +85,14 @@ " * https://github.com/tensorflow/addons\n", "If you depend on functionality not listed there, please file an issue.\n", "\n", - "2019-05-03 21:20:44 \u001b[1;30mINFO \u001b[0m \u001b[34m__main__\u001b[0m - Starting to visualize stories...\n", - "Processed Story Blocks: 100%|███| 34/34 [00:00<00:00, 5308.85it/s, # trackers=1]\n", - "2019-05-03 21:20:44 \u001b[1;30mINFO \u001b[0m \u001b[34m__main__\u001b[0m - Finished graph creation. Saved into file:///work/notebooks/stories/chat_graph.html\n" + "2019-07-17 16:33:50 \u001b[1;30mINFO \u001b[0m \u001b[34m__main__\u001b[0m - Starting to visualize stories...\n", + "Processed Story Blocks: 100%|███| 34/34 [00:00<00:00, 3467.21it/s, # trackers=1]\n", + "2019-07-17 16:33:51 \u001b[1;30mINFO \u001b[0m \u001b[34m__main__\u001b[0m - Finished graph creation. Saved into file:///work/notebooks/stories/chat_graph.html\n" ] } ], "source": [ - "!python -m rasa_core.visualize -d $BOT_DOMAIN_PATH -s $BOT_STORIES_PATH -o chat_graph.html" + "!python -m rasa_core.visualize -d $COACH_DOMAIN_PATH -s $COACH_STORIES_PATH -o chat_graph.html" ] }, { @@ -135,7 +125,7 @@ " " ], "text/plain": [ - "" + "" ] }, "execution_count": 3, @@ -172,49 +162,47 @@ "name": "stdout", "output_type": "stream", "text": [ - "make: Entering directory '/work/bot'\n", + "make: Entering directory '/work/coach'\n", "python3 -m rasa_nlu.train -c nlu_config.yml --fixed_model_name current \\\n", - " --data data/intents/ -o models --project nlu --verbose\n", - "/usr/local/lib/python3.6/site-packages/requests/__init__.py:91: RequestsDependencyWarning: urllib3 (1.25.2) or chardet (3.0.4) doesn't match a supported version!\n", - " RequestsDependencyWarning)\n", + "--data data/intents/ -o /src_models --project nlu --verbose\n", "/usr/local/lib/python3.6/runpy.py:125: RuntimeWarning: 'rasa_nlu.train' found in sys.modules after import of package 'rasa_nlu', but prior to execution of 'rasa_nlu.train'; this may result in unpredictable behaviour\n", " warn(RuntimeWarning(msg))\n", - "2019-05-03 21:20:47 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.training_data.loading\u001b[0m - Training data format of data/intents/aleatorio.md is md\n", - "2019-05-03 21:20:47 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.training_data.training_data\u001b[0m - Training data stats: \n", + "2019-07-17 16:34:21 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.training_data.loading\u001b[0m - Training data format of data/intents/geral.md is md\n", + "2019-07-17 16:34:21 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.training_data.training_data\u001b[0m - Training data stats: \n", + "\t- intent examples: 85 (7 distinct intents)\n", + "\t- Found intents: 'diga_mais', 'elogios', 'cumprimentar', 'out_of_scope', 'despedir', 'tudo_bem', 'negar'\n", + "\t- entity examples: 0 (0 distinct entities)\n", + "\t- found entities: \n", + "\n", + "2019-07-17 16:34:21 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.training_data.loading\u001b[0m - Training data format of data/intents/aleatorio.md is md\n", + "2019-07-17 16:34:21 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.training_data.training_data\u001b[0m - Training data stats: \n", "\t- intent examples: 197 (24 distinct intents)\n", - "\t- Found intents: 'religiao', 'linguagens', 'license', 'como_estou', 'filme', 'hobby', 'de_onde_voce_eh', 'signo', 'filhos', 'relationship', 'star_wars', 'playlist', 'onde_voce_mora', 'triste', 'historia', 'piada', 'bff', 'esporte', 'me', 'cor', 'risada', 'time', 'genero', 'comida'\n", + "\t- Found intents: 'genero', 'filme', 'filhos', 'onde_voce_mora', 'piada', 'star_wars', 'historia', 'esporte', 'como_estou', 'risada', 'comida', 'bff', 'time', 'me', 'license', 'relationship', 'signo', 'cor', 'religiao', 'de_onde_voce_eh', 'linguagens', 'hobby', 'playlist', 'triste'\n", "\t- entity examples: 172 (22 distinct entities)\n", - "\t- found entities: 'license', 'triste', 'starwars', 'genero', 'linguagens', 'comida', 'religiao', 'live', 'filme', 'hobby', 'signo', 'relationship', 'playlist', 'piada', 'bff', 'how', 'esporte', 'where', 'me', 'cor', 'filhos', 'historia'\n", + "\t- found entities: 'filme', 'genero', 'filhos', 'live', 'me', 'cor', 'hobby', 'where', 'triste', 'starwars', 'piada', 'how', 'esporte', 'comida', 'bff', 'license', 'relationship', 'signo', 'religiao', 'linguagens', 'playlist', 'historia'\n", "\n", - "2019-05-03 21:20:47 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.training_data.loading\u001b[0m - Training data format of data/intents/actions.md is md\n", - "2019-05-03 21:20:47 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.training_data.training_data\u001b[0m - Training data stats: \n", + "2019-07-17 16:34:21 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.training_data.loading\u001b[0m - Training data format of data/intents/actions.md is md\n", + "2019-07-17 16:34:21 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.training_data.training_data\u001b[0m - Training data stats: \n", "\t- intent examples: 6 (1 distinct intents)\n", "\t- Found intents: 'action_test'\n", "\t- entity examples: 0 (0 distinct entities)\n", "\t- found entities: \n", "\n", - "2019-05-03 21:20:47 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.training_data.loading\u001b[0m - Training data format of data/intents/geral.md is md\n", - "2019-05-03 21:20:47 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.training_data.training_data\u001b[0m - Training data stats: \n", - "\t- intent examples: 85 (7 distinct intents)\n", - "\t- Found intents: 'despedir', 'diga_mais', 'out_of_scope', 'elogios', 'cumprimentar', 'negar', 'tudo_bem'\n", - "\t- entity examples: 0 (0 distinct entities)\n", - "\t- found entities: \n", - "\n", - "2019-05-03 21:20:47 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.training_data.training_data\u001b[0m - Training data stats: \n", + "2019-07-17 16:34:21 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.training_data.training_data\u001b[0m - Training data stats: \n", "\t- intent examples: 288 (32 distinct intents)\n", - "\t- Found intents: 'license', 'como_estou', 'star_wars', 'negar', 'elogios', 'onde_voce_mora', 'triste', 'despedir', 'diga_mais', 'cumprimentar', 'genero', 'comida', 'linguagens', 'religiao', 'filme', 'hobby', 'de_onde_voce_eh', 'signo', 'relationship', 'out_of_scope', 'playlist', 'tudo_bem', 'piada', 'bff', 'risada', 'esporte', 'me', 'action_test', 'cor', 'filhos', 'time', 'historia'\n", + "\t- Found intents: 'genero', 'filme', 'filhos', 'elogios', 'out_of_scope', 'tudo_bem', 'me', 'despedir', 'cor', 'de_onde_voce_eh', 'hobby', 'triste', 'onde_voce_mora', 'piada', 'star_wars', 'esporte', 'como_estou', 'risada', 'comida', 'negar', 'bff', 'time', 'action_test', 'diga_mais', 'license', 'relationship', 'cumprimentar', 'signo', 'religiao', 'linguagens', 'playlist', 'historia'\n", "\t- entity examples: 172 (22 distinct entities)\n", - "\t- found entities: 'license', 'triste', 'starwars', 'genero', 'linguagens', 'comida', 'religiao', 'live', 'filme', 'hobby', 'signo', 'relationship', 'playlist', 'piada', 'bff', 'how', 'esporte', 'where', 'me', 'cor', 'filhos', 'historia'\n", + "\t- found entities: 'filme', 'genero', 'filhos', 'live', 'me', 'cor', 'hobby', 'where', 'triste', 'starwars', 'piada', 'how', 'esporte', 'comida', 'bff', 'license', 'relationship', 'signo', 'religiao', 'linguagens', 'playlist', 'historia'\n", "\n", - "2019-05-03 21:20:47 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.model\u001b[0m - Starting to train component WhitespaceTokenizer\n", - "2019-05-03 21:20:47 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.model\u001b[0m - Finished training component.\n", - "2019-05-03 21:20:47 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.model\u001b[0m - Starting to train component CRFEntityExtractor\n", - "2019-05-03 21:20:47 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.model\u001b[0m - Finished training component.\n", - "2019-05-03 21:20:47 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.model\u001b[0m - Starting to train component EntitySynonymMapper\n", - "2019-05-03 21:20:47 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.model\u001b[0m - Finished training component.\n", - "2019-05-03 21:20:47 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.model\u001b[0m - Starting to train component CountVectorsFeaturizer\n", - "2019-05-03 21:20:48 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.model\u001b[0m - Finished training component.\n", - "2019-05-03 21:20:48 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.model\u001b[0m - Starting to train component EmbeddingIntentClassifier\n", + "2019-07-17 16:34:21 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.model\u001b[0m - Starting to train component WhitespaceTokenizer\n", + "2019-07-17 16:34:21 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.model\u001b[0m - Finished training component.\n", + "2019-07-17 16:34:21 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.model\u001b[0m - Starting to train component CRFEntityExtractor\n", + "2019-07-17 16:34:22 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.model\u001b[0m - Finished training component.\n", + "2019-07-17 16:34:22 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.model\u001b[0m - Starting to train component EntitySynonymMapper\n", + "2019-07-17 16:34:22 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.model\u001b[0m - Finished training component.\n", + "2019-07-17 16:34:22 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.model\u001b[0m - Starting to train component CountVectorsFeaturizer\n", + "2019-07-17 16:34:22 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.model\u001b[0m - Finished training component.\n", + "2019-07-17 16:34:22 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.model\u001b[0m - Starting to train component EmbeddingIntentClassifier\n", "\n", "WARNING: The TensorFlow contrib module will not be included in TensorFlow 2.0.\n", "For more information, please see:\n", @@ -222,50 +210,48 @@ " * https://github.com/tensorflow/addons\n", "If you depend on functionality not listed there, please file an issue.\n", "\n", - "2019-05-03 21:20:48 \u001b[1;30mWARNING \u001b[0m \u001b[34mtensorflow\u001b[0m - \u001b[33mFrom /usr/local/lib/python3.6/site-packages/rasa_nlu/classifiers/embedding_intent_classifier.py:285: dense (from tensorflow.python.layers.core) is deprecated and will be removed in a future version.\n", + "2019-07-17 16:34:23 \u001b[1;30mWARNING \u001b[0m \u001b[34mtensorflow\u001b[0m - \u001b[33mFrom /usr/local/lib/python3.6/site-packages/rasa_nlu/classifiers/embedding_intent_classifier.py:285: dense (from tensorflow.python.layers.core) is deprecated and will be removed in a future version.\n", "Instructions for updating:\n", "Use keras.layers.dense instead.\u001b[0m\n", - "2019-05-03 21:20:48 \u001b[1;30mWARNING \u001b[0m \u001b[34mtensorflow\u001b[0m - \u001b[33mFrom /usr/local/lib/python3.6/site-packages/tensorflow/python/framework/op_def_library.py:263: colocate_with (from tensorflow.python.framework.ops) is deprecated and will be removed in a future version.\n", + "2019-07-17 16:34:23 \u001b[1;30mWARNING \u001b[0m \u001b[34mtensorflow\u001b[0m - \u001b[33mFrom /usr/local/lib/python3.6/site-packages/tensorflow/python/framework/op_def_library.py:263: colocate_with (from tensorflow.python.framework.ops) is deprecated and will be removed in a future version.\n", "Instructions for updating:\n", "Colocations handled automatically by placer.\u001b[0m\n", - "2019-05-03 21:20:48 \u001b[1;30mWARNING \u001b[0m \u001b[34mtensorflow\u001b[0m - \u001b[33mFrom /usr/local/lib/python3.6/site-packages/rasa_nlu/classifiers/embedding_intent_classifier.py:286: dropout (from tensorflow.python.layers.core) is deprecated and will be removed in a future version.\n", + "2019-07-17 16:34:23 \u001b[1;30mWARNING \u001b[0m \u001b[34mtensorflow\u001b[0m - \u001b[33mFrom /usr/local/lib/python3.6/site-packages/rasa_nlu/classifiers/embedding_intent_classifier.py:286: dropout (from tensorflow.python.layers.core) is deprecated and will be removed in a future version.\n", "Instructions for updating:\n", "Use keras.layers.dropout instead.\u001b[0m\n", - "2019-05-03 21:20:48 \u001b[1;30mWARNING \u001b[0m \u001b[34mtensorflow\u001b[0m - \u001b[33mFrom /usr/local/lib/python3.6/site-packages/tensorflow/python/keras/layers/core.py:143: calling dropout (from tensorflow.python.ops.nn_ops) with keep_prob is deprecated and will be removed in a future version.\n", + "2019-07-17 16:34:23 \u001b[1;30mWARNING \u001b[0m \u001b[34mtensorflow\u001b[0m - \u001b[33mFrom /usr/local/lib/python3.6/site-packages/tensorflow/python/keras/layers/core.py:143: calling dropout (from tensorflow.python.ops.nn_ops) with keep_prob is deprecated and will be removed in a future version.\n", "Instructions for updating:\n", "Please use `rate` instead of `keep_prob`. Rate should be set to `rate = 1 - keep_prob`.\u001b[0m\n", - "2019-05-03 21:20:48 \u001b[1;30mWARNING \u001b[0m \u001b[34mtensorflow\u001b[0m - \u001b[33mFrom /usr/local/lib/python3.6/site-packages/tensorflow/python/ops/math_ops.py:3066: to_int32 (from tensorflow.python.ops.math_ops) is deprecated and will be removed in a future version.\n", + "2019-07-17 16:34:23 \u001b[1;30mWARNING \u001b[0m \u001b[34mtensorflow\u001b[0m - \u001b[33mFrom /usr/local/lib/python3.6/site-packages/tensorflow/python/ops/math_ops.py:3066: to_int32 (from tensorflow.python.ops.math_ops) is deprecated and will be removed in a future version.\n", "Instructions for updating:\n", "Use tf.cast instead.\u001b[0m\n", - "2019-05-03 21:20:48 \u001b[1;30mWARNING \u001b[0m \u001b[34mtensorflow\u001b[0m - \u001b[33mFrom /usr/local/lib/python3.6/site-packages/tensorflow/python/ops/math_grad.py:102: div (from tensorflow.python.ops.math_ops) is deprecated and will be removed in a future version.\n", + "2019-07-17 16:34:23 \u001b[1;30mWARNING \u001b[0m \u001b[34mtensorflow\u001b[0m - \u001b[33mFrom /usr/local/lib/python3.6/site-packages/tensorflow/python/ops/math_grad.py:102: div (from tensorflow.python.ops.math_ops) is deprecated and will be removed in a future version.\n", "Instructions for updating:\n", "Deprecated in favor of operator or tf.math.divide.\u001b[0m\n", - "2019-05-03 21:20:49.119991: I tensorflow/core/platform/cpu_feature_guard.cc:141] Your CPU supports instructions that this TensorFlow binary was not compiled to use: AVX2 FMA\n", - "2019-05-03 21:20:49.139740: I tensorflow/core/platform/profile_utils/cpu_utils.cc:94] CPU Frequency: 2905000000 Hz\n", - "2019-05-03 21:20:49.140045: I tensorflow/compiler/xla/service/service.cc:150] XLA service 0x555c5d1fc6c0 executing computations on platform Host. Devices:\n", - "2019-05-03 21:20:49.140072: I tensorflow/compiler/xla/service/service.cc:158] StreamExecutor device (0): , \n", - "2019-05-03 21:20:49 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.classifiers.embedding_intent_classifier\u001b[0m - Accuracy is updated every 10 epochs\n", - "Epochs: 100%|██████████| 300/300 [00:11<00:00, 26.20it/s, loss=0.105, acc=0.993]\n", - "2019-05-03 21:21:00 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.classifiers.embedding_intent_classifier\u001b[0m - Finished training embedding classifier, loss=0.105, train accuracy=0.993\n", - "2019-05-03 21:21:00 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.model\u001b[0m - Finished training component.\n", - "2019-05-03 21:21:00 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.model\u001b[0m - Successfully saved model into '/work/bot/models/nlu/current'\n", - "2019-05-03 21:21:00 \u001b[1;30mINFO \u001b[0m \u001b[34m__main__\u001b[0m - Finished training\n", + "2019-07-17 16:34:24.429290: I tensorflow/core/platform/cpu_feature_guard.cc:141] Your CPU supports instructions that this TensorFlow binary was not compiled to use: AVX2 FMA\n", + "2019-07-17 16:34:24.452899: I tensorflow/core/platform/profile_utils/cpu_utils.cc:94] CPU Frequency: 2194805000 Hz\n", + "2019-07-17 16:34:24.453405: I tensorflow/compiler/xla/service/service.cc:150] XLA service 0x56418a533710 executing computations on platform Host. Devices:\n", + "2019-07-17 16:34:24.453460: I tensorflow/compiler/xla/service/service.cc:158] StreamExecutor device (0): , \n", + "2019-07-17 16:34:24 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.classifiers.embedding_intent_classifier\u001b[0m - Accuracy is updated every 10 epochs\n", + "Epochs: 100%|██████████| 300/300 [00:13<00:00, 22.67it/s, loss=0.100, acc=0.993]\n", + "2019-07-17 16:34:38 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.classifiers.embedding_intent_classifier\u001b[0m - Finished training embedding classifier, loss=0.100, train accuracy=0.993\n", + "2019-07-17 16:34:38 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.model\u001b[0m - Finished training component.\n", + "2019-07-17 16:34:38 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_nlu.model\u001b[0m - Successfully saved model into '/src_models/nlu/current'\n", + "2019-07-17 16:34:38 \u001b[1;30mINFO \u001b[0m \u001b[34m__main__\u001b[0m - Finished training\n", "python3 train.py\n", - "/usr/local/lib/python3.6/site-packages/requests/__init__.py:91: RequestsDependencyWarning: urllib3 (1.25.2) or chardet (3.0.4) doesn't match a supported version!\n", - " RequestsDependencyWarning)\n", - "/work/bot/validator.py:98: YAMLLoadWarning: calling yaml.load() without Loader=... is deprecated, as the default Loader is unsafe. Please read https://msg.pyyaml.org/load for full details.\n", - " validate(yaml.load(domain_file), yaml.load(schema))\n" + "/work/coach/validator.py:98: YAMLLoadWarning: calling yaml.load() without Loader=... is deprecated, as the default Loader is unsafe. Please read https://msg.pyyaml.org/load for full details.\n", + " validate(yaml.load(domain_file), yaml.load(schema))\n", + "2019-07-17 16:34:39 \u001b[1;30mINFO \u001b[0m \u001b[34mvalidator\u001b[0m - Domain verified\n", + "2019-07-17 16:34:39 \u001b[1;30mERROR \u001b[0m \u001b[34mvalidator\u001b[0m - \u001b[31mThe utter action_test is used in the stories story file data/stories/actions.md (line: 5) but it's not a valid utter.\u001b[0m\n", + "2019-07-17 16:34:41 \u001b[1;30mINFO \u001b[0m \u001b[34mapscheduler.scheduler\u001b[0m - Scheduler started\n", + "2019-07-17 16:34:41 \u001b[1;30mDEBUG \u001b[0m \u001b[34mapscheduler.scheduler\u001b[0m - Looking for jobs to run\n", + "2019-07-17 16:34:41 \u001b[1;30mDEBUG \u001b[0m \u001b[34mapscheduler.scheduler\u001b[0m - No jobs; waiting until a job is added\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "2019-05-03 21:21:02 \u001b[1;30mINFO \u001b[0m \u001b[34mvalidator\u001b[0m - Domain verified\n", - "2019-05-03 21:21:02 \u001b[1;30mERROR \u001b[0m \u001b[34mvalidator\u001b[0m - \u001b[31mThe utter action_test is used in the stories story file data/stories/actions.md (line: 5) but it's not a valid utter.\u001b[0m\n", - "2019-05-03 21:21:04 \u001b[1;30mINFO \u001b[0m \u001b[34mapscheduler.scheduler\u001b[0m - Scheduler started\n", - "2019-05-03 21:21:04 \u001b[1;30mDEBUG \u001b[0m \u001b[34mapscheduler.scheduler\u001b[0m - Looking for jobs to run\n", - "2019-05-03 21:21:04 \u001b[1;30mDEBUG \u001b[0m \u001b[34mapscheduler.scheduler\u001b[0m - No jobs; waiting until a job is added\n", "\n", "WARNING: The TensorFlow contrib module will not be included in TensorFlow 2.0.\n", "For more information, please see:\n", @@ -273,36 +259,36 @@ " * https://github.com/tensorflow/addons\n", "If you depend on functionality not listed there, please file an issue.\n", "\n", - "2019-05-03 21:21:05 \u001b[1;30mDEBUG \u001b[0m \u001b[34mrasa_core.training.generator\u001b[0m - Number of augmentation rounds is 3\n", - "2019-05-03 21:21:05 \u001b[1;30mDEBUG \u001b[0m \u001b[34mrasa_core.training.generator\u001b[0m - Starting data generation round 0 ... (with 1 trackers)\n", - "Processed Story Blocks: 100%|███| 34/34 [00:00<00:00, 5591.53it/s, # trackers=1]\n", - "2019-05-03 21:21:05 \u001b[1;30mDEBUG \u001b[0m \u001b[34mrasa_core.training.generator\u001b[0m - Finished phase (34 training samples found).\n", - "2019-05-03 21:21:05 \u001b[1;30mDEBUG \u001b[0m \u001b[34mrasa_core.training.generator\u001b[0m - Data generation rounds finished.\n", - "2019-05-03 21:21:05 \u001b[1;30mDEBUG \u001b[0m \u001b[34mrasa_core.training.generator\u001b[0m - Found 0 unused checkpoints\n", - "2019-05-03 21:21:05 \u001b[1;30mDEBUG \u001b[0m \u001b[34mrasa_core.training.generator\u001b[0m - Starting augmentation round 0 ... (with 20 trackers)\n", - "Processed Story Blocks: 100%|███| 34/34 [00:00<00:00, 426.94it/s, # trackers=20]\n", - "2019-05-03 21:21:05 \u001b[1;30mDEBUG \u001b[0m \u001b[34mrasa_core.training.generator\u001b[0m - Finished phase (711 training samples found).\n", - "2019-05-03 21:21:05 \u001b[1;30mDEBUG \u001b[0m \u001b[34mrasa_core.training.generator\u001b[0m - Starting augmentation round 1 ... (with 20 trackers)\n", - "Processed Story Blocks: 100%|███| 34/34 [00:00<00:00, 300.58it/s, # trackers=20]\n", - "2019-05-03 21:21:05 \u001b[1;30mDEBUG \u001b[0m \u001b[34mrasa_core.training.generator\u001b[0m - Finished phase (1391 training samples found).\n", - "2019-05-03 21:21:05 \u001b[1;30mDEBUG \u001b[0m \u001b[34mrasa_core.training.generator\u001b[0m - Starting augmentation round 2 ... (with 20 trackers)\n", - "Processed Story Blocks: 100%|███| 34/34 [00:00<00:00, 174.15it/s, # trackers=20]\n", - "2019-05-03 21:21:05 \u001b[1;30mDEBUG \u001b[0m \u001b[34mrasa_core.training.generator\u001b[0m - Finished phase (2034 training samples found).\n", - "2019-05-03 21:21:05 \u001b[1;30mDEBUG \u001b[0m \u001b[34mrasa_core.training.generator\u001b[0m - Found 2034 training trackers.\n", - "2019-05-03 21:21:05 \u001b[1;30mDEBUG \u001b[0m \u001b[34mrasa_core.training.generator\u001b[0m - Subsampled to 200 augmented training trackers.\n", - "2019-05-03 21:21:05 \u001b[1;30mDEBUG \u001b[0m \u001b[34mrasa_core.training.generator\u001b[0m - There are 34 original trackers.\n", - "2019-05-03 21:21:05 \u001b[1;30mDEBUG \u001b[0m \u001b[34mrasa_core.agent\u001b[0m - Agent trainer got kwargs: {'validation_split': 0.2}\n", - "2019-05-03 21:21:05 \u001b[1;30mDEBUG \u001b[0m \u001b[34mrasa_core.featurizers\u001b[0m - Creating states and action examples from collected trackers (by FullDialogueTrackerFeaturizer(LabelTokenizerSingleStateFeaturizer))...\n", - "Processed trackers: 100%|██████████████████| 234/234 [00:00<00:00, 19008.16it/s]\n", - "2019-05-03 21:21:05 \u001b[1;30mDEBUG \u001b[0m \u001b[34mrasa_core.featurizers\u001b[0m - The longest dialogue has 13 actions.\n", - "2019-05-03 21:21:05.665574: I tensorflow/core/platform/cpu_feature_guard.cc:141] Your CPU supports instructions that this TensorFlow binary was not compiled to use: AVX2 FMA\n", - "2019-05-03 21:21:05.686532: I tensorflow/core/platform/profile_utils/cpu_utils.cc:94] CPU Frequency: 2905000000 Hz\n", - "2019-05-03 21:21:05.688378: I tensorflow/compiler/xla/service/service.cc:150] XLA service 0x55cad90cbdc0 executing computations on platform Host. Devices:\n", - "2019-05-03 21:21:05.688446: I tensorflow/compiler/xla/service/service.cc:158] StreamExecutor device (0): , \n", - "2019-05-03 21:21:05 \u001b[1;30mWARNING \u001b[0m \u001b[34mtensorflow\u001b[0m - \u001b[33mFrom /usr/local/lib/python3.6/site-packages/tensorflow/python/ops/resource_variable_ops.py:435: colocate_with (from tensorflow.python.framework.ops) is deprecated and will be removed in a future version.\n", + "2019-07-17 16:34:42 \u001b[1;30mDEBUG \u001b[0m \u001b[34mrasa_core.training.generator\u001b[0m - Number of augmentation rounds is 3\n", + "2019-07-17 16:34:42 \u001b[1;30mDEBUG \u001b[0m \u001b[34mrasa_core.training.generator\u001b[0m - Starting data generation round 0 ... (with 1 trackers)\n", + "Processed Story Blocks: 100%|███| 34/34 [00:00<00:00, 4790.91it/s, # trackers=1]\n", + "2019-07-17 16:34:42 \u001b[1;30mDEBUG \u001b[0m \u001b[34mrasa_core.training.generator\u001b[0m - Finished phase (34 training samples found).\n", + "2019-07-17 16:34:42 \u001b[1;30mDEBUG \u001b[0m \u001b[34mrasa_core.training.generator\u001b[0m - Data generation rounds finished.\n", + "2019-07-17 16:34:42 \u001b[1;30mDEBUG \u001b[0m \u001b[34mrasa_core.training.generator\u001b[0m - Found 0 unused checkpoints\n", + "2019-07-17 16:34:42 \u001b[1;30mDEBUG \u001b[0m \u001b[34mrasa_core.training.generator\u001b[0m - Starting augmentation round 0 ... (with 34 trackers)\n", + "Processed Story Blocks: 100%|███| 34/34 [00:00<00:00, 204.51it/s, # trackers=34]\n", + "2019-07-17 16:34:42 \u001b[1;30mDEBUG \u001b[0m \u001b[34mrasa_core.training.generator\u001b[0m - Finished phase (1187 training samples found).\n", + "2019-07-17 16:34:42 \u001b[1;30mDEBUG \u001b[0m \u001b[34mrasa_core.training.generator\u001b[0m - Starting augmentation round 1 ... (with 50 trackers)\n", + "Processed Story Blocks: 100%|███| 34/34 [00:00<00:00, 111.16it/s, # trackers=50]\n", + "2019-07-17 16:34:42 \u001b[1;30mDEBUG \u001b[0m \u001b[34mrasa_core.training.generator\u001b[0m - Finished phase (2819 training samples found).\n", + "2019-07-17 16:34:42 \u001b[1;30mDEBUG \u001b[0m \u001b[34mrasa_core.training.generator\u001b[0m - Starting augmentation round 2 ... (with 50 trackers)\n", + "Processed Story Blocks: 100%|████| 34/34 [00:00<00:00, 94.44it/s, # trackers=50]\n", + "2019-07-17 16:34:43 \u001b[1;30mDEBUG \u001b[0m \u001b[34mrasa_core.training.generator\u001b[0m - Finished phase (4439 training samples found).\n", + "2019-07-17 16:34:43 \u001b[1;30mDEBUG \u001b[0m \u001b[34mrasa_core.training.generator\u001b[0m - Found 4439 training trackers.\n", + "2019-07-17 16:34:43 \u001b[1;30mDEBUG \u001b[0m \u001b[34mrasa_core.training.generator\u001b[0m - Subsampled to 500 augmented training trackers.\n", + "2019-07-17 16:34:43 \u001b[1;30mDEBUG \u001b[0m \u001b[34mrasa_core.training.generator\u001b[0m - There are 34 original trackers.\n", + "2019-07-17 16:34:43 \u001b[1;30mDEBUG \u001b[0m \u001b[34mrasa_core.agent\u001b[0m - Agent trainer got kwargs: {'validation_split': 0.2}\n", + "2019-07-17 16:34:43 \u001b[1;30mDEBUG \u001b[0m \u001b[34mrasa_core.featurizers\u001b[0m - Creating states and action examples from collected trackers (by FullDialogueTrackerFeaturizer(LabelTokenizerSingleStateFeaturizer))...\n", + "Processed trackers: 100%|██████████████████| 534/534 [00:00<00:00, 29542.81it/s]\n", + "2019-07-17 16:34:43 \u001b[1;30mDEBUG \u001b[0m \u001b[34mrasa_core.featurizers\u001b[0m - The longest dialogue has 11 actions.\n", + "2019-07-17 16:34:43.394363: I tensorflow/core/platform/cpu_feature_guard.cc:141] Your CPU supports instructions that this TensorFlow binary was not compiled to use: AVX2 FMA\n", + "2019-07-17 16:34:43.420891: I tensorflow/core/platform/profile_utils/cpu_utils.cc:94] CPU Frequency: 2194805000 Hz\n", + "2019-07-17 16:34:43.421344: I tensorflow/compiler/xla/service/service.cc:150] XLA service 0x55f4cd084a60 executing computations on platform Host. Devices:\n", + "2019-07-17 16:34:43.421423: I tensorflow/compiler/xla/service/service.cc:158] StreamExecutor device (0): , \n", + "2019-07-17 16:34:43 \u001b[1;30mWARNING \u001b[0m \u001b[34mtensorflow\u001b[0m - \u001b[33mFrom /usr/local/lib/python3.6/site-packages/tensorflow/python/ops/resource_variable_ops.py:435: colocate_with (from tensorflow.python.framework.ops) is deprecated and will be removed in a future version.\n", "Instructions for updating:\n", "Colocations handled automatically by placer.\u001b[0m\n", - "2019-05-03 21:21:05 \u001b[1;30mWARNING \u001b[0m \u001b[34mtensorflow\u001b[0m - \u001b[33mFrom /usr/local/lib/python3.6/site-packages/tensorflow/python/keras/backend.py:4010: calling dropout (from tensorflow.python.ops.nn_ops) with keep_prob is deprecated and will be removed in a future version.\n", + "2019-07-17 16:34:43 \u001b[1;30mWARNING \u001b[0m \u001b[34mtensorflow\u001b[0m - \u001b[33mFrom /usr/local/lib/python3.6/site-packages/tensorflow/python/keras/backend.py:4010: calling dropout (from tensorflow.python.ops.nn_ops) with keep_prob is deprecated and will be removed in a future version.\n", "Instructions for updating:\n", "Please use `rate` instead of `keep_prob`. Rate should be set to `rate = 1 - keep_prob`.\u001b[0m\n", "_________________________________________________________________\n", @@ -320,51 +306,74 @@ "Trainable params: 18,183\n", "Non-trainable params: 0\n", "_________________________________________________________________\n", - "2019-05-03 21:21:06 \u001b[1;30mDEBUG \u001b[0m \u001b[34mrasa_core.policies.keras_policy\u001b[0m - None\n", - "2019-05-03 21:21:06 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_core.policies.keras_policy\u001b[0m - Fitting model with 234 total samples and a validation split of 0.1\n", - "2019-05-03 21:21:06 \u001b[1;30mDEBUG \u001b[0m \u001b[34mrasa_core.policies.policy\u001b[0m - Parameters ignored by `model.fit(...)`: {}\n", - "2019-05-03 21:21:06 \u001b[1;30mWARNING \u001b[0m \u001b[34mtensorflow\u001b[0m - \u001b[33mFrom /usr/local/lib/python3.6/site-packages/tensorflow/python/ops/math_ops.py:3066: to_int32 (from tensorflow.python.ops.math_ops) is deprecated and will be removed in a future version.\n", + "2019-07-17 16:34:44 \u001b[1;30mDEBUG \u001b[0m \u001b[34mrasa_core.policies.keras_policy\u001b[0m - None\n", + "2019-07-17 16:34:44 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_core.policies.keras_policy\u001b[0m - Fitting model with 534 total samples and a validation split of 0.1\n", + "2019-07-17 16:34:44 \u001b[1;30mDEBUG \u001b[0m \u001b[34mrasa_core.policies.policy\u001b[0m - Parameters ignored by `model.fit(...)`: {}\n", + "2019-07-17 16:34:44 \u001b[1;30mWARNING \u001b[0m \u001b[34mtensorflow\u001b[0m - \u001b[33mFrom /usr/local/lib/python3.6/site-packages/tensorflow/python/ops/math_ops.py:3066: to_int32 (from tensorflow.python.ops.math_ops) is deprecated and will be removed in a future version.\n", "Instructions for updating:\n", "Use tf.cast instead.\u001b[0m\n", - "2019-05-03 21:21:06 \u001b[1;30mWARNING \u001b[0m \u001b[34mtensorflow\u001b[0m - \u001b[33mFrom /usr/local/lib/python3.6/site-packages/tensorflow/python/ops/math_grad.py:102: div (from tensorflow.python.ops.math_ops) is deprecated and will be removed in a future version.\n", + "2019-07-17 16:34:44 \u001b[1;30mWARNING \u001b[0m \u001b[34mtensorflow\u001b[0m - \u001b[33mFrom /usr/local/lib/python3.6/site-packages/tensorflow/python/ops/math_grad.py:102: div (from tensorflow.python.ops.math_ops) is deprecated and will be removed in a future version.\n", "Instructions for updating:\n", "Deprecated in favor of operator or tf.math.divide.\u001b[0m\n", - "Epoch 1/8\n", - "234/234 [==============================] - 2s 7ms/sample - loss: 3.4823 - acc: 0.4455\n", - "Epoch 2/8\n", - "234/234 [==============================] - 0s 2ms/sample - loss: 2.9316 - acc: 0.5708\n", - "Epoch 3/8\n", - "234/234 [==============================] - 0s 2ms/sample - loss: 2.6178 - acc: 0.5708\n", - "Epoch 4/8\n", - "234/234 [==============================] - 1s 2ms/sample - loss: 2.4668 - acc: 0.5708\n", - "Epoch 5/8\n", - "234/234 [==============================] - 1s 2ms/sample - loss: 2.3236 - acc: 0.5708\n", - "Epoch 6/8\n", - "234/234 [==============================] - 1s 2ms/sample - loss: 2.1960 - acc: 0.5708\n", - "Epoch 7/8\n", - "234/234 [==============================] - 1s 2ms/sample - loss: 2.0711 - acc: 0.5708\n", - "Epoch 8/8\n", - "234/234 [==============================] - 1s 2ms/sample - loss: 1.9513 - acc: 0.5708\n", - "2019-05-03 21:21:13 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_core.policies.keras_policy\u001b[0m - Done fitting keras policy model\n", - "2019-05-03 21:21:13 \u001b[1;30mDEBUG \u001b[0m \u001b[34mrasa_core.featurizers\u001b[0m - Creating states and action examples from collected trackers (by MaxHistoryTrackerFeaturizer(SingleStateFeaturizer))...\n", - "Processed trackers: 100%|███████| 34/34 [00:00<00:00, 4771.84it/s, # actions=68]\n", - "2019-05-03 21:21:13 \u001b[1;30mDEBUG \u001b[0m \u001b[34mrasa_core.featurizers\u001b[0m - Created 68 action examples.\n", - "Processed actions: 68it [00:00, 6188.17it/s, # examples=68]\n", - "2019-05-03 21:21:13 \u001b[1;30mDEBUG \u001b[0m \u001b[34mrasa_core.policies.memoization\u001b[0m - Memorized 68 unique examples.\n", - "2019-05-03 21:21:13 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_core.agent\u001b[0m - Model directory models/dialogue exists and contains old model files. All files will be overwritten.\n" + "Epoch 1/20\n", + "534/534 [==============================] - 2s 3ms/sample - loss: 3.1508 - acc: 0.5214\n", + "Epoch 2/20\n", + "534/534 [==============================] - 1s 2ms/sample - loss: 2.5611 - acc: 0.5706\n", + "Epoch 3/20\n", + "534/534 [==============================] - 1s 2ms/sample - loss: 2.2887 - acc: 0.5706\n", + "Epoch 4/20\n", + "534/534 [==============================] - 1s 2ms/sample - loss: 2.0275 - acc: 0.5706\n", + "Epoch 5/20\n", + "534/534 [==============================] - 1s 1ms/sample - loss: 1.8310 - acc: 0.5915\n", + "Epoch 6/20\n", + "534/534 [==============================] - 1s 2ms/sample - loss: 1.7020 - acc: 0.6172\n", + "Epoch 7/20\n", + "534/534 [==============================] - 1s 1ms/sample - loss: 1.5782 - acc: 0.6386\n", + "Epoch 8/20\n", + "534/534 [==============================] - 1s 2ms/sample - loss: 1.4444 - acc: 0.6706\n", + "Epoch 9/20\n", + "534/534 [==============================] - 1s 2ms/sample - loss: 1.2862 - acc: 0.7177\n", + "Epoch 10/20\n", + "534/534 [==============================] - 1s 2ms/sample - loss: 1.1180 - acc: 0.7656\n", + "Epoch 11/20\n", + "534/534 [==============================] - 1s 2ms/sample - loss: 0.9341 - acc: 0.8222\n", + "Epoch 12/20\n", + "534/534 [==============================] - 1s 2ms/sample - loss: 0.7627 - acc: 0.8746\n", + "Epoch 13/20\n", + "534/534 [==============================] - 1s 2ms/sample - loss: 0.6112 - acc: 0.9196\n", + "Epoch 14/20\n", + "534/534 [==============================] - 1s 2ms/sample - loss: 0.4943 - acc: 0.9331\n", + "Epoch 15/20\n", + "534/534 [==============================] - 1s 1ms/sample - loss: 0.4015 - acc: 0.9474\n", + "Epoch 16/20\n", + "534/534 [==============================] - 1s 1ms/sample - loss: 0.3283 - acc: 0.9558\n", + "Epoch 17/20\n", + "534/534 [==============================] - 1s 1ms/sample - loss: 0.2693 - acc: 0.9640\n", + "Epoch 18/20\n", + "534/534 [==============================] - 1s 1ms/sample - loss: 0.2484 - acc: 0.9622\n", + "Epoch 19/20\n", + "534/534 [==============================] - 1s 1ms/sample - loss: 0.2007 - acc: 0.9680\n", + "Epoch 20/20\n", + "534/534 [==============================] - 1s 1ms/sample - loss: 0.1921 - acc: 0.9698\n", + "2019-07-17 16:35:03 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_core.policies.keras_policy\u001b[0m - Done fitting keras policy model\n", + "2019-07-17 16:35:03 \u001b[1;30mDEBUG \u001b[0m \u001b[34mrasa_core.featurizers\u001b[0m - Creating states and action examples from collected trackers (by MaxHistoryTrackerFeaturizer(SingleStateFeaturizer))...\n", + "Processed trackers: 100%|███████| 34/34 [00:00<00:00, 4103.78it/s, # actions=68]\n", + "2019-07-17 16:35:03 \u001b[1;30mDEBUG \u001b[0m \u001b[34mrasa_core.featurizers\u001b[0m - Created 68 action examples.\n", + "Processed actions: 68it [00:00, 9631.33it/s, # examples=68]\n", + "2019-07-17 16:35:03 \u001b[1;30mDEBUG \u001b[0m \u001b[34mrasa_core.policies.memoization\u001b[0m - Memorized 68 unique examples.\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ - "2019-05-03 21:21:13 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_core.agent\u001b[0m - Persisted model to '/work/bot/models/dialogue'\n", - "make: Leaving directory '/work/bot'\n" + "2019-07-17 16:35:04 \u001b[1;30mINFO \u001b[0m \u001b[34mrasa_core.agent\u001b[0m - Persisted model to '/src_models/dialogue'\n", + "make: Leaving directory '/work/coach'\n" ] } ], "source": [ - "!make train -C $BOT_DIR_PATH" + "!make train -C $COACH_DIR_PATH" ] }, { @@ -385,8 +394,6 @@ "name": "stdout", "output_type": "stream", "text": [ - "/usr/local/lib/python3.6/site-packages/requests/__init__.py:91: RequestsDependencyWarning: urllib3 (1.25.2) or chardet (3.0.4) doesn't match a supported version!\n", - " RequestsDependencyWarning)\n", "Calling `rasa_core.evaluate` is deprecated. Please use `rasa_core.test` instead.\n", "\n", "WARNING: The TensorFlow contrib module will not be included in TensorFlow 2.0.\n", @@ -395,10 +402,10 @@ " * https://github.com/tensorflow/addons\n", "If you depend on functionality not listed there, please file an issue.\n", "\n", - "2019-05-03 21:21:17.252292: I tensorflow/core/platform/cpu_feature_guard.cc:141] Your CPU supports instructions that this TensorFlow binary was not compiled to use: AVX2 FMA\n", - "2019-05-03 21:21:17.270392: I tensorflow/core/platform/profile_utils/cpu_utils.cc:94] CPU Frequency: 2905000000 Hz\n", - "2019-05-03 21:21:17.271557: I tensorflow/compiler/xla/service/service.cc:150] XLA service 0x55efe976d490 executing computations on platform Host. Devices:\n", - "2019-05-03 21:21:17.271656: I tensorflow/compiler/xla/service/service.cc:158] StreamExecutor device (0): , \n", + "2019-07-17 16:35:22.074432: I tensorflow/core/platform/cpu_feature_guard.cc:141] Your CPU supports instructions that this TensorFlow binary was not compiled to use: AVX2 FMA\n", + "2019-07-17 16:35:22.096944: I tensorflow/core/platform/profile_utils/cpu_utils.cc:94] CPU Frequency: 2194805000 Hz\n", + "2019-07-17 16:35:22.098072: I tensorflow/compiler/xla/service/service.cc:150] XLA service 0x5576fe7115f0 executing computations on platform Host. Devices:\n", + "2019-07-17 16:35:22.098197: I tensorflow/compiler/xla/service/service.cc:158] StreamExecutor device (0): , \n", "WARNING:tensorflow:From /usr/local/lib/python3.6/site-packages/tensorflow/python/ops/resource_variable_ops.py:435: colocate_with (from tensorflow.python.framework.ops) is deprecated and will be removed in a future version.\n", "Instructions for updating:\n", "Colocations handled automatically by placer.\n", @@ -423,10 +430,10 @@ "WARNING:tensorflow:From /usr/local/lib/python3.6/site-packages/tensorflow/python/ops/math_grad.py:102: div (from tensorflow.python.ops.math_ops) is deprecated and will be removed in a future version.\n", "Instructions for updating:\n", "Deprecated in favor of operator or tf.math.divide.\n", - "Processed Story Blocks: 100%|███| 34/34 [00:00<00:00, 6296.36it/s, # trackers=1]\n", + "Processed Story Blocks: 100%|███| 34/34 [00:00<00:00, 4384.65it/s, # trackers=1]\n", "INFO:rasa_core.test:Evaluating 34 stories\n", "Progress:\n", - "100%|███████████████████████████████████████████| 34/34 [00:00<00:00, 68.13it/s]\n", + "100%|███████████████████████████████████████████| 34/34 [00:00<00:00, 55.92it/s]\n", "INFO:rasa_core.test:Finished collecting predictions.\n", "INFO:rasa_core.test:Evaluation Results on CONVERSATION level:\n", "INFO:rasa_core.test:\tCorrect: 34 / 34\n", @@ -493,7 +500,7 @@ } ], "source": [ - "!python -m rasa_core.evaluate --core $BOT_MODELS_DIALOGUE_PATH -s $BOT_STORIES_PATH -o results" + "!python -m rasa_core.evaluate --core $COACH_MODELS_DIALOGUE_PATH -s $COACH_STORIES_PATH -o results" ] }, { @@ -538,7 +545,7 @@ }, { "cell_type": "code", - "execution_count": 7, + "execution_count": 11, "metadata": {}, "outputs": [ { @@ -555,10 +562,10 @@ " " ], "text/plain": [ - "" + "" ] }, - "execution_count": 7, + "execution_count": 11, "metadata": {}, "output_type": "execute_result" } @@ -623,7 +630,7 @@ "name": "python", "nbconvert_exporter": "python", "pygments_lexer": "ipython3", - "version": "3.6.8" + "version": "3.6.9" } }, "nbformat": 4,