fix: ranking and intent based response selector

deeppavlov · Aug 9, 2023 · 8a492bb · 8a492bb
1 parent f99a312
commit 8a492bb
Show file tree

Hide file tree

Showing 15 changed files with 1,074 additions and 3 deletions.
diff --git a/...elector/force_intents_intent_catcher.json → ...intents/force_intents_intent_catcher.json b/...elector/force_intents_intent_catcher.json → ...intents/force_intents_intent_catcher.json
diff --git a/...ed_selector/lets_chat_about_triggers.json → common/intents/lets_chat_about_triggers.json b/...ed_selector/lets_chat_about_triggers.json → common/intents/lets_chat_about_triggers.json
diff --git a/...ased_selector/require_action_intents.json → common/intents/require_action_intents.json b/...ased_selector/require_action_intents.json → common/intents/require_action_intents.json
diff --git a/response_selectors/convers_evaluation_based_selector/tag_based_selection.py b/response_selectors/convers_evaluation_based_selector/tag_based_selection.py
@@ -63,13 +63,13 @@
 LANGUAGE = getenv("LANGUAGE", "EN")
 MAX_TURNS_WITHOUT_SCRIPTS = int(getenv("MAX_TURNS_WITHOUT_SCRIPTS", 5))
 
-force_intents_fname = "force_intents_intent_catcher.json"
+force_intents_fname = "common/intents/force_intents_intent_catcher.json"
 FORCE_INTENTS_IC = json.load(open(force_intents_fname))
 
-lets_chat_about_triggers_fname = "lets_chat_about_triggers.json"
+lets_chat_about_triggers_fname = "common/intents/lets_chat_about_triggers.json"
 LETS_CHAT_ABOUT_PARTICULAR_TOPICS = json.load(open(lets_chat_about_triggers_fname))
 
-require_action_intents_fname = "require_action_intents.json"
+require_action_intents_fname = "common/intents/require_action_intents.json"
 REQUIRE_ACTION_INTENTS = json.load(open(require_action_intents_fname))
 
 LINK_TO_PHRASES = sum([list(list_el) for list_el in skills_phrases_map.values()], [])

diff --git a/response_selectors/ranking_and_intent_based_response_selector/Dockerfile b/response_selectors/ranking_and_intent_based_response_selector/Dockerfile
@@ -0,0 +1,26 @@
+FROM python:3.10
+
+RUN mkdir /src
+
+COPY ./response_selectors/ranking_and_intent_based_response_selector/requirements.txt /src/requirements.txt
+RUN pip install -r /src/requirements.txt
+
+ARG SERVICE_PORT
+ENV SERVICE_PORT ${SERVICE_PORT}
+ARG SENTENCE_RANKER_ANNOTATION_NAME
+ENV SENTENCE_RANKER_ANNOTATION_NAME ${SENTENCE_RANKER_ANNOTATION_NAME}
+ARG SENTENCE_RANKER_SERVICE_URL
+ENV SENTENCE_RANKER_SERVICE_URL ${SENTENCE_RANKER_SERVICE_URL}
+ARG SENTENCE_RANKER_TIMEOUT
+ENV SENTENCE_RANKER_TIMEOUT ${SENTENCE_RANKER_TIMEOUT}
+ARG N_UTTERANCES_CONTEXT=5
+ENV N_UTTERANCES_CONTEXT ${N_UTTERANCES_CONTEXT}
+ARG FILTER_TOXIC_OR_BADLISTED=1
+ENV FILTER_TOXIC_OR_BADLISTED ${FILTER_TOXIC_OR_BADLISTED}
+
+COPY ./response_selectors/ranking_and_intent_based_response_selector/ /src/
+WORKDIR /src
+COPY ./common/ ./common/
+
+
+CMD gunicorn --workers=1 server:app -b 0.0.0.0:${SERVICE_PORT} --timeout=1200
diff --git a/response_selectors/ranking_and_intent_based_response_selector/README.md b/response_selectors/ranking_and_intent_based_response_selector/README.md
@@ -0,0 +1,18 @@
+# Ranking-based Response Selector
+
+## Description
+
+Response Selector is a component selecting final response among the given hypotheses by different skills.
+The Ranking-based Response Selector utilizes floating point annotations by ranking candidate annotator (e.g., Sentence Ranker)
+to rank hypotheses and selects the best ranked one.
+
+### Parameters
+
+Utilizes annotations by `SENTENCE_RANKER_ANNOTATION_NAME` candidate annotator. 
+In case of absence of these annotations, utilizes provided `SENTENCE_RANKER_SERVICE_URL` to annotate hypotheses 
+according to `N_UTTERANCES_CONTEXT` last utterances.
+Parameter `FILTER_TOXIC_OR_BADLISTED` defines whether it filers out toxic hypotheses or not.
+
+## Dependencies
+
+- either candidate annotations by `SENTENCE_RANKER_ANNOTATION_NAME` or service `SENTENCE_RANKER_SERVICE_URL`.
diff --git a/response_selectors/ranking_and_intent_based_response_selector/requirements.txt b/response_selectors/ranking_and_intent_based_response_selector/requirements.txt
@@ -0,0 +1,8 @@
+flask==1.1.1
+itsdangerous==2.0.1
+gunicorn==19.9.0
+requests==2.22.0
+numpy==1.25.0
+sentry-sdk==0.12.3
+jinja2<=3.0.3
+Werkzeug<=2.0.3
diff --git a/response_selectors/ranking_and_intent_based_response_selector/server.py b/response_selectors/ranking_and_intent_based_response_selector/server.py
@@ -0,0 +1,241 @@
+#!/usr/bin/env python
+import json
+import logging
+import numpy as np
+import requests
+import time
+from copy import deepcopy
+from os import getenv
+from typing import List
+
+import sentry_sdk
+from flask import Flask, request, jsonify
+from common.universal_templates import is_any_question_sentence_in_utterance, if_chat_about_particular_topic, \
+    if_not_want_to_chat_about_particular_topic, if_choose_topic, is_switch_topic
+from common.utils import is_toxic_or_badlisted_utterance, get_intents, get_entities, \
+    get_common_tokens_in_lists_of_strings
+
+
+sentry_sdk.init(getenv("SENTRY_DSN"))
+
+logging.basicConfig(format="%(asctime)s - %(name)s - %(levelname)s - %(message)s", level=logging.INFO)
+logger = logging.getLogger(__name__)
+
+app = Flask(__name__)
+
+SENTENCE_RANKER_ANNOTATION_NAME = getenv("SENTENCE_RANKER_ANNOTATION_NAME")
+SENTENCE_RANKER_SERVICE_URL = getenv("SENTENCE_RANKER_SERVICE_URL")
+SENTENCE_RANKER_TIMEOUT = int(getenv("SENTENCE_RANKER_TIMEOUT"))
+FILTER_TOXIC_OR_BADLISTED = int(getenv("FILTER_TOXIC_OR_BADLISTED"))
+N_UTTERANCES_CONTEXT = int(getenv("N_UTTERANCES_CONTEXT"))
+assert SENTENCE_RANKER_ANNOTATION_NAME or SENTENCE_RANKER_SERVICE_URL, logger.error(
+    "Ranker service URL or annotator name should be given"
+)
+force_intents_fname = "common/intents/force_intents_intent_catcher.json"
+FORCE_INTENTS_IC = json.load(open(force_intents_fname))
+
+lets_chat_about_triggers_fname = "common/intents/lets_chat_about_triggers.json"
+LETS_CHAT_ABOUT_PARTICULAR_TOPICS = json.load(open(lets_chat_about_triggers_fname))
+
+require_action_intents_fname = "common/intents/require_action_intents.json"
+REQUIRE_ACTION_INTENTS = json.load(open(require_action_intents_fname))
+
+
+
+def filter_out_badlisted_or_toxic(hypotheses):
+    clean_hypotheses = []
+    for hyp in hypotheses:
+        is_toxic = is_toxic_or_badlisted_utterance(hyp)
+        if not is_toxic:
+            clean_hypotheses += [deepcopy(hyp)]
+        else:
+            logger.info(f"Filter out toxic candidate: {hyp['text']}")
+    return clean_hypotheses
+
+
+def select_response_by_scores(hypotheses, scores):
+    best_id = np.argmax(scores)
+    result = hypotheses[best_id]
+    return result, best_id
+
+
+def get_scores(dialog_context, hypotheses):
+    if all([SENTENCE_RANKER_ANNOTATION_NAME in hyp.get("annotations", {}) for hyp in hypotheses]):
+        scores = [hyp.get("annotations", {}).get(SENTENCE_RANKER_ANNOTATION_NAME, 0.0) for hyp in hypotheses]
+        logger.info("Selected a response via Sentence Ranker Annotator.")
+    else:
+        try:
+            dialog_context = "\n".join(dialog_context)
+            pairs = [[dialog_context, hyp["text"]] for hyp in hypotheses]
+            scores = requests.post(
+                SENTENCE_RANKER_SERVICE_URL,
+                json={"sentence_pairs": pairs},
+                timeout=SENTENCE_RANKER_TIMEOUT,
+            ).json()
+            scores = np.array(scores[0]["batch"])
+            logger.info("Selected a response via Sentence Ranker Service.")
+        except Exception as e:
+            sentry_sdk.capture_exception(e)
+            scores = [hyp["confidence"] for hyp in hypotheses]
+            logger.exception(e)
+            logger.info("Selected a response via Confidence.")
+    return scores
+
+
+def select_response(dialog_context: List[str], hypotheses: List[dict], last_human_ann_uttr: dict, prev_bot_uttr: dict):
+    scores = get_scores(dialog_context, hypotheses)
+    scores = [score if hyp["skill_name"] != "dummy_skill" else score - 1 for score, hyp in zip(scores, hypotheses)]
+
+    # --------------------------------------------------------------------------------------------------------------
+    # intent-based scaling
+    human_intents = get_intents(last_human_ann_uttr, which="all")
+    human_named_entities = get_entities(last_human_ann_uttr, only_named=True, with_labels=False)
+    human_entities = get_entities(last_human_ann_uttr, only_named=False, with_labels=False)
+
+    _human_is_switch_topic_request = is_switch_topic(last_human_ann_uttr)
+    _human_is_request = any([intent in human_intents for intent in REQUIRE_ACTION_INTENTS.keys()])
+    _human_is_any_question = is_any_question_sentence_in_utterance(last_human_ann_uttr)
+    # if user utterance contains any question AND requires some intent by socialbot
+    _human_is_require_action_intent = _human_is_any_question and any(
+        [_intent in human_intents for _intent in REQUIRE_ACTION_INTENTS.keys()]
+    )
+    _human_contains_entities = len(human_entities) > 0
+    _human_wants_to_chat_about_topic = (
+        if_chat_about_particular_topic(last_human_ann_uttr) and "about it" not in last_human_ann_uttr["text"].lower()
+    )
+    _human_does_not_want_to_chat_about_topic = if_not_want_to_chat_about_particular_topic(last_human_ann_uttr)
+    _human_wants_bot_to_choose_topic = if_choose_topic(last_human_ann_uttr, prev_bot_uttr)
+    _human_is_force_intent = any([_intent in human_intents for _intent in FORCE_INTENTS_IC.keys()])
+    _human_force_intents_detected = [_intent for _intent in FORCE_INTENTS_IC.keys() if _intent in human_intents]
+    _human_force_intents_skills = sum([FORCE_INTENTS_IC.get(_intent, []) for _intent in _human_force_intents_detected], [])
+    _human_require_action_intents_detected = [
+        _intent for _intent in REQUIRE_ACTION_INTENTS.keys() if _intent in human_intents
+    ]
+    _human_required_actions = sum(
+        [REQUIRE_ACTION_INTENTS.get(_intent, []) for _intent in _human_require_action_intents_detected], []
+    )
+
+    for hyp_id, hyp in enumerate(hypotheses):
+        hyp_intents = get_intents(hyp, which="all")
+        hyp_named_entities = get_entities(hyp, only_named=True, with_labels=False)
+        hyp_entities = get_entities(hyp, only_named=False, with_labels=False)
+        # identifies if candidate contains named entities from last human utterance
+        _same_named_entities = (
+                len(get_common_tokens_in_lists_of_strings(hyp_named_entities, human_named_entities)) > 0
+        )
+        # identifies if candidate contains all (not only named) entities from last human utterance
+        _same_entities = len(get_common_tokens_in_lists_of_strings(hyp_entities, human_entities)) > 0
+        _same_topic_entity = _same_named_entities or _same_entities
+        _is_force_intent_skill = hyp["skill_name"] in _human_force_intents_skills and _human_is_force_intent
+        _hyp_wants_to_chat_about_topic = (if_chat_about_particular_topic(hyp) and "about it" not in hyp["text"].lower())
+
+        if _is_force_intent_skill:
+            scores[hyp_id] += 1.0
+        elif (_human_is_switch_topic_request or _human_does_not_want_to_chat_about_topic \
+              or _human_wants_bot_to_choose_topic):
+            # human wants to switch topic
+            if len(human_named_entities) > 0 or len(human_entities) > 0:
+                # if user names entities which does not want to talk about
+                if _same_named_entities or _same_entities:
+                    # if hyp contains the same entities, decrease score
+                    scores[hyp_id] /= 1.5
+                elif len(hyp_named_entities) > 0 or len(hyp_entities) > 0:
+                    # if hyp contains other entities, increase score
+                    scores[hyp_id] *= 1.5
+            else:
+                # if user does not name entities which does not want to talk about
+                if _hyp_wants_to_chat_about_topic:
+                    # if hyp contains offer on chat about some entities, increase score
+                    scores[hyp_id] *= 1.5
+        elif _human_wants_to_chat_about_topic:
+            # if user names entities which does not want to talk about
+            if _same_named_entities or _same_entities:
+                # if hyp contains requested entities, increase score
+                scores[hyp_id] *= 1.5
+        elif _human_is_require_action_intent:
+            # human intents require some action from hyp
+            if set(hyp_intents).intersection(set(_human_required_actions)):
+                # if hyp contains intents required by human intent
+                scores[hyp_id] *= 1.5
+
+    # --------------------------------------------------------------------------------------------------------------
+
+    logger.info(f"Scores for selection:\n`{scores}`")
+    result = select_response_by_scores(hypotheses, scores)[0]
+    logger.info(f"ranking_and_intent_based_response_selector selected:\n`{result}`")
+
+    return result
+
+
+@app.route("/respond", methods=["POST"])
+def respond():
+    st_time = time.time()
+
+    dialogs = request.json["dialogs"]
+
+    selected_skill_names = []
+    selected_responses = []
+    selected_confidences = []
+    selected_human_attributes = []
+    selected_bot_attributes = []
+    selected_attributes = []
+
+    for i, dialog in enumerate(dialogs):
+        hypotheses = [hyp for hyp in dialog["human_utterances"][-1]["hypotheses"]]
+        if FILTER_TOXIC_OR_BADLISTED:
+            hypotheses = filter_out_badlisted_or_toxic(hypotheses)
+        hypotheses_texts = "\n".join([f'{h["skill_name"]} (conf={h["confidence"]}): {h["text"]}' for h in hypotheses])
+        logger.info(f"Hypotheses: {hypotheses_texts}")
+        dialog_context = [uttr["text"] for uttr in dialog["utterances"][-N_UTTERANCES_CONTEXT:]]
+        selected_resp = select_response(
+            dialog_context,
+            hypotheses,
+            dialog["human_utterances"][-1],
+            dialog["bot_utterances"][-1],
+        )
+        try:
+            best_id = hypotheses.index(selected_resp)
+
+            selected_responses.append(hypotheses[best_id].pop("text"))
+            selected_skill_names.append(hypotheses[best_id].pop("skill_name"))
+            selected_confidences.append(hypotheses[best_id].pop("confidence"))
+            selected_human_attributes.append(hypotheses[best_id].pop("human_attributes", {}))
+            selected_bot_attributes.append(hypotheses[best_id].pop("bot_attributes", {}))
+            hypotheses[best_id].pop("annotations", {})
+            selected_attributes.append(hypotheses[best_id])
+
+        except Exception as e:
+            sentry_sdk.capture_exception(e)
+            logger.exception(e)
+            logger.info(
+                "Exception in finding selected response in hypotheses. "
+                "Selected a response with the highest confidence."
+            )
+            selected_resp, best_id = select_response_by_scores(hypotheses, [hyp["confidence"] for hyp in hypotheses])
+
+            selected_responses.append(hypotheses[best_id].pop("text"))
+            selected_skill_names.append(hypotheses[best_id].pop("skill_name"))
+            selected_confidences.append(hypotheses[best_id].pop("confidence"))
+            selected_human_attributes.append(hypotheses[best_id].pop("human_attributes", {}))
+            selected_bot_attributes.append(hypotheses[best_id].pop("bot_attributes", {}))
+            hypotheses[best_id].pop("annotations", {})
+            selected_attributes.append(hypotheses[best_id])
+
+    total_time = time.time() - st_time
+    logger.info(f"ranking_and_intent_based_response_selector exec time = {total_time:.3f}s")
+    return jsonify(
+        list(
+            zip(
+                selected_skill_names,
+                selected_responses,
+                selected_confidences,
+                selected_human_attributes,
+                selected_bot_attributes,
+                selected_attributes,
+            )
+        )
+    )
+
+
+if __name__ == "__main__":
+    app.run(debug=False, host="0.0.0.0", port=3000)
diff --git a/...se_selector/service_configs/ranking-and-intent-based-response-selector-ru/environment.yml b/...se_selector/service_configs/ranking-and-intent-based-response-selector-ru/environment.yml
@@ -0,0 +1,8 @@
+SERVICE_PORT: 8002
+SERVICE_NAME: response_selector
+SENTENCE_RANKER_ANNOTATION_NAME: dialogrpt
+SENTENCE_RANKER_SERVICE_URL: http://dialogrpt-ru:8122/rank_sentences
+SENTENCE_RANKER_TIMEOUT: 3
+N_UTTERANCES_CONTEXT: 5
+FILTER_TOXIC_OR_BADLISTED: 1
+FLASK_APP: server
diff --git a/...sponse_selector/service_configs/ranking-and-intent-based-response-selector-ru/service.yml b/...sponse_selector/service_configs/ranking-and-intent-based-response-selector-ru/service.yml
@@ -0,0 +1,29 @@
+name: ranking-and-intent-based-response-selector-ru
+endpoints:
+- respond
+compose:
+  env_file: [ .env ]
+  build:
+    args:
+      SERVICE_PORT: 8002
+      SERVICE_NAME: response_selector
+      SENTENCE_RANKER_ANNOTATION_NAME: dialogrpt
+      SENTENCE_RANKER_SERVICE_URL: http://dialogrpt-ru:8122/rank_sentences
+      SENTENCE_RANKER_TIMEOUT: 3
+      N_UTTERANCES_CONTEXT: 5
+      FILTER_TOXIC_OR_BADLISTED: 1
+      FLASK_APP: server
+    context: .
+    dockerfile: ./response_selectors/ranking_and_intent_based_response_selector/Dockerfile
+  command: flask run -h 0.0.0.0 -p 8002
+  environment:
+    - FLASK_APP=server
+  deploy:
+    resources:
+      limits:
+        memory: 100M
+      reservations:
+        memory: 100M
+  ports:
+  - 8002:8002
+proxy: null
diff --git a/...ponse_selector/service_configs/ranking-and-intent-based-response-selector/environment.yml b/...ponse_selector/service_configs/ranking-and-intent-based-response-selector/environment.yml
@@ -0,0 +1,8 @@
+SERVICE_PORT: 8002
+SERVICE_NAME: response_selector
+SENTENCE_RANKER_ANNOTATION_NAME: sentence_ranker
+SENTENCE_RANKER_SERVICE_URL: http://sentence-ranker:8128/respond
+SENTENCE_RANKER_TIMEOUT: 3
+N_UTTERANCES_CONTEXT: 5
+FILTER_TOXIC_OR_BADLISTED: 1
+FLASK_APP: server
diff --git a/..._response_selector/service_configs/ranking-and-intent-based-response-selector/service.yml b/..._response_selector/service_configs/ranking-and-intent-based-response-selector/service.yml
@@ -0,0 +1,30 @@
+name: ranking-and-intent-based-response-selector
+endpoints:
+- respond
+compose:
+  env_file: [ .env ]
+  build:
+    args:
+      SERVICE_PORT: 8002
+      SERVICE_NAME: response_selector
+      LANGUAGE: EN
+      SENTENCE_RANKER_ANNOTATION_NAME: sentence_ranker
+      SENTENCE_RANKER_SERVICE_URL: http://sentence-ranker:8128/respond
+      SENTENCE_RANKER_TIMEOUT: 3
+      N_UTTERANCES_CONTEXT: 5
+      FILTER_TOXIC_OR_BADLISTED: 1
+      FLASK_APP: server
+    context: .
+    dockerfile: ./response_selectors/ranking_and_intent_based_response_selector/Dockerfile
+  command: flask run -h 0.0.0.0 -p 8002
+  environment:
+    - FLASK_APP=server
+  deploy:
+    resources:
+      limits:
+        memory: 100M
+      reservations:
+        memory: 100M
+  ports:
+  - 8002:8002
+proxy: null