Success Markers CLI (RasaHQ#9824)

* Create stubs to start filling out Aciel's snippet Co-authored-by: Aciel Eshky <a.eshky@rasa.com> * Sketch out basics of CLI arguments * Start changing over args to new format * Make CLI match description from design pass * Add tests * Switch over timestamps to event IDs * Fix tests now event IDs are supported * Start work on doc comments * Switch over event_id fix Also removes otherwise-unused import to stop circularity * Address PR comments * Fix incorrect file extension * Codeclimate * Update rasa/core/evaluation/marker_base.py Co-authored-by: Kathrin Bujna <kathrin.bujna@gmail.com> * Address PR comments * Move test to marker * Rename dialogue to session Co-authored-by: Aciel Eshky <a.eshky@rasa.com> Co-authored-by: Kathrin Bujna <kathrin.bujna@gmail.com>
kode-git · Nov 1, 2021 · 18ca40c · 18ca40c
1 parent 52ad480
commit 18ca40c
Show file tree

Hide file tree

Showing 10 changed files with 527 additions and 24 deletions.
diff --git a/rasa/__main__.py b/rasa/__main__.py
@@ -23,6 +23,7 @@
     train,
     visualize,
     x,
+    evaluate,
 )
 from rasa.cli.arguments.default_arguments import add_logging_options
 from rasa.cli.utils import parse_last_positional_argument_as_model_path
@@ -69,6 +70,7 @@ def create_argument_parser() -> argparse.ArgumentParser:
     data.add_subparser(subparsers, parents=parent_parsers)
     export.add_subparser(subparsers, parents=parent_parsers)
     x.add_subparser(subparsers, parents=parent_parsers)
+    evaluate.add_subparser(subparsers, parents=parent_parsers)
 
     return parser
 

diff --git a/rasa/cli/arguments/evaluate.py b/rasa/cli/arguments/evaluate.py
@@ -0,0 +1,61 @@
+import argparse
+from rasa.cli.arguments.default_arguments import add_endpoint_param, add_domain_param
+
+
+def set_markers_arguments(parser: argparse.ArgumentParser) -> None:
+    """Specifies arguments for `rasa evaluate markers`."""
+    parser.add_argument(
+        "output_filename",
+        type=str,
+        help="The filename to write the extracted markers to (CSV format).",
+    )
+
+    parser.add_argument(
+        "--config",
+        default="markers.yml",
+        type=str,
+        help="The config file(s) containing marker definitions. This can be a single "
+        "YAML file, or a directory that contains several files with marker "
+        "definitions in it. The content of these files will be read and merged "
+        "together.",
+    )
+
+    stats = parser.add_mutually_exclusive_group()
+
+    stats.add_argument(
+        "--no-stats",
+        default=False,
+        action="store_true",
+        dest="stats",
+        help="Do not compute summary statistics.",
+    )
+
+    stats.add_argument(
+        "--stats-file",
+        default="stats.csv",
+        type=str,
+        help="The filename to write out computed summary statistics.",
+    )
+
+    add_endpoint_param(
+        parser, help_text="Configuration file for the tracker store as a yml file.",
+    )
+
+    add_domain_param(parser)
+
+
+def set_markers_first_n_arguments(parser: argparse.ArgumentParser) -> None:
+    """Specifies arguments for `rasa evaluate markers by_first_n`."""
+    parser.add_argument(
+        "count", type=int, help="The number of trackers to extract markers from",
+    )
+
+
+def set_markers_sample_arguments(parser: argparse.ArgumentParser) -> None:
+    """Specifies arguments for `rasa evaluate markers by_sample`."""
+    parser.add_argument(
+        "--seed", type=int, help="Seed to use if selecting trackers by 'sample'"
+    )
+    parser.add_argument(
+        "count", type=int, help="The number of trackers to extract markers from",
+    )
diff --git a/rasa/cli/evaluate.py b/rasa/cli/evaluate.py
@@ -0,0 +1,156 @@
+import argparse
+from typing import List, Text, Optional
+
+from rasa.core.utils import AvailableEndpoints
+from rasa.core.tracker_store import TrackerStore
+from rasa.core.evaluation.marker_tracker_loader import MarkerTrackerLoader
+from rasa.core.evaluation.marker_base import Marker
+
+from rasa.cli import SubParsersAction
+import rasa.cli.arguments.evaluate as arguments
+import rasa.shared.utils.cli
+import os.path
+
+
+def add_subparser(
+    subparsers: SubParsersAction, parents: List[argparse.ArgumentParser]
+) -> None:
+    """Add all evaluate parsers.
+
+    Args:
+        subparsers: subparser we are going to attach to
+        parents: Parent parsers, needed to ensure tree structure in argparse
+    """
+    evaluate_parser = subparsers.add_parser(
+        "evaluate",
+        parents=parents,
+        conflict_handler="resolve",
+        formatter_class=argparse.ArgumentDefaultsHelpFormatter,
+        help="Tools for evaluating models.",
+    )
+
+    evaluate_subparsers = evaluate_parser.add_subparsers()
+
+    marker_parser = evaluate_subparsers.add_parser(
+        "markers",
+        parents=parents,
+        conflict_handler="resolve",
+        formatter_class=argparse.ArgumentDefaultsHelpFormatter,
+        help="Applies marker conditions to existing trackers.",
+    )
+
+    arguments.set_markers_arguments(marker_parser)
+
+    markers_subparser = marker_parser.add_subparsers(dest="strategy")
+
+    markers_first_n_subparser = markers_subparser.add_parser(
+        "first_n",
+        parents=parents,
+        conflict_handler="resolve",
+        formatter_class=argparse.ArgumentDefaultsHelpFormatter,
+        help="Select trackers sequentially until N are taken.",
+    )
+    arguments.set_markers_first_n_arguments(markers_first_n_subparser)
+
+    markers_sample_subparser = markers_subparser.add_parser(
+        "sample",
+        parents=parents,
+        conflict_handler="resolve",
+        formatter_class=argparse.ArgumentDefaultsHelpFormatter,
+        help="Select trackers by sampling N.",
+    )
+    arguments.set_markers_sample_arguments(markers_sample_subparser)
+
+    markers_subparser.add_parser(
+        "all",
+        parents=parents,
+        conflict_handler="resolve",
+        formatter_class=argparse.ArgumentDefaultsHelpFormatter,
+        help="Select all trackers.",
+    )
+
+    marker_parser.set_defaults(func=_run_markers_cli)
+
+
+def _run_markers_cli(args: argparse.Namespace) -> None:
+    """Run markers algorithm using parameters from CLI.
+
+    Args:
+        args: The arguments passed in from the CLI.
+    """
+    seed = args.seed if "seed" in args else None
+    count = args.count if "count" in args else None
+
+    stats_file = args.stats_file if "stats_file" in args and args.stats else None
+
+    _run_markers(
+        seed,
+        count,
+        args.endpoints,
+        args.strategy,
+        args.config,
+        args.output_filename,
+        stats_file,
+    )
+
+
+def _run_markers(
+    seed: Optional[int],
+    count: Optional[int],
+    endpoint_config: Text,
+    strategy: Text,
+    config: Text,
+    output_filename: Text,
+    stats_file: Optional[Text] = None,
+) -> None:
+    """Run markers algorithm over specified config and tracker store.
+
+    Args:
+        seed: (Optional) The seed to initialise the random number generator for
+              use with the 'sample' strategy.
+        count: (Optional) Number of trackers to extract from (for any strategy
+               except 'all').
+        endpoint_config: Path to the endpoint configuration defining the tracker
+                         store to use.
+        strategy: Strategy to use when selecting trackers to extract from.
+        config: Path to the markers definition file to use.
+        output_filename: Path to write out the extracted markers.
+        stats_file: (Optional) Path to write out statistics about the extracted
+                    markers.
+    """
+    if os.path.exists(output_filename):
+        rasa.shared.utils.cli.print_error_and_exit(
+            "A file with the output filename already exists"
+        )
+
+    if stats_file and os.path.exists(stats_file):
+        rasa.shared.utils.cli.print_error_and_exit(
+            "A file with the stats filename already exists"
+        )
+
+    tracker_loader = _create_tracker_loader(endpoint_config, strategy, count, seed)
+    markers = Marker.from_path(config)
+    markers.export_markers(tracker_loader.load(), output_filename, stats_file)
+
+
+def _create_tracker_loader(
+    endpoint_config: Text, strategy: Text, count: Optional[int], seed: Optional[int]
+) -> MarkerTrackerLoader:
+    """Create a tracker loader against the configured tracker store.
+
+    Args:
+        endpoint_config: Path to the endpoint configuration defining the tracker
+                         store to use.
+        strategy: Strategy to use when selecting trackers to extract from.
+        count: (Optional) Number of trackers to extract from (for any strategy
+               except 'all').
+        seed: (Optional) The seed to initialise the random number generator for
+              use with the 'sample' strategy.
+
+    Returns:
+        A MarkerTrackerLoader object configured with the specified strategy against
+        the configured tracker store.
+    """
+    endpoints = AvailableEndpoints.read_endpoints(endpoint_config)
+    tracker_store = TrackerStore.create(endpoints.tracker_store)
+    return MarkerTrackerLoader(tracker_store, strategy, count, seed,)
diff --git a/rasa/core/evaluation/marker_base.py b/rasa/core/evaluation/marker_base.py
@@ -1,6 +1,8 @@
 from __future__ import annotations
 import os
 from abc import ABC, abstractmethod
+from rasa.shared.core.trackers import DialogueStateTracker
+from rasa.utils.io import WriteRow
 from typing import (
     Dict,
     Iterator,
@@ -27,6 +29,8 @@
 from rasa.shared.core.events import ActionExecuted, UserUttered, Event
 
 import logging
+import csv
+import os.path
 
 logger = logging.getLogger(__name__)
 
@@ -378,7 +382,7 @@ def from_path(path: Union[Path, Text]) -> Marker:
             config = {}
         if not config:
             raise InvalidMarkerConfig(f"Could not load any markers from '{path}'.")
-        return Marker.from_config(config)
+        return Marker.from_config_dict(config)
 
     @staticmethod
     def _load_and_combine_config_files_under(root_dir: Text) -> MarkerConfig:
@@ -485,6 +489,87 @@ def from_config(config: MarkerConfig, name: Optional[Text] = None) -> Marker:
             marker.name = name
         return marker
 
+    def export_markers(
+        self,
+        tracker_loader: Iterator[Optional[DialogueStateTracker]],
+        output_file: Text,
+        stats_file: Optional[Text] = None,
+    ) -> None:
+        """Collect markers for each dialogue in each tracker loaded.
+
+        Args:
+            tracker_loader: The tracker loader to use to select trackers for marker
+                            extraction.
+            output_file: Path to write out the extracted markers.
+            stats_file: (Optional) Path to write out statistics about the extracted
+                        markers.
+        """
+        processed_trackers = {}
+
+        for tracker in tracker_loader:
+            if tracker:
+                tracker_result = self.evaluate_events(tracker.events)
+                processed_trackers[tracker.sender_id] = tracker_result
+
+        Marker._save_results(output_file, processed_trackers)
+
+        if stats_file:
+            Marker._compute_stats(stats_file, processed_trackers)
+
+    @staticmethod
+    def _save_results(
+        path: Text, results: Dict[Text, List[Dict[Text, EventMetaData]]]
+    ) -> None:
+        """Save extracted marker results as CSV to specified path.
+
+        Args:
+            path: Path to write out the extracted markers.
+            results: Extracted markers from a selection of trackers.
+        """
+        with open(path, "w") as f:
+            table_writer = csv.writer(f)
+            table_writer.writerow(
+                [
+                    "sender_id",
+                    "session_idx",
+                    "marker_name",
+                    "event_id",
+                    "num_preceding_user_turns",
+                ]
+            )
+            for sender_id, dialogues in results.items():
+                for session_idx, session in enumerate(dialogues):
+                    Marker._write_relevant_events(
+                        table_writer, sender_id, session_idx, session
+                    )
+
+    @staticmethod
+    def _write_relevant_events(
+        writer: WriteRow,
+        sender_id: Text,
+        session_idx: int,
+        session: Dict[Text, EventMetaData],
+    ) -> None:
+        for marker_name, marker_metadata in session.items():
+            for metadata in marker_metadata:
+                writer.writerow(
+                    [
+                        sender_id,
+                        str(session_idx),
+                        marker_name,
+                        metadata.idx,
+                        metadata.preceding_user_turns,
+                    ]
+                )
+
+    @staticmethod
+    def _compute_stats(
+        out_file: Text, results: List[Union[Text, Dict[Text, EventMetaData]]]
+    ) -> None:
+        """Compute stats over extracted marker data."""
+        # TODO: Figure out how this is done
+        pass
+
 
 class CompoundMarker(Marker, ABC):
     """Combines several markers into one."""