services/control-tower/plugins/riffyn/watcher.py

import re

import riffyn_nexus_sdk_v1 as api
import requests

from lib import riffyn, utils
from plugins import registry
from plugins.riffyn.config import PluginConfig
from src.triggers import trigger

cfg = PluginConfig()


class Watcher(registry.Watcher):
    def __init__(self, logger, cache, queue, done):
        super(Watcher, self).__init__(logger, cache, queue, done)

        self.logger = logger
        self.cache = cache
        self.queue = queue
        self.done = done
        self.cache_key = cfg.CACHE_KEY
        self.poll_interval = cfg.POLL_INTERVAL

        client = riffyn.Client.default(cfg.API_KEY)
        self.activity_api = api.ProcessActivityApi(client)
        self.experiment_api = api.ExperimentApi(client)
        self.run_api = api.RunApi(client)

        self.partials = {}

    def run(self):
        # Keep polling until a done signal is received
        while not self.done.is_set():
            self.logger.info("runs.poll.started")

            try:
                # Fetch the statuses of all runs in Riffyn
                runs = self.__fetch_run_statuses()
                for experiment_id, runs in runs.items():
                    for run in runs["started"]:
                        self.logger.info(
                            "run.started",
                            experiment_id=experiment_id,
                            run_id=run.id,
                            run_name=run.name,
                        )

                        # Try to aggregate across multiple runs for plate-based protocols
                        complete, plate = self.__aggregate(run)
                        # Once we get a complete set of runs to execute
                        if len(complete) > 0:
                            if plate:
                                triggers = self.__build_triggers(
                                    experiment_id, complete, plate
                                )
                            else:
                                triggers = self.__build_triggers(
                                    experiment_id, complete
                                )

                            # Add the triggers to the queue to be published
                            for trigger in triggers:
                                self.queue.put(trigger)

                        # Add started runs to the cache for tracking
                        self.cache.hset(self.cache_key, run.id, "")

                    for run in runs["stopped"]:
                        self.logger.info(
                            "run.stopped",
                            experiment_id=experiment_id,
                            run_id=run.id,
                            run_name=run.name,
                        )

                        # Check if the run is part of an aggregated set
                        partial = self.__is_partial(run)
                        if partial:
                            key, rows, cols, idx = partial
                            if key in self.partials and idx < len(self.partials[key]):
                                self.partials[key][idx] = None

                        # Remove the stopped run from the cache
                        self.cache.hdel(self.cache_key, run.id)

                self.logger.info("runs.poll.finished")

            except api.rest.ApiException as err:
                self.logger.error(
                    "runs.poll.failed", status=err.status, error=err.reason
                )

            except Exception as err:
                self.logger.error("runs.poll.failed", error=err)

            self.done.wait(self.poll_interval)

    def __fetch_run_statuses(self):
        experiments = self.__fetch_experiments()
        active_runs = self.cache.hgetall(self.cache_key)

        # Select runs that have been started or stopped since we last polled
        runs = {}
        for experiment in experiments:
            status = {"started": [], "stopped": []}
            for run in self.__fetch_runs(experiment.id):
                if run.status == "running" and run.id not in active_runs:
                    status["started"].append(run)

                elif (
                    run.status == "stopped" or run.status == "new"
                ) and run.id in active_runs:
                    status["stopped"].append(run)

            runs[experiment.id] = status

        return runs

    def __fetch_experiments(self):
        experiments = self.experiment_api.list_experiments()
        return experiments.data

    def __fetch_runs(self, experiment_id):
        groups = self.run_api.list_run_groups(experiment_id)
        runs = list(
            map(
                lambda group: self.run_api.list_runs(experiment_id, group.id).data,
                groups.data,
            )
        )
        return utils.flatten(runs)

    def __aggregate(self, run):
        # Check if the run is part of a plate-based protocol
        partial = self.__is_partial(run)
        if not partial:
            return [run], None

        key, rows, cols, idx = partial
        if key not in self.partials:
            # Pre-fill an array equal to the number of expected partials
            self.partials[key] = [None] * (rows * cols)

        if idx < len(self.partials[key]):
            # Add the run to the aggregated set
            self.partials[key][idx] = run

        # Check that all partial runs in the aggregated set have been populated
        if all(partial is not None for partial in self.partials[key]):
            return self.partials[key], (rows, cols)

        return [], None

    def __is_partial(self, run):
        # Check the run name if it is part of a plate-based protocol using the format
        # <name of run> [row x columns] <well index>
        partial = re.search(r"(.*) \[([1-9])+x([1-9])+\] ([1-9])+$", run.name)
        if not partial:
            return False

        # Return the dimensions of the plate and the well index
        name, rows, cols, num = partial.group(1, 2, 3, 4)
        key = f"{self.cache_key}/{run.activity_id}/{name}"
        return (key, int(rows), int(cols), int(num) - 1)

    def __build_triggers(self, experiment_id, runs, plate=None):
        # Fetch the experiment's activity and raw data from Riffyn
        activity = self.activity_api.get_activity(experiment_id, runs[0].activity_id)
        data = self.__get_experiment_data_raw(experiment_id, activity.id, runs)
        # Initialise the triggers to be populated
        triggers = self.__init_triggers(experiment_id, activity, runs, plate)

        # Populate each trigger's spec using raw data from the runs
        for (trigger, resources) in triggers.values():
            properties = {}
            for input in activity.inputs:
                # If the resource is associated with a trigger's API version
                if input.id in resources:
                    # Add the property header to the trigger
                    for property in input.properties:
                        header = f"{activity.id} | input | {input.id} | {property.id} | value"
                        properties[utils.str_to_camelcase(property.name)] = header

            for idx, run in enumerate(runs):
                spec = {}
                # Add each property and its value to the spec object
                for property, header in properties.items():
                    datatable = data["datatables"][run.id]["datatable"][0]
                    value = datatable[header]

                    if value is not None:
                        spec[property] = value

                # For plate-based protocols, assign the spec to the corresponding well index
                if isinstance(trigger.spec, list):
                    trigger.spec[idx] = spec
                else:
                    trigger.spec = spec

        return [trigger for (trigger, resources) in triggers.values()]

    def __get_experiment_data_raw(self, experiment_id, activity_id, runs):
        resp = requests.get(
            f"https://api.app.riffyn.com/v1/experiment/{experiment_id}/step/{activity_id}/data/raw",
            headers={"api-key": cfg.API_KEY},
            params={
                "rgid": list(map(lambda run: run.group_id, runs)),
                "rid": list(map(lambda run: run.id, runs)),
                "rnum": list(map(lambda run: run.num, runs)),
            },
        )
        resp.raise_for_status()
        return resp.json()

    def __init_triggers(self, experiment_id, activity, runs, plate=None):
        # Create a mapping of API version -> (trigger, resource IDs)
        triggers = {}
        protocol = activity.name.title().replace(" ", "")

        for input in runs[0].inputs:
            try:
                api_version = input.resource_name
                # If we have not seen this API version before, create a new trigger
                if api_version not in triggers:
                    trg = trigger.Trigger(api_version, protocol)

                    # Initialise the trigger for plate-based protocols
                    if plate:
                        trg.plate(*plate)
                        # Pre-fill the spec with an array equal to the number of runs
                        trg.spec = [None] * len(runs)
                        trg.metadata(
                            "riffyn",
                            list(
                                map(
                                    lambda run: {
                                        "experimentId": experiment_id,
                                        "activityId": activity.id,
                                        "runId": run.id,
                                    },
                                    runs,
                                )
                            ),
                        )

                    else:
                        trg.metadata(
                            "riffyn",
                            {
                                "experimentId": experiment_id,
                                "activityId": activity.id,
                                "runId": runs[0].id,
                            },
                        )

                    triggers[api_version] = (trg, [])

                # Add the resource ID to the its associated API version
                triggers[api_version][1].append(input.resource_def_id)

            except trigger.InvalidAPIVersion:
                continue

        return triggers