Source code for blumycelium.mycelium

from . import utils as ut
from . import custom_types
from . import models as mod
from .the_exceptions import *


import pyArango.theExceptions as a_exc

from icecream import ic
ic.configureOutput(includeContext=True)

import logging
logger = logging.getLogger("BLUMYCELIUM")

[docs]class ArangoMycelium:
    """docstring for ArangoMycelium. A mycelium over ArangoDB"""

    def __init__(self, connection, name):
        """
        connection: pyArango connection object.
        name: Unique name for the mycelium
        """

        self.connection = connection
        self.name = name
        self.db_name = "BLUMYC_" + name

        self.collections = mod.COLLECTIONS
        self.graphs = mod.GRAPHS

        self.db = None

        if not self.connection.hasDatabase(self.db_name):
            logger.warning("Warning: Database %s does not exist. To create it run self.init with init_db=True" % self.db_name)
        else:
            self.db = self.connection[self.db_name]

    def _init_db(self) :
        """
        Create the mycelium database
        """
        from pyArango.theExceptions import CreationError

        print("Creating database", self.db_name)
        try :
            return self.connection.createDatabase(self.db_name)
        except CreationError as e :
            print("Database Creation error %s: => %s" % (self.db_name, e.message))

            try :
                return self.connection[self.db_name]
            except :
                raise e

[docs]    def init(self, init_db=False, users_to_create=None) :
        """
        init_db: initialise the database
        users_to_create: list of dicts {username, password}
        """
        if init_db:
            self.db = self._init_db()

        if self.db is None:
            raise DatabaseNotFoundError("Cannot continue with the initialisation because database does not exist. Try runing init with init_db=True")

        logger.info("Initializing %s..." % self.db_name)    
        logger.info("-- init collections")
        self._init_collections(self.db)
        logger.info("-- init graphs")
        self._init_graphs(self.db)
        logger.info("-- init indexes")
        self._init_indexes(self.db)
        logger.info("-- init users")

        if users_to_create:
            for user in self.users_to_create :
                self._init_user(self.connection, self.db_name, user["username"], user["password"])
    
[docs]    def drop_jobs(self):
        """delete all information related to jobs"""
        for collection in ["Jobs", "Failures", "Parameters", "JobFailures", "JobParameters", "Results", "JobToJob"]:
            self.db[collection].truncate() 

[docs]    def drop(self):
        """delete all documents in the mycelium"""
        for collection in self.collections:
            self.db[collection].truncate() 

    def _init_collections(self, db) :
        """initialize all collections"""
        for collection in self.collections :
            if collection.lower() not in ("collection", "edges", "field") :
                logger.info("Creating collection", collection)
                try :
                    db.createCollection(collection, allowUserKeys=True)
                except Exception as exp :
                    logger.info("Collection Creation error: =>", exp)

    def _init_graphs(self, db) :
        """initialize all graphs"""

        for graph in self.graphs :
            # ic(graph)
            if graph.lower() != "graph":
                logger.info("Creating graph", graph)
                try :
                    db.createGraph(graph)
                except Exception as exp :
                    logger.info("Graph Creation error (%s): =>" %graph, exp)
    
    def _init_user(self, connection, dbName, username, password) :
        """initialize all users"""

        logger.info("creating user: %s" % username)
        
        user = connection.users.createUser(username, password)
        user["extra"] = "Created on: %s, by automatic setup" % ut.gettime()
        try :
            user.save()
        except Exception as e1 :
            logger.info("Can't create user: '%s' -> " % username, e1)
            try :
                user = connection.users.fetchUser(username)
            except Exception as e2 :
                raise UserCreationError("Unable to get user: '%s' -> " % username, e2)
        u.setPermissions(dbName, True)

    def _init_indexes(self, *args, **kwargs):
        """initialize all indexes"""
        logger.info("No indexes defined")

[docs]    def register_machine_elf(self, machine_elf, store_source):
        """register and elf in the mycellium"""
        now = ut.gettime()
        first_register = False
        try:
            elf_doc = self.db["MachineElves"][machine_elf.uid]
            elf_doc["revisions"]["dates"].append(now)
            elf_doc["revisions"]["dates"] = elf_doc["revisions"]["dates"]
            elf_doc["revisions"]["hashes"].append(machine_elf.revision)
            elf_doc["revisions"]["hashes"] = elf_doc["revisions"]["hashes"]
        except a_exc.DocumentNotFoundError:
            elf_doc = self.db["MachineElves"].createDocument()
            elf_doc["_key"] = machine_elf.uid
            elf_doc["creation_date"] = now
            elf_doc["revisions"]["dates"] = [elf_doc["creation_date"]]
            elf_doc["revisions"]["hashes"] = [machine_elf.revision]
            first_register = True

        revision_key = ut.legalize_key(machine_elf.revision)

        if store_source and (elf_doc["last_revision"] != machine_elf.revision or first_register) and (self.db["MachineElvesRevisions"]):
            revision_doc = self.db["MachineElvesRevisions"].createDocument()
            revision_doc["_key"] = revision_key
            revision_doc["source_code"] = machine_elf.source_code
            revision_doc["creation_date"] = now
            revision_doc.save()

        elf_doc["documentation"] = machine_elf.documentation
        elf_doc["last_revision"] = machine_elf.revision
        
        elf_doc.save()

[docs]    def get_job(self, job_id):
        """get a job"""
        return self.db["Jobs"][job_id]
    
    def _save_job(self, job, now_date):
        """save job to the mycelium"""
        job_key = ut.legalize_key(job.run_job_id)
        job_doc = self.db["Jobs"].createDocument()

        job_doc.set(
            {
            "_key": job_key,
            "task" : {
                    "name": job.task.name,
                    "signature": str(job.task.signature),
                    "source_code": job.task.source_code,
                    "documentation": job.task.documentation,
                    "revision": job.task.revision,
                },
                "machine_elf" : {
                    "id": job.worker_elf.uid,
                    "revision": job.worker_elf.revision,
                },
                # "static_parameters": job.parameters.get_static_parameters(),
                "submit_date" : now_date,
                "start_date": None,
                "end_date": None,
                "status": custom_types.STATUS["PENDING"],
            }
        )
        job_doc.save()
        return job_doc

    def _save_parameters(self, job_doc, params, now):
        """save a parameters"""
        # from rich import print
        def _get_param_doc(node, date):
            doc = self.db["Parameters"].createDocument()
            dct = {"creation_date": date}
            dct.update(node)
            doc.set(dct)
            return doc

        graph = self.db.graphs["JobParameters_graph"]
        for name, traversal in params.items():
            param_doc = _get_param_doc(traversal, now)
            data = {"creation_date": now, "name": name}
            graph.link("JobParameters", job_doc, param_doc, data)

[docs]    def push_job(self, job):
        """push a job to the mycelium"""
        # from rich import print
        now = ut.gettime()
        job_doc = self._save_job(job, now)
        
        params = job.parameters.get_parameter_dict()
        self._save_parameters(job_doc, params, now)
        
        graph = self.db.graphs["Jobs_graph"]
        if job.dependencies:
            for dep in job.dependencies:
                graph.link("JobToJob", "Jobs/" + dep, job_doc, {"creation_date": now})

[docs]    def get_job_parameters(self, job_id):
        """return the parameters for a job"""
        aql = """
        FOR jparam IN JobParameters
            FILTER jparam._from == @id
            FOR node IN Parameters
                FILTER node._id == jparam._to
                RETURN {
                    name: jparam.name,
                    node: node
                }
        """
        bind_vars = {"id": "Jobs/"+ job_id}
        res_aql = self.db.AQLQuery(aql, bindVars=bind_vars, batchSize=100, rawResults=True)
        ret = {}
        for res in res_aql:
            ret[res["name"]] = res["node"]

        return ret

[docs]    def get_jobs(self, elf_uid:str, all_jobs=False, status_restriction=[custom_types.STATUS["PENDING"]]):
        """return all jobs for an elf"""
        bind_vars = {"uid": elf_uid}
        if all_jobs:
            status_restriction = list(custom_types.STATUS.values())
        
        str_status_filter = []
        for status in status_restriction:
            pending = "job.status == @%s" % status
            str_status_filter.append(pending)
            bind_vars[status] = status

        if len(str_status_filter) > 0:
            str_status_filter = "FILTER " + " OR ".join(str_status_filter)
        else:
            str_status_filter = ""

        aql = """
            FOR job IN Jobs
                FILTER job.machine_elf.id == @uid
                {str_status_filter}
                SORT job.creation_date DESC
                RETURN job
        """.format(str_status_filter=str_status_filter)

        ret_q = self.db.AQLQuery(aql, bindVars=bind_vars, batchSize=100, rawResults=True)
        ret = []
        for job in ret_q:
            job["id"] = job["_key"]
            ret.append(job)
        return ret

[docs]    def is_job_ready(self, job_id):
        """return True if the job is ready to run"""
        job_doc = self.get_job(job_id)
        if job_doc["status"] not in [ custom_types.STATUS["PENDING"], custom_types.STATUS["READY"] ]:
            return False

        aql = """
            FOR job IN Jobs
                FILTER job._id == @id
                FOR jtj in JobToJob
                    FILTER jtj._to == job._id
                    FOR job2 IN Jobs
                        FILTER job2._id == jtj._from
                        RETURN job2
        """

        ready = 0
        count = 0
        ret_q = self.db.AQLQuery(aql, bindVars={"id": job_doc["_id"]}, batchSize=100, rawResults=True)
        for job in ret_q:
            count += 1
            if job["status"] == custom_types.STATUS["DONE"]:
                ready += 1

        self_ready = count == ready
        return self_ready

[docs]    def update_job_status(self, job_id, status):
        """update the status of a job"""
        job_doc = self.get_job(job_id)
        job_doc["status"] = status
        job_doc.save()

[docs]    def start_job(self, job_id):
        """mark a job as running"""
        job_doc = self.get_job(job_id)
        job_doc["status"] = custom_types.STATUS["RUNING"]
        job_doc["start_date"] = ut.gettime()
        job_doc.save()

[docs]    def complete_job(self, job_id):
        """mark a job as successful"""
        job_doc = self.get_job(job_id)
        job_doc["status"] = custom_types.STATUS["DONE"]
        job_doc["end_date"] = ut.gettime()
        job_doc.save()

[docs]    def register_job_failure(self, exc_type, exc_value, exc_traceback, job_id):
        """register a job failure"""
        import traceback
        import hashlib

        e = traceback.extract_tb(exc_traceback)
        now = ut.gettime()

        self.update_job_status(job_id, custom_types.STATUS["FAILED"])
        
        trace = traceback.extract_tb(exc_traceback).format()
        trace_str = "".join(trace).encode("utf-8")
        trace_key = ut.legalize_key( str( hashlib.sha256(trace_str).hexdigest() ) )

        try:
            failure_doc = self.db["Failures"][trace_key]
        except a_exc.DocumentNotFoundError:
            failure_doc = self.db["Failures"].createDocument()
            failure_doc.set(
                {
                    "_key": trace_key,
                    "type": str(exc_type),
                    "value": str(exc_value),
                    "traceback": trace,
                    "creation_date": now
                }
            )
            failure_doc.save()

        job_doc = self.get_job(job_id)
        graph = self.db.graphs["JobFailures_graph"]
        graph.link("JobFailures", job_doc, failure_doc, {"creation_date": now})
        job_doc["status"] = custom_types.STATUS["FAILED"]
        job_doc["end_date"] = ut.gettime()
        job_doc.save()

[docs]    def store_results(self, job_id, results:dict):
        """store the results of a job"""
        if results is None:
            return
        
        if not type(results) is dict:
            raise  ResultTypeError("Results must be None or a dictionary")
        
        now = ut.gettime()

        for name, value in results.items():
            result_key = value["result_id"]
            try:
                result_doc = self.db["Results"][result_key]
            except a_exc.DocumentNotFoundError:
                result_doc = self.db["Results"].createDocument()
        
            result_doc.set(
                {
                    "_key": value["result_id"],
                    "name": name,
                    "value": value["value"],
                    "creation_date": now,
                }
            )
            result_doc.save()

[docs]    def get_result(self, result_id):
        """return the result of a job"""
        try:
            result_doc = self.db["Results"][result_id]
        except a_exc.DocumentNotFoundError:
            raise ResultNotFound("Unable to retrieve result: %s" % result_id)

        return result_doc.getStore()["value"]

[docs]    def get_job_status(self, job_id):
        """return the status of a job"""
        job_doc = self.db["Jobs"][job_id]
        return job_doc.getStore()["status"]

    def get_dependencies_status(self, job_id):
        aql = """
            FOR jj IN JobToJob
                FILTER jj._to == @id
                FOR job IN Jobs
                    FILTER jj._from == job._id
                    RETURN {
                        "job_id": job._key,
                        "status": job.status
                    }
        """
        
        bind_vars = {"id": "Jobs/"+ job_id}
        res_q = self.db.AQLQuery(aql, bindVars=bind_vars, batchSize=100, rawResults=True)
        ret = [res for res in res_q]
        return ret