Source code for aepsych.database.db

#!/usr/bin/env python3
# Copyright (c) Facebook, Inc. and its affiliates.
# All rights reserved.

# This source code is licensed under the license found in the
# LICENSE file in the root directory of this source tree.

import datetime
import logging
import os
import uuid
from contextlib import contextmanager
from pathlib import Path
from typing import Dict

import aepsych.database.tables as tables
from sqlalchemy import create_engine
from sqlalchemy.orm import sessionmaker
from sqlalchemy.orm.session import close_all_sessions

logger = logging.getLogger()


[docs]class Database:
    def __init__(self, db_path=None):
        if db_path is None:
            db_path = "./databases/default.db"

        db_dir, db_name = os.path.split(db_path)
        self._db_name = db_name
        self._db_dir = db_dir

        if os.path.exists(db_path):
            logger.info(f"Found DB at {db_path}, appending!")
        else:
            logger.info(f"No DB found at {db_path}, creating a new DB!")

        self._engine = self.get_engine()

[docs]    def get_engine(self):
        if not hasattr(self, "_engine") or self._engine is None:
            self._full_db_path = Path(self._db_dir)
            self._full_db_path.mkdir(parents=True, exist_ok=True)
            self._full_db_path = self._full_db_path.joinpath(self._db_name)

            self._engine = create_engine(f"sqlite:///{self._full_db_path.as_posix()}")

            # create the table metadata and tables
            tables.Base.metadata.create_all(self._engine)

            # create an ongoing session to be used. Provides a conduit
            # to the db so the instantiated objects work properly.
            Session = sessionmaker(bind=self.get_engine())
            self._session = Session()

        return self._engine

[docs]    def delete_db(self):
        if self._engine is not None and self._full_db_path.exists():
            close_all_sessions()
            self._full_db_path.unlink()
            self._engine = None

[docs]    def is_update_required(self):
        return (
            tables.DBMasterTable.requires_update(self._engine)
            or tables.DbReplayTable.requires_update(self._engine)
            or tables.DbStratTable.requires_update(self._engine)
            or tables.DbConfigTable.requires_update(self._engine)
            or tables.DbRawTable.requires_update(self._engine)
            or tables.DbParamTable.requires_update(self._engine)
            or tables.DbOutcomeTable.requires_update(self._engine)
        )

[docs]    def perform_updates(self):
        """Perform updates on known tables. SQLAlchemy doesn't do alters so they're done the old fashioned way."""
        tables.DBMasterTable.update(self._engine)
        tables.DbReplayTable.update(self._engine)
        tables.DbStratTable.update(self._engine)
        tables.DbConfigTable.update(self._engine)
        tables.DbRawTable.update(self, self._engine)
        tables.DbParamTable.update(self._engine)
        tables.DbOutcomeTable.update(self._engine)

[docs]    @contextmanager
    def session_scope(self):
        """Provide a transactional scope around a series of operations."""
        Session = sessionmaker(bind=self.get_engine())
        session = Session()
        try:
            yield session
            session.commit()
        except Exception as err:
            logger.error(f"db session use failed: {err}")
            session.rollback()
            raise
        finally:
            session.close()

    # @retry(stop_max_attempt_number=8, wait_exponential_multiplier=1.8)
[docs]    def execute_sql_query(self, query: str, vals: Dict[str, str]):
        """Execute an arbitrary query written in sql."""
        with self.session_scope() as session:
            return session.execute(query, vals).fetchall()

[docs]    def get_master_records(self):
        """Grab the list of master records."""
        records = self._session.query(tables.DBMasterTable).all()
        return records

[docs]    def get_master_record(self, experiment_id):
        """Grab the list of master record for a specific experiment (master) id."""
        records = (
            self._session.query(tables.DBMasterTable)
            .filter(tables.DBMasterTable.experiment_id == experiment_id)
            .all()
        )

        if 0 < len(records):
            return records[0]

        return None

[docs]    def get_replay_for(self, master_id):
        """Get the replay records for a specific master row."""
        master_record = self.get_master_record(master_id)

        if master_record is not None:
            return master_record.children_replay

        return None

[docs]    def get_strats_for(self, master_id=0):
        """Get the strat records for a specific master row."""
        master_record = self.get_master_record(master_id)

        if master_record is not None and len(master_record.children_strat) > 0:
            return [c.strat for c in master_record.children_strat]

        return None

[docs]    def get_strat_for(self, master_id, strat_id=-1):
        """Get a specific strat record for a specific master row."""
        master_record = self.get_master_record(master_id)

        if master_record is not None and len(master_record.children_strat) > 0:
            return master_record.children_strat[strat_id].strat

        return None

[docs]    def get_config_for(self, master_id):
        """Get the strat records for a specific master row."""
        master_record = self.get_master_record(master_id)

        if master_record is not None:
            return master_record.children_config[0].config
        return None

[docs]    def get_raw_for(self, master_id):
        """Get the raw data for a specific master row."""
        master_record = self.get_master_record(master_id)

        if master_record is not None:
            return master_record.children_raw

        return None

[docs]    def get_all_params_for(self, master_id):
        """Get the parameters for all the iterations of a specific experiment."""
        raw_record = self.get_raw_for(master_id)
        params = []

        if raw_record is not None:
            for raw in raw_record:
                for param in raw.children_param:
                    params.append(param)
            return params

        return None

[docs]    def get_param_for(self, master_id, iteration_id):
        """Get the parameters for a specific iteration of a specific experiment."""
        raw_record = self.get_raw_for(master_id)

        if raw_record is not None:
            for raw in raw_record:
                if raw.unique_id == iteration_id:
                    return raw.children_param

        return None

[docs]    def get_all_outcomes_for(self, master_id):
        """Get the outcomes for all the iterations of a specific experiment."""
        raw_record = self.get_raw_for(master_id)
        outcomes = []

        if raw_record is not None:
            for raw in raw_record:
                for outcome in raw.children_outcome:
                    outcomes.append(outcome)
            return outcomes

        return None

[docs]    def get_outcome_for(self, master_id, iteration_id):
        """Get the outcomes for a specific iteration of a specific experiment."""
        raw_record = self.get_raw_for(master_id)

        if raw_record is not None:
            for raw in raw_record:
                if raw.unique_id == iteration_id:
                    return raw.children_outcome

        return None

[docs]    def record_setup(
        self,
        description,
        name,
        extra_metadata=None,
        id=None,
        request=None,
        participant_id=None,
    ) -> str:
        self.get_engine()

        if id is None:
            master_table = tables.DBMasterTable()
            master_table.experiment_description = description
            master_table.experiment_name = name
            master_table.experiment_id = str(uuid.uuid4())
            if participant_id is not None:
                master_table.participant_id = participant_id
            else:
                master_table.participant_id = str(
                    uuid.uuid4()
                )  # no p_id specified will result in a generated UUID

            master_table.extra_metadata = extra_metadata

            self._session.add(master_table)

            logger.debug(f"record_setup = [{master_table}]")
        else:
            master_table = self.get_master_record(id)
            if master_table is None:
                raise RuntimeError(f"experiment id {id} doesn't exist in the db.")

        record = tables.DbReplayTable()
        record.message_type = "setup"
        record.message_contents = request

        if "extra_info" in request:
            record.extra_info = request["extra_info"]

        record.timestamp = datetime.datetime.now()
        record.parent = master_table
        logger.debug(f"record_setup = [{record}]")

        self._session.add(record)
        self._session.commit()

        # return the master table if it has a link to the list of child rows
        # tis needs to be passed into all future calls to link properly
        return master_table

[docs]    def record_message(self, master_table, type, request) -> None:
        # create a linked setup table
        record = tables.DbReplayTable()
        record.message_type = type
        record.message_contents = request

        if "extra_info" in request:
            record.extra_info = request["extra_info"]

        record.timestamp = datetime.datetime.now()
        record.parent = master_table

        self._session.add(record)
        self._session.commit()

[docs]    def record_raw(self, master_table, model_data, timestamp=None):
        raw_entry = tables.DbRawTable()
        raw_entry.model_data = model_data

        if timestamp is None:
            raw_entry.timestamp = datetime.datetime.now()
        else:
            raw_entry.timestamp = timestamp
        raw_entry.parent = master_table

        self._session.add(raw_entry)
        self._session.commit()

        return raw_entry

[docs]    def record_param(self, raw_table, param_name, param_value) -> None:
        param_entry = tables.DbParamTable()
        param_entry.param_name = param_name
        param_entry.param_value = param_value

        param_entry.parent = raw_table

        self._session.add(param_entry)
        self._session.commit()

[docs]    def record_outcome(self, raw_table, outcome_name, outcome_value) -> None:
        outcome_entry = tables.DbOutcomeTable()
        outcome_entry.outcome_name = outcome_name
        outcome_entry.outcome_value = outcome_value

        outcome_entry.parent = raw_table

        self._session.add(outcome_entry)
        self._session.commit()

[docs]    def record_strat(self, master_table, strat):
        strat_entry = tables.DbStratTable()
        strat_entry.strat = strat
        strat_entry.timestamp = datetime.datetime.now()
        strat_entry.parent = master_table

        self._session.add(strat_entry)
        self._session.commit()

[docs]    def record_config(self, master_table, config):
        config_entry = tables.DbConfigTable()
        config_entry.config = config
        config_entry.timestamp = datetime.datetime.now()
        config_entry.parent = master_table

        self._session.add(config_entry)
        self._session.commit()

[docs]    def list_master_records(self):
        master_records = self.get_master_records()

        print("Listing master records:")
        for record in master_records:
            print(
                f'\t{record.unique_id} - name: "{record.experiment_name}" experiment id: {record.experiment_id}'
            )
AEPsych

Source code for aepsych.database.db

AEPsych

Navigation

Related Topics