Source code for volttron.platform.dbutils.basedb

# -*- coding: utf-8 -*- {{{
# vim: set fenc=utf-8 ft=python sw=4 ts=4 sts=4 et:
#
# Copyright 2019, Battelle Memorial Institute.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
#
# This material was prepared as an account of work sponsored by an agency of
# the United States Government. Neither the United States Government nor the
# United States Department of Energy, nor Battelle, nor any of their
# employees, nor any jurisdiction or organization that has cooperated in the
# development of these materials, makes any warranty, express or
# implied, or assumes any legal liability or responsibility for the accuracy,
# completeness, or usefulness or any information, apparatus, product,
# software, or process disclosed, or represents that its use would not infringe
# privately owned rights. Reference herein to any specific commercial product,
# process, or service by trade name, trademark, manufacturer, or otherwise
# does not necessarily constitute or imply its endorsement, recommendation, or
# favoring by the United States Government or any agency thereof, or
# Battelle Memorial Institute. The views and opinions of authors expressed
# herein do not necessarily state or reflect those of the
# United States Government or any agency thereof.
#
# PACIFIC NORTHWEST NATIONAL LABORATORY operated by
# BATTELLE for the UNITED STATES DEPARTMENT OF ENERGY
# under Contract DE-AC05-76RL01830
# }}}


import contextlib
import importlib
import logging
import threading
from gevent.local import local

import sys
from abc import abstractmethod
from volttron.platform.agent import utils
from volttron.platform import jsonapi
import sqlite3

utils.setup_logging()
_log = logging.getLogger(__name__)


[docs]class ConnectionError(Exception):
    """Custom class for connection errors"""
    pass


[docs]@contextlib.contextmanager
def closing(obj):
    try:
        yield obj
    finally:
        try:
            obj.close()
        except BaseException as exc:
            # if exc.__class__.__module__ == 'exceptions':
            if exc.__class__.__module__ == 'builtins':
                # Don't ignore built-in exceptions because they likely indicate
                # a bug that should stop execution. psycopg2.Error subclasses
                # Exception, so the module must also be checked. :-(
                raise
            _log.exception('An exception was raised while closing '
                           'the cursor and is being ignored.')


[docs]class DbDriver(object):
    """
    Parent class used by :py:class:`sqlhistorian.historian.SQLHistorian` to
    do the database operations. This class is inherited by

    - :py:class:`volttron.platform.dbutils.mysqlfuncts.MySqlFuncts`
    - :py:class:`volttron.platform.dbutils.sqlitefuncts.SqlLiteFuncts`

    """
    def __init__(self, dbapimodule, **kwargs):
        thread_name = threading.currentThread().getName()
        if callable(dbapimodule):
            _log.debug("Constructing Driver for %s in thread: %s",
                       dbapimodule.__name__, thread_name)
            connect = dbapimodule
        else:
            _log.debug("Constructing Driver for %s in thread: %s",
                       dbapimodule, thread_name)
            _log.debug("kwargs for connect is %r", kwargs)
            dbapimodule = importlib.import_module(dbapimodule)
            connect = lambda: dbapimodule.connect(**kwargs)
        self.__connect = connect
        self.__connection = None
        self.stash = local()

[docs]    @contextlib.contextmanager
    def bulk_insert(self):
        """
        Function to meet bulk insert requirements. This function can be overridden by historian drivers to yield the
        required method for data insertion during bulk inserts in the respective historians. In this generic case it
        will yield the single insert method

        :yields: insert method
        """
        yield self.insert_data

[docs]    def cursor(self):

        self.stash.cursor = None
        if self.__connection is not None and not getattr(self.__connection, "closed", False):
            try:
                self.stash.cursor = self.__connection.cursor()
                return self.stash.cursor
            except Exception:
                _log.warn("An exception occurred while creating "
                          "a cursor. Will try establishing connection again")
        self.__connection = None
        try:
            self.__connection = self.__connect()
        except Exception as e:
            _log.error("Could not connect to database. Raise ConnectionError")
            raise ConnectionError(e).with_traceback(sys.exc_info()[2])
        if self.__connection is None:
            raise ConnectionError(
                "Unknown error. Could not connect to database")

        # if any exception happens here have it go to the caller.
        self.stash.cursor = self.__connection.cursor()

        return self.stash.cursor

[docs]    def read_tablenames_from_db(self, meta_table_name):
        """
        Reads names of the tables used by this historian to store data,
        topics, metadata, aggregate topics and aggregate metadata

        :param meta_table_name: The volttron metadata table in which table
                                definitions are stored
        :return: table names
        .. code-block:: python

            {
             'data_table': name of table that store data,
             'topics_table':name of table that store list of topics,
             'meta_table':name of table that store metadata,
             'agg_topics_table':name of table that stores aggregate topics,
             'agg_meta_table':name of table that store aggregate metadata
             }
        """
        rows = self.select("SELECT table_id, table_name, table_prefix from " +
                           meta_table_name, None)
        table_names = dict()
        table_prefix = ""
        table_map = {}

        for row in rows:
            table_map[row[0].lower()] = row[1]
            table_prefix = row[2] + "_" if row[2] else ""
            table_names[row[0]] = table_prefix + row[1]

        table_names['agg_topics_table'] = table_prefix + \
            'aggregate_' + table_map['topics_table']
        table_names['agg_meta_table'] = table_prefix + 'aggregate_' + \
            table_map['meta_table']
        return table_names

[docs]    @abstractmethod
    def setup_historian_tables(self):
        """
        Create historian tables if necessary
        """
        pass

[docs]    @abstractmethod
    def get_topic_map(self):
        """
        Returns details of topics in database

        :return: two dictionaries.
        - First one maps topic_name.lower() to topic id  and
        - Second one maps topic_name.lower() to topic name
        """
        pass

[docs]    @abstractmethod
    def get_agg_topics(self):
        """
        Get the list of aggregate topics available

        :return: list of tuples containing
        (agg_topic_name, agg_type, agg_time_period, configured topics/topic
        name pattern)
        """
        pass

[docs]    @abstractmethod
    def get_agg_topic_map(self):
        """
        Get a map of aggregate_topics to aggregate_topic_id

        :return: dict of format
        {(agg_topic_name, agg_type, agg_time_period):agg_topic_id}
        """
        pass

[docs]    @abstractmethod
    def query_topics_by_pattern(self, topic_pattern):
        """
        Return a map of {topi_name.lower():topic_id} that matches the given
        pattern
        :param topic_pattern: pattern to match against topic_name
        :return:
        """
        pass

[docs]    @abstractmethod
    def insert_data_query(self):
        """
        :return: query string to insert data into database
        """
        pass

[docs]    @abstractmethod
    def insert_topic_query(self):
        """
        :return: query string to insert a topic into database
        """
        pass

[docs]    @abstractmethod
    def update_topic_query(self):
        """
        :return: query string to update a topic in database
        """
        pass

[docs]    @abstractmethod
    def insert_meta_query(self):
        """
        :return: query string to insert metadata for a topic into database
        """
        pass

[docs]    @abstractmethod
    def get_aggregation_list(self):
        """
        Return list of aggregation supported by the specific data store

        :return: list of aggregations
        """
        pass

[docs]    @abstractmethod
    def insert_agg_topic_stmt(self):
        """
        :return: query string to insert an aggregate topic into database
        """
        pass

[docs]    @abstractmethod
    def update_agg_topic_stmt(self):
        """
        :return: query string to update an aggregate topic in database
        """
        pass

[docs]    @abstractmethod
    def replace_agg_meta_stmt(self):
        """
        :return: query string to insert metadata for an aggregate topic into
        database
        """
        pass

[docs]    def manage_db_size(self, history_limit_timestamp, storage_limit_gb):
        """
        Optional function to manage database size.

        :param history_limit_timestamp: remove all data older than this timestamp
        :param storage_limit_gb: remove oldest data until database is smaller than this value.
        """
        pass

[docs]    def insert_meta(self, topic_id, metadata):
        """
        Inserts metadata for topic

        :param topic_id: topic id for which metadata is inserted
        :param metadata: metadata
        :return: True if execution completes. Raises exception if unable to
        connect to database
        """
        self.execute_stmt(self.insert_meta_query(),
                          (topic_id, jsonapi.dumps(metadata)), commit=False)
        return True

[docs]    def insert_data(self, ts, topic_id, data):
        """
        Inserts data for topic

        :param ts: timestamp
        :param topic_id: topic id for which data is inserted
        :param data: data value
        :return: True if execution completes. raises Exception if unable to
        connect to database
        """
        self.execute_stmt(self.insert_data_query(),
                          (ts, topic_id, jsonapi.dumps(data)), commit=False)
        return True

[docs]    def insert_topic(self, topic):
        """
        Insert a new topic

        :param topic: topic to insert
        :return: id of the topic inserted if insert was successful.
                 Raises exception if unable to connect to database
        """
        with closing(self.cursor()) as cursor:
            cursor.execute(self.insert_topic_query(), (topic,))
            return cursor.lastrowid

[docs]    def update_topic(self, topic, topic_id):
        """
        Update a topic name

        :param topic: new topic name
        :param topic_id: topic id for which update is done
        :return: True if execution is complete. Raises exception if unable to
        connect to database
        """
        self.execute_stmt(self.update_topic_query(), (topic, topic_id),
                          commit=False)
        return True

[docs]    def insert_agg_meta(self, topic_id, metadata):
        """
        Inserts metadata for aggregate topic

        :param topic_id: aggregate topic id for which metadata is inserted
        :param metadata: metadata
        :return: True if execution completes. Raises exception if connection to
        database fails
        """
        self.execute_stmt(self.replace_agg_meta_stmt(),
                          (topic_id, jsonapi.dumps(metadata)), commit=False)
        return True

[docs]    def insert_agg_topic(self, topic, agg_type, agg_time_period):
        """
        Insert a new aggregate topic

        :param topic: topic name to insert
        :param agg_type: type of aggregation
        :param agg_time_period: time period of aggregation
        :return: id of the topic inserted if insert was successful.
                 Raises exception if unable to connect to database
        """
        with closing(self.cursor()) as cursor:
            cursor.execute(self.insert_agg_topic_stmt(),
                           (topic, agg_type, agg_time_period))
            return cursor.lastrowid

[docs]    def update_agg_topic(self, agg_id, agg_topic_name):
        """
        Update a aggregate topic name

        :param agg_id: topic id for which update is done
        :param agg_topic_name: new aggregate topic name
        :return: True if execution is complete. Raises exception if unable to
        connect to database
        """
        self.execute_stmt(self.update_agg_topic_stmt(),
                          (agg_topic_name, agg_id),commit=False)
        return True

[docs]    def commit(self):
        """
        Commit a transaction

        :return: True if successful, False otherwise
        """
        if self.__connection is not None:
            try:
                self.__connection.commit()
                return True
            except sqlite3.OperationalError as e:
                if "database is locked" in str(e):
                    _log.error("EXCEPTION: SQLITE3 Database is locked. This "
                               "error could occur when there are multiple "
                               "simultaneous read and write requests, making "
                               "individual request to wait more than the "
                               "default timeout period. If you are using "
                               "sqlite for frequent reads and write, please "
                               "configure a higher timeout in agent "
                               "configuration under \n"
                               "config[\"connection\"][\"params\"]["
                               "\"timeout\"]  "
                               "Default value is 10. Timeout units is seconds")
                raise
        _log.warning('connection was null during commit phase.')
        return False

[docs]    def rollback(self):
        """
        Rollback a transaction

        :return: True if successful, False otherwise
        """
        if self.__connection is not None:
            self.__connection.rollback()
            return True
        _log.warning('connection was null during rollback phase.')
        return False

[docs]    def close(self):
        """
        Close connection to database
        :return:
        """
        if self.__connection is not None:
            self.__connection.close()

[docs]    def select(self, query, args=None, fetch_all=True):
        """
        Execute a select statement

        :param query: select statement
        :param args: arguments for the where clause
        :param fetch_all: Set to True if function should return retrieve all
        the records from cursors and return it. Set to False to return cursor.
        :return: resultant rows if fetch_all is True else returns the cursor
        It is up to calling method to close the cursor
        """
        if not args:
            args = ()
        cursor = self.cursor()
        try:
            cursor.execute(query, args)
        except Exception:
            cursor.close()
            raise
        if fetch_all:
            with closing(cursor):
                return cursor.fetchall()
        return cursor

[docs]    def execute_stmt(self, stmt, args=None, commit=False):
        """
        Execute a sql statement

        :param stmt: the statement to execute
        :param args: optional arguments
        :param commit: True if transaction should be committed. Defaults to
        False
        :return: count of the number of affected rows
        """
        if args is None:
            args = ()
        with closing(self.cursor()) as cursor:
            cursor.execute(stmt, args)
            if commit:
                self.commit()
            return cursor.rowcount

[docs]    def execute_many(self, stmt, args, commit=False):
        """
        Execute a sql statement with multiple args

        :param stmt: the statement to execute
        :param args: optional arguments
        :param commit: True if transaction should be committed. Defaults to
        False
        :return: count of the number of affected rows
        """
        with closing(self.cursor()) as cursor:
            cursor.executemany(stmt, args)
            if commit:
                self.commit()
            return cursor.rowcount

[docs]    @abstractmethod
    def query(self, topic_ids, id_name_map, start=None, end=None,
              agg_type=None,
              agg_period=None, skip=0, count=None, order="FIRST_TO_LAST"):
        """
        Queries the raw historian data or aggregate data and returns the
        results of the query

        :param topic_ids: list of topic ids to query for.
        :param id_name_map: dictionary that maps topic id to topic name
        :param start: Start of query timestamp as a datetime.
        :param end: End of query timestamp as a datetime.
        :param agg_type: If this is a query for aggregate data, the type of
                         aggregation ( for example, sum, avg)
        :param agg_period: If this is a query for aggregate data, the time
                           period of aggregation
        :param skip: Skip this number of results.
        :param count: Limit results to this value. When the query is for
                      multiple topics, count applies to individual topics. For
                      example, a query on 2 topics with count=5 will return 5
                      records for each topic
        :param order: How to order the results, either "FIRST_TO_LAST" or
                      "LAST_TO_FIRST"
        :type topic: str or list
        :type start: datetime
        :type end: datetime
        :type skip: int
        :type count: int
        :type order: str
        :return: result of the query in the format:
        .. code-block:: python

            {
            topic_name:[(timestamp1, value1),
                        (timestamp2:,value2),
                        ...],
            topic_name:[(timestamp1, value1),
                        (timestamp2:,value2),
                        ...],
            ...}
        """
        pass

[docs]    @abstractmethod
    def create_aggregate_store(self, agg_type, period):
        """
        Create the data structure (table or collection) that is going to store
        the aggregate data for the give aggregation type and aggregation
        time period. Table name should be constructed as <agg_type>_<period>

        :param agg_type: The type of aggregation. (avg, sum etc.)
        :param agg_time_period: The time period of aggregation
        :return - True if successful, False otherwise
        """
        pass

[docs]    @abstractmethod
    def insert_aggregate_stmt(self, table_name):
        """
        The sql statement to insert collected aggregate for a given time
        period into database

        :param table_name: name of the table into which the aggregate data
                           needs to be inserted
        :return: sql insert/replace statement to insert aggregate data for a
                 specific time slice
        :rtype: str
        """
        pass

[docs]    def insert_aggregate(self, agg_topic_id, agg_type, period, ts,
                         data, topic_ids):
        """
        Insert aggregate data collected for a specific  time period into
        database. Data is inserted into <agg_type>_<period> table

        :param agg_topic_id: topic id
        :param agg_type: type of aggregation
        :param period: time period of aggregation
        :param ts: end time of aggregation period (not inclusive)
        :param data: computed aggregate
        :param topic_ids: topic ids or topic ids for which aggregate was
                          computed
        :return: True if execution was successful, raises exception
        in case of connection failures
        """
        table_name = agg_type + '_' + period
        _log.debug("Inserting aggregate: {} {} {} {} into table {}".format(
            ts, agg_topic_id, jsonapi.dumps(data), str(topic_ids), table_name))
        self.execute_stmt(
            self.insert_aggregate_stmt(table_name),
            (ts, agg_topic_id, jsonapi.dumps(data), str(topic_ids)),
            commit=True)
        return True

[docs]    @abstractmethod
    def collect_aggregate(self, topic_ids, agg_type, start=None, end=None):
        """
        Collect the aggregate data by querying the historian's data store

        :param topic_ids: list of topic ids for which aggregation should be
                          performed.
        :param agg_type: type of aggregation
        :param start_time: start time for query (inclusive)
        :param end_time:  end time for query (exclusive)
        :return: a tuple of (aggregated value, count of records over which
                 this aggregation was computed)
        """
        pass