erdl#119 create orm_lonoa.py to replace other orm files

matthew-schultz · Dec 22, 2019 · 7c08604 · 7c08604
1 parent 65609c5
commit 7c08604
Showing 1 changed file with 212 additions and 0 deletions.
diff --git a/orm_lonoa.py b/orm_lonoa.py
@@ -0,0 +1,212 @@
+#!./env/bin/python3
+"""
+This module defines classes for the postgresql tables that store database insertion success and readings
+and functions relating to those tables
+"""
+from pathlib import Path #used to read config.txt in parent directory
+from sqlalchemy import create_engine
+from sqlalchemy import BigInteger, Boolean, Column, Integer, String
+from sqlalchemy.dialects.postgresql import DOUBLE_PRECISION, TIMESTAMP
+from sqlalchemy.ext.declarative import declarative_base
+from sqlalchemy.sql import func
+from sqlalchemy.schema import ForeignKey
+from sqlalchemy.types import Enum
+
+import configparser
+# import csv
+import enum
+import os
+
+
+# needs to be in the same scope as all ORM table classes because they are subclasses of declarative_base class
+BASE = declarative_base()
+
+
+class Project(BASE):
+    """
+    This class represents the project table
+
+    Columns:
+        project_folder_path: the full path of the folder where a project's files and folders are stored
+    """
+    __tablename__ = 'project'
+
+    project_folder_path = Column(String, primary_key=True)
+
+
+class Reading(BASE):
+    """
+    This class represents the readings table
+
+    The table contains data read by the sensor for given units of time (usually minutes)
+
+    Columns:
+        datetime: the reading's datetime
+        purpose_id: unique id representing a purpose
+        value: the numerical value of a reading
+    """
+    __tablename__ = 'reading'
+
+    datetime = Column(TIMESTAMP, primary_key=True)
+    purpose_id = Column(BigInteger, ForeignKey('sensor_info.purpose_id'), primary_key=True)
+    units = Column(String(length=255), nullable=False)
+    reading = Column(DOUBLE_PRECISION, nullable=False)
+    upload_timestamp = Column(TIMESTAMP, default=func.now(), nullable=False)
+    log_id = Column(Integer, ForeignKey('error_log.log_id'))
+
+
+class SensorInfo(BASE):
+    """
+    Sources of readings
+
+    Columns:
+        purpose_id: uniquely identifies a purpose
+        query_string: string used in egauge and webctrl API requests; hobo sensor serial number; one query_string may have multiple purposes (egauge)
+        data_sensor_info_mapping: matches full column name in raw data (egauge api data, hobo csv's, etc)
+        type: string that represents one column name in data from a sensor if one row of data has multiple readings
+        script_folder: string representing source of readings; e.g. egauge, webctrl, hobo
+        is_active: boolean representing if script can request data from a sensor
+        last_updated_datetime: used to keep track of datetime of last successfully inserted reading
+        unit: unit of readings
+    """
+    __tablename__ = 'sensor_info'
+
+    class ScriptFolderEnum(enum.Enum):
+        """
+        This class defines strings that could be inserted into sensor_info.sensor_type
+        """
+        egauge = "egauge"
+        hobo = "hobo"
+        webctrl = "webctrl"
+
+    purpose_id = Column(Integer, primary_key=True)
+    building = Column(String(length=50))
+    variable_name = Column(String(length=50))
+    unit = Column(String(length=20))
+    type = Column(String(length=50))
+    appliance = Column(String(length=30))
+    room = Column(String(length=30))
+    surface = Column(String(length=50))
+    sample_resolution = Column(String(length=20))
+    query_string = Column(String(length=255))
+    note = Column(String(length=255))
+    data_sensor_info_mapping = Column(String)
+    script_folder = Column(Enum(ScriptFolderEnum))
+    is_active = Column(Boolean)
+    last_updated_datetime = Column(TIMESTAMP)
+
+
+class ErrorLog(BASE):
+    """
+    This class represents the error_log table
+
+    This table is the "historian" of the database and should help the entire team troubleshoot problem.
+    While it is not an oracle of all errors, it should help narrow down the problem space.
+
+    2 new rows will be added to this table every time the script runs.
+
+    Columns:
+        log_id: uniquely identifies a row
+        purpose_id: unique id representing a purpose
+        datetime: when an api request or a reading insertion was attempted
+        was_success: boolean representing if api script ran successfully or not
+        error_type: name of python exception caught; should remain empty if no exception was caught
+        pipeline_stage: the stage of the api script execution when an error_log row was inserted
+    """
+    __tablename__ = 'error_log'
+
+    class PipelineStageEnum(enum.Enum):
+        """
+        This class defines strings that could be inserted into error_log.pipeline_stage
+
+        Each string represents at what stage of the api script execution an error_log row was inserted
+            data_acquisition: obtaining readings from source
+            database_insertion: inserting new rows into readings table
+        """
+        data_acquisition = "data_acquisition"
+        database_insertion = "database_insertion"
+
+    # the sqlalchemy orm requires a primary key in each table
+    log_id = Column(Integer, primary_key=True)
+    purpose_id = Column(Integer)
+    datetime = Column(TIMESTAMP)
+    was_success = Column(Boolean)
+    error_type = Column(String)
+    pipeline_stage = Column(Enum(PipelineStageEnum))
+
+    # def __repr__(self):
+    #     return "<ErrorLog(id='%s', timestamp='%s, is_success='%s')>" % (
+    #                          self.id, self.timestamp, self.is_success)
+
+
+class ErrorLogDetails(BASE):
+    """
+    This class represents the error_log_details table that houses any extra info needed to troubleshoot script problems.
+
+    error_log_details is a long-form table.
+    It is currently used with hobo scripts to store fields like filename, first and last reading timestamps,
+    as one hobo has multiple files, with potentially repeated names.
+    """
+    __tablename__ = 'error_log_details'
+
+    log_id = Column(Integer, primary_key=True)
+    information_type = Column(String, primary_key=True)
+    information_value = Column(String)
+
+
+class ApiAuthentication(BASE):
+    """
+    User info for authentication
+
+    Used when connecting to api's like webctrl
+    """
+    __tablename__ = 'api_authentication'
+
+    user_id = Column(Integer, primary_key=True)
+    script_folder = Column(Enum(SensorInfo.ScriptFolderEnum))
+    username = Column(String)
+    password = Column(String)
+
+
+def setup():
+    """
+    Use defined classes to create tables in the database named in config file
+    """
+    #config_path = str(Path(os.path.dirname(os.path.realpath(__file__))).parent.parent) + "/config.txt"
+    config_path = "config.txt"
+    with open(config_path, "r") as file:
+        #prepend '[DEFAULT]\n' since ConfigParser requires section headers in config files
+        config_string = '[DEFAULT]\n' + file.read()
+    config = configparser.ConfigParser()
+    config.read_string(config_string)
+    db_url = "postgresql:///" + config['DEFAULT']['db']
+    db = create_engine(db_url)
+    BASE.metadata.create_all(db)
+
+
+def teardown():
+    """
+    Drop all tables in the database named in config file
+    """
+    config_path = str(Path(os.path.dirname(os.path.realpath(__file__))).parent.parent) + "/config.txt"
+    with open(config_path, "r") as file:
+        #prepend '[DEFAULT]\n' since ConfigParser requires section headers in config files
+        config_string = '[DEFAULT]\n' + file.read()
+    config = configparser.ConfigParser()
+    config.read_string(config_string)
+    db_url = "postgresql:///" + config['DEFAULT']['db']
+    db = create_engine(db_url)
+    BASE.metadata.drop_all(db)
+    # Readings.__table__.drop(db) # how to drop one table
+
+# def export_reading_to_csv(db_url=DB_URL, output_filename='reading_dump.csv'):
+#     db = create_engine(db_url)
+#     Session = sessionmaker(db)
+#     session = Session()
+#
+#     with open(output_filename, 'w') as outfile:
+#         outcsv = csv.writer(outfile)
+#         rows = session.query(Reading)
+#         for row in rows:
+#             outcsv.writerow([row.reading_id, row.query_string, row.timestamp, row.units, row.reading])
+#     session.close()