data-jupyter-notebooks/utils/dwh_utils.py

import pathlib
import yaml
import pandas as pd
from sqlalchemy import create_engine

# Path to credentials YAML file
CREDS_FILEPATH = pathlib.Path.home() / ".superhog-dwh" / "credentials.yml"

def read_credentials(yaml_path=CREDS_FILEPATH, env="prd"):
    with open(yaml_path, "r") as file:
        credentials = yaml.safe_load(file)
    return credentials["envs"][env]

def create_postgres_engine(creds: dict):
    user = creds["user"]
    password = creds["password"]
    host = creds["host"]
    port = creds["port"]
    database = creds["database"]
    connection_string = f"postgresql://{user}:{password}@{host}:{port}/{database}"
    return create_engine(connection_string)

def query_to_dataframe(engine, query: str):
    with engine.connect() as connection:
        df = pd.read_sql(query, connection)
    return df

# Optional test function to validate setup
def test_connection():
    print(f"🔌 Testing connection using credentials at: {CREDS_FILEPATH}")
    try:
        creds = read_credentials()
        engine = create_postgres_engine(creds)
        df = query_to_dataframe(engine, "SELECT 1;")
        print("✅ Connection successful.")

    except Exception as e:
        print("❌ Connection failed:")
        print(e)

# Only run the test if this script is executed directly
if __name__ == "__main__":
    test_connection()