aboutsummaryrefslogblamecommitdiffstats
path: root/entsoe2pgsql.py
blob: ef99fca8514cd8caf8c1cc1810d8cf27b6feb46e (plain) (tree)






































































































                                                                                                                                                                         
#!/bin/python3

import os
import sys
import json
import psycopg2
import requests
import xmltodict

from datetime import datetime
from datetime import timedelta
from tzlocal import get_localzone
from dateutil import tz


# variables
apiKey = os.environ['entsoe_token']
apiUrl = "https://transparency.entsoe.eu/api?securityToken=" + apiKey

pg_db = os.environ['pg_db']
pg_host = os.environ['pg_host']
pg_table = "entsoe"

startTime = datetime.now(get_localzone()) - timedelta(days = 7)
startTime = startTime.strftime('%Y%m%d')

endTime = datetime.now(get_localzone()).strftime('%Y%m%d')

areas = [ {"name": "NO-0", "code": "10YNO-0--------C"},
          {"name": "NO-1", "code": "10YNO-1--------2"},
          {"name": "NO-2", "code": "10YNO-2--------T"},
          {"name": "NO-3", "code": "10YNO-3--------J"},
          {"name": "NO-4", "code": "10YNO-4--------9"} ]
    
UTC = tz.gettz('UTC')
CET = tz.gettz('Europe/Oslo')


# Get the data
values=[]
for area in areas:
    try:
        url = apiUrl + "&documentType=A44&in_Domain=" + area["code"] + "&out_Domain=" + area["code"] + "&periodStart=" + startTime + "0000&periodEnd=" + endTime + "0000"
    
        print("Getting data for " + area["code"])
        response = requests.get(url)
        if response.status_code != 200:
            print(response.status_code)
            print("Oh shit")
            response.raise_for_status()
    
    except Exception as e:
        print("oh lol")
        sys.exit(e)
    
    data_dict = xmltodict.parse(response.content)
    
    items = 0
    if "Publication_MarketDocument" in data_dict:
        for lista in data_dict["Publication_MarketDocument"]["TimeSeries"]:
            utctime = datetime.strptime(lista["Period"]["timeInterval"]["start"], "%Y-%m-%dT%H:%MZ")
            utctime = utctime.replace(tzinfo = UTC)
            cettime = utctime.astimezone(CET)
            items += len(lista["Period"]["Point"])

            for item in lista["Period"]["Point"]:
                # the response contains timerange, but not timestamp for every price, so we must calculate it
                time = str(cettime + timedelta(hours = int(item["position"]) - 1))

                # append values
                values.append((time, area["name"], item["price.amount"]))
    print("Got " + str(items) + " records")
    

# connect to db
conn = psycopg2.connect(database=pg_db, host=pg_host)
cur = conn.cursor()

# count rows before we start
cur.execute("SELECT COUNT(*) FROM " + pg_table)
before = cur.fetchone()

# insert data
print("Inserting into database")
try:
    cur.executemany("INSERT INTO " + pg_table + " VALUES(%s,%s,%s) ON CONFLICT (starttime, zone) DO NOTHING", values)
    conn.commit()
except Exception as e:
    conn.rollback()
    raise e

# count rows after we finnish
cur.execute("SELECT COUNT(*) FROM " + pg_table)
after = cur.fetchone()

# count *new* rows
newRows = after[0] - before[0]

# close connection
conn.close()


print("Successfully inserted " + str(newRows) + " records into the database")