diff options
author | Dennis Eriksen <d@ennis.no> | 2022-09-14 12:35:43 +0200 |
---|---|---|
committer | Dennis Eriksen <d@ennis.no> | 2022-09-14 12:35:43 +0200 |
commit | e58dc713bef769c55efb42a76b6e058c28122bf4 (patch) | |
tree | 9f8bf9710cdfba33dd8b04eff630e15610c40a8d /entsoe2pgsql.py | |
parent | Sometimes there's a delay before new data is available. Increase the (diff) | |
download | energyscripts-e58dc713bef769c55efb42a76b6e058c28122bf4.tar.gz |
Adding Entsoe as a data source. Also adding Norges Bank, since Entsoes
prices are in Euros, and I need an exchange-rate.
Diffstat (limited to 'entsoe2pgsql.py')
-rwxr-xr-x | entsoe2pgsql.py | 103 |
1 files changed, 103 insertions, 0 deletions
diff --git a/entsoe2pgsql.py b/entsoe2pgsql.py new file mode 100755 index 0000000..ef99fca --- /dev/null +++ b/entsoe2pgsql.py @@ -0,0 +1,103 @@ +#!/bin/python3 + +import os +import sys +import json +import psycopg2 +import requests +import xmltodict + +from datetime import datetime +from datetime import timedelta +from tzlocal import get_localzone +from dateutil import tz + + +# variables +apiKey = os.environ['entsoe_token'] +apiUrl = "https://transparency.entsoe.eu/api?securityToken=" + apiKey + +pg_db = os.environ['pg_db'] +pg_host = os.environ['pg_host'] +pg_table = "entsoe" + +startTime = datetime.now(get_localzone()) - timedelta(days = 7) +startTime = startTime.strftime('%Y%m%d') + +endTime = datetime.now(get_localzone()).strftime('%Y%m%d') + +areas = [ {"name": "NO-0", "code": "10YNO-0--------C"}, + {"name": "NO-1", "code": "10YNO-1--------2"}, + {"name": "NO-2", "code": "10YNO-2--------T"}, + {"name": "NO-3", "code": "10YNO-3--------J"}, + {"name": "NO-4", "code": "10YNO-4--------9"} ] + +UTC = tz.gettz('UTC') +CET = tz.gettz('Europe/Oslo') + + +# Get the data +values=[] +for area in areas: + try: + url = apiUrl + "&documentType=A44&in_Domain=" + area["code"] + "&out_Domain=" + area["code"] + "&periodStart=" + startTime + "0000&periodEnd=" + endTime + "0000" + + print("Getting data for " + area["code"]) + response = requests.get(url) + if response.status_code != 200: + print(response.status_code) + print("Oh shit") + response.raise_for_status() + + except Exception as e: + print("oh lol") + sys.exit(e) + + data_dict = xmltodict.parse(response.content) + + items = 0 + if "Publication_MarketDocument" in data_dict: + for lista in data_dict["Publication_MarketDocument"]["TimeSeries"]: + utctime = datetime.strptime(lista["Period"]["timeInterval"]["start"], "%Y-%m-%dT%H:%MZ") + utctime = utctime.replace(tzinfo = UTC) + cettime = utctime.astimezone(CET) + items += len(lista["Period"]["Point"]) + + for item in lista["Period"]["Point"]: + # the response contains timerange, but not timestamp for every price, so we must calculate it + time = str(cettime + timedelta(hours = int(item["position"]) - 1)) + + # append values + values.append((time, area["name"], item["price.amount"])) + print("Got " + str(items) + " records") + + +# connect to db +conn = psycopg2.connect(database=pg_db, host=pg_host) +cur = conn.cursor() + +# count rows before we start +cur.execute("SELECT COUNT(*) FROM " + pg_table) +before = cur.fetchone() + +# insert data +print("Inserting into database") +try: + cur.executemany("INSERT INTO " + pg_table + " VALUES(%s,%s,%s) ON CONFLICT (starttime, zone) DO NOTHING", values) + conn.commit() +except Exception as e: + conn.rollback() + raise e + +# count rows after we finnish +cur.execute("SELECT COUNT(*) FROM " + pg_table) +after = cur.fetchone() + +# count *new* rows +newRows = after[0] - before[0] + +# close connection +conn.close() + + +print("Successfully inserted " + str(newRows) + " records into the database") |