aboutsummaryrefslogtreecommitdiffstats
path: root/entsoe2pgsql.py
diff options
context:
space:
mode:
authorDennis Eriksen <d@ennis.no>2022-09-14 12:35:43 +0200
committerDennis Eriksen <d@ennis.no>2022-09-14 12:35:43 +0200
commite58dc713bef769c55efb42a76b6e058c28122bf4 (patch)
tree9f8bf9710cdfba33dd8b04eff630e15610c40a8d /entsoe2pgsql.py
parentSometimes there's a delay before new data is available. Increase the (diff)
downloadenergyscripts-e58dc713bef769c55efb42a76b6e058c28122bf4.tar.gz
Adding Entsoe as a data source. Also adding Norges Bank, since Entsoes
prices are in Euros, and I need an exchange-rate.
Diffstat (limited to 'entsoe2pgsql.py')
-rwxr-xr-xentsoe2pgsql.py103
1 files changed, 103 insertions, 0 deletions
diff --git a/entsoe2pgsql.py b/entsoe2pgsql.py
new file mode 100755
index 0000000..ef99fca
--- /dev/null
+++ b/entsoe2pgsql.py
@@ -0,0 +1,103 @@
+#!/bin/python3
+
+import os
+import sys
+import json
+import psycopg2
+import requests
+import xmltodict
+
+from datetime import datetime
+from datetime import timedelta
+from tzlocal import get_localzone
+from dateutil import tz
+
+
+# variables
+apiKey = os.environ['entsoe_token']
+apiUrl = "https://transparency.entsoe.eu/api?securityToken=" + apiKey
+
+pg_db = os.environ['pg_db']
+pg_host = os.environ['pg_host']
+pg_table = "entsoe"
+
+startTime = datetime.now(get_localzone()) - timedelta(days = 7)
+startTime = startTime.strftime('%Y%m%d')
+
+endTime = datetime.now(get_localzone()).strftime('%Y%m%d')
+
+areas = [ {"name": "NO-0", "code": "10YNO-0--------C"},
+ {"name": "NO-1", "code": "10YNO-1--------2"},
+ {"name": "NO-2", "code": "10YNO-2--------T"},
+ {"name": "NO-3", "code": "10YNO-3--------J"},
+ {"name": "NO-4", "code": "10YNO-4--------9"} ]
+
+UTC = tz.gettz('UTC')
+CET = tz.gettz('Europe/Oslo')
+
+
+# Get the data
+values=[]
+for area in areas:
+ try:
+ url = apiUrl + "&documentType=A44&in_Domain=" + area["code"] + "&out_Domain=" + area["code"] + "&periodStart=" + startTime + "0000&periodEnd=" + endTime + "0000"
+
+ print("Getting data for " + area["code"])
+ response = requests.get(url)
+ if response.status_code != 200:
+ print(response.status_code)
+ print("Oh shit")
+ response.raise_for_status()
+
+ except Exception as e:
+ print("oh lol")
+ sys.exit(e)
+
+ data_dict = xmltodict.parse(response.content)
+
+ items = 0
+ if "Publication_MarketDocument" in data_dict:
+ for lista in data_dict["Publication_MarketDocument"]["TimeSeries"]:
+ utctime = datetime.strptime(lista["Period"]["timeInterval"]["start"], "%Y-%m-%dT%H:%MZ")
+ utctime = utctime.replace(tzinfo = UTC)
+ cettime = utctime.astimezone(CET)
+ items += len(lista["Period"]["Point"])
+
+ for item in lista["Period"]["Point"]:
+ # the response contains timerange, but not timestamp for every price, so we must calculate it
+ time = str(cettime + timedelta(hours = int(item["position"]) - 1))
+
+ # append values
+ values.append((time, area["name"], item["price.amount"]))
+ print("Got " + str(items) + " records")
+
+
+# connect to db
+conn = psycopg2.connect(database=pg_db, host=pg_host)
+cur = conn.cursor()
+
+# count rows before we start
+cur.execute("SELECT COUNT(*) FROM " + pg_table)
+before = cur.fetchone()
+
+# insert data
+print("Inserting into database")
+try:
+ cur.executemany("INSERT INTO " + pg_table + " VALUES(%s,%s,%s) ON CONFLICT (starttime, zone) DO NOTHING", values)
+ conn.commit()
+except Exception as e:
+ conn.rollback()
+ raise e
+
+# count rows after we finnish
+cur.execute("SELECT COUNT(*) FROM " + pg_table)
+after = cur.fetchone()
+
+# count *new* rows
+newRows = after[0] - before[0]
+
+# close connection
+conn.close()
+
+
+print("Successfully inserted " + str(newRows) + " records into the database")