-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathdata_loader.py
183 lines (149 loc) · 6.69 KB
/
data_loader.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
import os
import time
import json
import geopandas as gpd
import requests
from geopandas import GeoSeries
from shapely.geometry import Point
import pandas as pd
from string_decode import decode_string
TEMP_DIR = "temp"
class ZueriData:
def __init__(self):
self.end_url = "https://www.zuerich.com/en/api/v2/data"
self.api_url = self.end_url + "?id="
self.temp_dir = TEMP_DIR
def get_endpoint_list(self):
print('Retrieving Zürich Tourism API endpoints...')
try:
api_endpoints_raw = requests.get(self.end_url)
api_ids_names = {item.get('id'): item.get('name').get('de') for item in api_endpoints_raw.json() if
not item.get('name').get('de') is None}
except Exception as e:
print(f'Error: {e}')
api_ids_names = {101: 'Error Retrieving data...'}
return api_ids_names
def get_api_data(self, api_id=101):
print(f'Checking for cached version of API endpoint with id {api_id}')
# Check if the data is already cached and not older than 24h
if os.path.exists(f'{self.temp_dir}/{api_id}.json') and os.path.getctime(
f'{self.temp_dir}/{api_id}.json') > time.time() - (60 * 60 * 24):
print('Loading cached data...')
with open(f'{self.temp_dir}/{api_id}.json', 'r') as f:
data = json.load(f)
return data
else:
print('No cached data found, retrieving fresh API data...')
try:
response = requests.get(self.api_url + str(api_id))
data = response.json()
with open(f'{self.temp_dir}/{api_id}.json', 'w') as f:
json.dump(data, f)
except Exception as e:
print(f'Error: {e}')
data = {}
return data
def load_transform_save_antenna_data():
# Prepare antenna data
filepath = 'static/antennenstandorte-5g_de.json'
ant_gdf = gpd.read_file(filepath)
# Use WGS 84 (epsg:4326) as the geographic coordinate system
ant_gdf = ant_gdf.to_crs(epsg=4326)
# Convert powercode_de to integer value
# dictionary to convert antenna power data
powercodes = {"Sehr Klein": 2, "Klein": 3, "Mittel": 5, "Gross": 10}
# convert powercode_de to integer value
ant_gdf["power_int"] = ant_gdf["powercode_de"].apply(lambda x: powercodes.get(x))
# create lat and lon columns in ant_gdf
ant_gdf['lat'] = ant_gdf.geometry.y
ant_gdf['lon'] = ant_gdf.geometry.x
# Assuming `gdf` is your GeoPandas DataFrame
ant_gdf.to_file("static/ant_gdf.json", driver='GeoJSON')
def load_transform_save_political_shape_geo_data():
# Set the file path to the shapefile
# shapefile = "static/Grenzen.shp/swissBOUNDARIES3D_1_5_TLM_BEZIRKSGEBIET.shp"
# shapefile = "static/Grenzen.shp/swissBOUNDARIES3D_1_5_TLM_KANTONSGEBIET.shp"
shapefile = "static/Grenzen.shp/swissBOUNDARIES3D_1_5_TLM_HOHEITSGEBIET.shp"
# load Shape file into GeoDataFrame
gdf = gpd.GeoDataFrame.from_file(shapefile)
# Convert to WGS84
gdf.crs = "EPSG:2056" # Use CH1903+ / LV95 (epsg:2056)
# Use WGS84 (epsg:4326) as the geographic coordinate system
gdf = gdf.to_crs(epsg=4326)
# print(gdf.columns)
gdf['DICHTE'] = gdf['EINWOHNERZ'] / gdf['KANTONSFLA'] * 1000 # BEZIRKSFLA, KANTONSFLA
# Correct string encoding for the NAME column
gdf['NAME'] = gdf['NAME'].apply(decode_string)
# Save the GeoDataFrame to a GeoJSON file
gdf.to_file("static/gdf_gem.json", driver='GeoJSON')
def load_transform_ev_station_data():
print("Loading EV data from URL...")
url = "https://data.geo.admin.ch/ch.bfe.ladestellen-elektromobilitaet/data/oicp/ch.bfe.ladestellen-elektromobilitaet.json"
response = requests.get(url)
data = response.json()
stations = data.get("EVSEData")[0].get("EVSEDataRecord")
station_ids = []
coordinates = []
plugs = []
names = []
for station in stations:
station_ids.append(station.get("EvseID"))
current_plugs = [station for station in station.get("Plugs")]
coordinates.append(station.get("GeoCoordinates").get("Google"))
# plugs.append({str(i):str(station) for i, station in enumerate(station.get("Plugs"))})
plugs_str = ", ".join([str(plug) for plug in current_plugs])
plugs.append(plugs_str)
names.append(station.get("ChargingStationNames")[0].get("value"))
print("Data Size: ", len(coordinates))
print("Sample coordinates: ", coordinates[:5])
print("Sample plug count: ", plugs[:5])
print("Sample names: ", names[:5])
ev_gdf = gpd.GeoDataFrame(geometry=GeoSeries())
ev_gdf['EvseID'] = station_ids
ev_gdf['name'] = names
ev_gdf['lat'] = [float(coord.split(" ")[0]) for coord in coordinates]
ev_gdf['lon'] = [float(coord.split(" ")[1]) for coord in coordinates]
ev_gdf['plugs'] = plugs
ev_gdf['geometry'] = [Point(xy) for xy in zip(ev_gdf['lon'], ev_gdf['lat'])]
ev_gdf.set_geometry('geometry')
# save to json file
ev_gdf.to_file("static/ev_gdf.json", driver='GeoJSON')
return ev_gdf
def get_live_ev_station_data():
print("Loading EV data from URL...")
# Ladestationen verfügbarkeit
url = "https://data.geo.admin.ch/ch.bfe.ladestellen-elektromobilitaet/status/oicp/ch.bfe.ladestellen-elektromobilitaet.json"
response = requests.get(url)
data = response.json()
stations = data.get("EVSEStatuses")[0].get("EVSEStatusRecord")
live_ev_df = pd.DataFrame(stations)
# save to json file
live_ev_df.to_json("static/live_ev_df.json", orient='records', lines=True)
return live_ev_df
def load_map_save_antenna_data():
print("Loading mobile antenna data...")
filepath = "static/mobilfunkanlagen.json"
gdf = gpd.read_file(filepath)
print("Converting to epsg4326...")
gdf.set_crs(epsg=2056, inplace=True)
gdf = gdf.to_crs(epsg=4326)
print("Columns: ", gdf.columns)
print("Shape: ", gdf.shape)
print(gdf.head())
print(gdf.index)
print("Mapping power codes...")
power_dict = {"Leistungsklasse : sehr klein (bis 6 W)": 2,
"Leistungsklasse : klein (bis 500 W)": 3,
"Leistungsklasse : mittel (bis 5'000 W)": 5,
"Leistungsklasse : gross (über 5'000 W)": 10,}
gdf["power_code"] = gdf["power_de"].map(power_dict)
gdf = gdf[['geometry', 'typ_de', 'techno_de', 'power_de', 'power_code']]
# Save as GeoJSON
gdf.to_file("static/mobilfunk.json", driver="GeoJSON")
print("Done.")
if __name__ == "__main__":
# load_transform_save_antenna_data()
# load_transform_save_political_shape_geo_data()
# load_transform_ev_station_data()
print(get_live_ev_station_data().head())
print("Done.")