Repository created, old data ported
commit
db4319e7d6
|
@ -0,0 +1,8 @@
|
|||
# Default ignored files
|
||||
/shelf/
|
||||
/workspace.xml
|
||||
# Editor-based HTTP Client requests
|
||||
/httpRequests/
|
||||
# Datasource local storage ignored files
|
||||
/dataSources/
|
||||
/dataSources.local.xml
|
|
@ -0,0 +1,8 @@
|
|||
<?xml version="1.0" encoding="UTF-8"?>
|
||||
<module type="PYTHON_MODULE" version="4">
|
||||
<component name="NewModuleRootManager">
|
||||
<content url="file://$MODULE_DIR$" />
|
||||
<orderEntry type="inheritedJdk" />
|
||||
<orderEntry type="sourceFolder" forTests="false" />
|
||||
</component>
|
||||
</module>
|
|
@ -0,0 +1,6 @@
|
|||
<component name="InspectionProjectProfileManager">
|
||||
<settings>
|
||||
<option name="USE_PROJECT_PROFILE" value="false" />
|
||||
<version value="1.0" />
|
||||
</settings>
|
||||
</component>
|
|
@ -0,0 +1,4 @@
|
|||
<?xml version="1.0" encoding="UTF-8"?>
|
||||
<project version="4">
|
||||
<component name="ProjectRootManager" version="2" project-jdk-name="Python 3.12" project-jdk-type="Python SDK" />
|
||||
</project>
|
|
@ -0,0 +1,8 @@
|
|||
<?xml version="1.0" encoding="UTF-8"?>
|
||||
<project version="4">
|
||||
<component name="ProjectModuleManager">
|
||||
<modules>
|
||||
<module fileurl="file://$PROJECT_DIR$/.idea/ConsultancyProject_2_ETL.iml" filepath="$PROJECT_DIR$/.idea/ConsultancyProject_2_ETL.iml" />
|
||||
</modules>
|
||||
</component>
|
||||
</project>
|
|
@ -0,0 +1,6 @@
|
|||
<?xml version="1.0" encoding="UTF-8"?>
|
||||
<project version="4">
|
||||
<component name="VcsDirectoryMappings">
|
||||
<mapping directory="" vcs="Git" />
|
||||
</component>
|
||||
</project>
|
|
@ -0,0 +1,83 @@
|
|||
from datetime import datetime, timedelta
|
||||
import json
|
||||
|
||||
import MySQLdb #Version 2.2.4
|
||||
import pandas as pd #Version 2.2.2
|
||||
import plotly.express as px #Version 5.22.0
|
||||
|
||||
db = MySQLdb.connect(host="localhost",user="root",passwd="admin",db="heiraterei")
|
||||
cur = db.cursor()
|
||||
|
||||
cur.execute("SELECT JSON_EXTRACT(header, '$.Date') "
|
||||
"FROM extractions "
|
||||
"WHERE type='calendar' AND property_id = 200;")
|
||||
dateoutput = cur.fetchall()
|
||||
|
||||
|
||||
cur.execute("SELECT JSON_EXTRACT(body, '$.content.days') "
|
||||
"FROM extractions "
|
||||
"WHERE type='calendar' AND property_id = 200;")
|
||||
|
||||
output = cur.fetchall()
|
||||
db.close()
|
||||
|
||||
#createScrapedate Liste
|
||||
ytickVals = list(range(0, 30, 5))
|
||||
scrapeDates = []
|
||||
#print(dateoutput)
|
||||
for row in dateoutput:
|
||||
date = datetime.strptime(json.loads(row[0])[0], '%a, %d %b %Y %H:%M:%S %Z').date()
|
||||
str = date.strftime('%d/%m/%Y')
|
||||
scrapeDates.append(str)
|
||||
|
||||
#minimales und maximales Datum ermitteln
|
||||
fullDateList = []
|
||||
for row in output:
|
||||
tempJson = json.loads(row[0]).keys()
|
||||
for key in tempJson:
|
||||
#print(key)
|
||||
fullDateList.append(datetime.strptime(key, '%Y-%m-%d').date())
|
||||
|
||||
end_dt = max(fullDateList)
|
||||
start_dt = min(fullDateList)
|
||||
delta = timedelta(days=1)
|
||||
HeaderDates = []
|
||||
|
||||
while start_dt <= end_dt:
|
||||
HeaderDates.append(start_dt)
|
||||
start_dt += delta
|
||||
|
||||
#Create data-Matrix
|
||||
data = []
|
||||
for row in output:
|
||||
tempList = [-1] * len(HeaderDates)
|
||||
tempJson = json.loads(row[0])
|
||||
for key in tempJson:
|
||||
date = datetime.strptime(key, '%Y-%m-%d').date()
|
||||
content = tempJson[key]
|
||||
index = [i for i, x in enumerate(HeaderDates) if x == date]
|
||||
tempList[index[0]] = content
|
||||
data.append(tempList)
|
||||
|
||||
#Transform to Dataframe for Plotly
|
||||
df = pd.DataFrame(data, columns=HeaderDates)
|
||||
|
||||
#Generate Plotly Diagramm
|
||||
colScale = [[0, 'rgb(0, 0, 0)'], [0.33, 'rgb(204, 16, 16)'], [0.66, 'rgb(10, 102, 15)'], [1, 'rgb(17, 184, 26)']]
|
||||
fig = px.imshow(df, color_continuous_scale= colScale)
|
||||
lines = list(range(0,30,1))
|
||||
for i in lines:
|
||||
#fig.add_hline(y=i+0.5, line_color="white")
|
||||
fig.add_hline(y=i+0.5)
|
||||
|
||||
fig.update_layout(yaxis = dict(tickfont = dict(size=50))),
|
||||
fig.update_layout(xaxis = dict(tickfont = dict(size=50)))
|
||||
fig.update_layout(xaxis_title="Verfügbarkeitsdaten Mietobjekt", yaxis_title="Scrapingvorgang")
|
||||
fig.update_xaxes(title_font_size=100, title_font_weight="bold")
|
||||
fig.update_yaxes(title_font_size=100, title_font_weight="bold")
|
||||
fig.update_layout(yaxis = dict(tickmode = 'array',tickvals = ytickVals, ticktext = scrapeDates))
|
||||
fig.update_xaxes(title_standoff = 80)
|
||||
fig.update_yaxes(title_standoff = 80)
|
||||
fig.update_layout(xaxis={'side': 'top'})
|
||||
fig.show()
|
||||
|
Loading…
Reference in New Issue