More shit

2019-04-06 13:38:39 +02:00 · 2019-04-06 13:38:39 +02:00 · 140a9eb574
commit 140a9eb574
parent 0a1708d7aa
2 changed files with 76 additions and 3 deletions
--- a/server/nightr/scrape.py
+++ b/server/nightr/scrape.py
@ -1,6 +1,71 @@
 import requests
 from bs4 import BeautifulSoup
 import pandas as pd
 import urllib.request
 from datetime import datetime, timedelta
 import json
-import os
+
 def determine_month():
    ds = pd.read_excel(urllib.request.urlopen('https://sundogbaelt.dk/wp-content/uploads/2019/04/trafiktal-maaned.xls'))
    cur_year = 2019
    amount_of_cur_year = sum([x == cur_year for x in ds['År']])
    cur_year_total = sum(ds['Total'][1:amount_of_cur_year+1])
    last_year_total = sum(ds['Total'][amount_of_cur_year+1:amount_of_cur_year+13])
    return (12/(last_year_total//cur_year_total))+1
 def is_tide():
    month = determine_month()
    tide_data = requests.get('https://www.dmi.dk/fileadmin/user_upload/Bruger_upload/Tidevand/2019/Aarhus.t.txt')
    lines = tide_data.text[570:].split('\n')
    tuples = [x.split('\t') for x in lines]
    lel = [[datetime.strptime(x[0], '%Y%m%d%H%M'), x[1]] for x in tuples[:-1]]
    matches = [[x[0], int(x[1])] for x in lel if x[0].month == month]
    all_the_data = requests.get('https://www.dmi.dk/NinJo2DmiDk/ninjo2dmidk?cmd=odj&stations=22331&datatype=obs')
    current_water_level = json.loads(all_the_data.content)[0]['values'][-1]['value']
    # Generate average of when the water is high
    last_match = matches[0]
    moments = []
    for idx, water_level in enumerate(matches[1:]):
        #print(last_match[1], water_level[1])
        diff = abs(last_match[1]) + abs(water_level[1])
        time_diff = (water_level[0] - last_match[0]).seconds
        average_inc = time_diff/diff
        average_delta = timedelta(seconds=average_inc)
        if last_match[1] < 0: # Increasing
            time = last_match
            while time[1] != current_water_level:
                time[0] += average_delta
                time[1] += 1
        elif last_match[1] > 0: # Decreasing
            time = last_match
            while time[1] != current_water_level:
                time[0] += average_delta
                time[1] -= 1
        last_match = water_level
        moments.append(time[0])
    night = sum([1 for x in moments if 6 >= x.hour or x.hour >= 22])
    return night / len(moments)
 def tmp():
    r = requests.get('https://portal.opendata.dk/api/3/action/datastore_search?resource_id=b3eeb0ff-c8a8-4824-99d6-e0a3747c8b0d')
    with open('traffic_data_13_23.json', 'w') as f:
        json.dump(r.json(), f)
 def scrape_traffic():
@ -29,4 +94,11 @@ def scrape_traffic():
    return res
-scrape_traffic()
+def scrape_weather():
    r = requests.get('https://weather.com/weather/hourbyhour/l/99546:4:US')
    soup = BeautifulSoup(r.content)
    print(soup.find_all('td', {'class': 'temp'})[0])
--- a/server/nightr/traffic_data_13_23.json
+++ b/server/nightr/traffic_data_13_23.json