This repository has been archived by the owner on Mar 29, 2022. It is now read-only.
-
Notifications
You must be signed in to change notification settings - Fork 2
/
Copy pathdb_scrape.py
executable file
·90 lines (83 loc) · 3.2 KB
/
db_scrape.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
#!/usr/bin/python
from bs4 import BeautifulSoup
import urllib2
import os, sys, re, json
import sqlite3
conn = sqlite3.connect('database.db')
db = conn.cursor()
def init():
init_db()
url = 'http://aviationweather.gov/products/nws/all'
usock = urllib2.urlopen(url)
source = usock.read()
usock.close()
soup = BeautifulSoup(source)
parse(soup)
def parse(soup):
content = soup.find('pre')
if content is None:
exit("Nothing")
blob = content.get_text().split('\n')
altitudes = [0,3000,6000,9000,12000,18000,24000,30000,34000,39000]
for line in blob:
if len(line) == 69 and not (line.startswith('FT')):
# TODO - be better about filtering these columns. Either remove lamba function or regex.
line = re.sub('[\s]{5}', ' 0000', line)
data_strings = line.split(' ')
data_strings = filter(lambda blank: blank != '', data_strings)
airport_code = data_strings[0]
for data,altitude in zip(data_strings, altitudes):
if len(data) == 3:
pass
else:
if int(data[:2]) == 99:
# Winds are light and variable
direction = '00'
speed = '00'
elif int(data[:2]) > 36:
# Winds are OVER 99 knots. Follow WMO nomenclature: http://en.wikipedia.org/wiki/Winds_aloft
# Subtract 50 from DD, add 100 to SS
direction = str((int(data[:2]) - 50)) + '0'
speed = (int(data[2:4]) + 100)
else:
# Standard DDss format.
direction = data[:2] + '0'
speed = data[2:4]
insert_db(airport_code, altitude, direction, speed)
#print "Airport: {} Height: {} Dir: {} Speed {}".format(airport_code, altitude, direction, speed)
conn.commit()
def init_db():
db.execute('''DROP TABLE IF EXISTS winds''')
db.execute('''CREATE TABLE winds
(airport_code STRING, altitude INTEGER, direction INTEGER, speed INTEGER)''')
def insert_db(airport_code, altitude, direction, speed):
query = '''INSERT INTO winds VALUES ("{}","{}","{}","{}")'''.format(airport_code, altitude, direction, speed)
db.execute(query)
def get_ground_winds():
query = '''SELECT distinct(airport_code) FROM winds'''
cur = db.execute(query)
airport_codes = cur.fetchall()
airport_code_string = ','.join(code[0] for code in airport_codes)
url = '''http://weather.aero/dataserver_current/httpparam?dataSource=metars&requestType=retrieve&format=json&hoursBeforeNow=1&mostRecentForEachStation=true&stationString={}'''.format(airport_code_string)
usock = urllib2.urlopen(url)
source = usock.read()
usock.close()
data = json.loads(source)
parse_ground_winds(airport_codes, data)
def parse_ground_winds(airport_codes, data):
for data in data['features']:
print "--------------------------"
print data
for airport_code in airport_codes:
if airport_code[0] in data['properties']['icao_code']:
try:
direction = data['properties']['wind_dir_degrees']
speed = data['properties']['wind_speed_kt']
insert_db(airport_code[0],'0',direction,speed)
except:
print (airport_code[0])
insert_db(airport_code[0],'0','0','0')
conn.commit()
if __name__ == '__main__':
init()
get_ground_winds()