Skip to content

Navigation Menu

Sign in
Appearance settings

Search code, repositories, users, issues, pull requests...

Provide feedback

We read every piece of feedback, and take your input very seriously.

Saved searches

Use saved searches to filter your results more quickly

Appearance settings

Latest commit

 

History

History
History
81 lines (59 loc) · 2.89 KB

File metadata and controls

81 lines (59 loc) · 2.89 KB
Copy raw file
Download raw file
Open symbols panel
Edit and raw actions
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
# -*- coding: utf-8 -*-
"""
Created on Fri Sep 27 00:42:41 2019
@author: lukek
"""
import requests, bs4
import selenium
from selenium import webdriver
import time
import shutil, os
#downloadbox=driver.find_element_by_name('Download')
#using chrome
#define driver
options = webdriver.ChromeOptions()
options.add_argument("--start-maximized")
prefs = {"profile.default_content_settings.popups": 0,
"download.default_directory": r"C:\Users\lukek\Desktop\Python\airplane\\",
"directory_upgrade": True}
options.add_experimental_option("prefs", prefs)
driver=webdriver.Chrome(executable_path=r'C:\Users\lukek\Desktop\Python\chromedriver.exe', options=options)
#open website
driver.get('https://www.transtats.bts.gov/DL_SelectFields.asp?Table_ID=236&DB_Short_Name=On-Time')
checkbox=['\'YEAR\'','\'MONTH\'', '\'DAY_OF_MONTH\'','\'FL_DATE\'', '\'ORIGIN\'', '\'ORIGIN_CITY_NAME\'','\'ORIGIN_STATE_ABR\'','\'DEST\'', '\'DEST_CITY_NAME\'','\'DEST_STATE_ABR\'', '\'DEP_TIME\'', '\'DEP_DELAY\'', '\'ARR_TIME\'', '\'ARR_DELAY\'', '\'CANCELLED\'', '\'AIR_TIME\'', '\'DISTANCE\'', '\'CARRIER_DELAY\'', '\'WEATHER_DELAY\'', '\'NAS_DELAY\'','\'SECURITY_DELAY\'', '\'LATE_AIRCRAFT_DELAY\'']
paths=[]
year=[]
for i in range(0,10):
year.append(str(201)+str(i))
months=['\'January\'','\'February\'','\'March\'','\'April\'','\'May\'','\'June\'','\'July\'','\'August\'','\'September\'','\'October\'','\'November\'','\'December\'']
for i in range(0,len(checkbox)):
paths.append("//input[@type='checkbox' and @value=" + checkbox[i] + "]")
#
element = driver.find_element_by_xpath("//input[@type='checkbox' and @id='DownloadZip']").click()
element = driver.find_element_by_xpath("//input[@type='checkbox' and @id='DownloadZip']").click()
#
#click all columns needed
for j in range(0,len(paths)):
driver.find_element_by_xpath(paths[j]).click()
time.sleep(.006)
#select year
for yr in range(2012,2020):
driver.find_element_by_xpath("//select[@id='XYEAR']/option[text()=" +str(yr) +"]" ).click()
for month in months:
driver.find_element_by_xpath("//select[@id='FREQUENCY']/option[text()=" +str(month) +"]" ).click()
for dfile in os.listdir(r"C:\Users\lukek\Desktop\Python\airplane"):
while dfile.endswith('.crdownload'):
if dfile in os.listdir(r"C:\Users\lukek\Desktop\Python\airplane"):
continue
break
driver.find_element_by_name("Download").click()
print('Saved File for' + str(month)+ ' '+str(yr))
time.sleep(.06)
#time.sleep(.2)
#driver.find_element_by_name("Download").click()
# =============================================================================
# for yr in range(2004,2010):
# print(yr)
# for month in months:
# print(month)
# =============================================================================
Morty Proxy This is a proxified and sanitized view of the page, visit original site.