Skip to content

Commit ecdb408

Browse files
committed
updated for 2019 spring semester
1 parent 80dd100 commit ecdb408

File tree

1 file changed

+5
-5
lines changed

1 file changed

+5
-5
lines changed

Scraping script/scraper.py

Lines changed: 5 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -28,7 +28,7 @@ def scrape_catalog(session):
2828
online_uniques = []
2929

3030
# root page to be scraped
31-
next_page = "https://utdirect.utexas.edu/apps/registrar/course_schedule/20189/results/?ccyys=20189&" \
31+
next_page = "https://utdirect.utexas.edu/apps/registrar/course_schedule/20189/results/?ccyys=20199&" \
3232
"search_type_main=UNIQUE&unique_number=&start_unique=00000&end_unique=99999"
3333

3434
# tests to see if the end has been reached, if not keeps scraping
@@ -94,7 +94,7 @@ def scrape_page(session, page, db_uniques, on_uniques, cur, con):
9494
# look for the next page to crawl
9595
try:
9696
test = page_soup.find("a", {"id": "next_nav_link"})["href"]
97-
return "https://utdirect.utexas.edu/apps/registrar/course_schedule/20189/results/" + test
97+
return "https://utdirect.utexas.edu/apps/registrar/course_schedule/20199/results/" + test
9898
except TypeError:
9999
return None
100100

@@ -133,7 +133,7 @@ def login(username, password):
133133
("login_uri", "/login/cdcservlet"),
134134
("login_method", "GET"),
135135
("IDButton", "Log In"),
136-
("goto", "https://utdirect.utexas.edu:443/apps/registrar/course_schedule/20189"),
136+
("goto", "https://utdirect.utexas.edu:443/apps/registrar/course_schedule/20199"),
137137
("encoded", "false"),
138138
("gx_charset", "UTF-8"),
139139
]
@@ -146,7 +146,7 @@ def login(username, password):
146146
time.sleep(1)
147147

148148
# page gets redirected, need to input LARES value to continue, no clue what LARES is
149-
lares_page = scrape_session.get("https://utdirect.utexas.edu/apps/registrar/course_schedule/20189")
149+
lares_page = scrape_session.get("https://utdirect.utexas.edu/apps/registrar/course_schedule/20199")
150150
time.sleep(1)
151151

152152
# goes through the page and finds the LARES value to input
@@ -157,7 +157,7 @@ def login(username, password):
157157
]
158158

159159
# submits the LARES value, this time going into the correct path
160-
scrape_session.post("https://utdirect.utexas.edu/apps/registrar/course_schedule/20189", data=lares_data)
160+
scrape_session.post("https://utdirect.utexas.edu/apps/registrar/course_schedule/20199", data=lares_data)
161161
time.sleep(1)
162162

163163
# returns the session for future use

0 commit comments

Comments
 (0)