-
Notifications
You must be signed in to change notification settings - Fork 1
/
Copy pathwebscraping.py
32 lines (25 loc) · 887 Bytes
/
webscraping.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
# scrape.py
import requests
from bs4 import BeautifulSoup
from datetime import datetime
from datetime import timedelta
hackathons = []
result = requests.get(
"https://devpost.com/hackathons?utf8=%E2%9C%93&search=blockchain&challenge_type=all&sort_by=Submission+Deadline")
src = result.content
soup = BeautifulSoup(src, 'lxml')
featured_challenges = soup.find_all(
'a', attrs={'data-role': 'featured_challenge'})
for featured_challenge in featured_challenges:
try:
time = featured_challenge.find(
"time", attrs={"class": "value timeago"}).text
time_left = datetime.strptime(
time[:-4], "%b %d, %Y %I:%M %p")
now = datetime.now()
if now > time_left - timedelta(days=50):
hackathons.append(featured_challenge.attrs['href'])
except:
continue
for hackathon in hackathons:
print(hackathon)