diff options
Diffstat (limited to 'main.py')
-rw-r--r-- | main.py | 31 |
1 files changed, 23 insertions, 8 deletions
@@ -4,20 +4,18 @@ from mastodon import Mastodon import sys import requests +import datetime +import json # Constant URL to Hacker News base_url = "https://news.ycombinator.com/" - # Calculate the date 10 years ago as %Y-%m%d year = int(date.today().strftime("%Y")) - 10 today = str(year) + date.today().strftime("-%m-%d") - # Request the page -r = requests.get(base_url + 'front?day='+today) - +r = requests.get('https://news.ycombinator.com/front?day='+today) # Parse the html soup = BeautifulSoup(r.text, features="lxml") - # Get the post specified by the first argument items = soup.find_all("tr", "athing")[:3] index = int(sys.argv[1]) @@ -29,18 +27,35 @@ title = story.text link = story["href"] if "http" not in link: link = base_url + link +try: + r = requests.get(link) + if r.status_code == 404: + raise Exception(404) +except: + timestamp = int(datetime.datetime.timestamp(datetime.datetime.today() - datetime.timedelta(days=(10 * 365)))) + r = requests.get("http://archive.org/wayback/available?url=" + link + "×tamp=" + str(timestamp)) + res = r.json() + if res["archived_snapshots"] and res["archived_snapshots"]["closest"]["available"]: + link = res["archived_snapshots"]["closest"]["url"] + else: + link = "[dead link]" + + + # Find the comments link from the row comment_el = item.next_sibling comment_link = base_url + comment_el.find_all("a")[-1]["href"] +if comment_link == link: + comment_link = "" # Format the final string -final = title + "\n" + link + "\n"+comment_link +toot_content = title + "\n" + link + "\n"+comment_link # Connect to Mastodon and send a toot mastodon = Mastodon( - access_token = 'hndecade_usercred.secret', + access_token = '/home/mark/hndecade/hndecade_usercred.secret', api_base_url = 'https://botsin.space' ) -mastodon.toot(final) +mastodon.toot(toot_content) |