1 files changed, 23 insertions, 8 deletions
diff --git a/main.py b/main.py
index 61c4f86..df34f4f 100644
--- a/main.py
+++ b/main.py
@@ -4,20 +4,18 @@ from mastodon import Mastodon
 
 import sys
 import requests
+import datetime
+import json
 
 # Constant URL to Hacker News
 base_url = "https://news.ycombinator.com/"
-
 # Calculate the date 10 years ago as %Y-%m%d
 year = int(date.today().strftime("%Y")) - 10
 today = str(year) + date.today().strftime("-%m-%d")
-
 # Request the page
-r = requests.get(base_url + 'front?day='+today)
-
+r = requests.get('https://news.ycombinator.com/front?day='+today)
 # Parse the html
 soup = BeautifulSoup(r.text, features="lxml")
-
 # Get the post specified by the first argument
 items = soup.find_all("tr", "athing")[:3]
 index = int(sys.argv[1])
@@ -29,18 +27,35 @@ title = story.text
 link = story["href"]
 if "http" not in link:
     link = base_url + link
+try:
+    r = requests.get(link)
+    if r.status_code == 404:
+        raise Exception(404)
+except:
+    timestamp = int(datetime.datetime.timestamp(datetime.datetime.today() - datetime.timedelta(days=(10 * 365))))
+    r = requests.get("http://archive.org/wayback/available?url=" + link + "&timestamp=" + str(timestamp))
+    res = r.json()
+    if res["archived_snapshots"] and res["archived_snapshots"]["closest"]["available"]:
+        link = res["archived_snapshots"]["closest"]["url"]
+    else:
+        link = "[dead link]"
+
+    
+
 
 # Find the comments link from the row
 comment_el = item.next_sibling
 comment_link = base_url + comment_el.find_all("a")[-1]["href"]
+if comment_link == link:
+    comment_link = ""
 
 # Format the final string
-final = title + "\n" + link + "\n"+comment_link
+toot_content = title + "\n" + link + "\n"+comment_link
 
 # Connect to Mastodon and send a toot
 mastodon = Mastodon(
-    access_token = 'hndecade_usercred.secret',
+    access_token = '/home/mark/hndecade/hndecade_usercred.secret',
     api_base_url = 'https://botsin.space'
 )
-mastodon.toot(final)
 
+mastodon.toot(toot_content)