summaryrefslogtreecommitdiffstats
path: root/minlobsters.py
diff options
context:
space:
mode:
authorsteve <steve@haxors.club>2024-07-06 16:16:14 +0100
committersteve <steve@haxors.club>2024-07-06 16:16:14 +0100
commit84090ca8bc10853db10000940b72604a0d7c293a (patch)
tree4da8717c69f6e2420d748a6b2dd4430494a0fc50 /minlobsters.py
downloadbarkingspider-84090ca8bc10853db10000940b72604a0d7c293a.tar.gz
barkingspider-84090ca8bc10853db10000940b72604a0d7c293a.tar.bz2
barkingspider-84090ca8bc10853db10000940b72604a0d7c293a.zip
Initial release
Diffstat (limited to 'minlobsters.py')
-rw-r--r--minlobsters.py22
1 files changed, 22 insertions, 0 deletions
diff --git a/minlobsters.py b/minlobsters.py
new file mode 100644
index 0000000..e383535
--- /dev/null
+++ b/minlobsters.py
@@ -0,0 +1,22 @@
+#!/usr/bin/env python3
+
+import sys, getopt
+import requests
+
+from selectolax.parser import HTMLParser
+
+def extract_lobsters(tag):
+ base_url = f"https://lobste.rs/t/{tag}"
+ r = requests.get(base_url, headers = {'User-agent': 'yourbot'})
+
+ h = HTMLParser(r.text)
+ items = h.css('ol.stories.list li') # Our parent CSS class, each article is in an li
+ for i in items:
+ score = i.css("div.score")[0].text() # .text() recovers the text between tags
+ title = i.css("span.link a")[0].text()
+ url = i.css("span.link a")[0].attrs['href'] # .attrs recovers attribute content (ie href here)
+
+ print(f"\"{title}\" - {url} ({score})")
+
+tag = "reversing"
+extract_lobsters(tag)