From 84090ca8bc10853db10000940b72604a0d7c293a Mon Sep 17 00:00:00 2001 From: steve Date: Sat, 6 Jul 2024 16:16:14 +0100 Subject: Initial release --- minlobsters.py | 22 ++++++++++++++++++++++ 1 file changed, 22 insertions(+) create mode 100644 minlobsters.py (limited to 'minlobsters.py') diff --git a/minlobsters.py b/minlobsters.py new file mode 100644 index 0000000..e383535 --- /dev/null +++ b/minlobsters.py @@ -0,0 +1,22 @@ +#!/usr/bin/env python3 + +import sys, getopt +import requests + +from selectolax.parser import HTMLParser + +def extract_lobsters(tag): + base_url = f"https://lobste.rs/t/{tag}" + r = requests.get(base_url, headers = {'User-agent': 'yourbot'}) + + h = HTMLParser(r.text) + items = h.css('ol.stories.list li') # Our parent CSS class, each article is in an li + for i in items: + score = i.css("div.score")[0].text() # .text() recovers the text between tags + title = i.css("span.link a")[0].text() + url = i.css("span.link a")[0].attrs['href'] # .attrs recovers attribute content (ie href here) + + print(f"\"{title}\" - {url} ({score})") + +tag = "reversing" +extract_lobsters(tag) -- cgit v1.2.3