diff options
| author | steve <steve@haxors.club> | 2024-07-06 16:16:14 +0100 |
|---|---|---|
| committer | steve <steve@haxors.club> | 2024-07-06 16:16:14 +0100 |
| commit | 84090ca8bc10853db10000940b72604a0d7c293a (patch) | |
| tree | 4da8717c69f6e2420d748a6b2dd4430494a0fc50 /minlobsters.py | |
| download | barkingspider-84090ca8bc10853db10000940b72604a0d7c293a.tar.gz barkingspider-84090ca8bc10853db10000940b72604a0d7c293a.tar.bz2 barkingspider-84090ca8bc10853db10000940b72604a0d7c293a.zip | |
Initial release
Diffstat (limited to 'minlobsters.py')
| -rw-r--r-- | minlobsters.py | 22 |
1 files changed, 22 insertions, 0 deletions
diff --git a/minlobsters.py b/minlobsters.py new file mode 100644 index 0000000..e383535 --- /dev/null +++ b/minlobsters.py @@ -0,0 +1,22 @@ +#!/usr/bin/env python3 + +import sys, getopt +import requests + +from selectolax.parser import HTMLParser + +def extract_lobsters(tag): + base_url = f"https://lobste.rs/t/{tag}" + r = requests.get(base_url, headers = {'User-agent': 'yourbot'}) + + h = HTMLParser(r.text) + items = h.css('ol.stories.list li') # Our parent CSS class, each article is in an li + for i in items: + score = i.css("div.score")[0].text() # .text() recovers the text between tags + title = i.css("span.link a")[0].text() + url = i.css("span.link a")[0].attrs['href'] # .attrs recovers attribute content (ie href here) + + print(f"\"{title}\" - {url} ({score})") + +tag = "reversing" +extract_lobsters(tag) |
