summaryrefslogtreecommitdiff
path: root/textract
blob: 707cd276427b89df6bb53c00728851f0d466c49c (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
#! /usr/bin/env nix-shell
#! nix-shell -i python -p "python3.withPackages(p: [p.requests p.pyreadability])"

import argparse
from readability import Document
import requests
import sys

cli = argparse.ArgumentParser('read a url')
cli.add_argument('url', type=str)

args = cli.parse_args()

try:
    resp = requests.get(args.url)
    doc = Document(resp.text)
    sys.stdout.write(doc.summary())
except:
    print("textract: Could not fetch document.")
    sys.exit(1)