summaryrefslogtreecommitdiff
path: root/textract
blob: 4a29f55dc8fa75098004b5dcd5ffb1b8858a3650 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
#! /usr/bin/env nix-shell
#! nix-shell -i python -p "python3.withPackages(p: [p.pyreadability])"

import argparse
import readability
import sys

cli = argparse.ArgumentParser('read a file')
cli.add_argument('file', type=str)

args = cli.parse_args()

try:
    with open(args.file, 'r') as f:
        content = f.read()
    doc = readability.Document(content)
    sys.stdout.write(doc.summary())
except Exception as e:
    print(f"textract: Could not process document. Error: {e}")
    sys.exit(1)