git.fiddlerwoaroof.com
Raw Blame History
#!/usr/bin/env python2

import goose
import lxml
import argparse

p = argparse.ArgumentParser()
p.add_argument('url')
args = p.parse_args()

g = goose.Goose()
a = g.extract(args.url)
print lxml.html.tostring(a.doc)