git.fiddlerwoaroof.com
scripts/goosify
a0d71cd9
 #!/usr/bin/env python2
 
 import goose
 import lxml
 import argparse
 
 p = argparse.ArgumentParser()
 p.add_argument('url')
 args = p.parse_args()
 
 g = goose.Goose()
 a = g.extract(args.url)
 print lxml.html.tostring(a.doc)