1 # Contributor: Kevin Brubeck Unhammer <unhammer@gmail.com>
2 # Maintainer: Kevin Brubeck Unhammer <unhammer@gmail.com>
6 pkgdesc="jusText removes boilerplate content (such as navigation links, headers, and footers) from HTML pages. Designed to preserve text with full sentences, it is suited for creating linguistic resources like Web corpora."
7 url="https://code.google.com/p/justext/"
9 license=('New BSD License')
10 depends=('python2>=2.2.4')
16 source=("http://justext.googlecode.com/files/justext-1.1.tar.gz")
17 md5sums=('120d33a917a6362c88dd546d4f354c47')
19 cd $startdir/src/$pkgname-$pkgver
21 # From http://allanmcrae.com/2010/10/big-python-transition-in-arch-linux/
22 sed -i -e "s|#![ ]*/usr/bin/python$|#!/usr/bin/python2|" \
23 -e "s|#![ ]*/usr/bin/env python$|#!/usr/bin/env python2|" \
24 $(find . -name '*.py')
26 python2 setup.py install --prefix=/usr --root="$pkgdir" || return 1