@INPROCEEDINGS{Gottron:2007, author = {Thomas Gottron}, title = {Evaluating Content Extraction on {HTML} Documents}, booktitle = {ITA '07: Proceedings of the 2nd International Conference on Internet Technologies and Applications}, year = {2007}, pages = {123--132}, month = sep, isbn = {978-0-946881-54-3}, location = {Wrexham, Wales, UK} }