<?xml version="1.0"?>
<dblp>
<article key="journals/ldvf/Rehm05" mdate="2006-11-06">
<author>Georg Rehm</author>
<title>Language-Independent Text Parsing of Arbitrary HTML-Documents. Towards A Foundation For Web Genre Identification.</title>
<pages>53-74</pages>
<year>2005</year>
<volume>20</volume>
<journal>LDV Forum</journal>
<number>2</number>
<ee>http://ariadne.coli.uni-bielefeld.de/gldv/site/2005_Heft2/Georg_Rehm.pdf</ee>
<url>db/journals/ldvf/ldvf20.html#Rehm05</url>
</article>
</dblp>
