Open Source Web Data Extraction tool written in Java. It offers a way to collect desired Web pages and extract useful data from them.
'net.sourceforge.web-harvest:webharvest:2.1.0-RC1'
<dependency>
<groupId>net.sourceforge.web-harvest</groupId>
<artifactId>webharvest</artifactId>
<version>2.1.0-RC1</version>
</dependency>
<dependency org="net.sourceforge.web-harvest" name="webharvest" rev="2.1.0-RC1"/>
"net.sourceforge.web-harvest", "webharvest", "2.1.0-RC1"