This plugin crawls web sites and extracts the content from Web.
'org.codelibs:elasticsearch-river-web:1.2.0'
<dependency>
<groupId>org.codelibs</groupId>
<artifactId>elasticsearch-river-web</artifactId>
<version>1.2.0</version>
</dependency>
<dependency org="org.codelibs" name="elasticsearch-river-web" rev="1.2.0"/>
"org.codelibs", "elasticsearch-river-web", "1.2.0"