Apache Tika is a toolkit for detecting and extracting metadata and structured text content from various documents using existing parser libraries.
'org.apache.tika:tika-bundle:0.10'
<dependency>
<groupId>org.apache.tika</groupId>
<artifactId>tika-bundle</artifactId>
<version>0.10</version>
</dependency>
<dependency org="org.apache.tika" name="tika-bundle" rev="0.10"/>
"org.apache.tika", "tika-bundle", "0.10"