Apache Tika is a toolkit for detecting and extracting metadata and structured text content from various documents using existing parser libraries.
'org.apache.tika:tika-serialization:1.6'
<dependency> <groupId>org.apache.tika</groupId> <artifactId>tika-serialization</artifactId> <version>1.6</version> </dependency>
<dependency org="org.apache.tika" name="tika-serialization" rev="1.6"/>
"org.apache.tika", "tika-serialization", "1.6"