Apache Solr Content Extraction Library integrates Apache Tika content extraction framework into Solr
'org.dspace.dependencies.solr:dspace-solr-cell:1.4.0.1'
<dependency>
<groupId>org.dspace.dependencies.solr</groupId>
<artifactId>dspace-solr-cell</artifactId>
<version>1.4.0.1</version>
</dependency>
<dependency org="org.dspace.dependencies.solr" name="dspace-solr-cell" rev="1.4.0.1"/>
"org.dspace.dependencies.solr", "dspace-solr-cell", "1.4.0.1"