"description":"The Apache Tika™ toolkit detects and extracts metadata and text from over a thousand different file types (such as PPT, XLS, and PDF). All of these file types can be parsed through a single interface, making Tika useful for search engine indexing, content analysis, translation, and much more.",
"install_methods":[
{
"type":"default",
"script":"ct/apache-tika.sh",
"resources":{
"cpu":1,
"ram":2024,
"hdd":10,
"os":"debian",
"version":"12"
}
}
],
"default_credentials":{
"username":null,
"password":null
},
"notes":[
{
"text":"Configuration file is not created at install time. Example is at: `https://cwiki.apache.org/confluence/display/TIKA/TikaServer+in+Tika+2.x`",