| Package | Description |
|---|---|
| org.apache.tika.batch | |
| org.apache.tika.batch.builders | |
| org.apache.tika.batch.fs | |
| org.apache.tika.batch.fs.builders |
| Modifier and Type | Class and Description |
|---|---|
(package private) class |
PoisonFileResource
Sentinel class for the crawler to add to the queue to let
the consumers know that they should shutdown.
|
| Modifier and Type | Field and Description |
|---|---|
private java.util.concurrent.ArrayBlockingQueue<FileResource> |
FileResourceConsumer.fileQueue |
private java.util.concurrent.ArrayBlockingQueue<FileResource> |
FileResourceCrawler.queue |
| Modifier and Type | Method and Description |
|---|---|
private FileResource |
FileResourceConsumer.getNextFileResource() |
| Modifier and Type | Method and Description |
|---|---|
private boolean |
FileResourceConsumer._processFileResource(FileResource fileResource) |
abstract boolean |
FileResourceConsumer.processFileResource(FileResource fileResource)
Main piece of code that needs to be implemented.
|
protected int |
FileResourceCrawler.tryToAdd(FileResource fileResource) |
| Constructor and Description |
|---|
FileResourceConsumer(java.util.concurrent.ArrayBlockingQueue<FileResource> fileQueue) |
FileResourceCrawler(java.util.concurrent.ArrayBlockingQueue<FileResource> queue,
int numConsumers) |
| Modifier and Type | Method and Description |
|---|---|
private java.util.concurrent.ArrayBlockingQueue<FileResource> |
BatchProcessBuilder.buildQueue(org.w3c.dom.Node docElement,
java.util.Map<java.lang.String,java.lang.String> runtimeAttributes) |
| Modifier and Type | Method and Description |
|---|---|
T |
ObjectFromDOMAndQueueBuilder.build(org.w3c.dom.Node node,
java.util.Map<java.lang.String,java.lang.String> runtimeAttributes,
java.util.concurrent.ArrayBlockingQueue<FileResource> resourceQueue) |
FileResourceCrawler |
ICrawlerBuilder.build(org.w3c.dom.Node node,
java.util.Map<java.lang.String,java.lang.String> attributes,
java.util.concurrent.ArrayBlockingQueue<FileResource> queue) |
abstract ConsumersManager |
AbstractConsumersBuilder.build(org.w3c.dom.Node node,
java.util.Map<java.lang.String,java.lang.String> runtimeAttributes,
java.util.concurrent.ArrayBlockingQueue<FileResource> queue) |
private ConsumersManager |
BatchProcessBuilder.buildConsumersManager(org.w3c.dom.Node node,
java.util.Map<java.lang.String,java.lang.String> runtimeAttributes,
java.util.concurrent.ArrayBlockingQueue<FileResource> queue) |
private FileResourceCrawler |
BatchProcessBuilder.buildCrawler(java.util.concurrent.ArrayBlockingQueue<FileResource> queue,
org.w3c.dom.Node node,
java.util.Map<java.lang.String,java.lang.String> runtimeAttributes) |
| Modifier and Type | Class and Description |
|---|---|
class |
FSFileResource
FileSystem(FS)Resource wraps a file name.
|
| Modifier and Type | Method and Description |
|---|---|
protected java.io.InputStream |
AbstractFSConsumer.getInputStream(FileResource fileResource) |
protected java.io.OutputStream |
AbstractFSConsumer.getOutputStream(OutputStreamFactory fsOSFactory,
FileResource fileResource)
Use this for consistent logging of exceptions.
|
boolean |
BasicTikaFSConsumer.processFileResource(FileResource fileResource) |
boolean |
RecursiveParserWrapperFSConsumer.processFileResource(FileResource fileResource) |
| Constructor and Description |
|---|
AbstractFSConsumer(java.util.concurrent.ArrayBlockingQueue<FileResource> fileQueue) |
BasicTikaFSConsumer(java.util.concurrent.ArrayBlockingQueue<FileResource> queue,
ParserFactory parserFactory,
ContentHandlerFactory contentHandlerFactory,
OutputStreamFactory fsOSFactory,
TikaConfig config) |
FSDirectoryCrawler(java.util.concurrent.ArrayBlockingQueue<FileResource> fileQueue,
int numConsumers,
java.nio.file.Path root,
FSDirectoryCrawler.CRAWL_ORDER crawlOrder) |
FSDirectoryCrawler(java.util.concurrent.ArrayBlockingQueue<FileResource> fileQueue,
int numConsumers,
java.nio.file.Path root,
java.nio.file.Path startDirectory,
FSDirectoryCrawler.CRAWL_ORDER crawlOrder) |
FSListCrawler(java.util.concurrent.ArrayBlockingQueue<FileResource> fileQueue,
int numConsumers,
java.io.File root,
java.io.File list,
java.lang.String encoding)
Deprecated.
|
FSListCrawler(java.util.concurrent.ArrayBlockingQueue<FileResource> fileQueue,
int numConsumers,
java.nio.file.Path root,
java.nio.file.Path list,
java.nio.charset.Charset charset)
Constructor for a crawler that reads a list of files to process.
|
RecursiveParserWrapperFSConsumer(java.util.concurrent.ArrayBlockingQueue<FileResource> queue,
ParserFactory parserFactory,
ContentHandlerFactory contentHandlerFactory,
OutputStreamFactory fsOSFactory,
TikaConfig tikaConfig) |
| Modifier and Type | Method and Description |
|---|---|
FileResourceCrawler |
FSCrawlerBuilder.build(org.w3c.dom.Node node,
java.util.Map<java.lang.String,java.lang.String> runtimeAttributes,
java.util.concurrent.ArrayBlockingQueue<FileResource> queue) |
ConsumersManager |
BasicTikaFSConsumersBuilder.build(org.w3c.dom.Node node,
java.util.Map<java.lang.String,java.lang.String> runtimeAttributes,
java.util.concurrent.ArrayBlockingQueue<FileResource> queue) |