public class FilesystemCrawler
extends com.norconex.collector.core.crawler.AbstractCrawler
| Constructor and Description |
|---|
FilesystemCrawler(FilesystemCrawlerConfig crawlerConfig)
Constructor.
|
| Modifier and Type | Method and Description |
|---|---|
protected void |
cleanupExecution(JobStatusUpdater statusUpdater,
JobSuite suite,
com.norconex.collector.core.data.store.ICrawlDataStore refStore) |
protected com.norconex.collector.core.data.BaseCrawlData |
createEmbeddedCrawlData(String embeddedReference,
com.norconex.collector.core.data.ICrawlData parentCrawlData) |
protected void |
executeCommitterPipeline(com.norconex.collector.core.crawler.ICrawler crawler,
ImporterDocument doc,
com.norconex.collector.core.data.store.ICrawlDataStore crawlDataStore,
com.norconex.collector.core.data.BaseCrawlData crawlData,
com.norconex.collector.core.data.BaseCrawlData cachedCrawlData) |
protected ImporterResponse |
executeImporterPipeline(com.norconex.collector.core.pipeline.importer.ImporterPipelineContext importerContext) |
protected void |
executeQueuePipeline(com.norconex.collector.core.data.ICrawlData crawlData,
com.norconex.collector.core.data.store.ICrawlDataStore crawlDataStore) |
FilesystemCrawlerConfig |
getCrawlerConfig() |
org.apache.commons.vfs2.FileSystemManager |
getFileManager() |
protected void |
markReferenceVariationsAsProcessed(com.norconex.collector.core.data.BaseCrawlData crawlData,
com.norconex.collector.core.data.store.ICrawlDataStore crawlDataStore) |
protected void |
prepareExecution(JobStatusUpdater statusUpdater,
JobSuite suite,
com.norconex.collector.core.data.store.ICrawlDataStore crawlDataStore,
boolean resume) |
protected ImporterDocument |
wrapDocument(com.norconex.collector.core.data.ICrawlData crawlData,
ImporterDocument document) |
beforeFinalizeDocumentProcessing, createCrawlDataStore, deleteCacheOrphans, execute, fireCrawlerEvent, getBaseDownloadDir, getCrawlerDownloadDir, getCrawlerEventManager, getId, getImporter, getStreamFactory, handleOrphans, initCrawlData, isMaxDocuments, isStopped, processNextReference, processReferences, reprocessCacheOrphans, resumeExecution, startExecution, stopexecutepublic FilesystemCrawler(FilesystemCrawlerConfig crawlerConfig)
crawlerConfig - HTTP crawler configurationpublic FilesystemCrawlerConfig getCrawlerConfig()
getCrawlerConfig in interface com.norconex.collector.core.crawler.ICrawlergetCrawlerConfig in class com.norconex.collector.core.crawler.AbstractCrawlerpublic org.apache.commons.vfs2.FileSystemManager getFileManager()
protected void prepareExecution(JobStatusUpdater statusUpdater, JobSuite suite, com.norconex.collector.core.data.store.ICrawlDataStore crawlDataStore, boolean resume)
prepareExecution in class com.norconex.collector.core.crawler.AbstractCrawlerprotected void executeQueuePipeline(com.norconex.collector.core.data.ICrawlData crawlData,
com.norconex.collector.core.data.store.ICrawlDataStore crawlDataStore)
executeQueuePipeline in class com.norconex.collector.core.crawler.AbstractCrawlerprotected ImporterDocument wrapDocument(com.norconex.collector.core.data.ICrawlData crawlData, ImporterDocument document)
wrapDocument in class com.norconex.collector.core.crawler.AbstractCrawlerprotected ImporterResponse executeImporterPipeline(com.norconex.collector.core.pipeline.importer.ImporterPipelineContext importerContext)
executeImporterPipeline in class com.norconex.collector.core.crawler.AbstractCrawlerprotected com.norconex.collector.core.data.BaseCrawlData createEmbeddedCrawlData(String embeddedReference, com.norconex.collector.core.data.ICrawlData parentCrawlData)
createEmbeddedCrawlData in class com.norconex.collector.core.crawler.AbstractCrawlerprotected void executeCommitterPipeline(com.norconex.collector.core.crawler.ICrawler crawler,
ImporterDocument doc,
com.norconex.collector.core.data.store.ICrawlDataStore crawlDataStore,
com.norconex.collector.core.data.BaseCrawlData crawlData,
com.norconex.collector.core.data.BaseCrawlData cachedCrawlData)
executeCommitterPipeline in class com.norconex.collector.core.crawler.AbstractCrawlerprotected void markReferenceVariationsAsProcessed(com.norconex.collector.core.data.BaseCrawlData crawlData,
com.norconex.collector.core.data.store.ICrawlDataStore crawlDataStore)
markReferenceVariationsAsProcessed in class com.norconex.collector.core.crawler.AbstractCrawlerprotected void cleanupExecution(JobStatusUpdater statusUpdater, JobSuite suite, com.norconex.collector.core.data.store.ICrawlDataStore refStore)
cleanupExecution in class com.norconex.collector.core.crawler.AbstractCrawlerCopyright © 2014–2023 Norconex Inc.. All rights reserved.