public class FilesystemCrawler
extends com.norconex.collector.core.crawler.AbstractCrawler
Constructor and Description |
---|
FilesystemCrawler(FilesystemCrawlerConfig crawlerConfig)
Constructor.
|
Modifier and Type | Method and Description |
---|---|
protected void |
cleanupExecution(JobStatusUpdater statusUpdater,
JobSuite suite,
com.norconex.collector.core.data.store.ICrawlDataStore refStore) |
protected com.norconex.collector.core.data.BaseCrawlData |
createEmbeddedCrawlData(String embeddedReference,
com.norconex.collector.core.data.ICrawlData parentCrawlData) |
protected void |
executeCommitterPipeline(com.norconex.collector.core.crawler.ICrawler crawler,
ImporterDocument doc,
com.norconex.collector.core.data.store.ICrawlDataStore crawlDataStore,
com.norconex.collector.core.data.BaseCrawlData crawlData,
com.norconex.collector.core.data.BaseCrawlData cachedCrawlData) |
protected ImporterResponse |
executeImporterPipeline(com.norconex.collector.core.pipeline.importer.ImporterPipelineContext importerContext) |
protected void |
executeQueuePipeline(com.norconex.collector.core.data.ICrawlData crawlData,
com.norconex.collector.core.data.store.ICrawlDataStore crawlDataStore) |
FilesystemCrawlerConfig |
getCrawlerConfig() |
org.apache.commons.vfs2.FileSystemManager |
getFileManager() |
protected void |
markReferenceVariationsAsProcessed(com.norconex.collector.core.data.BaseCrawlData crawlData,
com.norconex.collector.core.data.store.ICrawlDataStore crawlDataStore) |
protected void |
prepareExecution(JobStatusUpdater statusUpdater,
JobSuite suite,
com.norconex.collector.core.data.store.ICrawlDataStore crawlDataStore,
boolean resume) |
protected ImporterDocument |
wrapDocument(com.norconex.collector.core.data.ICrawlData crawlData,
ImporterDocument document) |
beforeFinalizeDocumentProcessing, createCrawlDataStore, deleteCacheOrphans, execute, fireCrawlerEvent, getBaseDownloadDir, getCrawlerDownloadDir, getCrawlerEventManager, getId, getImporter, getStreamFactory, handleOrphans, initCrawlData, isMaxDocuments, isStopped, processNextReference, processReferences, reprocessCacheOrphans, resumeExecution, startExecution, stop
execute
public FilesystemCrawler(FilesystemCrawlerConfig crawlerConfig)
crawlerConfig
- HTTP crawler configurationpublic FilesystemCrawlerConfig getCrawlerConfig()
getCrawlerConfig
in interface com.norconex.collector.core.crawler.ICrawler
getCrawlerConfig
in class com.norconex.collector.core.crawler.AbstractCrawler
public org.apache.commons.vfs2.FileSystemManager getFileManager()
protected void prepareExecution(JobStatusUpdater statusUpdater, JobSuite suite, com.norconex.collector.core.data.store.ICrawlDataStore crawlDataStore, boolean resume)
prepareExecution
in class com.norconex.collector.core.crawler.AbstractCrawler
protected void executeQueuePipeline(com.norconex.collector.core.data.ICrawlData crawlData, com.norconex.collector.core.data.store.ICrawlDataStore crawlDataStore)
executeQueuePipeline
in class com.norconex.collector.core.crawler.AbstractCrawler
protected ImporterDocument wrapDocument(com.norconex.collector.core.data.ICrawlData crawlData, ImporterDocument document)
wrapDocument
in class com.norconex.collector.core.crawler.AbstractCrawler
protected ImporterResponse executeImporterPipeline(com.norconex.collector.core.pipeline.importer.ImporterPipelineContext importerContext)
executeImporterPipeline
in class com.norconex.collector.core.crawler.AbstractCrawler
protected com.norconex.collector.core.data.BaseCrawlData createEmbeddedCrawlData(String embeddedReference, com.norconex.collector.core.data.ICrawlData parentCrawlData)
createEmbeddedCrawlData
in class com.norconex.collector.core.crawler.AbstractCrawler
protected void executeCommitterPipeline(com.norconex.collector.core.crawler.ICrawler crawler, ImporterDocument doc, com.norconex.collector.core.data.store.ICrawlDataStore crawlDataStore, com.norconex.collector.core.data.BaseCrawlData crawlData, com.norconex.collector.core.data.BaseCrawlData cachedCrawlData)
executeCommitterPipeline
in class com.norconex.collector.core.crawler.AbstractCrawler
protected void markReferenceVariationsAsProcessed(com.norconex.collector.core.data.BaseCrawlData crawlData, com.norconex.collector.core.data.store.ICrawlDataStore crawlDataStore)
markReferenceVariationsAsProcessed
in class com.norconex.collector.core.crawler.AbstractCrawler
protected void cleanupExecution(JobStatusUpdater statusUpdater, JobSuite suite, com.norconex.collector.core.data.store.ICrawlDataStore refStore)
cleanupExecution
in class com.norconex.collector.core.crawler.AbstractCrawler
Copyright © 2014–2023 Norconex Inc.. All rights reserved.