]> git.mxchange.org Git - hub.git/blobdiff - application/hub/main/filter/task/crawler/class_CrawlerTaskHandlerInitializerFilter.php
Added more tasks (see wiki: https://wiki.shipsimu.org/doku.php/de/projects/hub/applic...
[hub.git] / application / hub / main / filter / task / crawler / class_CrawlerTaskHandlerInitializerFilter.php
index 43a7be491f7b6c994a411a0216c65e3f296d5cfd..cb2a1383c6e7b86cfea2e35ddf8d132a571fe1a7 100644 (file)
@@ -81,6 +81,26 @@ class CrawlerTaskHandlerInitializerFilter extends BaseCrawlerFilter implements F
                $taskInstance = ObjectFactory::createObjectByConfiguredName('crawler_remote_job_publisher_task_class');
                $handlerInstance->registerTask('crawler_remote_job_publisher', $taskInstance);
 
+               // 5) MIME sniffer
+               $taskInstance = ObjectFactory::createObjectByConfiguredName('crawler_mime_sniffer_task_class');
+               $handlerInstance->registerTask('crawler_mime_sniffer', $taskInstance);
+
+               // 6) Document parser (converts document to meta format)
+               $taskInstance = ObjectFactory::createObjectByConfiguredName('crawler_document_parser_task_class');
+               $handlerInstance->registerTask('crawler_document_parser', $taskInstance);
+
+               // 7) Document structure analyzer
+               $taskInstance = ObjectFactory::createObjectByConfiguredName('crawler_structure_analyzer_task_class');
+               $handlerInstance->registerTask('crawler_structure_analyzer', $taskInstance);
+
+               // 8) Snippet extractor
+               $taskInstance = ObjectFactory::createObjectByConfiguredName('crawler_snippet_extractor_task_class');
+               $handlerInstance->registerTask('crawler_snippet_extractor', $taskInstance);
+
+               // 9) Node ping
+               $taskInstance = ObjectFactory::createObjectByConfiguredName('crawler_ping_task_class');
+               $handlerInstance->registerTask('crawler_ping', $taskInstance);
+
                // Put the task handler in registry
                Registry::getRegistry()->addInstance('task_handler', $handlerInstance);
        }