Search Options

Results per page
Sort
Preferred Languages
Advance

Results 11 - 20 of 92 for CrawlerSystemException (0.19 sec)

  1. fess-crawler-opensearch/src/main/java/org/codelibs/fess/crawler/service/impl/OpenSearchUrlFilterService.java

         * @return The list of compiled include patterns.
         * @throws CrawlerSystemException if the patterns cannot be loaded.
         */
        @Override
        public List<Pattern> getIncludeUrlPatternList(final String sessionId) {
            try {
                return includeFilterCache.get(sessionId);
            } catch (final ExecutionException e) {
                throw new CrawlerSystemException(e);
            }
        }
    
        /**
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Thu Aug 07 02:55:08 UTC 2025
    - 9.2K bytes
    - Viewed (0)
  2. fess-crawler/src/main/java/org/codelibs/fess/crawler/interval/impl/HostIntervalController.java

    import org.codelibs.core.lang.StringUtil;
    import org.codelibs.core.lang.SystemUtil;
    import org.codelibs.fess.crawler.entity.UrlQueue;
    import org.codelibs.fess.crawler.exception.CrawlerSystemException;
    import org.codelibs.fess.crawler.util.CrawlingParameterUtil;
    
    /**
     * HostIntervalController is an implementation of {@link org.codelibs.fess.crawler.interval.IntervalController}
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 4.2K bytes
    - Viewed (0)
  3. fess-crawler/src/main/java/org/codelibs/fess/crawler/transformer/impl/HtmlTransformer.java

                resultData.removeUrl(requestData);
                resultData.removeUrl(getDuplicateUrl(requestData));
            } catch (final CrawlerSystemException e) {
                throw e;
            } catch (final Exception e) {
                throw new CrawlerSystemException("Could not store data.", e);
            }
        }
    
        /**
         * Gets the child URL extraction rules as a stream of tag-attribute pairs.
         *
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 28.5K bytes
    - Viewed (0)
  4. fess-crawler/src/test/java/org/codelibs/fess/crawler/util/CrawlerWebServer.java

            try {
                server.start();
            } catch (final Exception e) {
                throw new CrawlerSystemException(e);
            }
        }
    
        public void stop() {
            try {
                server.stop();
                server.join();
            } catch (final Exception e) {
                throw new CrawlerSystemException(e);
            } finally {
                if (tempDocRoot) {
                    docRoot.delete();
                }
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Mar 15 06:52:00 UTC 2025
    - 6.3K bytes
    - Viewed (0)
  5. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/JodExtractor.java

        }
    
        /**
         * Initializes the extractor by starting the office manager.
         *
         * @throws CrawlerSystemException if the office manager is null or fails to start
         */
        @PostConstruct
        public void init() {
            if (officeManager == null) {
                throw new CrawlerSystemException("officeManager is null.");
            }
            try {
                officeManager.start();
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 10.3K bytes
    - Viewed (0)
  6. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/MsWordExtractor.java

    import java.io.IOException;
    import java.io.InputStream;
    import java.util.Map;
    
    import org.codelibs.fess.crawler.entity.ExtractData;
    import org.codelibs.fess.crawler.exception.CrawlerSystemException;
    import org.codelibs.fess.crawler.exception.ExtractException;
    
    /**
     * Gets a text from .doc file.
     *
     * @author shinsuke
     *
     */
    public class MsWordExtractor extends AbstractExtractor {
    
        /**
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 1.9K bytes
    - Viewed (0)
  7. fess-crawler/src/test/java/org/codelibs/fess/crawler/extractor/impl/TextExtractorTest.java

    import org.codelibs.core.io.CloseableUtil;
    import org.codelibs.core.io.ResourceUtil;
    import org.codelibs.fess.crawler.container.StandardCrawlerContainer;
    import org.codelibs.fess.crawler.exception.CrawlerSystemException;
    import org.dbflute.utflute.core.PlainTestCase;
    
    /**
     * @author shinsuke
     *
     */
    public class TextExtractorTest extends PlainTestCase {
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Mar 15 06:52:00 UTC 2025
    - 2K bytes
    - Viewed (0)
  8. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/AbstractExtractor.java

    import java.io.File;
    import java.io.IOException;
    import java.util.List;
    
    import org.codelibs.fess.crawler.container.CrawlerContainer;
    import org.codelibs.fess.crawler.exception.CrawlerSystemException;
    import org.codelibs.fess.crawler.extractor.Extractor;
    import org.codelibs.fess.crawler.extractor.ExtractorFactory;
    import org.codelibs.fess.crawler.helper.MimeTypeHelper;
    
    import jakarta.annotation.Resource;
    
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 4.2K bytes
    - Viewed (0)
  9. fess-crawler/src/main/java/org/codelibs/fess/crawler/transformer/impl/TextTransformer.java

    import org.codelibs.fess.crawler.entity.ExtractData;
    import org.codelibs.fess.crawler.entity.ResponseData;
    import org.codelibs.fess.crawler.entity.ResultData;
    import org.codelibs.fess.crawler.exception.CrawlerSystemException;
    import org.codelibs.fess.crawler.exception.CrawlingAccessException;
    import org.codelibs.fess.crawler.extractor.Extractor;
    import org.codelibs.fess.crawler.extractor.ExtractorFactory;
    
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 6.5K bytes
    - Viewed (0)
  10. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/MsExcelExtractor.java

    import java.io.InputStream;
    import java.util.Map;
    
    import org.apache.poi.hssf.usermodel.HSSFWorkbook;
    import org.codelibs.fess.crawler.entity.ExtractData;
    import org.codelibs.fess.crawler.exception.CrawlerSystemException;
    import org.codelibs.fess.crawler.exception.ExtractException;
    
    /**
     * Gets a text from .xls file.
     *
     * @author shinsuke
     *
     */
    public class MsExcelExtractor extends AbstractExtractor {
    
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 2K bytes
    - Viewed (0)
Back to top