Search Options

Results per page
Sort
Preferred Languages
Advance

Results 31 - 40 of 54 for Handle (0.03 sec)

  1. fess-crawler/src/main/java/org/codelibs/fess/crawler/util/XmlUtil.java

            if (StringUtil.isNotBlank(accessResultData.getEncoding())) {
                is.setEncoding(accessResultData.getEncoding());
            }
    
            // create handler
            final DocHandler handler = new DocHandler();
    
            // create a sax instance
            final SAXParserFactory spfactory = SAXParserFactory.newInstance();
            try {
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 9.4K bytes
    - Viewed (0)
  2. fess-crawler/src/main/java/org/codelibs/fess/crawler/processor/impl/SitemapsResponseProcessor.java

    import org.codelibs.fess.crawler.helper.SitemapsHelper;
    import org.codelibs.fess.crawler.processor.ResponseProcessor;
    
    import jakarta.annotation.Resource;
    
    /**
     * A response processor implementation that handles sitemaps.
     * It parses the response body as a SitemapSet, extracts URLs from the sitemaps,
     * and adds them as child URLs to be crawled.
     *
     * <p>
     * This class uses a {@link SitemapsHelper} to parse the sitemap XML or text.
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 3.4K bytes
    - Viewed (0)
  3. fess-crawler-opensearch/src/test/java/org/codelibs/fess/crawler/CrawlerTest.java

            Logger rootLogger = Logger.getLogger("");
            rootLogger.setLevel(Level.ALL);
            ConsoleHandler handler = new ConsoleHandler();
            handler.setFormatter(new SimpleFormatter());
            handler.setLevel(Level.ALL);
            rootLogger.addHandler(handler);
        }
    
        @Override
        public void tearDown() throws Exception {
            super.tearDown();
            // close runner
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Sep 06 04:15:37 UTC 2025
    - 7.7K bytes
    - Viewed (0)
  4. fess-crawler/src/main/java/org/codelibs/fess/crawler/rule/impl/AbstractRule.java

    import jakarta.annotation.Resource;
    
    /**
     * Abstract base class for implementing {@link Rule} interfaces.
     * Provides common functionality and properties for crawler rules.
     *
     * <p>
     * This class handles the registration of rules with the {@link RuleManager}
     * and provides getter and setter methods for common properties such as
     * {@code ruleId} and {@code responseProcessor}.
     * </p>
     *
     * <p>
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Wed Sep 03 14:42:53 UTC 2025
    - 2.8K bytes
    - Viewed (0)
  5. fess-crawler/src/main/java/org/codelibs/fess/crawler/entity/RobotsTxt.java

    import java.util.LinkedHashMap;
    import java.util.List;
    import java.util.Map;
    import java.util.regex.Pattern;
    
    import org.codelibs.core.lang.StringUtil;
    
    /**
     * Represents a robots.txt file parser and handler.
     * This class manages the rules defined in a robots.txt file, including user agent directives,
     * allowed/disallowed paths, crawl delays, and sitemap URLs.
     *
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 10K bytes
    - Viewed (0)
  6. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/AbstractExtractor.java

    /**
     * An abstract base class for implementing Extractor interfaces.
     * Provides common functionality such as access to CrawlerContainer components
     * and registration with the ExtractorFactory.
     *
     * <p>
     * This class handles the retrieval of essential crawler components like
     * {@link MimeTypeHelper} and {@link ExtractorFactory} from the
     * {@link CrawlerContainer}. It also provides a convenient method for
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 4.2K bytes
    - Viewed (0)
  7. src/main/java/org/codelibs/fess/suggest/normalizer/HankakuKanaToZenkakuKana.java

    /**
     * The HankakuKanaToZenkakuKana class implements the Normalizer interface to convert
     * half-width Katakana characters (Hankaku Kana) to full-width Katakana characters (Zenkaku Kana).
     * It also handles the conversion of voiced and semi-voiced sound marks.
     *
     * <p>This class provides the following functionalities:</p>
     * <ul>
     *   <li>Normalization of a string containing Hankaku Kana to Zenkaku Kana.</li>
    Registered: Fri Sep 19 09:08:11 UTC 2025
    - Last Modified: Fri Jul 04 14:00:23 UTC 2025
    - 6.8K bytes
    - Viewed (0)
  8. fess-crawler/src/main/java/org/codelibs/fess/crawler/processor/impl/DefaultResponseProcessor.java

     * It processes the response data based on the HTTP status code and configured transformer.
     * </p>
     *
     * <p>
     * It handles successful responses by transforming the data using a {@link Transformer}
     * and storing the result. It also handles "Not Modified" responses by creating an empty
     * result and storing it. Unsuccessful responses are logged for debugging purposes.
     * </p>
     *
     * <p>
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Thu Aug 07 02:55:08 UTC 2025
    - 12.5K bytes
    - Viewed (0)
  9. fess-crawler/src/main/java/org/codelibs/fess/crawler/client/CrawlerClientCreator.java

    import org.codelibs.fess.crawler.container.CrawlerContainer;
    
    import jakarta.annotation.Resource;
    
    /**
     * Creates and manages crawler clients for web crawling operations.
     * This class handles the registration and loading of crawler client factories and their associated clients.
     * <p>
     * The class maintains a mapping between regular expressions and component names, and manages a list
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 4.5K bytes
    - Viewed (0)
  10. fess-crawler/src/main/java/org/codelibs/fess/crawler/client/ftp/FtpClient.java

     * from FTP servers. The client supports various configurations, including authentication, timeouts,
     * passive/active modes, and encoding settings. It also handles FTP file attributes such as user,
     * group, and symbolic links.
     *
     * <p>
     * The class uses Apache Commons Net library for FTP communication. It maintains a queue of FTPClient
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 39.5K bytes
    - Viewed (0)
Back to top