Search Options

Results per page
Sort
Preferred Languages
Advance

Results 21 - 30 of 115 for from (0.01 sec)

  1. fess-crawler/src/main/java/org/codelibs/fess/crawler/CrawlerThread.java

     * </p>
     *
     * <p>
     * The crawling process involves the following steps:
     * </p>
     * <ol>
     *   <li>Fetching a URL from the queue using {@link UrlQueueService#poll(String)}.</li>
     *   <li>Checking if the URL is valid using {@link #isValid(UrlQueue)}.</li>
     *   <li>Accessing the content using a {@link CrawlerClient} obtained from {@link CrawlerClientFactory}.</li>
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Thu Aug 07 02:55:08 UTC 2025
    - 20.4K bytes
    - Viewed (0)
  2. fess-crawler/src/main/java/org/codelibs/fess/net/protocol/storage/Handler.java

         * This class handles the authentication, connection management, and data retrieval
         * from storage buckets and objects.
         *
         * <p>
         * The connection extracts bucket and object names from the URL and uses environment
         * variables for authentication and endpoint configuration.
         * </p>
         */
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 10.5K bytes
    - Viewed (0)
  3. fess-crawler/src/main/java/org/codelibs/fess/crawler/client/ftp/FtpClient.java

            return processRequest(uri, true);
        }
    
        /**
         * Processes an FTP request to retrieve data from the specified URI.
         * This method handles the complete FTP request lifecycle including timeout management,
         * connection setup, and data retrieval.
         *
         * @param uri The URI to retrieve data from
         * @param includeContent Whether to include the actual content in the response
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 39.5K bytes
    - Viewed (0)
  4. fess-crawler/src/main/java/org/codelibs/fess/crawler/pool/CrawlerPooledObjectFactory.java

        /**
         * The name of the component to be retrieved from the CrawlerContainer.
         */
        protected String componentName;
    
        /**
         * The listener that is called when a pooled object is destroyed.
         */
        protected OnDestroyListener<T> onDestroyListener;
    
        /**
         * Creates a new object instance from the crawler container.
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 3.9K bytes
    - Viewed (0)
  5. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/AbstractExtractor.java

     * and registration with the ExtractorFactory.
     *
     * <p>
     * This class handles the retrieval of essential crawler components like
     * {@link MimeTypeHelper} and {@link ExtractorFactory} from the
     * {@link CrawlerContainer}. It also provides a convenient method for
     * registering the extractor with the {@link ExtractorFactory}.
     * </p>
     *
     * <p>
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 4.2K bytes
    - Viewed (0)
  6. fess-crawler/src/main/java/org/codelibs/fess/crawler/transformer/impl/XpathTransformer.java

     *   <li><b>trimSpaceEnabled:</b> A flag to enable or disable trimming of whitespace from extracted values.</li>
     *   <li><b>charsetName:</b> The character encoding for the output XML.</li>
     *   <li><b>dataClass:</b> The class type to return from the {@link #getData(AccessResultData)} method.</li>
     * </ul>
     *
     */
    public class XpathTransformer extends HtmlTransformer {
    
        /**
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 13.1K bytes
    - Viewed (0)
  7. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/MsPowerPointExtractor.java

    /**
     * Extracts text content from Microsoft PowerPoint documents.
     */
    public class MsPowerPointExtractor extends AbstractExtractor {
    
        /**
         * Creates a new MsPowerPointExtractor instance.
         */
        public MsPowerPointExtractor() {
            super();
        }
    
        /**
         * Extracts text from the PowerPoint input stream.
         * @param in The input stream.
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 2.1K bytes
    - Viewed (0)
  8. fess-crawler/src/main/java/org/codelibs/fess/crawler/service/UrlFilterService.java

         * @param url the URL to be excluded
         */
        void addExcludeUrlFilter(String sessionId, String url);
    
        /**
         * Adds a list of URLs to be excluded from crawling for a specific session.
         *
         * @param sessionId the ID of the session for which the URLs should be excluded
         * @param urlList the list of URLs to be excluded
         */
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Mar 15 06:52:00 UTC 2025
    - 3.1K bytes
    - Viewed (0)
  9. fess-crawler/src/main/java/org/codelibs/fess/crawler/util/TemporaryFileInputStream.java

        private final File tempFile;
    
        private final FileInputStream fileInputStream;
    
        /**
         * A class that provides an input stream for reading from a temporary file.
         * This class wraps a {@link FileInputStream} to read from the specified temporary file.
         *
         * @param tempFile the temporary file to be read
         * @throws FileNotFoundException if the specified file does not exist
         */
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 4.3K bytes
    - Viewed (0)
  10. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/MsPublisherExtractor.java

    /**
     * Gets a text from . file.
     *
     * @author shinsuke
     *
     */
    public class MsPublisherExtractor extends AbstractExtractor {
    
        /**
         * Creates a new MsPublisherExtractor instance.
         */
        public MsPublisherExtractor() {
            super();
        }
    
        /**
         * Extracts text from the Publisher input stream.
         * @param in The input stream.
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 1.9K bytes
    - Viewed (0)
Back to top