Search Options

Results per page
Sort
Preferred Languages
Advance

Results 21 - 30 of 38 for Processing (0.06 sec)

  1. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/EmlExtractor.java

            }
        }
    
        /**
         * Gets the mail properties used for email processing.
         *
         * @return the mail properties
         */
        public Properties getMailProperties() {
            return mailProperties;
        }
    
        /**
         * Sets the mail properties used for email processing.
         *
         * @param mailProperties the mail properties to set
         */
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 12.6K bytes
    - Viewed (0)
  2. fess-crawler/src/main/java/org/codelibs/fess/crawler/rule/RuleManager.java

     */
    package org.codelibs.fess.crawler.rule;
    
    import org.codelibs.fess.crawler.entity.ResponseData;
    
    /**
     * The RuleManager interface provides methods to manage rules for processing response data.
     * It allows adding, retrieving, and removing rules, as well as checking for their existence.
     */
    public interface RuleManager {
    
        /**
         * Retrieves the rule associated with the given response data.
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 2.1K bytes
    - Viewed (0)
  3. fess-crawler/src/main/java/org/codelibs/fess/crawler/entity/SitemapFile.java

     *
     * <p>
     * A Sitemap file provides search engines with a list of URLs available for crawling.
     * This class encapsulates the essential attributes of a Sitemap entry, allowing for efficient management
     * and processing of Sitemap data.
     * </p>
     *
     * <p>
     * The {@code loc} attribute specifies the URL of the Sitemap, while the {@code lastmod} attribute
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 4.4K bytes
    - Viewed (1)
  4. fess-crawler/src/main/java/org/codelibs/fess/crawler/client/smb/SmbClient.java

                } catch (final Exception e) {
                    if (logger.isDebugEnabled()) {
                        logger.debug("Exception on SID processing.", e);
                    }
                }
            }
        }
    
        /**
         * Preprocesses the URI before processing the request.
         *
         * @param uri the URI to preprocess
         * @return the preprocessed URI
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Thu Sep 18 09:30:45 UTC 2025
    - 22.5K bytes
    - Viewed (3)
  5. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/TikaExtractor.java

     * <p>
     * The {@link ContentWriter} functional interface is used to abstract the process of writing content to a writer.
     * </p>
     *
     * <p>
     * The class uses temporary files for processing large input streams and ensures that these files are deleted after
     * processing.
     * </p>
     *
     */
    public class TikaExtractor extends PasswordBasedExtractor {
    
        private static final Logger logger = LogManager.getLogger(TikaExtractor.class);
    
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Thu Aug 07 02:55:08 UTC 2025
    - 30.7K bytes
    - Viewed (0)
  6. fess-crawler/src/main/java/org/codelibs/fess/crawler/CrawlerThread.java

    import jakarta.annotation.Resource;
    
    /**
     * The {@code CrawlerThread} class represents a thread that executes the crawling process.
     * It is responsible for fetching URLs from the queue, accessing the content,
     * processing the response, and extracting child URLs.
     *
     * <p>
     * This class implements the {@link Runnable} interface, allowing it to be executed in a separate thread.
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Thu Aug 07 02:55:08 UTC 2025
    - 20.4K bytes
    - Viewed (0)
  7. fess-crawler-opensearch/src/main/java/org/codelibs/fess/crawler/entity/OpenSearchAccessResult.java

        /**
         * Initializes the access result with response data and result data.
         *
         * @param responseData The response data from the crawl operation.
         * @param resultData The result data from content processing.
         */
        @Override
        public void init(final ResponseData responseData, final ResultData resultData) {
    
            setCreateTime(System.currentTimeMillis());
            if (responseData != null) {
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 6.5K bytes
    - Viewed (0)
  8. fess-crawler/src/main/java/org/codelibs/fess/crawler/client/CrawlerClientFactory.java

     *
     * <p>The factory maintains a map of regular expression patterns to crawler clients,
     * allowing for URL-based client selection. Clients can be added with specific patterns
     * and optionally at specific positions in the processing order.</p>
     *
     * <p>This factory is typically initialized through dependency injection and can be
     * configured with initialization parameters that are passed to all registered clients.</p>
     *
     * <p>Features:</p>
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 7K bytes
    - Viewed (0)
  9. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/AbstractXmlExtractor.java

                    throw new ExtractException(e);
                }
            }
    
            return encoding;
        }
    
        /**
         * Extracts text content from the given content by removing tags and processing attributes.
         * @param content The content to extract from.
         * @return The extracted text.
         */
        protected String extractString(final String content) {
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 8.5K bytes
    - Viewed (0)
  10. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/ExtractorBuilder.java

     *
     * <p>
     * The main purpose of this class is to simplify the extraction process by providing a fluent interface
     * for configuring the extraction parameters and handling the underlying complexities of content processing,
     * such as MIME type detection, extractor selection, and content length validation.
     * </p>
     *
     * <p>
     * Example usage:
     * </p>
     *
     * <pre>
     * {@code
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 10.1K bytes
    - Viewed (0)
Back to top