Search Options

Results per page
Sort
Preferred Languages
Advance

Results 91 - 100 of 130 for content2 (0.06 sec)

  1. fess-crawler/src/main/java/org/codelibs/fess/crawler/rule/impl/SitemapsRule.java

     * represents a valid sitemap. It uses a SitemapsHelper to validate the response body as an InputStream.
     * The rule checks if the URL matches the defined regex pattern and then validates the content as a sitemap.
     * If any exception occurs during the sitemap validation, it logs the error and returns false.
     *
     */
    public class SitemapsRule extends RegexRule {
        /**
         * Serial version UID for serialization.
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 2.6K bytes
    - Viewed (0)
  2. fess-crawler/src/test/java/org/codelibs/fess/crawler/extractor/impl/ApiExtractorTest.java

            final String content = ATTR_NAME + "," + testStr;
            final Map<String, String> params = new HashMap<String, String>();
            //final ExtractData text = extractor.getText(new ByteArrayInputStream(FileUtils.readFileToByteArray(new File(filePath))), params);
            final ExtractData text = extractor.getText(new ByteArrayInputStream(testStr.getBytes()), params);
            assertEquals(content, text.getContent());
        }
    
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Mar 15 06:52:00 UTC 2025
    - 5.4K bytes
    - Viewed (0)
  3. fess-crawler/src/main/java/org/codelibs/fess/crawler/util/CrawlingParameterUtil.java

         */
        public static CrawlerContext getCrawlerContext() {
            return ROBOT_CONTEXT_THREAD_LOCAL.get();
        }
    
        /**
         * Sets the current {@link CrawlerContext} for the current thread.
         * If the provided {@code crawlerContext} is {@code null}, the context is removed from the thread-local storage.
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Mar 15 06:52:00 UTC 2025
    - 6.4K bytes
    - Viewed (0)
  4. fess-crawler/src/main/java/org/codelibs/fess/crawler/exception/MaxLengthExceededException.java

     * governing permissions and limitations under the License.
     */
    package org.codelibs.fess.crawler.exception;
    
    /**
     * MaxLengthExceededException is thrown when the content length exceeds the maximum allowed length.
     * It extends CrawlingAccessException, indicating a crawling-related access issue.
     *
     */
    public class MaxLengthExceededException extends CrawlingAccessException {
    
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 1.2K bytes
    - Viewed (0)
  5. fess-crawler-opensearch/src/main/java/org/codelibs/fess/crawler/entity/OpenSearchAccessResultData.java

    import java.io.IOException;
    import java.util.Map;
    
    import org.codelibs.core.misc.Base64Util;
    import org.codelibs.fess.crawler.exception.OpenSearchAccessException;
    import org.opensearch.core.xcontent.ToXContent;
    import org.opensearch.core.xcontent.XContentBuilder;
    
    /**
     * OpenSearchAccessResultData is an implementation of {@link AccessResultData} for OpenSearch.
     */
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 3.2K bytes
    - Viewed (0)
  6. fess-crawler-opensearch/src/main/java/org/codelibs/fess/crawler/entity/OpenSearchUrlQueue.java

     * governing permissions and limitations under the License.
     */
    package org.codelibs.fess.crawler.entity;
    
    import java.io.IOException;
    
    import org.opensearch.core.xcontent.ToXContent;
    import org.opensearch.core.xcontent.XContentBuilder;
    
    /**
     * OpenSearchUrlQueue is an implementation of {@link UrlQueue} for OpenSearch.
     */
    public class OpenSearchUrlQueue extends UrlQueueImpl<String> implements ToXContent {
    
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 3.1K bytes
    - Viewed (0)
  7. fess-crawler/src/main/java/org/codelibs/fess/crawler/client/fs/FileSystemClient.java

        public static final String FS_FILE_GROUPS = "fsFileGroups";
    
        /** Character encoding for files */
        protected String charset = Constants.UTF_8;
    
        /** Helper for managing content length limits */
        @Resource
        protected ContentLengthHelper contentLengthHelper;
    
        /** Flag to track initialization status */
        protected AtomicBoolean isInit = new AtomicBoolean(false);
    
        /**
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 13.8K bytes
    - Viewed (0)
  8. LICENSE

              documentation, if provided along with the Derivative Works; or,
              within a display generated by the Derivative Works, if and
              wherever such third-party notices normally appear. The contents
              of the NOTICE file are for informational purposes only and
              do not modify the License. You may add Your own attribution
              notices within Derivative Works that You distribute, alongside
    Registered: Fri Sep 19 09:08:11 UTC 2025
    - Last Modified: Mon Jan 11 04:30:09 UTC 2021
    - 11.1K bytes
    - Viewed (0)
  9. fess-crawler/src/main/java/org/codelibs/fess/crawler/client/http/ntlm/JcifsEngine.java

        /** The CIFS context for NTLM authentication. */
        protected BaseContext cifsContext;
    
        /**
         * Constructs a JcifsEngine with the specified properties.
         *
         * @param props the properties for configuring the CIFS context
         * @throws CrawlingAccessException if an error occurs during initialization
         */
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Thu Sep 18 09:30:45 UTC 2025
    - 4.3K bytes
    - Viewed (0)
  10. fess-crawler/src/main/java/org/codelibs/fess/crawler/helper/impl/LogHelperImpl.java

     * </p>
     * <ul>
     *   <li>Starting and finishing threads</li>
     *   <li>Starting and cleaning up crawling</li>
     *   <li>Handling unsupported URLs</li>
     *   <li>Checking last modified dates</li>
     *   <li>Getting content</li>
     *   <li>Handling redirects</li>
     *   <li>Processing responses</li>
     *   <li>Handling exceptions during crawling and child URL processing</li>
     *   <li>Handling cases where no URL is in the queue</li>
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 14K bytes
    - Viewed (0)
Back to top