Search Options

Results per page
Sort
Preferred Languages
Advance

Results 31 - 40 of 45 for furent (0.02 sec)

  1. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/AbstractXmlExtractor.java

            }
            matcher.appendTail(sb);
            return sb.toString().replaceAll("\\s+", " ").trim();
        }
    
        /**
         * Returns the current encoding setting.
         * @return The current encoding.
         */
        public String getEncoding() {
            return encoding;
        }
    
        /**
         * Sets the encoding for content extraction.
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 8.5K bytes
    - Viewed (0)
  2. fess-crawler/src/main/java/org/codelibs/fess/crawler/CrawlerThread.java

                }
            }
    
        }
    
        /**
         * Stores child URLs to the crawling queue.
         * @param childUrlList The set of child URLs to store.
         * @param url The parent URL.
         * @param depth The depth of the child URLs.
         */
        protected void storeChildUrls(final Set<RequestData> childUrlList, final String url, final int depth) {
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Thu Aug 07 02:55:08 UTC 2025
    - 20.4K bytes
    - Viewed (0)
  3. fess-crawler/src/main/java/org/codelibs/fess/crawler/util/IgnoreCloseInputStream.java

         *
         * @return a hash code value for this object
         */
        @Override
        public int hashCode() {
            return inputStream.hashCode();
        }
    
        /**
         * Marks the current position in this input stream.
         *
         * @param readlimit the maximum limit of bytes that can be read before the mark position becomes invalid
         */
        @Override
        public synchronized void mark(final int readlimit) {
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 5.3K bytes
    - Viewed (0)
  4. fess-crawler/src/main/java/org/codelibs/fess/crawler/entity/AccessResultImpl.java

        protected String sessionId;
    
        /** The rule ID that matched the accessed resource. */
        protected String ruleId;
    
        /** The URL of the accessed resource. */
        protected String url;
    
        /** The parent URL of the accessed resource. */
        protected String parentUrl;
    
        /** The status of the access result. */
        protected Integer status = Constants.OK_STATUS;
    
        /** The HTTP status code of the access result. */
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 9K bytes
    - Viewed (0)
  5. fess-crawler-opensearch/src/main/java/org/codelibs/fess/crawler/entity/OpenSearchAccessResult.java

         */
        public static final String RULE_ID = "ruleId";
    
        /**
         * Field name for URL.
         */
        public static final String URL = "url";
    
        /**
         * Field name for parent URL.
         */
        public static final String PARENT_URL = "parentUrl";
    
        /**
         * Field name for status.
         */
        public static final String STATUS = "status";
    
        /**
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 6.5K bytes
    - Viewed (0)
  6. fess-crawler/src/main/java/org/codelibs/fess/crawler/service/impl/UrlQueueServiceImpl.java

            }
        }
    
        /**
         * Generates URL queues from a previous session's access results.
         * @param previousSessionId The previous session ID.
         * @param sessionId The current session ID.
         */
        @Override
        public void generateUrlQueues(final String previousSessionId, final String sessionId) {
            final Queue<UrlQueueImpl<Long>> urlQueueList = dataHelper.getUrlQueueList(sessionId);
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 9.3K bytes
    - Viewed (0)
  7. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/ExtractorBuilder.java

     * and cache file size to optimize the extraction process.
     *
     * <p>
     * The main purpose of this class is to simplify the extraction process by providing a fluent interface
     * for configuring the extraction parameters and handling the underlying complexities of content processing,
     * such as MIME type detection, extractor selection, and content length validation.
     * </p>
     *
     * <p>
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 10.1K bytes
    - Viewed (0)
  8. README.md

    - **Index Management**: Automatic index creation, switching, and maintenance
    - **Customizable Scoring**: User boost, document frequency, and query frequency weighting
    
    ## Technology Stack
    
    - **Java**: 21+ (configured via parent POM)
    - **OpenSearch**: Latest (provided scope)
    - **Apache Lucene**: Query parsing and text analysis
    - **ICU4J**: Unicode text processing and normalization
    - **JUnit 4**: Testing framework
    Registered: Fri Sep 19 09:08:11 UTC 2025
    - Last Modified: Sun Aug 31 03:31:14 UTC 2025
    - 12.1K bytes
    - Viewed (1)
  9. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/HtmlExtractor.java

            }
    
            return parser;
        }
    
        /**
         * Gets a thread-local XPathAPI instance for thread-safe XPath evaluation.
         *
         * @return the XPathAPI instance for the current thread
         */
        protected XPathAPI getXPathAPI() {
            XPathAPI cachedXPathAPI = xpathAPI.get();
            if (cachedXPathAPI == null) {
                cachedXPathAPI = new XPathAPI();
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 9.3K bytes
    - Viewed (0)
  10. fess-crawler/src/main/java/org/codelibs/fess/crawler/processor/impl/DefaultResponseProcessor.java

        }
    
        /**
         * Stores child URLs found in the response data.
         *
         * @param crawlerContext the crawler context
         * @param childUrlList the set of child URLs
         * @param url the parent URL
         * @param depth the depth of the child URLs
         * @param encoding the encoding of the child URLs
         */
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Thu Aug 07 02:55:08 UTC 2025
    - 12.5K bytes
    - Viewed (0)
Back to top