Search Options

Results per page
Sort
Preferred Languages
Advance

Results 41 - 50 of 64 for default (0.03 sec)

  1. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/HtmlExtractor.java

                    return strList.toArray(n -> new String[n]);
                case NODE:
                    final Node node = (Node) xObj.value();
                    return new String[] { node.getTextContent() };
                default:
                    Object obj = xObj.value();
                    if (obj == null) {
                        obj = "";
                    }
                    return new String[] { obj.toString() };
                }
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 9.3K bytes
    - Viewed (0)
  2. fess-crawler/src/main/java/org/codelibs/fess/crawler/entity/SitemapUrl.java

         * are compared to pages on other sites—it only lets the search engines know
         * which pages you deem most important for the crawlers.
         *
         * The default priority of a page is 0.5.
         *
         * Please note that the priority you assign to a page is not likely to
         * influence the position of your URLs in a search engine's result pages.
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 6.5K bytes
    - Viewed (0)
  3. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/ExtractorFactory.java

        protected Map<String, Extractor[]> extractorMap = new HashMap<>();
    
        /**
         * Constructs a new ExtractorFactory.
         */
        public ExtractorFactory() {
            // Default constructor
        }
    
        /**
         * Adds an extractor to the factory for the specified key.
         * If an extractor already exists for the key, the new extractor is added to the array of extractors,
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 7.3K bytes
    - Viewed (0)
  4. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/HtmlXpathExtractor.java

     * It also includes caching mechanism for XPathAPI instances to improve performance.
     * </p>
     * <p>
     * The extracted text is obtained from the nodes selected by the {@code targetNodePath} XPath expression.
     * The default value for {@code targetNodePath} is "//HTML/BODY | //@alt | //@title", which selects the body of the HTML document,
     * as well as the alt and title attributes.
     * </p>
     * <p>
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 10.3K bytes
    - Viewed (0)
  5. fess-crawler/src/test/java/org/codelibs/fess/crawler/CrawlerContextTest.java

            }
    
            public void delayAtNoUrlInQueue() {
            }
    
            public void delayForWaitingNewUrl() {
            }
        }
    
        /**
         * Test default constructor
         */
        public void test_constructor() {
            CrawlerContext context = new CrawlerContext();
            assertNotNull(context);
            assertNull(context.getSessionId());
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Sep 06 04:15:37 UTC 2025
    - 25.6K bytes
    - Viewed (0)
  6. fess-crawler/src/main/java/org/codelibs/fess/net/protocol/storage/Handler.java

     * </p>
     */
    public class Handler extends URLStreamHandler {
    
        /**
         * Constructs a new Handler.
         */
        public Handler() {
            // Default constructor
        }
    
        /**
         * Opens a connection to the storage URL.
         *
         * @param u The URL to open a connection to
         * @return A new StorageURLConnection instance
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 10.5K bytes
    - Viewed (0)
  7. fess-crawler/src/main/java/org/codelibs/fess/crawler/CrawlerContext.java

     * </p>
     */
    public class CrawlerContext {
        /**
         * Constructs a new CrawlerContext.
         */
        public CrawlerContext() {
            // Default constructor
        }
    
        /**
         * Session identifier for the crawling session.
         */
        protected String sessionId;
    
        /**
         * Current number of active crawler threads.
         */
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 8.9K bytes
    - Viewed (0)
  8. fess-crawler/src/main/java/org/codelibs/fess/crawler/util/TextUtil.java

            private int maxAlphanumTermSize = -1;
    
            private int maxSymbolTermSize = -1;
    
            private boolean duplicateTermRemoved = false;
    
            /**
             * Array of space characters. Default includes common space characters.
             */
            private int[] spaceChars = { '\u0020', '\u00a0', '\u3000', '\ufffd' };
    
            /**
             * Constructor.
             * @param reader The reader.
             */
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 12K bytes
    - Viewed (0)
  9. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/ExtractorBuilder.java

                    extractor = extractorFactory.getExtractor(detectedMimeType);
                    if (extractor == null) {
                        if (logger.isDebugEnabled()) {
                            logger.debug("Using default extractor {} for MIME type {}", extractorName, mimeType);
                        }
                        extractor = crawlerContainer.getComponent(extractorName);
                    } else if (logger.isDebugEnabled()) {
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 10.1K bytes
    - Viewed (0)
  10. fess-crawler/src/main/java/org/codelibs/fess/crawler/entity/RobotsTxt.java

        private final List<String> sitemapList = new ArrayList<>();
    
        /**
         * Creates a new RobotsTxt instance.
         */
        public RobotsTxt() {
            // Default constructor
        }
    
        /**
         * Checks if access to a given path is allowed for a specific user agent according to robots.txt rules.
         *
         * @param path The path to check for access permission
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 10K bytes
    - Viewed (0)
Back to top