Search Options

Results per page
Sort
Preferred Languages
Advance

Results 41 - 45 of 45 for extras (0.02 sec)

  1. fess-crawler/src/main/java/org/codelibs/fess/crawler/transformer/impl/XpathTransformer.java

    import org.w3c.dom.Document;
    import org.w3c.dom.Node;
    import org.xml.sax.InputSource;
    
    /**
     * {@link XpathTransformer} is a class that transforms HTML content into XML format based on XPath expressions.
     * It extracts data from an HTML document by applying XPath rules defined in {@link #fieldRuleMap}.
     * The extracted data is then formatted into an XML structure and stored in the {@link ResultData}.
     * <p>
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 13.1K bytes
    - Viewed (0)
  2. fess-crawler/src/main/java/org/codelibs/fess/crawler/CrawlerThread.java

            }
        }
    
        /**
         * Runs the crawling process in a separate thread.
         * This method fetches URLs from the queue, accesses content, processes responses,
         * and extracts child URLs until the crawling process is done or no more URLs are available.
         */
        @Override
        public void run() {
            log(logHelper, LogType.START_THREAD, crawlerContext);
            int threadCheckCount = 0;
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Thu Aug 07 02:55:08 UTC 2025
    - 20.4K bytes
    - Viewed (0)
  3. src/test/java/org/codelibs/fess/suggest/util/SuggestUtilTest.java

            String[] fields = { "content" };
            List<String> keywords = SuggestUtil.getKeywords(query, fields);
            assertNotNull(keywords);
            // Should extract all unique terms
            assertTrue(keywords.size() > 0);
        }
    
        @Test
        public void testCreateBulkLineWithMinimalItem() {
            // Test with minimal SuggestItem
    Registered: Fri Sep 19 09:08:11 UTC 2025
    - Last Modified: Mon Sep 01 13:33:03 UTC 2025
    - 18.2K bytes
    - Viewed (0)
  4. fess-crawler/src/main/java/org/codelibs/fess/crawler/client/ftp/FtpClient.java

            private URI uri;
    
            private String parent;
    
            private String name;
    
            /**
             * Constructs a new FtpInfo from a URL string.
             * This constructor parses the URL and extracts the host, port, parent directory,
             * and file name components.
             *
             * @param s The URL string to parse
             * @param c The character encoding (not currently used)
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 39.5K bytes
    - Viewed (0)
  5. fess-crawler/src/main/java/org/codelibs/fess/crawler/client/http/HcHttpClient.java

                httpClientPropertyMap.put(name, value);
            }
        }
    
        /**
         * Processes robots.txt for the given URL.
         * This method fetches and parses the robots.txt file to extract disallow/allow rules
         * and sitemap information.
         *
         * @param url The URL to process robots.txt for
         */
        protected void processRobotsTxt(final String url) {
            if (StringUtil.isBlank(url)) {
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Thu Aug 07 02:55:08 UTC 2025
    - 52.2K bytes
    - Viewed (0)
Back to top