Search Options

Results per page
Sort
Preferred Languages
Advance

Results 1 - 10 of 111 for xpath (0.07 sec)

  1. src/main/java/org/codelibs/fess/crawler/transformer/FessXpathTransformer.java

            final String xpath = xpathConfigMap.get(XPath.DEFAULT_LANG);
            if (StringUtil.isNotBlank(xpath)) {
                return xpath;
            }
            return fessConfig.getCrawlerDocumentHtmlLangXpath();
        }
    
        /**
         * Gets the XPath expression for extracting content.
         *
         * @param fessConfig the Fess configuration
         * @param xpathConfigMap the XPath configuration map
    Registered: Sat Dec 20 09:19:18 UTC 2025
    - Last Modified: Fri Dec 12 13:58:40 UTC 2025
    - 54.6K bytes
    - Viewed (0)
  2. fess-crawler/src/main/java/org/codelibs/fess/crawler/transformer/impl/HtmlTransformer.java

        }
    
        /**
         * Checks if a path is valid for crawling (not a JavaScript, mailto, or other invalid URL).
         *
         * @param path the path to validate
         * @return true if the path is valid, false otherwise
         */
        protected boolean isValidPath(final String path) {
            if (StringUtil.isBlank(path)) {
                return false;
            }
    
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Sat Nov 29 07:42:33 UTC 2025
    - 30.5K bytes
    - Viewed (0)
  3. src/main/resources/fess_config.properties

    dc:title=title:string\n\
    
    # html
    
    # XPath to extract main content from HTML documents.
    crawler.document.html.content.xpath=//BODY
    # XPath to extract language attribute from HTML documents.
    crawler.document.html.lang.xpath=//HTML/@lang
    # XPath to extract digest (description) from HTML documents.
    crawler.document.html.digest.xpath=//META[@name='description']/@content
    # XPath to extract canonical URL from HTML documents.
    Registered: Sat Dec 20 09:19:18 UTC 2025
    - Last Modified: Thu Dec 11 09:47:03 UTC 2025
    - 54.8K bytes
    - Viewed (0)
  4. src/main/java/org/codelibs/fess/mylasta/direction/FessConfig.java

        /** The key of the configuration. e.g. //HTML/@lang */
        String CRAWLER_DOCUMENT_HTML_LANG_XPATH = "crawler.document.html.lang.xpath";
    
        /** The key of the configuration. e.g. //META[@name='description']/@content */
        String CRAWLER_DOCUMENT_HTML_DIGEST_XPATH = "crawler.document.html.digest.xpath";
    
    Registered: Sat Dec 20 09:19:18 UTC 2025
    - Last Modified: Sat Dec 13 02:21:17 UTC 2025
    - 525.7K bytes
    - Viewed (2)
  5. src/main/java/org/codelibs/core/io/FileUtil.java

        /**
         * Reads text from a file using the default encoding.
         *
         * @param path
         *            The file path. Must not be {@literal null} or empty.
         * @return The text read from the file.
         */
        public static String readText(final String path) {
            assertArgumentNotEmpty("path", path);
            return readText(path, Charset.defaultCharset().name());
        }
    
        /**
    Registered: Sat Dec 20 08:55:33 UTC 2025
    - Last Modified: Sat Nov 22 11:21:59 UTC 2025
    - 13.1K bytes
    - Viewed (0)
  6. fess-crawler/src/main/java/org/codelibs/fess/crawler/client/s3/S3Client.java

        }
    
        /**
         * Parses an S3 path into bucket name and object path components.
         * @param path the S3 path to parse (format: bucket/object/path)
         * @return an array containing the bucket name and object path
         * @throws CrawlingAccessException if the path format is invalid
         */
        protected String[] parsePath(final String path) {
            if (StringUtil.isNotEmpty(path)) {
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Thu Dec 11 08:38:29 UTC 2025
    - 21.4K bytes
    - Viewed (0)
  7. src/test/java/org/codelibs/core/io/FileUtilTest.java

        }
    
        /**
         * Test isPathSafe with path outside base directory
         *
         * @throws Exception
         */
        @Test
        public void testIsPathSafe_PathOutsideBase() throws Exception {
            final Path baseDir = tempFolder.getRoot().toPath();
            final Path outsidePath = Paths.get("/tmp/outside.txt");
    
    Registered: Sat Dec 20 08:55:33 UTC 2025
    - Last Modified: Sat Nov 22 11:21:59 UTC 2025
    - 10.3K bytes
    - Viewed (0)
  8. src/main/java/org/codelibs/fess/app/web/admin/storage/AdminStorageAction.java

        }
    
        /**
         * Creates a path prefix with trailing slash if path is not empty.
         *
         * @param path the base path
         * @return path with trailing slash or empty string
         */
        protected static String getPathPrefix(final String path) {
            return StringUtil.isEmpty(path) ? StringUtil.EMPTY : path + "/";
        }
    
        /**
         * Combines path and name to create a full object name.
         *
    Registered: Sat Dec 20 09:19:18 UTC 2025
    - Last Modified: Sat Dec 13 02:21:17 UTC 2025
    - 22.1K bytes
    - Viewed (0)
  9. src/main/java/org/codelibs/fess/helper/CurlHelper.java

        /**
         * Creates a GET request for the specified path.
         * @param path the request path
         * @return the configured CurlRequest
         */
        public CurlRequest get(final String path) {
            return request(Method.GET, path).header("Content-Type", "application/json");
        }
    
        /**
         * Creates a POST request for the specified path.
         * @param path the request path
         * @return the configured CurlRequest
         */
    Registered: Sat Dec 20 09:19:18 UTC 2025
    - Last Modified: Fri Nov 28 16:29:12 UTC 2025
    - 6.1K bytes
    - Viewed (0)
  10. src/main/java/org/codelibs/fess/app/web/admin/wizard/AdminWizardAction.java

            }
    
            if (path.startsWith("www.")) {
                return "http://" + path;
            }
    
            if (path.startsWith("//")) {
                return "file://" + path;
            }
            if (path.startsWith("/")) {
                return "file:" + path;
            }
            if (!path.startsWith("file:")) {
                return "file:/" + path.replace('\\', '/');
            }
            return path;
        }
    Registered: Sat Dec 20 09:19:18 UTC 2025
    - Last Modified: Thu Dec 11 09:47:03 UTC 2025
    - 16.3K bytes
    - Viewed (0)
Back to top