Search Options

Results per page
Sort
Preferred Languages
Advance

Results 1 - 3 of 3 for getCrawlerDocumentHtmlCanonicalXpath (0.42 sec)

  1. src/test/java/org/codelibs/fess/crawler/transformer/FessXpathTransformerTest.java

                }
            };
            transformer.fessConfig = new FessConfig.SimpleImpl() {
                private static final long serialVersionUID = 1L;
    
                public String getCrawlerDocumentHtmlCanonicalXpath() {
                    return "//LINK[@rel='canonical'][1]/@href";
                };
            };
    
            final ResponseData responseData = new ResponseData();
            responseData.setSessionId("test");
    Registered: Thu Sep 04 12:52:25 UTC 2025
    - Last Modified: Sat Jul 19 23:49:30 UTC 2025
    - 41.5K bytes
    - Viewed (0)
  2. src/main/java/org/codelibs/fess/crawler/transformer/FessXpathTransformer.java

            String xpath = configMap.get(Config.HTML_CANONICAL_XPATH);
            if (xpath == null) {
                xpath = fessConfig.getCrawlerDocumentHtmlCanonicalXpath();
            }
            if (StringUtil.isBlank(xpath)) {
                return null;
            }
            final String canonicalUrl = getSingleNodeValue(document, xpath, node -> node);
    Registered: Thu Sep 04 12:52:25 UTC 2025
    - Last Modified: Thu Aug 07 03:06:29 UTC 2025
    - 54.4K bytes
    - Viewed (0)
  3. src/main/java/org/codelibs/fess/mylasta/direction/FessConfig.java

         * comment: XPath to extract canonical URL from HTML documents.
         * @return The value of found property. (NotNull: if not found, exception but basically no way)
         */
        String getCrawlerDocumentHtmlCanonicalXpath();
    
        /**
         * Get the value for the key 'crawler.document.html.pruned.tags'. <br>
         * The value is, e.g. noscript,script,style,header,footer,aside,nav,a[rel=nofollow] <br>
    Registered: Thu Sep 04 12:52:25 UTC 2025
    - Last Modified: Thu Jul 17 08:28:31 UTC 2025
    - 525.6K bytes
    - Viewed (1)
Back to top