Search Options

Results per page
Sort
Preferred Languages
Advance

Results 1 - 3 of 3 for getCrawlerDocumentHtmlCanonicalXpath (0.8 sec)

  1. src/test/java/org/codelibs/fess/crawler/transformer/FessXpathTransformerTest.java

                }
            };
            transformer.fessConfig = new FessConfig.SimpleImpl() {
                private static final long serialVersionUID = 1L;
    
                public String getCrawlerDocumentHtmlCanonicalXpath() {
                    return "//LINK[@rel='canonical'][1]/@href";
                };
            };
    
            final ResponseData responseData = new ResponseData();
            responseData.setSessionId("test");
    Registered: Wed Jun 12 13:08:18 UTC 2024
    - Last Modified: Thu Feb 22 01:37:57 UTC 2024
    - 38.6K bytes
    - Viewed (0)
  2. src/main/java/org/codelibs/fess/crawler/transformer/FessXpathTransformer.java

            String xpath = configMap.get(Config.HTML_CANONICAL_XPATH);
            if (xpath == null) {
                xpath = fessConfig.getCrawlerDocumentHtmlCanonicalXpath();
            }
            if (StringUtil.isBlank(xpath)) {
                return null;
            }
            final String canonicalUrl = getSingleNodeValue(document, xpath, node -> node);
    Registered: Wed Jun 12 13:08:18 UTC 2024
    - Last Modified: Thu Feb 22 01:37:57 UTC 2024
    - 41.9K bytes
    - Viewed (0)
  3. src/main/java/org/codelibs/fess/mylasta/direction/FessConfig.java

         * The value is, e.g. //LINK[@rel='canonical'][1]/@href <br>
         * @return The value of found property. (NotNull: if not found, exception but basically no way)
         */
        String getCrawlerDocumentHtmlCanonicalXpath();
    
        /**
         * Get the value for the key 'crawler.document.html.pruned.tags'. <br>
         * The value is, e.g. noscript,script,style,header,footer,aside,nav,a[rel=nofollow] <br>
    Registered: Wed Jun 12 13:08:18 UTC 2024
    - Last Modified: Thu Apr 11 02:34:53 UTC 2024
    - 459.2K bytes
    - Viewed (0)
Back to top