Search Options

Results per page
Sort
Preferred Languages
Advance

Results 11 - 20 of 21 for Xref (0.01 sec)

  1. fess-crawler-lasta/src/test/java/org/codelibs/fess/crawler/util/CrawlerWebServer.java

            buf.append(count);
            buf.append("</title></head><body><h1>Content ");
            buf.append(count);
            buf.append("</h1><br>");
            buf.append("<a href=\"index.html\">Index</a><br>");
            for (int i = 1; i <= 10; i++) {
                buf.append("<a href=\"file");
                buf.append(count);
                buf.append("-");
                buf.append(i);
                buf.append(".html\">File ");
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Mar 15 06:52:00 UTC 2025
    - 6.3K bytes
    - Viewed (0)
  2. fess-crawler/src/test/java/org/codelibs/fess/crawler/transformer/impl/HtmlTransformerTest.java

            Map<String, String> childUrlRuleMap = newHashMap();
            childUrlRuleMap.put("//A", "href");
            childUrlRuleMap.put("//AREA", "href");
            childUrlRuleMap.put("//FRAME", "src");
            childUrlRuleMap.put("//IFRAME", "src");
            childUrlRuleMap.put("//IMG", "src");
            childUrlRuleMap.put("//LINK", "href");
            childUrlRuleMap.put("//SCRIPT", "src");
            htmlTransformer.setChildUrlRuleMap(childUrlRuleMap);
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Mar 15 06:52:00 UTC 2025
    - 13.8K bytes
    - Viewed (0)
  3. fess-crawler/src/test/java/org/codelibs/fess/crawler/transformer/impl/FileTransformerTest.java

            Map<String, String> childUrlRuleMap = newHashMap();
            childUrlRuleMap.put("//A", "href");
            childUrlRuleMap.put("//AREA", "href");
            childUrlRuleMap.put("//FRAME", "src");
            childUrlRuleMap.put("//IFRAME", "src");
            childUrlRuleMap.put("//IMG", "src");
            childUrlRuleMap.put("//LINK", "href");
            childUrlRuleMap.put("//SCRIPT", "src");
            fileTransformer.setChildUrlRuleMap(childUrlRuleMap);
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Mar 15 06:52:00 UTC 2025
    - 7.6K bytes
    - Viewed (0)
  4. fess-crawler/src/test/java/org/codelibs/fess/crawler/util/CrawlerWebServer.java

            buf.append(count);
            buf.append("</title></head><body><h1>Content ");
            buf.append(count);
            buf.append("</h1><br>");
            buf.append("<a href=\"index.html\">Index</a><br>");
            for (int i = 1; i <= 10; i++) {
                buf.append("<a href=\"file");
                buf.append(count);
                buf.append("-");
                buf.append(i);
                buf.append(".html\">File ");
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Mar 15 06:52:00 UTC 2025
    - 6.3K bytes
    - Viewed (0)
  5. .github/workflows/maven.yml

            restore-keys: |
              ${{ runner.os }}-maven-
        - name: Checkout fess-parent
          uses: actions/checkout@v4
          with:
            repository: codelibs/fess-parent
            ref: ${{ env.PARENT_BRANCH }}
            path: fess-parent
        - name: Install fess-parent
          run: |
            cd fess-parent
            mvn install -Dgpg.skip=true
        - name: Build with Maven
    Registered: Fri Sep 19 09:08:11 UTC 2025
    - Last Modified: Sun May 18 02:59:16 UTC 2025
    - 1.1K bytes
    - Viewed (0)
  6. fess-crawler/src/main/resources/org/codelibs/fess/crawler/mime/tika-mimetypes.xml

      <mime-type type="message/http"/>
      <mime-type type="message/imdn+xml"/>
    
      <mime-type type="message/news">
        <magic priority="60">
          <match value="Path:" type="string" offset="0" />
          <match value="Xref:" type="string" offset="0" />
        </magic>
        <magic priority="50">
          <match value="Article" type="string" offset="0" />
        </magic>
        <sub-class-of type="text/x-tika-text-based-message"/>
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Thu Mar 13 08:18:01 UTC 2025
    - 320.1K bytes
    - Viewed (1)
  7. .github/workflows/maven.yml

            restore-keys: |
              ${{ runner.os }}-maven-
        - name: Checkout fess-parent
          uses: actions/checkout@v4
          with:
            repository: codelibs/fess-parent
            ref: ${{ env.PARENT_BRANCH }}
            path: fess-parent
        - name: Install fess-parent
          run: |
            cd fess-parent
            mvn install -Dgpg.skip=true
        - name: Build with Maven
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun May 18 03:08:24 UTC 2025
    - 1.1K bytes
    - Viewed (0)
  8. fess-crawler/src/main/java/org/codelibs/fess/crawler/transformer/impl/HtmlTransformer.java

            }
    
            return parser;
        }
    
        /**
         * Gets the base href from the document's BASE tag.
         *
         * @param document the document to extract base href from
         * @return the base href URL, or null if not found
         */
        protected String getBaseHref(final Document document) {
            try {
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 28.5K bytes
    - Viewed (0)
  9. fess-crawler/src/test/java/org/codelibs/fess/crawler/CrawlerTest.java

            final Map<String, String> childUrlRuleMap = newHashMap();
            childUrlRuleMap.put("//A", "href");
            childUrlRuleMap.put("//AREA", "href");
            childUrlRuleMap.put("//FRAME", "src");
            childUrlRuleMap.put("//IFRAME", "src");
            childUrlRuleMap.put("//IMG", "src");
            childUrlRuleMap.put("//LINK", "href");
            childUrlRuleMap.put("//SCRIPT", "src");
    
            container = new StandardCrawlerContainer();
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Sep 06 04:15:37 UTC 2025
    - 19.1K bytes
    - Viewed (0)
  10. fess-crawler/src/main/java/org/codelibs/fess/crawler/helper/RobotsTxtHelper.java

    import org.codelibs.fess.crawler.entity.RobotsTxt.Directive;
    import org.codelibs.fess.crawler.exception.RobotsTxtException;
    
    /**
     * Robots.txt Specifications:
     * <ul>
     * <li><a href=
     * "https://developers.google.com/webmasters/control-crawl-index/docs/robots_txt"
     * >https://developers.google.com/webmasters/control-crawl-index/docs/robots_txt
     * </a></li>
     * </ul>
     *
     * @author bowez
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 7.7K bytes
    - Viewed (0)
Back to top