Search Options

Results per page
Sort
Preferred Languages
Advance

Results 21 - 28 of 28 for runes (0.01 sec)

  1. fess-crawler/src/test/java/org/codelibs/fess/crawler/transformer/TransformerTest.java

                    return null;
                }
    
                ResultData resultData = new ResultData();
                resultData.setTransformerName(name);
                // Apply transformation rules
                try (InputStream is = responseData.getResponseBody()) {
                    byte[] bytes = is.readAllBytes();
                    String content = new String(bytes);
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Sep 06 04:15:37 UTC 2025
    - 28K bytes
    - Viewed (0)
  2. fess-crawler/src/main/java/org/codelibs/fess/crawler/CrawlerContext.java

        /**
         * Filter for URLs to control which URLs are processed.
         */
        protected UrlFilter urlFilter;
    
        /**
         * Manager for crawling rules and configurations.
         */
        protected RuleManager ruleManager;
    
        /**
         * Controller for managing crawling intervals and delays.
         */
        protected IntervalController intervalController;
    
        /**
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 8.9K bytes
    - Viewed (0)
  3. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/PdfExtractor.java

    /**
     * PdfExtractor extracts text content from PDF files using Apache PDFBox.
     * It supports password-protected PDFs and can extract embedded documents and annotations.
     *
     * <p>The extractor runs text extraction in a separate thread with a configurable timeout
     * to prevent hanging on problematic PDF files. It also extracts metadata from the PDF
     * document and includes it in the extraction result.
     *
     * <p>Features:
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 12.7K bytes
    - Viewed (0)
  4. fess-crawler/src/main/java/org/codelibs/fess/crawler/transformer/impl/XmlTransformer.java

     *   <li>Coalescing</li>
     *   <li>Entity expansion</li>
     *   <li>Ignoring comments and whitespace</li>
     *   <li>Validation</li>
     *   <li>XInclude awareness</li>
     * </ul>
     *
     * <p>
     * It also allows defining field rules using XPath expressions to extract specific data from the XML document and map it to fields in the ResultData.
     * The extracted data is then formatted into an XML structure suitable for indexing.
     * </p>
     *
     * <p>
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 23.9K bytes
    - Viewed (0)
  5. fess-crawler/src/main/java/org/codelibs/fess/crawler/CrawlerThread.java

         */
        protected void log(final LogHelper logHelper, final LogType key, final Object... objs) {
            if (logHelper != null) {
                logHelper.log(key, objs);
            }
        }
    
        /**
         * Runs the crawling process in a separate thread.
         * This method fetches URLs from the queue, accesses content, processes responses,
         * and extracts child URLs until the crawling process is done or no more URLs are available.
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Thu Aug 07 02:55:08 UTC 2025
    - 20.4K bytes
    - Viewed (0)
  6. fess-crawler-lasta/src/main/resources/crawler/extractor.xml

    				"application/onenote",
    				"application/parityfec",
    				"application/patch-ops-error+xml",
    				"application/pgp-encrypted",
    				"application/pgp-keys",
    				"application/pgp-signature",
    				"application/pics-rules",
    				"application/pidf+xml",
    				"application/pidf-diff+xml",
    				"application/pkcs10",
    				"application/pkcs7-mime",
    				"application/pkcs7-signature",
    				"application/pkix-cert",
    				"application/pkix-crl",
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Aug 01 21:40:30 UTC 2020
    - 49K bytes
    - Viewed (0)
  7. src/main/resources/suggest_indices/suggest_analyzer.json

          },
          "dutch_stemmer": {
            "type":       "stemmer",
            "language":   "dutch"
          },
          "dutch_override": {
            "type":       "stemmer_override",
            "rules": [
              "fiets=>fiets",
              "bromfiets=>bromfiets",
              "ei=>eier",
              "kind=>kinder"
            ]
          },
          "english_keywords": {
            "type":       "keyword_marker",
    Registered: Fri Sep 19 09:08:11 UTC 2025
    - Last Modified: Thu Oct 03 02:51:59 UTC 2019
    - 57.3K bytes
    - Viewed (0)
  8. fess-crawler/src/main/resources/org/codelibs/fess/crawler/mime/tika-mimetypes.xml

      <mime-type type="application/pgp-keys"/>
    
      <mime-type type="application/pgp-signature">
        <glob pattern="*.asc"/>
        <glob pattern="*.sig"/>
      </mime-type>
    
      <mime-type type="application/pics-rules">
        <glob pattern="*.prf"/>
      </mime-type>
      <mime-type type="application/pidf+xml"/>
      <mime-type type="application/pidf-diff+xml"/>
      <mime-type type="application/pkcs10">
        <glob pattern="*.p10"/>
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Thu Mar 13 08:18:01 UTC 2025
    - 320.1K bytes
    - Viewed (1)
Back to top