Search Options

Results per page
Sort
Preferred Languages
Advance

Results 1 - 10 of 19 for extractors (0.06 sec)

  1. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/ZipExtractor.java

                        final Extractor extractor = extractorFactory.getExtractor(mimeType);
                        if (extractor != null) {
                            try {
                                final Map<String, String> map = new HashMap<>();
                                map.put(ExtractData.RESOURCE_NAME_KEY, filename);
                                buf.append(extractor.getText(new IgnoreCloseInputStream(ais), map).getContent());
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Thu Dec 11 08:38:29 UTC 2025
    - 4.8K bytes
    - Viewed (0)
  2. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/TarExtractor.java

                        final Extractor extractor = extractorFactory.getExtractor(mimeType);
                        if (extractor != null) {
                            try {
                                final Map<String, String> map = new HashMap<>();
                                map.put(ExtractData.RESOURCE_NAME_KEY, filename);
                                buf.append(extractor.getText(new IgnoreCloseInputStream(ais), map).getContent());
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Thu Dec 11 08:38:29 UTC 2025
    - 5.1K bytes
    - Viewed (0)
  3. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/TextExtractor.java

     */
    package org.codelibs.fess.crawler.extractor.impl;
    
    import java.io.InputStream;
    import java.util.Map;
    
    import org.codelibs.core.io.InputStreamUtil;
    import org.codelibs.fess.crawler.Constants;
    import org.codelibs.fess.crawler.entity.ExtractData;
    import org.codelibs.fess.crawler.exception.ExtractException;
    
    /**
     * Extracts text content from an input stream as plain text.
     */
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Thu Dec 11 08:38:29 UTC 2025
    - 2K bytes
    - Viewed (0)
  4. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/CsvExtractor.java

    import org.codelibs.fess.crawler.Constants;
    import org.codelibs.fess.crawler.entity.ExtractData;
    import org.codelibs.fess.crawler.exception.ExtractException;
    
    /**
     * Extracts text content and metadata from CSV files.
     * This extractor provides better structured data extraction compared to Tika's generic text extraction.
     *
     * <p>Features:
     * <ul>
     *   <li>Automatic delimiter detection (comma, tab, semicolon, pipe)</li>
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Thu Dec 11 08:38:29 UTC 2025
    - 12.8K bytes
    - Viewed (0)
  5. fastapi/security/api_key.py

        """
        API key authentication using a query parameter.
    
        This defines the name of the query parameter that should be provided in the request
        with the API key and integrates that into the OpenAPI documentation. It extracts
        the key value sent in the query parameter automatically and provides it as the
        dependency result. But it doesn't define how to send that API key to the client.
    
        ## Usage
    
    Registered: Sun Dec 28 07:19:09 UTC 2025
    - Last Modified: Wed Dec 17 21:25:59 UTC 2025
    - 9.6K bytes
    - Viewed (1)
  6. src/main/java/org/codelibs/fess/crawler/transformer/FessTransformer.java

         */
        FessConfig getFessConfig();
    
        /**
         * Gets the logger instance for this transformer.
         *
         * @return the logger instance
         */
        Logger getLogger();
    
        /**
         * Extracts the host name from a URL string.
         * Removes protocol and path components to return just the hostname.
         *
         * @param u the URL string to extract host from
    Registered: Sat Dec 20 09:19:18 UTC 2025
    - Last Modified: Thu Dec 11 09:47:03 UTC 2025
    - 14.1K bytes
    - Viewed (0)
  7. src/main/java/org/codelibs/fess/crawler/transformer/FessXpathTransformer.java

            if (StringUtil.isNotBlank(xpath)) {
                return xpath;
            }
            return fessConfig.getCrawlerDocumentHtmlDigestXpath();
        }
    
        /**
         * Extracts the canonical URL from the HTML document.
         *
         * @param responseData the response data from crawling
         * @param document the parsed HTML document
         * @return the canonical URL if found, null otherwise
    Registered: Sat Dec 20 09:19:18 UTC 2025
    - Last Modified: Fri Dec 12 13:58:40 UTC 2025
    - 54.6K bytes
    - Viewed (0)
  8. .teamcity/subprojects.json

        "name": "jacoco",
        "path": "platforms/jvm/jacoco",
        "unitTests": true,
        "functionalTests": true,
        "crossVersionTests": false
      },
      {
        "name": "java-api-extractor",
        "path": "platforms/core-configuration/java-api-extractor",
        "unitTests": true,
        "functionalTests": false,
        "crossVersionTests": false
      },
      {
        "name": "java-compiler-plugin",
    Registered: Wed Dec 31 11:36:14 UTC 2025
    - Last Modified: Thu Dec 18 18:40:11 UTC 2025
    - 37.5K bytes
    - Viewed (0)
  9. src/main/java/org/codelibs/fess/crawler/FessCrawlerThread.java

                        throw new ContainerNotAvailableException(t);
                    }
                    throw t;
                }
            }
        }
    
        /**
         * Extracts anchor URLs from the given object and converts them to RequestData objects.
         * The input object can be either a single string or a list of strings representing URLs.
         *
    Registered: Sat Dec 20 09:19:18 UTC 2025
    - Last Modified: Thu Dec 11 09:47:03 UTC 2025
    - 19.5K bytes
    - Viewed (0)
  10. src/main/java/org/codelibs/fess/storage/S3StorageClient.java

                return false;
            }
        }
    
        @Override
        public void close() {
            if (s3Client != null) {
                s3Client.close();
            }
        }
    
        /**
         * Extracts the file/directory name from a full object path.
         *
         * @param objectName the full object path
         * @return the name portion of the path
         */
        private String getName(final String objectName) {
    Registered: Sat Dec 20 09:19:18 UTC 2025
    - Last Modified: Sat Dec 13 02:21:17 UTC 2025
    - 10.9K bytes
    - Viewed (0)
Back to top