Search Options

Results per page
Sort
Preferred Languages
Advance

Results 51 - 60 of 154 for extracted (3.38 sec)

  1. src/main/java/org/codelibs/fess/ldap/LdapManager.java

                        }
                        consumer.accept(entryDn);
                    }
                }
            }
        }
    
        /**
         * Extracts the role name from an LDAP entry DN.
         *
         * @param entryDn the LDAP entry DN
         * @return the extracted role name, or null if not found
         */
        protected String getSearchRoleName(final String entryDn) {
            if (entryDn == null) {
                return null;
    Registered: Sat Dec 20 09:19:18 UTC 2025
    - Last Modified: Fri Nov 28 16:29:12 UTC 2025
    - 86.3K bytes
    - Viewed (0)
  2. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/MarkdownExtractor.java

                }
    
                // Extract links
                if (extractLinks) {
                    extractLinkMetadata(document, extractData);
                }
    
                return extractData;
            } catch (final Exception e) {
                throw new ExtractException("Failed to extract Markdown content", e);
            }
        }
    
        /**
         * Extracts YAML front matter metadata from the document.
         *
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Sun Nov 23 03:46:53 UTC 2025
    - 8.2K bytes
    - Viewed (0)
  3. fess-crawler-lasta/src/main/resources/crawler/extractor.xml

    		class="org.codelibs.fess.crawler.extractor.impl.MsPowerPointExtractor" />
    	<component name="msPublisherExtractor"
    		class="org.codelibs.fess.crawler.extractor.impl.MsPublisherExtractor" />
    	<component name="msVisioExtractor"
    		class="org.codelibs.fess.crawler.extractor.impl.MsVisioExtractor" />
    	<component name="pdfExtractor"
    		class="org.codelibs.fess.crawler.extractor.impl.PdfExtractor" />
    	<component name="lhaExtractor"
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Sun Nov 23 03:46:53 UTC 2025
    - 50.1K bytes
    - Viewed (0)
  4. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/ExtractorFactory.java

            }
            if (extractor == null) {
                throw new CrawlerSystemException("Extractor instance is null. Cannot register null extractor.");
            }
            if (extractorMap.containsKey(key)) {
                final Extractor[] existingExtractors = extractorMap.get(key);
    
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Sun Nov 23 12:19:14 UTC 2025
    - 7.4K bytes
    - Viewed (0)
  5. src/main/resources/crawler/extractor+tikaExtractor.xml

    	"http://dbflute.org/meta/lastadi10.dtd">
    <components namespace="fessCrawler">
    	<include path="crawler/container.xml" />
    	<component name="tikaExtractor"
    		class="org.codelibs.fess.crawler.extractor.impl.TikaExtractor">
    		<property name="maxCompressionRatio">2</property>
    		<property name="maxUncompressionSize">10000000</property>
    	</component>
    Registered: Sat Dec 20 09:19:18 UTC 2025
    - Last Modified: Sun Aug 25 12:46:12 UTC 2019
    - 461 bytes
    - Viewed (0)
  6. src/main/resources/fess_config.properties

    dc:title=title:string\n\
    
    # html
    
    # XPath to extract main content from HTML documents.
    crawler.document.html.content.xpath=//BODY
    # XPath to extract language attribute from HTML documents.
    crawler.document.html.lang.xpath=//HTML/@lang
    # XPath to extract digest (description) from HTML documents.
    crawler.document.html.digest.xpath=//META[@name='description']/@content
    # XPath to extract canonical URL from HTML documents.
    Registered: Sat Dec 20 09:19:18 UTC 2025
    - Last Modified: Thu Dec 11 09:47:03 UTC 2025
    - 54.8K bytes
    - Viewed (0)
  7. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/TextExtractor.java

     */
    package org.codelibs.fess.crawler.extractor.impl;
    
    import java.io.InputStream;
    import java.util.Map;
    
    import org.codelibs.core.io.InputStreamUtil;
    import org.codelibs.fess.crawler.Constants;
    import org.codelibs.fess.crawler.entity.ExtractData;
    import org.codelibs.fess.crawler.exception.ExtractException;
    
    /**
     * Extracts text content from an input stream as plain text.
     */
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Thu Dec 11 08:38:29 UTC 2025
    - 2K bytes
    - Viewed (0)
  8. fess-crawler/src/test/java/org/codelibs/fess/crawler/extractor/impl/ArchiveExtractorErrorHandlingTest.java

                        e.getMessage().contains("TAR") || e.getMessage().contains("extract"));
            }
        }
    
        /**
         * Test that ZipExtractor successfully extracts from valid archive.
         */
        public void test_ZipExtractor_validArchive_extractsSuccessfully() {
            final InputStream in = ResourceUtil.getResourceAsStream("extractor/zip/test.zip");
    
            final ExtractData result = zipExtractor.getText(in, null);
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Mon Nov 24 03:59:47 UTC 2025
    - 12.6K bytes
    - Viewed (0)
  9. fess-crawler/src/test/java/org/codelibs/fess/crawler/extractor/impl/ExtractorResourceManagementTest.java

            final AtomicBoolean streamClosed = new AtomicBoolean(false);
    
            try (final InputStream originalStream = ResourceUtil.getResourceAsStream("extractor/msoffice/test.xls")) {
                final InputStream trackableStream = createTrackableInputStream(originalStream, streamClosed);
                final ExtractData result = extractor.getText(trackableStream, null);
    
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Mon Nov 24 03:59:47 UTC 2025
    - 10.4K bytes
    - Viewed (0)
  10. fess-crawler/src/test/java/org/codelibs/fess/crawler/extractor/ExtractorFactoryTest.java

            final Extractor extractor = new Extractor() {
                public ExtractData getText(final InputStream in, final Map<String, String> params) {
                    return null;
                }
            };
    
            assertNull(extractorFactory.getExtractor("test"));
            extractorFactory.addExtractor("test", extractor);
            assertEquals(extractor, extractorFactory.getExtractor("test"));
        }
    
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Sat Mar 15 06:52:00 UTC 2025
    - 6.9K bytes
    - Viewed (0)
Back to top