Search Options

Results per page
Sort
Preferred Languages
Advance

Results 51 - 60 of 61 for Extractor (0.04 sec)

  1. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/FilenameExtractor.java

     * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND,
     * either express or implied. See the License for the specific language
     * governing permissions and limitations under the License.
     */
    package org.codelibs.fess.crawler.extractor.impl;
    
    import java.io.InputStream;
    import java.util.Map;
    
    import org.codelibs.core.lang.StringUtil;
    import org.codelibs.fess.crawler.entity.ExtractData;
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 1.9K bytes
    - Viewed (0)
  2. src/main/java/org/codelibs/fess/util/ComponentUtil.java

         */
        public static IntervalControlHelper getIntervalControlHelper() {
            return getComponent(INTERVAL_CONTROL_HELPER);
        }
    
        /**
         * Gets the extractor factory component.
         * @return The extractor factory.
         */
        public static ExtractorFactory getExtractorFactory() {
            return getComponent(EXTRACTOR_FACTORY);
        }
    
        /**
         * Gets a job executor by name.
    Registered: Thu Sep 04 12:52:25 UTC 2025
    - Last Modified: Thu Jul 17 08:28:31 UTC 2025
    - 28.9K bytes
    - Viewed (0)
  3. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/TikaExtractor.java

    import org.apache.logging.log4j.Logger;
    import org.apache.tika.config.TikaConfig;
    import org.apache.tika.detect.Detector;
    import org.apache.tika.exception.TikaException;
    import org.apache.tika.extractor.EmbeddedDocumentExtractor;
    import org.apache.tika.extractor.ParsingEmbeddedDocumentExtractor;
    import org.apache.tika.io.TemporaryResources;
    import org.apache.tika.io.TikaInputStream;
    import org.apache.tika.metadata.Metadata;
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Thu Aug 07 02:55:08 UTC 2025
    - 30.7K bytes
    - Viewed (0)
  4. fess-crawler-lasta/src/main/resources/crawler.xml

    	<include path="crawler/container.xml"/>
    	<include path="crawler/client.xml"/>
    	<include path="crawler/rule.xml"/>
    	<include path="crawler/filter.xml"/>
    	<include path="crawler/interval.xml"/>
    	<include path="crawler/extractor.xml"/>
    	<include path="crawler/mimetype.xml"/>
    	<include path="crawler/encoding.xml"/>
    	<include path="crawler/urlconverter.xml"/>
    	<include path="crawler/log.xml"/>
    	<include path="crawler/sitemaps.xml"/>
    
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Tue Nov 28 13:40:25 UTC 2017
    - 1.7K bytes
    - Viewed (0)
  5. fess-crawler/src/test/java/org/codelibs/fess/crawler/CrawlerTest.java

    import org.codelibs.fess.crawler.entity.AccessResultImpl;
    import org.codelibs.fess.crawler.entity.UrlQueue;
    import org.codelibs.fess.crawler.entity.UrlQueueImpl;
    import org.codelibs.fess.crawler.extractor.ExtractorFactory;
    import org.codelibs.fess.crawler.extractor.impl.TikaExtractor;
    import org.codelibs.fess.crawler.filter.impl.UrlFilterImpl;
    import org.codelibs.fess.crawler.helper.ContentLengthHelper;
    import org.codelibs.fess.crawler.helper.EncodingHelper;
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Sep 06 04:15:37 UTC 2025
    - 19.1K bytes
    - Viewed (0)
  6. fess-crawler/src/test/java/org/codelibs/fess/crawler/transformer/impl/XmlTransformerTest.java

                    + "</doc>";
    
            final ResponseData responseData = new ResponseData();
            responseData.setResponseBody(ResourceUtil.getResourceAsFile("extractor/test.xml"), false);
            responseData.setCharSet(Constants.UTF_8);
            final ResultData resultData = xmlTransformer.transform(responseData);
            assertEquals(result, new String(resultData.getData(), Constants.UTF_8));
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Mar 15 06:52:00 UTC 2025
    - 13.5K bytes
    - Viewed (0)
  7. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/AbstractXmlExtractor.java

     * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND,
     * either express or implied. See the License for the specific language
     * governing permissions and limitations under the License.
     */
    package org.codelibs.fess.crawler.extractor.impl;
    
    import java.io.BufferedInputStream;
    import java.io.IOException;
    import java.io.InputStream;
    import java.nio.charset.Charset;
    import java.util.Map;
    import java.util.regex.Matcher;
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 8.5K bytes
    - Viewed (0)
  8. src/test/java/org/codelibs/fess/helper/DocumentHelperTest.java

     */
    package org.codelibs.fess.helper;
    
    import java.util.HashMap;
    import java.util.Map;
    
    import org.codelibs.fess.crawler.entity.ResponseData;
    import org.codelibs.fess.crawler.extractor.impl.TikaExtractor;
    import org.codelibs.fess.unit.UnitFessTestCase;
    
    public class DocumentHelperTest extends UnitFessTestCase {
    
        @Override
        public void setUp() throws Exception {
            super.setUp();
    Registered: Thu Sep 04 12:52:25 UTC 2025
    - Last Modified: Thu Jul 10 13:41:04 UTC 2025
    - 13K bytes
    - Viewed (0)
  9. .github/CODEOWNERS

    platforms/enterprise/enterprise-logging/                @gradle/bt-build-scan @gradle/dv-testing-team
    
    # JVM platform
    platforms/jvm/                                      @gradle/bt-jvm
    platforms/core-configuration/java-api-extractor     @gradle/bt-jvm
    
    # JVM testing services also shared by GE testing plugins
    platforms/jvm/testing-junit-platform/       @gradle/bt-jvm @gradle/dv-testing-team
    Registered: Wed Sep 10 11:36:15 UTC 2025
    - Last Modified: Mon Jul 28 01:45:03 UTC 2025
    - 10.9K bytes
    - Viewed (0)
  10. cmd/signature-v4-parser_test.go

    		t.Errorf("Test %d: scope request mismatch:Expected \"%s\", got \"%s\"", testNum, expectedCredentials.scope.request, actualCredential.scope.request)
    	}
    }
    
    // TestParseCredentialHeader - validates the format validator and extractor for the Credential header in an aws v4 request.
    // A valid format of credential should be of the following format.
    // Credential = accessKey + SlashSeparator+ scope
    // where scope = string.Join([]string{  currTime.Format(yyyymmdd),
    Registered: Sun Sep 07 19:28:11 UTC 2025
    - Last Modified: Tue Feb 18 16:25:55 UTC 2025
    - 27.4K bytes
    - Viewed (0)
Back to top