- Sort Score
- Result 10 results
- Languages All
Results 51 - 60 of 61 for Extractor (0.05 sec)
-
fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/FilenameExtractor.java
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, * either express or implied. See the License for the specific language * governing permissions and limitations under the License. */ package org.codelibs.fess.crawler.extractor.impl; import java.io.InputStream; import java.util.Map; import org.codelibs.core.lang.StringUtil; import org.codelibs.fess.crawler.entity.ExtractData;
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 1.9K bytes - Viewed (0) -
src/main/java/org/codelibs/fess/util/ComponentUtil.java
*/ public static IntervalControlHelper getIntervalControlHelper() { return getComponent(INTERVAL_CONTROL_HELPER); } /** * Gets the extractor factory component. * @return The extractor factory. */ public static ExtractorFactory getExtractorFactory() { return getComponent(EXTRACTOR_FACTORY); } /** * Gets a job executor by name.
Registered: Thu Sep 04 12:52:25 UTC 2025 - Last Modified: Thu Jul 17 08:28:31 UTC 2025 - 28.9K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/TikaExtractor.java
import org.apache.logging.log4j.Logger; import org.apache.tika.config.TikaConfig; import org.apache.tika.detect.Detector; import org.apache.tika.exception.TikaException; import org.apache.tika.extractor.EmbeddedDocumentExtractor; import org.apache.tika.extractor.ParsingEmbeddedDocumentExtractor; import org.apache.tika.io.TemporaryResources; import org.apache.tika.io.TikaInputStream; import org.apache.tika.metadata.Metadata;
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Thu Aug 07 02:55:08 UTC 2025 - 30.7K bytes - Viewed (0) -
fess-crawler-lasta/src/main/resources/crawler.xml
<include path="crawler/container.xml"/> <include path="crawler/client.xml"/> <include path="crawler/rule.xml"/> <include path="crawler/filter.xml"/> <include path="crawler/interval.xml"/> <include path="crawler/extractor.xml"/> <include path="crawler/mimetype.xml"/> <include path="crawler/encoding.xml"/> <include path="crawler/urlconverter.xml"/> <include path="crawler/log.xml"/> <include path="crawler/sitemaps.xml"/>
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Tue Nov 28 13:40:25 UTC 2017 - 1.7K bytes - Viewed (0) -
fess-crawler/src/test/java/org/codelibs/fess/crawler/CrawlerTest.java
import org.codelibs.fess.crawler.entity.AccessResultImpl; import org.codelibs.fess.crawler.entity.UrlQueue; import org.codelibs.fess.crawler.entity.UrlQueueImpl; import org.codelibs.fess.crawler.extractor.ExtractorFactory; import org.codelibs.fess.crawler.extractor.impl.TikaExtractor; import org.codelibs.fess.crawler.filter.impl.UrlFilterImpl; import org.codelibs.fess.crawler.helper.ContentLengthHelper; import org.codelibs.fess.crawler.helper.EncodingHelper;
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sat Sep 06 04:15:37 UTC 2025 - 19.1K bytes - Viewed (0) -
fess-crawler/src/test/java/org/codelibs/fess/crawler/transformer/impl/XmlTransformerTest.java
+ "</doc>"; final ResponseData responseData = new ResponseData(); responseData.setResponseBody(ResourceUtil.getResourceAsFile("extractor/test.xml"), false); responseData.setCharSet(Constants.UTF_8); final ResultData resultData = xmlTransformer.transform(responseData); assertEquals(result, new String(resultData.getData(), Constants.UTF_8));
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sat Mar 15 06:52:00 UTC 2025 - 13.5K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/AbstractXmlExtractor.java
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, * either express or implied. See the License for the specific language * governing permissions and limitations under the License. */ package org.codelibs.fess.crawler.extractor.impl; import java.io.BufferedInputStream; import java.io.IOException; import java.io.InputStream; import java.nio.charset.Charset; import java.util.Map; import java.util.regex.Matcher;
Registered: Sun Sep 21 03:50:09 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 8.5K bytes - Viewed (0) -
src/test/java/org/codelibs/fess/helper/DocumentHelperTest.java
*/ package org.codelibs.fess.helper; import java.util.HashMap; import java.util.Map; import org.codelibs.fess.crawler.entity.ResponseData; import org.codelibs.fess.crawler.extractor.impl.TikaExtractor; import org.codelibs.fess.unit.UnitFessTestCase; public class DocumentHelperTest extends UnitFessTestCase { @Override public void setUp() throws Exception { super.setUp();
Registered: Thu Sep 04 12:52:25 UTC 2025 - Last Modified: Thu Jul 10 13:41:04 UTC 2025 - 13K bytes - Viewed (0) -
.github/CODEOWNERS
platforms/enterprise/enterprise-logging/ @gradle/bt-build-scan @gradle/dv-testing-team # JVM platform platforms/jvm/ @gradle/bt-jvm platforms/core-configuration/java-api-extractor @gradle/bt-jvm # JVM testing services also shared by GE testing plugins platforms/jvm/testing-junit-platform/ @gradle/bt-jvm @gradle/dv-testing-team
Registered: Wed Sep 10 11:36:15 UTC 2025 - Last Modified: Mon Jul 28 01:45:03 UTC 2025 - 10.9K bytes - Viewed (0) -
cmd/signature-v4-parser_test.go
t.Errorf("Test %d: scope request mismatch:Expected \"%s\", got \"%s\"", testNum, expectedCredentials.scope.request, actualCredential.scope.request) } } // TestParseCredentialHeader - validates the format validator and extractor for the Credential header in an aws v4 request. // A valid format of credential should be of the following format. // Credential = accessKey + SlashSeparator+ scope // where scope = string.Join([]string{ currTime.Format(yyyymmdd),
Registered: Sun Sep 07 19:28:11 UTC 2025 - Last Modified: Tue Feb 18 16:25:55 UTC 2025 - 27.4K bytes - Viewed (0)