- Sort Score
- Result 10 results
- Languages All
Results 81 - 90 of 130 for extraction (0.28 sec)
-
fess-crawler/src/test/java/org/codelibs/fess/crawler/extractor/impl/MsPowerPointExtractorTest.java
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, * either express or implied. See the License for the specific language * governing permissions and limitations under the License. */ package org.codelibs.fess.crawler.extractor.impl; import java.io.InputStream; import org.apache.logging.log4j.LogManager; import org.apache.logging.log4j.Logger; import org.codelibs.core.io.CloseableUtil; import org.codelibs.core.io.ResourceUtil;
Registered: Sat Dec 20 11:21:39 UTC 2025 - Last Modified: Sat Mar 15 06:52:00 UTC 2025 - 2.1K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/MsVisioExtractor.java
* governing permissions and limitations under the License. */ package org.codelibs.fess.crawler.extractor.impl; import java.io.IOException; import java.io.InputStream; import java.util.Map; import org.apache.poi.hdgf.extractor.VisioTextExtractor; import org.codelibs.fess.crawler.entity.ExtractData; import org.codelibs.fess.crawler.exception.CrawlerSystemException;
Registered: Sat Dec 20 11:21:39 UTC 2025 - Last Modified: Sun Nov 23 12:19:14 UTC 2025 - 1.9K bytes - Viewed (0) -
fess-crawler/src/test/resources/extractor/json/test.json
{ "title": "Sample Document", "author": "John Doe", "version": "1.0", "published": "2025-01-15", "tags": ["crawler", "extractor", "json"], "content": { "summary": "This is a sample JSON document for testing", "body": "The extractor should handle nested objects and arrays properly" }, "metadata": { "created_at": "2025-01-01T00:00:00Z", "updated_at": "2025-01-15T12:00:00Z" }Registered: Sat Dec 20 11:21:39 UTC 2025 - Last Modified: Sun Nov 23 03:46:53 UTC 2025 - 412 bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/JodExtractor.java
final Extractor extractor = getExtractor(outExt); if (extractor != null) { final Map<String, String> params = new HashMap<>(); params.put(ExtractData.RESOURCE_NAME_KEY, outputFile.getName()); try (final FileInputStream in = new FileInputStream(outputFile)) { final ExtractData extractData = extractor.getText(in, params);
Registered: Sat Dec 20 11:21:39 UTC 2025 - Last Modified: Sun Nov 23 12:19:14 UTC 2025 - 10.4K bytes - Viewed (0) -
fess-crawler/src/test/java/org/codelibs/fess/crawler/extractor/impl/PdfExtractorTest.java
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, * either express or implied. See the License for the specific language * governing permissions and limitations under the License. */ package org.codelibs.fess.crawler.extractor.impl; import java.io.InputStream; import java.util.HashMap; import java.util.Map; import org.apache.logging.log4j.LogManager; import org.apache.logging.log4j.Logger; import org.codelibs.core.io.CloseableUtil;
Registered: Sat Dec 20 11:21:39 UTC 2025 - Last Modified: Sat Mar 15 06:52:00 UTC 2025 - 7.6K bytes - Viewed (0) -
.github/ISSUE_TEMPLATE/02-pkgsite-removal.yml
If the package path doesn't include your github username, please provide some other form of proof of ownership. validations: required: true - type: textarea id: retraction-reason attributes: label: "What is the reason that you could not retract this package instead?" description: | Requesting we remove a module here only hides the generated documentation on pkg.go.dev.
Registered: Tue Dec 30 11:13:12 UTC 2025 - Last Modified: Thu Jan 04 23:31:17 UTC 2024 - 1.9K bytes - Viewed (0) -
fess-crawler/src/test/java/org/codelibs/fess/crawler/extractor/impl/TextExtractorTest.java
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, * either express or implied. See the License for the specific language * governing permissions and limitations under the License. */ package org.codelibs.fess.crawler.extractor.impl; import java.io.InputStream; import org.apache.logging.log4j.LogManager; import org.apache.logging.log4j.Logger; import org.codelibs.core.io.CloseableUtil; import org.codelibs.core.io.ResourceUtil;
Registered: Sat Dec 20 11:21:39 UTC 2025 - Last Modified: Sat Mar 15 06:52:00 UTC 2025 - 2K bytes - Viewed (0) -
fess-crawler/src/test/java/org/codelibs/fess/crawler/extractor/impl/EmlExtractorTest.java
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, * either express or implied. See the License for the specific language * governing permissions and limitations under the License. */ package org.codelibs.fess.crawler.extractor.impl; import java.io.IOException; import java.io.InputStream; import org.apache.logging.log4j.LogManager; import org.apache.logging.log4j.Logger; import org.codelibs.core.io.ResourceUtil;
Registered: Sat Dec 20 11:21:39 UTC 2025 - Last Modified: Thu Aug 07 02:55:08 UTC 2025 - 4.6K bytes - Viewed (1) -
fess-crawler/src/test/java/org/codelibs/fess/crawler/transformer/impl/TextTransformerTest.java
import org.codelibs.fess.crawler.entity.ResponseData; import org.codelibs.fess.crawler.entity.ResultData; import org.codelibs.fess.crawler.exception.CrawlerSystemException; import org.codelibs.fess.crawler.extractor.ExtractorFactory; import org.codelibs.fess.crawler.extractor.impl.TikaExtractor; import org.dbflute.utflute.core.PlainTestCase; /** * @author shinsuke * */ public class TextTransformerTest extends PlainTestCase {Registered: Sat Dec 20 11:21:39 UTC 2025 - Last Modified: Thu Aug 07 02:55:08 UTC 2025 - 4.6K bytes - Viewed (0) -
fess-crawler/src/test/java/org/codelibs/fess/crawler/extractor/impl/HtmlExtractorTest.java
final BufferedInputStream bis = new BufferedInputStream(in); final String encoding = htmlExtractor.getEncoding(bis); CloseableUtil.closeQuietly(bis); assertEquals("UTF-8", encoding); } public void test_getEncoding_sjis() { final InputStream in = ResourceUtil.getResourceAsStream("extractor/test_sjis.html");
Registered: Sat Dec 20 11:21:39 UTC 2025 - Last Modified: Sat Mar 15 06:52:00 UTC 2025 - 3.7K bytes - Viewed (0)