- Sort Score
- Result 10 results
- Languages All
Results 11 - 20 of 73 for pDf (0.29 sec)
-
fess-crawler/src/test/java/org/codelibs/fess/crawler/helper/RobotsTxtHelperTest.java
} // Test WildcardBot - wildcard patterns // Disallow: /*.pdf$ - should block .pdf files but not .pdf with query params assertFalse(robotsTxt.allows("/document.pdf", "WildcardBot")); assertFalse(robotsTxt.allows("/files/report.pdf", "WildcardBot")); assertTrue(robotsTxt.allows("/document.pdf?download=true", "WildcardBot")); // $ means exact endRegistered: Sat Dec 20 11:21:39 UTC 2025 - Last Modified: Mon Nov 24 03:59:47 UTC 2025 - 20.6K bytes - Viewed (0) -
src/main/resources/fess_thumbnail.xml
<property name="commandList"> ["${path}/generate-thumbnail", "pdf", "${url}", "${outputFile}"] </property> <property name="generatorList"> ["${path}/generate-thumbnail"] </property> <postConstruct name="addCondition"> <arg>"mimetype"</arg> <arg>"application/pdf" </arg> </postConstruct> <postConstruct name="register"></postConstruct> </component>
Registered: Sat Dec 20 09:19:18 UTC 2025 - Last Modified: Thu Dec 04 08:02:36 UTC 2025 - 6K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/ExtractorBuilder.java
* </p> * * <p> * Example usage: * </p> * * <pre> * {@code * try (InputStream in = new FileInputStream("example.pdf")) { * ExtractData extractData = new ExtractorBuilder(crawlerContainer, in, new HashMap<>()) * .mimeType("application/pdf") * .filename("example.pdf") * .maxContentLength(1024 * 1024) * .extract(); * * String content = extractData.getContent();
Registered: Sat Dec 20 11:21:39 UTC 2025 - Last Modified: Sun Jul 06 02:13:03 UTC 2025 - 10.1K bytes - Viewed (0) -
src/main/resources/crawler/rule.xml
</postConstruct> <postConstruct name="addRule"> <arg>"mimeType"</arg> <!-- Supported MIME type --> <arg> "(application/xml" + "|application/xhtml+xml" + "|application/rdf+xml" + "|application/pdf" + "|application/x-freemind" + "|text/xml" + "|text/xml-external-parsed-entity)" </arg> </postConstruct> </component> <component name="fsFileRule" class="org.codelibs.fess.crawler.rule.impl.RegexRule" >
Registered: Sat Dec 20 09:19:18 UTC 2025 - Last Modified: Thu Jun 04 08:42:49 UTC 2020 - 4.6K bytes - Viewed (0) -
src/main/java/org/codelibs/fess/helper/FileTypeHelper.java
} } /** * Adds or updates a MIME type to file type mapping. * * @param mimetype the MIME type to map (e.g., "application/pdf") * @param filetype the file type classification (e.g., "pdf") */ public void add(final String mimetype, final String filetype) { mimetypeMap.put(mimetype, filetype); } /**Registered: Sat Dec 20 09:19:18 UTC 2025 - Last Modified: Thu Jul 17 08:28:31 UTC 2025 - 4.4K bytes - Viewed (0) -
src/main/java/jcifs/smb1/util/mime.map
application/msword doc # Microsoft Word application/octet-stream bin exe ani # Binary File application/oda oda application/pagemaker pm5 pt5 pm # PageMaker application/pdf pdf # Adobe Acrobat application/postscript ai eps ps # Postscript File application/rtf rtf # Rich Text File application/toolbook tbk # Toolbook
Registered: Sat Dec 20 13:44:44 UTC 2025 - Last Modified: Fri Mar 22 20:39:42 UTC 2019 - 5.9K bytes - Viewed (0) -
fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/JodExtractor.java
// Presentation Formats extensionMap.put("odp", "pdf"); extensionMap.put("otp", "pdf"); extensionMap.put("sxi", "pdf"); extensionMap.put("ppt", "pdf"); extensionMap.put("pptx", "pdf"); // Drawing Formats extensionMap.put("odg", "svg"); extensionMap.put("otg", "svg"); extractorMap.put("pdf", new PdfExtractor());Registered: Sat Dec 20 11:21:39 UTC 2025 - Last Modified: Sun Nov 23 12:19:14 UTC 2025 - 10.4K bytes - Viewed (0) -
fess-crawler/src/test/java/org/codelibs/fess/crawler/filter/UrlFilterTest.java
String sessionId = "test-session-019"; urlFilter.init(sessionId); urlFilter.addInclude(".*\\.PDF$"); // Test case sensitivity assertFalse(urlFilter.match("https://example.com/document.pdf")); assertTrue(urlFilter.match("https://example.com/document.PDF")); } /** * Test very long URL handling */ public void test_veryLongUrl() {Registered: Sat Dec 20 11:21:39 UTC 2025 - Last Modified: Wed Sep 03 14:42:53 UTC 2025 - 19K bytes - Viewed (0) -
src/main/assemblies/files/generate-thumbnail
if [[ -z "${im_cmd}" ]] ; then echo "ImageMagick (convert or magick) does not exist." exit 1 fi check_command pdftoppm check_command unoconv tmp_pdf_file=/tmp/thumbnail.$$.pdf unoconv -e PageRange=1-1 -o ${tmp_pdf_file} -f pdf "${target_file}" if [[ ! -f ${tmp_pdf_file} ]] ; then echo "unoconv does not work." exit 1 fi tmp_png_prefix=/tmp/thumbnail.png.$$
Registered: Sat Dec 20 09:19:18 UTC 2025 - Last Modified: Thu Dec 04 08:02:36 UTC 2025 - 3.9K bytes - Viewed (0) -
fess-crawler/src/test/resources/org/codelibs/fess/crawler/helper/robots_wildcard.txt
# Test robots.txt for wildcard (*) and end-of-path ($) support # Based on RFC 9309 specification # Test wildcard patterns User-agent: WildcardBot Disallow: /*.pdf$ Disallow: /admin/*.php Disallow: /*/private/ Allow: /public/*.html # Test end-of-path ($) patterns User-agent: EndPathBot Disallow: /fish$ Disallow: /temp$ Allow: /fishing # Test complex patterns User-agent: ComplexBot Disallow: / Allow: /$
Registered: Sat Dec 20 11:21:39 UTC 2025 - Last Modified: Thu Nov 13 14:03:41 UTC 2025 - 910 bytes - Viewed (0)