Search Options

Results per page
Sort
Preferred Languages
Advance

Results 11 - 20 of 73 for pDf (0.29 sec)

  1. fess-crawler/src/test/java/org/codelibs/fess/crawler/helper/RobotsTxtHelperTest.java

            }
    
            // Test WildcardBot - wildcard patterns
            // Disallow: /*.pdf$ - should block .pdf files but not .pdf with query params
            assertFalse(robotsTxt.allows("/document.pdf", "WildcardBot"));
            assertFalse(robotsTxt.allows("/files/report.pdf", "WildcardBot"));
            assertTrue(robotsTxt.allows("/document.pdf?download=true", "WildcardBot")); // $ means exact end
    
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Mon Nov 24 03:59:47 UTC 2025
    - 20.6K bytes
    - Viewed (0)
  2. src/main/resources/fess_thumbnail.xml

    		<property name="commandList">
    			["${path}/generate-thumbnail",
    			"pdf",
    			"${url}",
    			"${outputFile}"]
    		</property>
    		<property name="generatorList">
    			["${path}/generate-thumbnail"]
    		</property>
    		<postConstruct name="addCondition">
    			<arg>"mimetype"</arg>
    			<arg>"application/pdf"
    			</arg>
    		</postConstruct>
    		<postConstruct name="register"></postConstruct>
    	</component>
    Registered: Sat Dec 20 09:19:18 UTC 2025
    - Last Modified: Thu Dec 04 08:02:36 UTC 2025
    - 6K bytes
    - Viewed (0)
  3. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/ExtractorBuilder.java

     * </p>
     *
     * <p>
     * Example usage:
     * </p>
     *
     * <pre>
     * {@code
     * try (InputStream in = new FileInputStream("example.pdf")) {
     *     ExtractData extractData = new ExtractorBuilder(crawlerContainer, in, new HashMap<>())
     *         .mimeType("application/pdf")
     *         .filename("example.pdf")
     *         .maxContentLength(1024 * 1024)
     *         .extract();
     *
     *     String content = extractData.getContent();
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 10.1K bytes
    - Viewed (0)
  4. src/main/resources/crawler/rule.xml

    		</postConstruct>
    		<postConstruct name="addRule">
    			<arg>"mimeType"</arg>
    			<!-- Supported MIME type -->
    			<arg>
      "(application/xml"
    + "|application/xhtml+xml"
    + "|application/rdf+xml"
    + "|application/pdf"
    + "|application/x-freemind"
    + "|text/xml"
    + "|text/xml-external-parsed-entity)"
    			</arg>
    		</postConstruct>
    	</component>
    
    	<component name="fsFileRule" class="org.codelibs.fess.crawler.rule.impl.RegexRule" >
    Registered: Sat Dec 20 09:19:18 UTC 2025
    - Last Modified: Thu Jun 04 08:42:49 UTC 2020
    - 4.6K bytes
    - Viewed (0)
  5. src/main/java/org/codelibs/fess/helper/FileTypeHelper.java

            }
        }
    
        /**
         * Adds or updates a MIME type to file type mapping.
         *
         * @param mimetype the MIME type to map (e.g., "application/pdf")
         * @param filetype the file type classification (e.g., "pdf")
         */
        public void add(final String mimetype, final String filetype) {
            mimetypeMap.put(mimetype, filetype);
        }
    
        /**
    Registered: Sat Dec 20 09:19:18 UTC 2025
    - Last Modified: Thu Jul 17 08:28:31 UTC 2025
    - 4.4K bytes
    - Viewed (0)
  6. src/main/java/jcifs/smb1/util/mime.map

    application/msword             doc              # Microsoft Word
    application/octet-stream       bin exe ani      # Binary File
    application/oda                oda
    application/pagemaker          pm5 pt5 pm       # PageMaker
    application/pdf                pdf              # Adobe Acrobat
    application/postscript         ai eps ps        # Postscript File
    application/rtf                rtf              # Rich Text File
    application/toolbook           tbk              # Toolbook
    Registered: Sat Dec 20 13:44:44 UTC 2025
    - Last Modified: Fri Mar 22 20:39:42 UTC 2019
    - 5.9K bytes
    - Viewed (0)
  7. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/JodExtractor.java

            // Presentation Formats
            extensionMap.put("odp", "pdf");
            extensionMap.put("otp", "pdf");
            extensionMap.put("sxi", "pdf");
            extensionMap.put("ppt", "pdf");
            extensionMap.put("pptx", "pdf");
            // Drawing Formats
            extensionMap.put("odg", "svg");
            extensionMap.put("otg", "svg");
    
            extractorMap.put("pdf", new PdfExtractor());
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Sun Nov 23 12:19:14 UTC 2025
    - 10.4K bytes
    - Viewed (0)
  8. fess-crawler/src/test/java/org/codelibs/fess/crawler/filter/UrlFilterTest.java

            String sessionId = "test-session-019";
            urlFilter.init(sessionId);
    
            urlFilter.addInclude(".*\\.PDF$");
    
            // Test case sensitivity
            assertFalse(urlFilter.match("https://example.com/document.pdf"));
            assertTrue(urlFilter.match("https://example.com/document.PDF"));
        }
    
        /**
         * Test very long URL handling
         */
        public void test_veryLongUrl() {
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Wed Sep 03 14:42:53 UTC 2025
    - 19K bytes
    - Viewed (0)
  9. src/main/assemblies/files/generate-thumbnail

      if [[ -z "${im_cmd}" ]] ; then
        echo "ImageMagick (convert or magick) does not exist."
        exit 1
      fi
      check_command pdftoppm
      check_command unoconv
      tmp_pdf_file=/tmp/thumbnail.$$.pdf
      unoconv -e PageRange=1-1 -o ${tmp_pdf_file} -f pdf "${target_file}"
      if [[ ! -f ${tmp_pdf_file} ]] ; then
        echo "unoconv does not work."
        exit 1
      fi
      tmp_png_prefix=/tmp/thumbnail.png.$$
    Registered: Sat Dec 20 09:19:18 UTC 2025
    - Last Modified: Thu Dec 04 08:02:36 UTC 2025
    - 3.9K bytes
    - Viewed (0)
  10. fess-crawler/src/test/resources/org/codelibs/fess/crawler/helper/robots_wildcard.txt

    # Test robots.txt for wildcard (*) and end-of-path ($) support
    # Based on RFC 9309 specification
    
    # Test wildcard patterns
    User-agent: WildcardBot
    Disallow: /*.pdf$
    Disallow: /admin/*.php
    Disallow: /*/private/
    Allow: /public/*.html
    
    # Test end-of-path ($) patterns
    User-agent: EndPathBot
    Disallow: /fish$
    Disallow: /temp$
    Allow: /fishing
    
    # Test complex patterns
    User-agent: ComplexBot
    Disallow: /
    Allow: /$
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Thu Nov 13 14:03:41 UTC 2025
    - 910 bytes
    - Viewed (0)
Back to top