Search Options

Results per page
Sort
Preferred Languages
Advance

Results 1 - 10 of 11 for pdfbox (0.26 sec)

  1. fess-crawler/pom.xml

    		</dependency>
    		<dependency>
    			<groupId>org.apache.pdfbox</groupId>
    			<artifactId>pdfbox</artifactId>
    			<version>${pdfbox.version}</version>
    		</dependency>
    		<dependency>
    			<groupId>org.apache.pdfbox</groupId>
    			<artifactId>pdfbox-tools</artifactId>
    			<version>${pdfbox.version}</version>
    		</dependency>
    		<dependency>
    			<groupId>org.apache.pdfbox</groupId>
    			<artifactId>fontbox</artifactId>
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Sat Dec 20 06:34:36 UTC 2025
    - 12.1K bytes
    - Viewed (0)
  2. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/PdfExtractor.java

    import org.apache.logging.log4j.Logger;
    import org.apache.pdfbox.Loader;
    import org.apache.pdfbox.cos.COSInputStream;
    import org.apache.pdfbox.io.RandomAccessReadBuffer;
    import org.apache.pdfbox.pdmodel.PDDocument;
    import org.apache.pdfbox.pdmodel.PDDocumentInformation;
    import org.apache.pdfbox.pdmodel.PDDocumentNameDictionary;
    import org.apache.pdfbox.pdmodel.PDEmbeddedFilesNameTreeNode;
    import org.apache.pdfbox.pdmodel.PDPage;
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Sun Nov 23 12:19:14 UTC 2025
    - 12.8K bytes
    - Viewed (0)
  3. src/main/webapp/WEB-INF/env/crawler/resources/log4j2.xml

    				max="${backup.max.history}" compressionLevel="9" />
    		</RollingFile>
    		<Rewrite name="AppFile">
    			<AppenderRef ref="AppRollingFile" />
    			<ErrorToWarnRewritePolicy loggers="org.apache.fontbox,org.apache.pdfbox,org.apache.poi" />
    		</Rewrite>
    		<RollingFile name="StatsFile" fileName="${log.file.basedir}/fess-urls.log"
    			filePattern="${log.file.basedir}/fess-urls${backup.date.suffix}-%i.log.gz">
    			<PatternLayout>
    Registered: Sat Dec 20 09:19:18 UTC 2025
    - Last Modified: Mon Feb 20 13:05:30 UTC 2023
    - 2.4K bytes
    - Viewed (0)
  4. build-logic-commons/build-platform/build.gradle.kts

            }
            api("org.apache.pdfbox:pdfbox:2.0.24") {
                because("Flexmark 0.34.60 brings in a vulnerable version of pdfbox")
            }
            api("com.google.code.findbugs:jsr305:3.0.2")
            api("org.jspecify:jspecify:1.0.0")
            api("commons-io:commons-io:2.14.0")
            api("org.apache.commons:commons-lang3:3.20.0")
    Registered: Wed Dec 31 11:36:14 UTC 2025
    - Last Modified: Tue Dec 30 10:16:30 UTC 2025
    - 4.6K bytes
    - Viewed (0)
  5. CLAUDE.md

    - **License**: Apache 2.0
    - **DI**: LastaFlute DI
    - **Repo**: https://github.com/codelibs/fess-crawler
    
    ### Tech Stack
    
    - **HTTP**: Apache HttpComponents 4.5+
    - **Extraction**: Apache Tika 3.0+, POI 5.3+, PDFBox 3.0+
    - **Testing**: JUnit 4, UTFlute, Mockito 5.7.0
    - **Storage**: In-memory (default), OpenSearch (optional)
    
    ### Protocols
    
    - **HTTP/HTTPS**: Full crawling, cookies, auth, robots.txt
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Fri Nov 28 17:31:34 UTC 2025
    - 10.7K bytes
    - Viewed (0)
  6. README.md

    ## Technology Stack
    
    - **Java**: 21+ (requires Java 21 or higher)
    - **Build System**: Maven 3.x
    - **DI Container**: LastaFlute DI
    - **HTTP Client**: Apache HttpComponents
    - **Content Extraction**: Apache Tika, Apache POI, PDFBox
    - **Testing**: JUnit 4, UTFlute, Testcontainers
    - **Storage Backends**: OpenSearch, Memory-based
    
    ## Quick Start
    
    ### Prerequisites
    
    - Java 21 or higher
    - Maven 3.6 or higher
    
    ### Installation
    
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Sun Aug 31 05:32:52 UTC 2025
    - 15.3K bytes
    - Viewed (0)
  7. src/main/java/org/codelibs/fess/taglib/FessFunctions.java

    import org.apache.commons.lang3.time.DurationFormatUtils;
    import org.apache.commons.text.StringEscapeUtils;
    import org.apache.logging.log4j.LogManager;
    import org.apache.logging.log4j.Logger;
    import org.apache.pdfbox.util.DateConverter;
    import org.codelibs.core.lang.StringUtil;
    import org.codelibs.fess.Constants;
    import org.codelibs.fess.app.web.base.FessAdminAction;
    import org.codelibs.fess.app.web.base.login.FessLoginAssist;
    Registered: Sat Dec 20 09:19:18 UTC 2025
    - Last Modified: Fri Nov 28 16:29:12 UTC 2025
    - 25.4K bytes
    - Viewed (1)
  8. fess-crawler/src/test/java/org/codelibs/fess/crawler/extractor/impl/TikaExtractorTest.java

            final String content = extractData.getContent();
            CloseableUtil.closeQuietly(in);
            logger.info(content);
            assertTrue(content.contains("ใƒ†ใ‚นใƒˆ"));
        }
    
        // TODO tika needs to support pdfbox 2.0
        //    public void test_getTika_pdf() {
        //        final InputStream in = ResourceUtil
        //                .getResourceAsStream("extractor/test.pdf");
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Thu Aug 07 02:55:08 UTC 2025
    - 30.6K bytes
    - Viewed (0)
  9. src/main/resources/fess_config.properties

    -Dlog4j.shutdownHookEnabled=false\n\
    -Dlog4j2.formatMsgNoLookups=true\n\
    -Dlog4j2.disable.jmx=true\n\
    -Dlog4j.skipJansi=true\n\
    -Dsun.java2d.cmm=sun.java2d.cmm.kcms.KcmsServiceProvider\n\
    -Dorg.apache.pdfbox.rendering.UsePureJavaCMYKConversion=true\n\
    
    
    jvm.suggest.options=\
    -Djava.awt.headless=true\n\
    -Dfile.encoding=UTF-8\n\
    -Djna.nosys=true\n\
    -Djdk.io.permissionsUseCanonicalPath=true\n\
    Registered: Sat Dec 20 09:19:18 UTC 2025
    - Last Modified: Thu Dec 11 09:47:03 UTC 2025
    - 54.8K bytes
    - Viewed (0)
  10. src/main/java/org/codelibs/fess/mylasta/direction/FessConfig.java

         * -Dlog4j2.formatMsgNoLookups=true<br>
         * -Dlog4j2.disable.jmx=true<br>
         * -Dlog4j.skipJansi=true<br>
         * -Dsun.java2d.cmm=sun.java2d.cmm.kcms.KcmsServiceProvider<br>
         * -Dorg.apache.pdfbox.rendering.UsePureJavaCMYKConversion=true<br>
         *  */
        String JVM_CRAWLER_OPTIONS = "jvm.crawler.options";
    
        /** The key of the configuration. e.g. -Djava.awt.headless=true<br>
         * -Dfile.encoding=UTF-8<br>
    Registered: Sat Dec 20 09:19:18 UTC 2025
    - Last Modified: Sat Dec 13 02:21:17 UTC 2025
    - 525.7K bytes
    - Viewed (2)
Back to top