Search Options

Results per page
Sort
Preferred Languages
Advance

Results 1 - 10 of 24 for annotations (0.07 sec)

  1. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/PdfExtractor.java

        /**
         * Extracts text from file attachments in PDF annotations.
         * @param doc the PDF document
         * @param writer the writer to append extracted text to
         */
        protected void extractAnnotations(final PDDocument doc, final StringWriter writer) {
            for (final PDPage page : doc.getPages()) {
                try {
                    for (final PDAnnotation annotation : page.getAnnotations()) {
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 12.7K bytes
    - Viewed (0)
  2. fess-crawler/pom.xml

    			<artifactId>httpclient-cache</artifactId>
    			<version>${httpcomponents.version}</version>
    		</dependency>
    		<dependency>
    			<groupId>jakarta.annotation</groupId>
    			<artifactId>jakarta.annotation-api</artifactId>
    			<version>${jakarta.annotation.api.version}</version>
    		</dependency>
    		<dependency>
    			<groupId>org.codelibs</groupId>
    			<artifactId>nekohtml</artifactId>
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Sep 06 04:15:37 UTC 2025
    - 11.3K bytes
    - Viewed (0)
  3. LICENSE

          "Derivative Works" shall mean any work, whether in Source or Object
          form, that is based on (or derived from) the Work and for which the
          editorial revisions, annotations, elaborations, or other modifications
          represent, as a whole, an original work of authorship. For the purposes
          of this License, Derivative Works shall not include works that remain
    Registered: Fri Sep 19 09:08:11 UTC 2025
    - Last Modified: Mon Jan 11 04:30:09 UTC 2021
    - 11.1K bytes
    - Viewed (0)
  4. LICENSE

          "Derivative Works" shall mean any work, whether in Source or Object
          form, that is based on (or derived from) the Work and for which the
          editorial revisions, annotations, elaborations, or other modifications
          represent, as a whole, an original work of authorship. For the purposes
          of this License, Derivative Works shall not include works that remain
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Mon Jan 11 04:26:17 UTC 2021
    - 11.1K bytes
    - Viewed (0)
  5. fess-crawler/src/main/java/org/codelibs/fess/crawler/container/StandardCrawlerContainer.java

    import org.codelibs.core.lang.ClassUtil;
    import org.codelibs.core.lang.FieldUtil;
    import org.codelibs.core.lang.MethodUtil;
    
    import jakarta.annotation.PostConstruct;
    import jakarta.annotation.PreDestroy;
    import jakarta.annotation.Resource;
    
    /**
     * A container implementation that manages the lifecycle and dependency injection of components
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 14.3K bytes
    - Viewed (0)
  6. fess-crawler-opensearch/src/main/java/org/codelibs/fess/crawler/service/impl/OpenSearchUrlQueueService.java

    import org.opensearch.search.SearchHits;
    import org.opensearch.search.sort.SortBuilders;
    import org.opensearch.search.sort.SortOrder;
    
    import jakarta.annotation.PostConstruct;
    import jakarta.annotation.PreDestroy;
    import jakarta.annotation.Resource;
    
    /**
     * OpenSearchUrlQueueService is an implementation of {@link UrlQueueService} for OpenSearch.
     *
     * @author shinsuke
     *
     */
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Thu Aug 07 02:55:08 UTC 2025
    - 17K bytes
    - Viewed (1)
  7. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/JodExtractor.java

    import org.jodconverter.core.office.OfficeException;
    import org.jodconverter.core.office.OfficeManager;
    import org.jodconverter.local.LocalConverter;
    
    import jakarta.annotation.PostConstruct;
    import jakarta.annotation.PreDestroy;
    
    /**
     * Extracts text content from various document formats using JODConverter.
     */
    public class JodExtractor extends AbstractExtractor {
        /** Logger for this class. */
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 10.3K bytes
    - Viewed (0)
  8. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/ApiExtractor.java

    import org.codelibs.fess.crawler.entity.ExtractData;
    import org.codelibs.fess.crawler.exception.ExtractException;
    
    import com.google.common.base.Charsets;
    
    import jakarta.annotation.PostConstruct;
    import jakarta.annotation.PreDestroy;
    
    /**
     * Extract a text by using external http server.
     */
    public class ApiExtractor extends AbstractExtractor {
    
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Thu Aug 07 02:55:08 UTC 2025
    - 12.2K bytes
    - Viewed (0)
  9. fess-crawler/src/main/java/org/codelibs/fess/crawler/client/smb1/SmbClient.java

    import org.codelibs.fess.crawler.exception.MaxLengthExceededException;
    import org.codelibs.fess.crawler.helper.ContentLengthHelper;
    import org.codelibs.fess.crawler.helper.MimeTypeHelper;
    
    import jakarta.annotation.Resource;
    import org.codelibs.jcifs.smb1.Config;
    import org.codelibs.jcifs.smb1.ACE;
    import org.codelibs.jcifs.smb1.NtlmPasswordAuthentication;
    import org.codelibs.jcifs.smb1.SID;
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Thu Sep 18 09:30:45 UTC 2025
    - 23K bytes
    - Viewed (0)
  10. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/HtmlXpathExtractor.java

    import org.w3c.dom.Node;
    import org.xml.sax.InputSource;
    
    import com.google.common.cache.CacheBuilder;
    import com.google.common.cache.CacheLoader;
    import com.google.common.cache.LoadingCache;
    
    import jakarta.annotation.Resource;
    
    /**
     * {@link HtmlXpathExtractor} is an implementation of the {@link org.codelibs.fess.crawler.extractor.Extractor} interface.
     * It uses XPath expressions to extract text content from HTML documents.
     * <p>
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 10.3K bytes
    - Viewed (0)
Back to top