Search Options

Results per page
Sort
Preferred Languages
Advance

Results 1 - 10 of 109 for from (0.02 sec)

  1. fess-crawler/src/main/java/org/codelibs/fess/crawler/transformer/Transformer.java

     * and retrieving data from access results.
     */
    public interface Transformer {
    
        /**
         * Transforms the given ResponseData into a ResultData.
         *
         * @param responseData the data to be transformed
         * @return the transformed ResultData
         */
        ResultData transform(ResponseData responseData);
    
        /**
         * Retrieves data from the given AccessResultData object.
         *
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Mar 15 06:52:00 UTC 2025
    - 1.7K bytes
    - Viewed (0)
  2. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/HtmlExtractor.java

                xpathAPI.remove();
            }
        }
    
        /**
         * Extracts strings from a document using the specified XPath expression.
         *
         * @param document the DOM document to extract strings from
         * @param path the XPath expression to evaluate
         * @return an array of strings extracted from the document
         */
        protected String[] getStringsByXPath(final Document document, final String path) {
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 9.3K bytes
    - Viewed (0)
  3. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/PdfExtractor.java

    /**
     * PdfExtractor extracts text content from PDF files using Apache PDFBox.
     * It supports password-protected PDFs and can extract embedded documents and annotations.
     *
     * <p>The extractor runs text extraction in a separate thread with a configurable timeout
     * to prevent hanging on problematic PDF files. It also extracts metadata from the PDF
     * document and includes it in the extraction result.
     *
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 12.7K bytes
    - Viewed (0)
  4. src/main/java/org/codelibs/fess/suggest/settings/ArraySettings.java

     * <li>{@link #addToArrayIndex(String, String, String, Map)}: Adds a map to the array index.</li>
     * <li>{@link #deleteKeyFromArray(String, String, String)}: Deletes all entries associated with the specified key from the array index.</li>
     * <li>{@link #deleteFromArray(String, String, String)}: Deletes a specific entry from the array index based on the ID.</li>
    Registered: Fri Sep 19 09:08:11 UTC 2025
    - Last Modified: Thu Aug 07 02:41:28 UTC 2025
    - 15.6K bytes
    - Viewed (0)
  5. src/main/java/org/codelibs/fess/suggest/index/writer/SuggestWriter.java

        /**
         * Deletes a suggestion from the specified index.
         *
         * @param client   the client to use for the operation
         * @param settings the settings to use for the operation
         * @param index    the name of the index from which to delete the suggestion
         * @param id       the ID of the suggestion to delete
    Registered: Fri Sep 19 09:08:11 UTC 2025
    - Last Modified: Fri Jul 04 14:00:23 UTC 2025
    - 4.1K bytes
    - Viewed (0)
  6. fess-crawler/src/main/java/org/codelibs/fess/crawler/processor/impl/SitemapsResponseProcessor.java

     * It parses the response body as a SitemapSet, extracts URLs from the sitemaps,
     * and adds them as child URLs to be crawled.
     *
     * <p>
     * This class uses a {@link SitemapsHelper} to parse the sitemap XML or text.
     * It then iterates through the sitemaps in the SitemapSet, extracts the URL
     * from each sitemap, and creates a new {@link RequestData} object for each URL.
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 3.4K bytes
    - Viewed (0)
  7. fess-crawler-opensearch/src/main/java/org/codelibs/fess/crawler/service/impl/AbstractCrawlerService.java

                        builder.addSort(sortBuilder);
                    }
                }
                if (from != null) {
                    builder.setFrom(from);
                }
                if (size != null) {
                    builder.setSize(size);
                }
            });
        }
    
        /**
         * Retrieves a list of documents from the OpenSearch index using a custom search request builder.
         *
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Thu Aug 07 02:55:08 UTC 2025
    - 34.2K bytes
    - Viewed (0)
  8. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/FilenameExtractor.java

    import org.codelibs.fess.crawler.exception.ExtractException;
    
    /**
     * Extracts the filename from the parameters.
     */
    public class FilenameExtractor extends AbstractExtractor {
    
        /**
         * Constructs a new FilenameExtractor.
         */
        public FilenameExtractor() {
            // Default constructor
        }
    
        /**
         * Extracts the filename from the parameters.
         * @param in The input stream (not used).
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 1.9K bytes
    - Viewed (0)
  9. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/MsVisioExtractor.java

    import org.codelibs.fess.crawler.exception.ExtractException;
    
    /**
     * Gets a text from . file.
     *
     * @author shinsuke
     *
     */
    public class MsVisioExtractor extends AbstractExtractor {
    
        /**
         * Creates a new MsVisioExtractor instance.
         */
        public MsVisioExtractor() {
            super();
        }
    
        /**
         * Extracts text from the Visio input stream.
         * @param in The input stream.
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 1.9K bytes
    - Viewed (0)
  10. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/AbstractXmlExtractor.java

                    throw new ExtractException(e);
                }
            }
    
            return encoding;
        }
    
        /**
         * Extracts text content from the given content by removing tags and processing attributes.
         * @param content The content to extract from.
         * @return The extracted text.
         */
        protected String extractString(final String content) {
            String input = content.replaceAll("[\\r\\n]", " ");
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 8.5K bytes
    - Viewed (0)
Back to top