Search Options

Results per page
Sort
Preferred Languages
Advance

Results 1 - 10 of 354 for extract (0.05 sec)

  1. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/ExtractorBuilder.java

                dfos = out;
                CopyUtil.copy(in, out);
                out.flush();
    
                Extractor extractor = StringUtil.isBlank(mimeType) ? null : extractorFactory.getExtractor(mimeType);
                if (extractor == null) {
                    final String detectedMimeType = getMimeType(out);
                    extractor = extractorFactory.getExtractor(detectedMimeType);
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 10.1K bytes
    - Viewed (0)
  2. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/EmlExtractor.java

        public void setMailProperties(final Properties mailProperties) {
            this.mailProperties = mailProperties;
        }
    
        /**
         * Extracts the body text from a MIME message.
         *
         * @param message the MIME message to extract text from
         * @return the extracted body text
         * @throws ExtractException if extraction fails
         */
        protected String getBodyText(final MimeMessage message) {
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 12.6K bytes
    - Viewed (0)
  3. fess-crawler/src/main/java/org/codelibs/fess/crawler/transformer/impl/TextTransformer.java

    import org.codelibs.fess.crawler.extractor.Extractor;
    import org.codelibs.fess.crawler.extractor.ExtractorFactory;
    
    import jakarta.annotation.Resource;
    
    /**
     * TextTransformer is a class that transforms a ResponseData object into a ResultData object containing the extracted text content.
     * It uses an Extractor to extract the text from the response body based on the MIME type.
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 6.5K bytes
    - Viewed (0)
  4. cmd/batch-job-common-types.go

    	line, col int
    	Key       string `yaml:"key" json:"key"`
    	Value     string `yaml:"value" json:"value"`
    }
    
    var _ yaml.Unmarshaler = &BatchJobKV{}
    
    // UnmarshalYAML - BatchJobKV extends default unmarshal to extract line, col information.
    func (kv *BatchJobKV) UnmarshalYAML(val *yaml.Node) error {
    	type jobKV BatchJobKV
    	var tmp jobKV
    	err := val.Decode(&tmp)
    	if err != nil {
    		return err
    	}
    	*kv = BatchJobKV(tmp)
    Registered: Sun Sep 07 19:28:11 UTC 2025
    - Last Modified: Fri Aug 29 02:39:48 UTC 2025
    - 7.9K bytes
    - Viewed (0)
  5. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/ApiExtractor.java

                    logger.error("Failed to close httpClient.", e);
                }
            }
        }
    
        /**
         * Extracts text from the input stream using the API endpoint.
         *
         * @param in the input stream to extract text from
         * @param params additional parameters
         * @return the extracted data
         * @throws ExtractException if extraction fails
         */
        @Override
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Thu Aug 07 02:55:08 UTC 2025
    - 12.2K bytes
    - Viewed (0)
  6. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/LhaExtractor.java

    import org.codelibs.fess.crawler.extractor.Extractor;
    import org.codelibs.fess.crawler.extractor.ExtractorFactory;
    import org.codelibs.fess.crawler.helper.MimeTypeHelper;
    import org.codelibs.fess.crawler.util.IgnoreCloseInputStream;
    
    import jp.gr.java_conf.dangan.util.lha.LhaFile;
    import jp.gr.java_conf.dangan.util.lha.LhaHeader;
    
    /**
     * Extractor implementation for LHA (LZH) archive files.
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 5.8K bytes
    - Viewed (0)
  7. src/main/java/jcifs/internal/smb2/persistent/HandleGuid.java

            ByteBuffer bb = ByteBuffer.wrap(result).order(java.nio.ByteOrder.LITTLE_ENDIAN);
    
            long mostSig = guid.getMostSignificantBits();
            long leastSig = guid.getLeastSignificantBits();
    
            // Extract GUID components from UUID
            int data1 = (int) (mostSig >>> 32); // first 4 bytes
            short data2 = (short) (mostSig >>> 16); // next 2 bytes
            short data3 = (short) mostSig; // next 2 bytes
    
    Registered: Sun Sep 07 00:10:21 UTC 2025
    - Last Modified: Sat Aug 23 02:21:31 UTC 2025
    - 4.5K bytes
    - Viewed (0)
  8. src/main/java/org/codelibs/fess/helper/PermissionHelper.java

            this.userPrefix = userPrefix;
        }
    
        /**
         * Extracts role type information from SMB (Server Message Block) response data.
         * Processes both SMB and SMB1 protocols to extract allowed and denied SIDs.
         *
         * @param responseData the response data containing SMB metadata
         * @return a list of role type strings extracted from the SMB permissions
         */
    Registered: Thu Sep 04 12:52:25 UTC 2025
    - Last Modified: Thu Jul 17 08:28:31 UTC 2025
    - 15.3K bytes
    - Viewed (0)
  9. fess-crawler/src/main/java/org/codelibs/fess/crawler/client/http/form/FormScheme.java

                    logger.debug("Logged in {}", originalLoginUrl);
                }
            });
    
        }
    
        /**
         * Parses the token page and extracts token information.
         * @param tokenPattern The regex pattern to extract the token.
         * @param responseParams The list to store response parameters.
         * @param entity The HTTP entity containing the token page content.
         */
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 14.3K bytes
    - Viewed (1)
  10. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/PdfExtractor.java

    import org.codelibs.fess.crawler.extractor.Extractor;
    import org.codelibs.fess.crawler.extractor.ExtractorFactory;
    import org.codelibs.fess.crawler.helper.MimeTypeHelper;
    
    /**
     * PdfExtractor extracts text content from PDF files using Apache PDFBox.
     * It supports password-protected PDFs and can extract embedded documents and annotations.
     *
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 12.7K bytes
    - Viewed (0)
Back to top