Search Options

Results per page
Sort
Preferred Languages
Advance

Results 121 - 130 of 353 for extracted (0.04 sec)

  1. fess-crawler/src/test/java/org/codelibs/fess/crawler/extractor/impl/CsvExtractorTest.java

            csvExtractor.setMaxRows(2);
            final InputStream in = ResourceUtil.getResourceAsStream("extractor/csv/test.csv");
            final ExtractData extractData = csvExtractor.getText(in, null);
            CloseableUtil.closeQuietly(in);
    
            final String rowCount = extractData.getValues("row_count")[0];
            // Should extract 2 data rows (header doesn't count toward maxRows)
            assertEquals("2", rowCount);
        }
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Sun Nov 23 03:46:53 UTC 2025
    - 5.3K bytes
    - Viewed (0)
  2. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/XmlExtractor.java

     * either express or implied. See the License for the specific language
     * governing permissions and limitations under the License.
     */
    package org.codelibs.fess.crawler.extractor.impl;
    
    import java.util.regex.Pattern;
    
    /**
     * Extracts text content from XML documents.
     */
    public class XmlExtractor extends AbstractXmlExtractor {
    
        /**
         * Creates a new XmlExtractor instance.
         */
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 2.6K bytes
    - Viewed (0)
  3. src/main/java/org/codelibs/fess/mylasta/action/FessLabels.java

        /** The key of the message: Crawling/Displaying */
        public static final String LABELS_pathmap_pt_both = "{labels.pathmap_pt_both}";
    
        /** The key of the message: Extracted URL Conversion */
        public static final String LABELS_pathmap_pt_stored = "{labels.pathmap_pt_stored}";
    
        /** The key of the message: Regular Name */
    Registered: Sat Dec 20 09:19:18 UTC 2025
    - Last Modified: Sat Dec 13 02:21:17 UTC 2025
    - 156.4K bytes
    - Viewed (0)
  4. CLAUDE.md

    ```
    
    4. **Add tests**: Unit + integration
    
    ### Adding a Content Extractor
    
    1. **Implement `Extractor`**:
    ```java
    public class MyExtractor extends AbstractExtractor {
        @Override
        public ExtractData getText(InputStream in, Map<String, String> params) {
            ExtractData data = new ExtractData();
            // Extract text
            data.setContent(extractedText);
            return data;
        }
    }
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Fri Nov 28 17:31:34 UTC 2025
    - 10.7K bytes
    - Viewed (0)
  5. build-logic/documentation/src/main/groovy/gradlebuild/docs/dsl/source/ExtractDslMetaDataTask.groovy

    import org.gradle.api.tasks.OutputFile
    import org.gradle.api.tasks.PathSensitive
    import org.gradle.api.tasks.PathSensitivity
    import org.gradle.api.tasks.SourceTask
    import org.gradle.api.tasks.TaskAction
    
    /**
     * Extracts meta-data from the Groovy and Java source files which make up the Gradle API. Persists the meta-data to a file
     * for later use in generating documentation for the DSL, such as by {@link gradlebuild.docs.dsl.docbook.AssembleDslDocTask}.
    Registered: Wed Dec 31 11:36:14 UTC 2025
    - Last Modified: Mon Jan 08 12:45:57 UTC 2024
    - 4.4K bytes
    - Viewed (0)
  6. src/main/java/org/codelibs/fess/helper/RelatedQueryHelper.java

            this.relatedQueryMap = relatedQueryMap;
            return relatedQueryMap.size();
        }
    
        /**
         * Extracts the virtual host key from a RelatedQuery entity.
         * If the virtual host is blank or null, returns an empty string.
         *
         * @param entity the RelatedQuery entity to extract the host key from
         * @return the virtual host key, or empty string if blank or null
         */
    Registered: Sat Dec 20 09:19:18 UTC 2025
    - Last Modified: Fri Nov 28 16:29:12 UTC 2025
    - 5.1K bytes
    - Viewed (0)
  7. impl/maven-cli/src/main/java/org/apache/maven/cling/invoker/mvnup/goals/AbstractUpgradeStrategy.java

            if (result.errorCount() > 0) {
                context.info(result.errorCount() + " POM(s) had errors");
            }
            context.unindent();
        }
    
        /**
         * Extracts an Artifact from a POM document with parent resolution.
         * If groupId or version are missing, attempts to resolve from parent.
         *
         * <p>This method handles Maven's inheritance mechanism where groupId and version
    Registered: Sun Dec 28 03:35:09 UTC 2025
    - Last Modified: Tue Nov 18 18:03:26 UTC 2025
    - 7.1K bytes
    - Viewed (0)
  8. src/main/java/org/codelibs/fess/mylasta/direction/FessConfig.java

        String getCrawlerDocumentHtmlPrunedTags();
    
        /**
         * Get the value for the key 'crawler.document.html.max.digest.length'. <br>
         * The value is, e.g. 120 <br>
         * comment: Maximum length of digest extracted from HTML documents.
         * @return The value of found property. (NotNull: if not found, exception but basically no way)
         */
        String getCrawlerDocumentHtmlMaxDigestLength();
    
        /**
    Registered: Sat Dec 20 09:19:18 UTC 2025
    - Last Modified: Sat Dec 13 02:21:17 UTC 2025
    - 525.7K bytes
    - Viewed (2)
  9. src/main/java/org/codelibs/fess/app/service/FailureUrlService.java

                op.setRefreshPolicy(Constants.TRUE);
            });
            return failureUrl;
        }
    
        /**
         * Extracts and returns the stack trace from a throwable as a string.
         * The stack trace is abbreviated if it exceeds the configured maximum length.
         *
         * @param t the throwable to extract the stack trace from
         * @return the stack trace as a string, or empty string if extraction fails
         */
    Registered: Sat Dec 20 09:19:18 UTC 2025
    - Last Modified: Thu Jul 17 08:28:31 UTC 2025
    - 9.2K bytes
    - Viewed (0)
  10. fess-crawler/src/test/java/org/codelibs/fess/crawler/helper/impl/MimeTypeHelperImplTest.java

            assertContentType("application/pdf", "extractor/test.pdf", "hoge.pdf");
    
            assertContentType("application/gzip", "extractor/gz/test.tar.gz", "hoge.tar.gz");
            assertContentType("application/zip", "extractor/zip/test.zip", "hoge.zip");
            assertContentType("application/x-lharc", "extractor/lha/test.lzh", "hoge.lzh"); // TODO is it correct?
    
            assertContentType("application/xml", "extractor/test.mm", "hoge.mm");
    
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Sat Mar 15 06:52:00 UTC 2025
    - 11.6K bytes
    - Viewed (0)
Back to top