Search Options

Results per page
Sort
Preferred Languages
Advance

Results 41 - 50 of 50 for getText (0.03 sec)

  1. fess-crawler/src/main/java/org/codelibs/fess/crawler/transformer/impl/TextTransformer.java

            params.put(ExtractData.CONTENT_TYPE, responseData.getMimeType());
            String content = null;
            try (final InputStream in = responseData.getResponseBody()) {
                content = extractor.getText(in, params).getContent();
            } catch (final Exception e) {
                throw new CrawlingAccessException("Could not extract data.", e);
            }
    
            final ResultData resultData = new ResultData();
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 6.5K bytes
    - Viewed (0)
  2. src/main/java/org/codelibs/fess/suggest/util/SuggestUtil.java

         */
        public static String createBulkLine(final String index, final String type, final SuggestItem item) {
            if (item == null || item.getId() == null || item.getText() == null) {
                throw new SuggesterException("Invalid SuggestItem: item, id, or text is null");
            }
    
            final Map<String, Object> firstLineMap = new HashMap<>();
    Registered: Fri Sep 19 09:08:11 UTC 2025
    - Last Modified: Mon Sep 01 13:33:03 UTC 2025
    - 17.4K bytes
    - Viewed (1)
  3. README.md

    crawler.awaitTermination();
    System.out.println("Crawling completed");
    ```
    
    ### Custom Content Extractor
    
    ```java
    public class CustomExtractor extends AbstractExtractor {
        @Override
        public ExtractData getText(final InputStream inputStream, final Map<String, String> params) {
            // Custom extraction logic
            ExtractData extractData = new ExtractData();
            // ... implementation
            return extractData;
        }
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Aug 31 05:32:52 UTC 2025
    - 15.3K bytes
    - Viewed (0)
  4. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/AbstractXmlExtractor.java

        /**
         * Returns the pattern used to identify tags in the content.
         * @return The tag pattern.
         */
        protected abstract Pattern getTagPattern();
    
        @Override
        public ExtractData getText(final InputStream in, final Map<String, String> params) {
            if (in == null) {
                throw new CrawlerSystemException("The inputstream is null.");
            }
            try {
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 8.5K bytes
    - Viewed (0)
  5. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/ExtractorBuilder.java

                    }
                    return new ExtractData(StringUtil.EMPTY);
                } else {
                    try (InputStream is = getContentInputStream(out)) {
                        return extractor.getText(is, params);
                    }
                }
            } catch (final CrawlingAccessException e) {
                throw e;
            } catch (final Exception e) {
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 10.1K bytes
    - Viewed (0)
  6. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/ApiExtractor.java

         * @param params additional parameters
         * @return the extracted data
         * @throws ExtractException if extraction fails
         */
        @Override
        public ExtractData getText(final InputStream in, final Map<String, String> params) {
            if (logger.isDebugEnabled()) {
                logger.debug("Accessing {}", url);
            }
    
            // start
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Thu Aug 07 02:55:08 UTC 2025
    - 12.2K bytes
    - Viewed (0)
  7. src/test/java/org/codelibs/fess/suggest/SuggesterTest.java

            final List<SuggestItem> items = response.getItems();
            assertEquals(1, response.getNum());
            assertEquals("検索 エンジン", items.get(0).getText());
        }
    
        @Test
        public void test_indexFromSearchWordExclude() throws Exception {
            SuggestIndexResponse indexResponse = suggester.indexer().indexFromSearchWord("。」", null, null, null, 1, null);
    Registered: Fri Sep 19 09:08:11 UTC 2025
    - Last Modified: Thu Aug 07 02:41:28 UTC 2025
    - 37.2K bytes
    - Viewed (0)
  8. fess-crawler/src/test/resources/ajax/js/jquery-2.1.1.min.js

    Error("Syntax error, unrecognized expression: "+a)},fb.uniqueSort=function(a){var b,d=[],e=0,f=0;if(l=!c.detectDuplicates,k=!c.sortStable&&a.slice(0),a.sort(B),l){while(b=a[f++])b===a[f]&&(e=d.push(f));while(e--)a.splice(d[e],1)}return k=null,a},e=fb.getText=function(a){var b,c="",d=0,f=a.nodeType;if(f){if(1===f||9===f||11===f){if("string"==typeof a.textContent)return a.textContent;for(a=a.firstChild;a;a=a.nextSibling)c+=e(a)}else if(3===f||4===f)return a.nodeValue}else while(b=a[d++])c+=e(b);return ...
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Oct 11 02:16:55 UTC 2015
    - 82.3K bytes
    - Viewed (0)
  9. fess-crawler-lasta/src/main/resources/crawler/extractor.xml

    				"text/x-prolog",
    				"text/x-python",
    				"text/x-rst",
    				"text/x-rexx",
    				"text/x-ruby",
    				"text/x-scala",
    				"text/x-scheme",
    				"text/x-sed",
    				"text/x-sql",
    				"text/x-setext",
    				"text/x-stsrc",
    				"text/x-tcl",
    				"text/x-uuencode",
    				"text/x-vbasic",
    				"text/x-vbdotnet",
    				"text/x-vbscript",
    				"text/x-vcalendar",
    				"text/x-vcard",
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Aug 01 21:40:30 UTC 2020
    - 49K bytes
    - Viewed (0)
  10. fess-crawler/src/main/resources/org/codelibs/fess/crawler/mime/tika-mimetypes.xml

      </mime-type>
    
      <mime-type type="text/x-sql">
        <_comment>SQL code</_comment>
        <glob pattern="*.sql"/>
        <sub-class-of type="text/plain"/>
      </mime-type>
    
      <mime-type type="text/x-setext">
        <glob pattern="*.etx"/>
        <sub-class-of type="text/plain"/>
      </mime-type>
    
      <mime-type type="text/x-stsrc">
        <_comment>Smalltalk source code</_comment>
        <glob pattern="*.st"/>
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Thu Mar 13 08:18:01 UTC 2025
    - 320.1K bytes
    - Viewed (1)
Back to top