Search Options

Results per page
Sort
Preferred Languages
Advance

Results 81 - 90 of 169 for Watch (0.05 sec)

  1. fess-crawler/src/main/java/org/codelibs/fess/crawler/rule/impl/RuleManagerImpl.java

         * Gets the first rule that matches the given response data.
         * @param responseData the response data to match against
         * @return the first matching rule, or null if no rule matches
         */
        @Override
        public Rule getRule(final ResponseData responseData) {
            for (final Rule rule : ruleList) {
                if (rule.match(responseData)) {
                    return rule;
                }
            }
            return null;
        }
    
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 3.4K bytes
    - Viewed (0)
  2. fess-crawler/src/test/java/org/codelibs/fess/crawler/rule/impl/SitemapsRuleTest.java

            assertTrue(sitemapsRule.match(responseData));
            InputStream is = responseData.getResponseBody();
            assertTrue(is instanceof InputStream);
            CloseableUtil.closeQuietly(responseData);
        }
    
        private void assertMatchFalse(ResponseData responseData) {
            sitemapsRule.addRule("url", Pattern.compile(".*sitemap.*"));
            assertFalse(sitemapsRule.match(responseData));
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Mar 15 06:52:00 UTC 2025
    - 4.7K bytes
    - Viewed (0)
  3. fess-crawler/src/main/java/org/codelibs/fess/crawler/client/http/form/FormScheme.java

                    } else {
                        String content;
                        try {
                            content = new String(InputStreamUtil.getBytes(entity.getContent()), Constants.UTF_8_CHARSET);
                        } catch (final IOException e) {
                            content = e.getMessage();
                        }
                        logger.warn("Failed to access to {}. The http status is {}.\n{}", tokenUrl, httpStatusCode, content);
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 14.3K bytes
    - Viewed (1)
  4. fess-crawler/src/main/java/org/codelibs/fess/crawler/filter/UrlFilter.java

         */
        void init(String sessionId);
    
        /**
         * Check if a given url is a target.
         *
         * @param url URL
         * @return true if url is matched
         */
        boolean match(String url);
    
        /**
         * Add an url pattern as a target.
         *
         * @param urlPattern Regular expression that is crawled
         */
        void addInclude(String urlPattern);
    
        /**
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Mar 15 06:52:00 UTC 2025
    - 1.6K bytes
    - Viewed (0)
  5. fess-crawler/src/main/java/org/codelibs/fess/crawler/transformer/impl/FileTransformer.java

                    CopyUtil.copy(is, os);
                } catch (final IOException e) {
                    throw new CrawlerSystemException("Could not store " + file.getAbsolutePath(), e);
                }
            }
            try {
                resultData.setData(path.getBytes(charsetName));
            } catch (final UnsupportedEncodingException e) {
                if (logger.isInfoEnabled()) {
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Thu Aug 07 02:55:08 UTC 2025
    - 11.7K bytes
    - Viewed (0)
  6. fess-crawler/src/main/java/org/codelibs/fess/crawler/entity/RobotsTxt.java

     * </ul>
     *
     * <p>The class uses case-insensitive pattern matching for user agents and supports
     * wildcard characters (*) in user agent strings. When multiple directives match a user agent,
     * the most specific (longest) match is used.</p>
     *
     */
    public class RobotsTxt {
        private static final String ALL_BOTS = "*";
    
        /** Map of user agent patterns to their corresponding directives. */
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 10K bytes
    - Viewed (0)
  7. fess-crawler/src/test/java/org/codelibs/fess/crawler/extractor/impl/MsWordExtractorTest.java

            logger.info(content);
            assertTrue(content.contains("ใƒ†ใ‚นใƒˆ"));
        }
    
        public void test_getText_null() {
            try {
                msWordExtractor.getText(null, null);
                fail();
            } catch (final CrawlerSystemException e) {
                // NOP
            }
        }
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Mar 15 06:52:00 UTC 2025
    - 2.1K bytes
    - Viewed (0)
  8. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/MsPublisherExtractor.java

                @SuppressWarnings("resource")
                final PublisherTextExtractor publisherTextExtractor = new PublisherTextExtractor(in);
                return new ExtractData(publisherTextExtractor.getText());
            } catch (final IOException e) {
                throw new ExtractException(e);
            }
        }
    
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 1.9K bytes
    - Viewed (0)
  9. fess-crawler/src/main/java/org/codelibs/fess/crawler/interval/impl/AbstractIntervalController.java

                    break;
                default:
                    // No operation
                    break;
                }
            } catch (final CrawlerSystemException e) {
                if (!ignoreException) {
                    throw e;
                }
            } catch (final Exception e) {
                if (!ignoreException) {
                    throw new CrawlerSystemException("Could not stop a process.", e);
                }
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 4.5K bytes
    - Viewed (0)
  10. fess-crawler/src/main/java/org/codelibs/fess/crawler/interval/impl/HostIntervalController.java

                            break;
                        }
                        lastTime.wait(delayTime);
                    }
                }
            } catch (final InterruptedException e) {
                throw new InterruptedRuntimeException(e);
            } catch (final Exception e) {
                throw new CrawlerSystemException(e);
            }
        }
    
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 4.2K bytes
    - Viewed (0)
Back to top