Search Options

Results per page
Sort
Preferred Languages
Advance

Results 81 - 90 of 342 for used (0.08 sec)

  1. fess-crawler/src/test/java/org/codelibs/fess/crawler/filter/UrlFilterTest.java

            assertTrue(urlFilter.match("https://test.com/page"));
            assertTrue(urlFilter.match("ftp://files.com/document.pdf"));
            assertTrue(urlFilter.match("file:///home/user/file.txt"));
        }
    
        /**
         * Test match with complex URL patterns
         */
        public void test_match_complexUrls() {
            String sessionId = "test-session-010";
            urlFilter.init(sessionId);
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Wed Sep 03 14:42:53 UTC 2025
    - 19K bytes
    - Viewed (0)
  2. fess-crawler/src/main/java/org/codelibs/fess/crawler/processor/impl/SitemapsResponseProcessor.java

    /**
     * A response processor implementation that handles sitemaps.
     * It parses the response body as a SitemapSet, extracts URLs from the sitemaps,
     * and adds them as child URLs to be crawled.
     *
     * <p>
     * This class uses a {@link SitemapsHelper} to parse the sitemap XML or text.
     * It then iterates through the sitemaps in the SitemapSet, extracts the URL
     * from each sitemap, and creates a new {@link RequestData} object for each URL.
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 3.4K bytes
    - Viewed (0)
  3. src/test/java/org/codelibs/opensearch/extension/kuromoji/index/analysis/KuromojiTokenizerFactory.java

            }
            return rule;
        }
    
        public static UserDictionary getUserDictionary(Environment env, Settings settings) {
            if (settings.get(USER_DICT_PATH_OPTION) != null && settings.get(USER_DICT_RULES_OPTION) != null) {
                throw new IllegalArgumentException(
    Registered: Fri Sep 19 09:08:11 UTC 2025
    - Last Modified: Sat Mar 15 06:51:20 UTC 2025
    - 4.7K bytes
    - Viewed (0)
  4. src/main/java/org/codelibs/fess/suggest/converter/KatakanaToAlphabetConverter.java

     *
     * <p>
     * This class implements the {@link ReadingConverter} interface and provides a method to convert a given
     * Katakana string into a list of possible Alphabet readings. It uses a predefined mapping of Katakana
     * characters to their Alphabet equivalents, handling both single and double Katakana character combinations.
     * </p>
     *
     * <p>
    Registered: Fri Sep 19 09:08:11 UTC 2025
    - Last Modified: Fri Jul 04 14:00:23 UTC 2025
    - 10.8K bytes
    - Viewed (0)
  5. fess-crawler/src/main/java/org/codelibs/fess/crawler/helper/SitemapsHelper.java

     * and can handle GZIP compressed sitemaps.
     * The class provides methods to check if an input stream is a valid sitemap,
     * and to parse an input stream into a {@link SitemapSet} object.
     * It uses SAX parser for XML sitemaps and XML sitemap indexes,
     * and handles potential exceptions during parsing.
     * The class also includes inner classes for handling XML sitemap and sitemap index parsing.
     */
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 14.7K bytes
    - Viewed (0)
  6. fess-crawler/src/main/java/org/codelibs/fess/crawler/helper/impl/LogHelperImpl.java

    import org.codelibs.fess.crawler.log.LogType;
    
    /**
     * Implementation of the {@link LogHelper} interface.
     * This class provides methods for logging various events during the crawling process.
     * It uses Log4j2 for logging.
     *
     * <p>
     * The class contains methods for logging different types of events, such as:
     * </p>
     * <ul>
     *   <li>Starting and finishing threads</li>
     *   <li>Starting and cleaning up crawling</li>
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 14K bytes
    - Viewed (0)
  7. fess-crawler/src/test/resources/org/codelibs/fess/crawler/helper/robots.txt

    User-agent: FessCrawler
    Disallow:           # allows all 
    
    User-agent: BruteBot
    Disallow: /
    Allow: /foo/bar/
    Crawl-delay: 1314000
    
    # welcome!
    User-agent: Googlebot
    Crawl-delay: 1
    
    User-agent: *
    Disallow: /private/
    Disallow: /help        # disallows /help.html, /help/index.html, etc.
    Allow: /help/faq.html
    Crawl-delay: 3
    
    User-agent: Crawler
    Disallow: /aaa
    
    User-agent: Crawler/1.0
    Disallow: /bbb
    
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Oct 11 02:16:55 UTC 2015
    - 566 bytes
    - Viewed (0)
  8. src/main/java/org/codelibs/fess/suggest/index/contents/DefaultContentsParser.java

    /**
     * DefaultContentsParser is an implementation of the ContentsParser interface.
     * It provides methods to parse search words, query logs, and documents into SuggestItem objects.
     *
     * <p>This class uses various utilities such as ReadingConverter, Normalizer, and SuggestAnalyzer
     * to process and analyze the input data.</p>
     *
     * <p>It also handles the exclusion of search words based on certain criteria and manages the
    Registered: Fri Sep 19 09:08:11 UTC 2025
    - Last Modified: Fri Jul 04 14:00:23 UTC 2025
    - 15.4K bytes
    - Viewed (0)
  9. .github/workflows/maven.yml

        - "*.x"
    
    jobs:
      build:
    
        runs-on: ubuntu-latest
        env:
          PARENT_BRANCH: main
    
        steps:
        - uses: actions/checkout@v4
        - name: Set up JDK 21
          uses: actions/setup-java@v4
          with:
            java-version: '21'
            distribution: 'temurin'
        - uses: actions/cache@v4
          with:
            path: ~/.m2/repository
            key: ${{ runner.os }}-maven-${{ hashFiles('**/pom.xml') }}
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun May 18 03:08:24 UTC 2025
    - 1.1K bytes
    - Viewed (0)
  10. fess-crawler-opensearch/src/test/java/org/codelibs/fess/crawler/util/CrawlerWebServer.java

                final File tempDir = File.createTempFile("crawlerDocRoot", "");
                tempDir.delete();
                tempDir.mkdirs();
    
                final StringBuilder buf = new StringBuilder();
                buf.append("User-agent: *").append('\n');
                buf.append("Disallow: /admin/").append('\n');
                buf.append("Disallow: /websvn/").append('\n');
                final File robotTxtFile = new File(tempDir, "robots.txt");
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Mar 15 06:52:00 UTC 2025
    - 5K bytes
    - Viewed (0)
Back to top