Search Options

Results per page
Sort
Preferred Languages
Advance

Results 81 - 90 of 104 for url (0.01 sec)

  1. fess-crawler-lasta/src/test/java/org/codelibs/fess/crawler/util/CrawlerWebServer.java

                buf.append("<url>").append('\n');
                buf.append("<loc>http://localhost:7070/index.html</loc>").append('\n');
                buf.append("<loc>http://localhost:7070/file").append(count).append("-1.html").append("</loc>").append('\n');
                buf.append("</url>").append('\n');
                buf.append("</urlset>").append('\n');
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Mar 15 06:52:00 UTC 2025
    - 6.3K bytes
    - Viewed (0)
  2. fess-crawler/src/main/java/org/codelibs/fess/crawler/client/fs/FileSystemClient.java

            this.charset = charset;
        }
    
        /**
         * Executes a HEAD request for the given URL.
         * @param url The URL to request.
         * @return The ResponseData.
         */
        @Override
        public ResponseData doHead(final String url) {
            try {
                final ResponseData responseData = processRequest(url, false);
                responseData.setMethod(Constants.HEAD_METHOD);
                return responseData;
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 13.8K bytes
    - Viewed (0)
  3. fess-crawler-opensearch/src/main/resources/mapping/filter.json

    {
        "properties": {
          "sessionId": {
            "type": "keyword"
          },
          "filterType": {
            "type": "keyword"
          },
          "url": {
            "type": "keyword"
          }
        }
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Thu Nov 07 04:44:10 UTC 2024
    - 192 bytes
    - Viewed (0)
  4. fess-crawler/src/test/resources/extractor/test_ns.xml

    <?xml version="1.0" encoding="UTF-8"?>
    <hoge:address xmlns:hoge="http://www.example.com/hoge">
    	<hoge:item sex="male" custid="A12345">
    		<hoge:name>鈴木太郎</hoge:name>
    		<hoge:access kind="email"></hoge:access>
    		<hoge:access kind="url">http://www.taro.com/</hoge:access>
    		<hoge:image file="taro.png" />
    	</hoge:item>
    	<hoge:item sex="male" custid="B23456">
    		<hoge:name>佐藤二朗</hoge:name>
    		<hoge:access kind="email">******@****.***</hoge:access>
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Oct 11 02:16:55 UTC 2015
    - 707 bytes
    - Viewed (0)
  5. fess-crawler/src/main/java/org/codelibs/fess/crawler/entity/RobotsTxt.java

        }
    
        /**
         * Adds a sitemap URL to the list of sitemaps.
         *
         * @param url The URL of the sitemap to be added
         */
        public void addSitemap(final String url) {
            if (!sitemapList.contains(url)) {
                sitemapList.add(url);
            }
        }
    
        /**
         * Returns an array of sitemap URLs.
         *
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 10K bytes
    - Viewed (0)
  6. fess-crawler/src/main/java/org/codelibs/fess/crawler/client/CrawlerClientFactory.java

    import jakarta.annotation.Resource;
    
    /**
     * A factory class for managing and creating crawler clients based on URL patterns.
     * This class implements AutoCloseable to properly handle resource cleanup.
     *
     * <p>The factory maintains a map of regular expression patterns to crawler clients,
     * allowing for URL-based client selection. Clients can be added with specific patterns
     * and optionally at specific positions in the processing order.</p>
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 7K bytes
    - Viewed (0)
  7. fess-crawler/src/main/java/org/codelibs/fess/crawler/processor/impl/DefaultResponseProcessor.java

         * @param childUrlList the set of child URLs
         * @param url the parent URL
         * @param depth the depth of the child URLs
         * @param encoding the encoding of the child URLs
         */
        protected void storeChildUrls(final CrawlerContext crawlerContext, final Set<RequestData> childUrlList, final String url,
                final int depth, final String encoding) {
            // add url and filter
            final Set<String> urlSet = new HashSet<>();
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Thu Aug 07 02:55:08 UTC 2025
    - 12.5K bytes
    - Viewed (0)
  8. fess-crawler/src/test/java/org/codelibs/fess/crawler/util/CrawlerWebServer.java

                buf.append("<url>").append('\n');
                buf.append("<loc>http://localhost:7070/index.html</loc>").append('\n');
                buf.append("<loc>http://localhost:7070/file").append(count).append("-1.html").append("</loc>").append('\n');
                buf.append("</url>").append('\n');
                buf.append("</urlset>").append('\n');
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Mar 15 06:52:00 UTC 2025
    - 6.3K bytes
    - Viewed (0)
  9. fess-crawler/src/main/java/org/codelibs/fess/crawler/CrawlerContext.java

     * of the crawler's behavior.
     *
     * <p>
     * The context includes information such as the session ID, active thread count, access count, crawler status,
     * URL filter, rule manager, interval controller, robots.txt URL set, sitemaps, number of threads,
     * maximum thread check count, maximum depth, and maximum access count.
     * </p>
     *
     * <p>
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 8.9K bytes
    - Viewed (0)
  10. fess-crawler-opensearch/src/test/java/org/codelibs/fess/crawler/CrawlerTest.java

                file.deleteOnExit();
                fileTransformer.setPath(file.getAbsolutePath());
                crawler.addUrl(url);
                crawler.getCrawlerContext().setMaxAccessCount(maxCount);
                crawler.getCrawlerContext().setNumOfThread(numOfThread);
                crawler.urlFilter.addInclude(url + ".*");
                final String sessionId = crawler.execute();
                assertEquals(maxCount, dataService.getCount(sessionId));
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Sep 06 04:15:37 UTC 2025
    - 7.7K bytes
    - Viewed (0)
Back to top