Search Options

Display Count
Sort
Preferred Language
Advanced Search

Results 41 - 50 of 51 for ditamap (0.06 seconds)

The search processing time has exceeded the limit. The displayed results may be partial.

  1. fess-crawler/src/test/java/org/codelibs/fess/crawler/util/CrawlerWebServer.java

                buf = new StringBuilder();
                buf.append("<?xml version=\"1.0\" encoding=\"UTF-8\"?>").append('\n');
                buf.append("<urlset ").append("xmlns=\"http://www.sitemaps.org/schemas/sitemap/0.9\">").append('\n');
                buf.append("<url>").append('\n');
                buf.append("<loc>http://localhost:7070/index.html</loc>").append('\n');
    Created: Sat Dec 20 11:21:39 GMT 2025
    - Last Modified: Sat Mar 15 06:52:00 GMT 2025
    - 6.3K bytes
    - Click Count (0)
  2. fess-crawler-lasta/src/test/java/org/codelibs/fess/crawler/util/CrawlerWebServer.java

                buf = new StringBuilder();
                buf.append("<?xml version=\"1.0\" encoding=\"UTF-8\"?>").append('\n');
                buf.append("<urlset ").append("xmlns=\"http://www.sitemaps.org/schemas/sitemap/0.9\">").append('\n');
                buf.append("<url>").append('\n');
                buf.append("<loc>http://localhost:7070/index.html</loc>").append('\n');
    Created: Sat Dec 20 11:21:39 GMT 2025
    - Last Modified: Sat Mar 15 06:52:00 GMT 2025
    - 6.3K bytes
    - Click Count (0)
  3. CLAUDE.md

    extractorFactory.addExtractor("text/html", tikaExtractor, 1);  // Fallback
    ```
    
    ### Helpers
    
    **RobotsTxtHelper**: RFC 9309 parsing, user-agent matching, crawl-delay, sitemaps
    **SitemapsHelper**: Sitemap XML parsing, index handling
    **MimeTypeHelper**: MIME detection via Tika
    **EncodingHelper**: Charset detection with BOM
    **UrlConvertHelper**: URL normalization
    
    ---
    
    ## Development Workflow
    
    Created: Sat Dec 20 11:21:39 GMT 2025
    - Last Modified: Fri Nov 28 17:31:34 GMT 2025
    - 10.7K bytes
    - Click Count (0)
  4. cmd/admin-handlers.go

    	}
    
    	disks := strings.Split(r.Form.Get("disks"), ",")
    	byDisk := strings.EqualFold(r.Form.Get("by-disk"), "true")
    	var diskMap map[string]struct{}
    	if len(disks) > 0 && disks[0] != "" {
    		diskMap = make(map[string]struct{}, len(disks))
    		for _, k := range disks {
    			if k != "" {
    				diskMap[k] = struct{}{}
    			}
    		}
    	}
    	jobID := r.Form.Get("by-jobID")
    
    	hosts := strings.Split(r.Form.Get("hosts"), ",")
    Created: Sun Dec 28 19:28:13 GMT 2025
    - Last Modified: Sun Sep 28 20:59:21 GMT 2025
    - 99.7K bytes
    - Click Count (0)
  5. fess-crawler/src/test/java/org/codelibs/fess/crawler/CrawlerTest.java

                        rule.setResponseProcessor(container.getComponent("sitemapsResponseProcessor"));
                        rule.setRuleId("sitemapsRule");
                        rule.addRule("url", ".*sitemap.*");
                    })//
                    .<DefaultResponseProcessor> singleton("defaultResponseProcessor", DefaultResponseProcessor.class, processor -> {
    Created: Sat Dec 20 11:21:39 GMT 2025
    - Last Modified: Tue Nov 11 13:40:14 GMT 2025
    - 25.8K bytes
    - Click Count (0)
  6. fess-crawler/src/main/java/org/codelibs/fess/crawler/client/http/HcHttpClient.java

            }
        }
    
        /**
         * Processes robots.txt for the given URL.
         * This method fetches and parses the robots.txt file to extract disallow/allow rules
         * and sitemap information.
         *
         * @param url The URL to process robots.txt for
         */
        protected void processRobotsTxt(final String url) {
            if (StringUtil.isBlank(url)) {
    Created: Sat Dec 20 11:21:39 GMT 2025
    - Last Modified: Sun Nov 23 12:19:14 GMT 2025
    - 53.7K bytes
    - Click Count (0)
  7. guava/src/com/google/common/net/MediaType.java

       *
       * @since 20.0
       */
      public static final MediaType VTT_UTF_8 = createConstantUtf8(TEXT_TYPE, "vtt");
    
      /* image types */
      /**
       * <a href="https://en.wikipedia.org/wiki/BMP_file_format">Bitmap file format</a> ({@code bmp}
       * files).
       *
       * @since 13.0
       */
      public static final MediaType BMP = createConstant(IMAGE_TYPE, "bmp");
    
      /**
    Created: Fri Dec 26 12:43:10 GMT 2025
    - Last Modified: Thu Oct 02 01:46:40 GMT 2025
    - 48K bytes
    - Click Count (0)
  8. fess-crawler-lasta/src/main/resources/crawler/extractor.xml

    				"image/x-freehand",
    				"image/x-jp2-codestream",
    				"image/x-jp2-container",
    				"image/x-niff",
    				"image/x-pcx",
    				"image/x-pict",
    				"image/x-portable-anymap",
    				"image/x-portable-bitmap",
    				"image/x-portable-graymap",
    				"image/x-portable-pixmap",
    				"image/x-raw-adobe",
    				"image/x-raw-hasselblad",
    				"image/x-raw-fuji",
    				"image/x-raw-canon",
    				"image/x-raw-kodak",
    Created: Sat Dec 20 11:21:39 GMT 2025
    - Last Modified: Sun Nov 23 03:46:53 GMT 2025
    - 50.1K bytes
    - Click Count (0)
  9. cmd/object-handlers_test.go

    	// function type for creating signed requests - used to repeat
    	// requests with V2 and V4 signing.
    	type testSignedReqFn func(method, urlStr string, contentLength int64,
    		body io.ReadSeeker, accessKey, secretKey string, metamap map[string]string) (*http.Request,
    		error)
    
    	mkGetReq := func(oi ObjectInput, byteRange string, i int, mkSignedReq testSignedReqFn) {
    		object := oi.objectName
    		rec := httptest.NewRecorder()
    Created: Sun Dec 28 19:28:13 GMT 2025
    - Last Modified: Sun Sep 28 20:59:21 GMT 2025
    - 163.1K bytes
    - Click Count (0)
  10. RELEASE.md

    fsx950223, ganler, Gaurav Singh, Georgios Pinitas, Gian Marco Iodice, Giorgio
    Arena, Giuseppe Rossini, Gregory Keith, Guozhong Zhuang, gurushantj, Hahn
    Anselm, Harald Husum, Harjyot Bagga, Hristo Vrigazov, Ilya Persky, Ir1d, Itamar
    Turner-Trauring, jacco, Jake Tae, Janosh Riebesell, Jason Zaman, jayanth, Jeff
    Daily, Jens Elofsson, Jinzhe Zeng, JLZ, Jonas Skog, Jonathan Dekhtiar, Josh
    Created: Tue Dec 30 12:39:10 GMT 2025
    - Last Modified: Tue Oct 28 22:27:41 GMT 2025
    - 740.4K bytes
    - Click Count (3)
Back to Top