Search Options

Results per page
Sort
Preferred Languages
Advance

Results 41 - 50 of 51 for filemap (0.09 sec)

  1. fess-crawler-lasta/src/test/java/org/codelibs/fess/crawler/util/CrawlerWebServer.java

                buf = new StringBuilder();
                buf.append("<?xml version=\"1.0\" encoding=\"UTF-8\"?>").append('\n');
                buf.append("<urlset ").append("xmlns=\"http://www.sitemaps.org/schemas/sitemap/0.9\">").append('\n');
                buf.append("<url>").append('\n');
                buf.append("<loc>http://localhost:7070/index.html</loc>").append('\n');
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Sat Mar 15 06:52:00 UTC 2025
    - 6.3K bytes
    - Viewed (0)
  2. internal/config/config.go

    			tgtName := strings.TrimPrefix(k, envVarPrefix)
    			if tgtName != "" {
    				if v, ok := filterMap[k]; ok {
    					if strings.HasPrefix(envVarPrefix, v) {
    						filterMap[k] = envVarPrefix
    					}
    				} else {
    					filterMap[k] = envVarPrefix
    				}
    			}
    		}
    	}
    
    	for k, v := range filterMap {
    		seen.Add(strings.TrimPrefix(k, v))
    	}
    
    	seen.Remove(Default)
    Registered: Sun Dec 28 19:28:13 UTC 2025
    - Last Modified: Sun Sep 28 20:59:21 UTC 2025
    - 37.7K bytes
    - Viewed (0)
  3. CLAUDE.md

    extractorFactory.addExtractor("text/html", tikaExtractor, 1);  // Fallback
    ```
    
    ### Helpers
    
    **RobotsTxtHelper**: RFC 9309 parsing, user-agent matching, crawl-delay, sitemaps
    **SitemapsHelper**: Sitemap XML parsing, index handling
    **MimeTypeHelper**: MIME detection via Tika
    **EncodingHelper**: Charset detection with BOM
    **UrlConvertHelper**: URL normalization
    
    ---
    
    ## Development Workflow
    
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Fri Nov 28 17:31:34 UTC 2025
    - 10.7K bytes
    - Viewed (0)
  4. .github/workflows/tests.yml

          matrix:
            dbversion: [ 'v6.5.0' ]
            go: ['1.24', '1.25']
            platform: [ ubuntu-latest ]
        runs-on: ${{ matrix.platform }}
    
        steps:
          - name: Setup TiDB
            uses: Icemap/tidb-action@main
            with:
              port: 9940
              version: ${{matrix.dbversion}}
    
          - name: Set up Go 1.x
            uses: actions/setup-go@v4
            with:
    Registered: Sun Dec 28 09:35:17 UTC 2025
    - Last Modified: Mon Sep 08 09:19:22 UTC 2025
    - 8.9K bytes
    - Viewed (0)
  5. android/guava-tests/test/com/google/common/collect/MapsCollectionTest.java

        suite.addTest(filterSortedMapSuite());
        suite.addTest(filterNavigableMapSuite());
        return suite;
      }
    
      static TestSuite filterMapSuite() {
        TestSuite suite = new TestSuite("FilterMap");
        suite.addTest(
            MapTestSuiteBuilder.using(
                    new TestStringMapGenerator() {
                      @Override
    Registered: Fri Dec 26 12:43:10 UTC 2025
    - Last Modified: Tue May 13 17:27:14 UTC 2025
    - 32.4K bytes
    - Viewed (0)
  6. fess-crawler/src/test/java/org/codelibs/fess/crawler/helper/RobotsTxtHelperTest.java

            // Test sitemaps
            String[] sitemaps = robotsTxt.getSitemaps();
            assertEquals(1, sitemaps.length);
            assertEquals("http://www.example.com/sitemap.xml", sitemaps[0]);
        }
    
        public void testParse_malformed() {
            RobotsTxt robotsTxt;
            final InputStream in = RobotsTxtHelperTest.class.getResourceAsStream("robots_malformed.txt");
            try {
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Mon Nov 24 03:59:47 UTC 2025
    - 20.6K bytes
    - Viewed (0)
  7. fess-crawler/src/test/java/org/codelibs/fess/crawler/CrawlerTest.java

                        rule.setResponseProcessor(container.getComponent("sitemapsResponseProcessor"));
                        rule.setRuleId("sitemapsRule");
                        rule.addRule("url", ".*sitemap.*");
                    })//
                    .<DefaultResponseProcessor> singleton("defaultResponseProcessor", DefaultResponseProcessor.class, processor -> {
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Tue Nov 11 13:40:14 UTC 2025
    - 25.8K bytes
    - Viewed (0)
  8. guava-tests/test/com/google/common/collect/MapsCollectionTest.java

        suite.addTest(filterSortedMapSuite());
        suite.addTest(filterNavigableMapSuite());
        return suite;
      }
    
      static TestSuite filterMapSuite() {
        TestSuite suite = new TestSuite("FilterMap");
        suite.addTest(
            MapTestSuiteBuilder.using(
                    new TestStringMapGenerator() {
                      @Override
    Registered: Fri Dec 26 12:43:10 UTC 2025
    - Last Modified: Tue May 13 17:27:14 UTC 2025
    - 32.4K bytes
    - Viewed (0)
  9. fess-crawler/src/main/java/org/codelibs/fess/crawler/client/http/HcHttpClient.java

            }
        }
    
        /**
         * Processes robots.txt for the given URL.
         * This method fetches and parses the robots.txt file to extract disallow/allow rules
         * and sitemap information.
         *
         * @param url The URL to process robots.txt for
         */
        protected void processRobotsTxt(final String url) {
            if (StringUtil.isBlank(url)) {
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Sun Nov 23 12:19:14 UTC 2025
    - 53.7K bytes
    - Viewed (0)
  10. fess-crawler/src/main/resources/org/codelibs/fess/crawler/mime/tika-mimetypes.xml

            <match value="allow:" type="stringignorecase" offset="0"/>
            <match value="disallow:" type="stringignorecase" offset="0"/>
            <match value="sitemap:" type="stringignorecase" offset="0"/>
            <match value="\nuser-agent:" type="stringignorecase" offset="0:1000"/>
            <match value="\nallow:" type="stringignorecase" offset="0:1000"/>
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Thu Oct 16 07:46:32 UTC 2025
    - 320.2K bytes
    - Viewed (5)
Back to top