Search Options

Display Count
Sort
Preferred Language
Advanced Search

Results 21 - 30 of 51 for filemap (0.23 seconds)

  1. fess-crawler/src/test/java/org/codelibs/fess/crawler/entity/RobotsTxtTest.java

            RobotsTxt robotsTxt = new RobotsTxt();
    
            robotsTxt.addSitemap("https://example.com/sitemap.xml");
            robotsTxt.addSitemap("https://example.com/sitemap2.xml");
    
            String[] sitemaps = robotsTxt.getSitemaps();
            assertEquals(2, sitemaps.length);
            assertEquals("https://example.com/sitemap.xml", sitemaps[0]);
            assertEquals("https://example.com/sitemap2.xml", sitemaps[1]);
        }
    
    Created: Sat Dec 20 11:21:39 GMT 2025
    - Last Modified: Thu Nov 13 13:29:22 GMT 2025
    - 14.4K bytes
    - Click Count (0)
  2. fess-crawler/src/test/resources/org/codelibs/fess/crawler/helper/robots.txt

    Crawl-delay: 3
    
    User-agent: Crawler
    Disallow: /aaa
    
    User-agent: Crawler/1.0
    Disallow: /bbb
    
    User-agent: Crawler/2.0
    Disallow: /ccc
    
    User-agent: Hoge Crawler
    Disallow: /ddd
    
    sitemap: http://www.example.com/sitmap.xml
    Created: Sat Dec 20 11:21:39 GMT 2025
    - Last Modified: Sun Oct 11 02:16:55 GMT 2015
    - 566 bytes
    - Click Count (0)
  3. android/guava-tests/test/com/google/common/io/FilesFileTraverserTest.java

          throws Exception {
        File fileA = newFile("file-a");
        File dir1 = newDir("dir-1");
        newFile("dir-1/file-b");
        newFile("dir-1/dir-2");
    
        assertThat(Iterables.limit(Files.fileTraverser().breadthFirst(rootDir), 3))
            .containsExactly(rootDir, fileA, dir1);
      }
    
      public void testFileTraverser_multipleDirectoryLayers_traversalReturnsAll() throws Exception {
        File fileA = newFile("file-a");
    Created: Fri Dec 26 12:43:10 GMT 2025
    - Last Modified: Thu Dec 19 18:03:30 GMT 2024
    - 3.4K bytes
    - Click Count (0)
  4. internal/lock/lock_windows.go

    	var lockType uint32 = lockFileFailImmediately | lockFileExclusiveLock
    	if flag == syscall.O_RDONLY {
    		// https://docs.microsoft.com/en-us/windows/desktop/api/fileapi/nf-fileapi-lockfileex
    		//lint:ignore SA4016 Reasons
    		lockType = lockFileFailImmediately // Set this to enable shared lock and fail immediately.
    	}
    	return lockedOpenFile(path, flag, perm, lockType)
    }
    
    Created: Sun Dec 28 19:28:13 GMT 2025
    - Last Modified: Sun Sep 28 20:59:21 GMT 2025
    - 7.9K bytes
    - Click Count (0)
  5. fess-crawler/src/main/java/org/codelibs/fess/crawler/entity/SitemapNews.java

     */
    package org.codelibs.fess.crawler.entity;
    
    import java.io.Serializable;
    
    /**
     * Represents a news entry within a sitemap URL.
     * This class encapsulates the properties of a news article as defined in the Google News Sitemap extension.
     *
     * <p>
     * The news extension allows you to provide additional information about news articles on your site.
    Created: Sat Dec 20 11:21:39 GMT 2025
    - Last Modified: Thu Nov 13 13:34:36 GMT 2025
    - 4.8K bytes
    - Click Count (0)
  6. src/main/java/jcifs/smb1/http/NetworkExplorer.java

         * Default constructor.
         */
        public NetworkExplorer() {
            super();
        }
    
        private static LogStream log = LogStream.getInstance();
    
        /** The MIME type mapping */
        private MimeMap mimeMap;
        /** The CSS style for HTML rendering */
        private String style;
        /** The NTLM SSP handler */
        private NtlmSsp ntlmSsp;
        /** Flag indicating if credentials were supplied */
    Created: Sat Dec 20 13:44:44 GMT 2025
    - Last Modified: Sun Aug 31 08:00:57 GMT 2025
    - 22.6K bytes
    - Click Count (0)
  7. fess-crawler/src/main/java/org/codelibs/fess/crawler/entity/SitemapImage.java

     */
    package org.codelibs.fess.crawler.entity;
    
    import java.io.Serializable;
    
    /**
     * Represents an image entry within a sitemap URL.
     * This class encapsulates the properties of an image as defined in the Google Image Sitemap extension.
     *
     * <p>
     * The image extension allows you to provide additional information about images on your pages.
    Created: Sat Dec 20 11:21:39 GMT 2025
    - Last Modified: Thu Nov 13 13:34:36 GMT 2025
    - 3.8K bytes
    - Click Count (0)
  8. fess-crawler/src/main/java/org/codelibs/fess/crawler/helper/RobotsTxtHelper.java

        protected static final Pattern CRAWL_DELAY_RECORD = Pattern.compile("^crawl-delay:\\s*([^\\s]+)\\s*$", Pattern.CASE_INSENSITIVE);
    
        /**
         * Pattern for Sitemap record.
         */
        protected static final Pattern SITEMAP_RECORD = Pattern.compile("^sitemap:\\s*([^\\s]+)\\s*$", Pattern.CASE_INSENSITIVE);
    
        /** Whether robots.txt processing is enabled. */
        protected boolean enabled = true;
    
        /**
    Created: Sat Dec 20 11:21:39 GMT 2025
    - Last Modified: Fri Nov 14 12:52:01 GMT 2025
    - 11.4K bytes
    - Click Count (0)
  9. internal/mountinfo/mountinfo_windows.go

    		// Recognize "fixed", "removable", "remote" and "ramdisk" drives as proper drives
    		// which can be treated as an actual mount-point, rest can be ignored.
    		// https://docs.microsoft.com/en-us/windows/desktop/api/fileapi/nf-fileapi-getdrivetypew
    		mountPointCache.Store(path, true)
    		return true
    	}
    	mountPointCache.Store(path, false)
    	return false
    Created: Sun Dec 28 19:28:13 GMT 2025
    - Last Modified: Tue Feb 18 16:25:55 GMT 2025
    - 2.1K bytes
    - Click Count (0)
  10. README.md

        controller.setDefaultIntervalTime(1000);
    });
    ```
    
    ### Sitemap Support
    
    ```java
    // Enable sitemap processing
    container.singleton("sitemapsRule", SitemapsRule.class, rule -> {
        rule.addRule("url", ".*sitemap.*");
    });
    
    // Add sitemap URL
    crawler.addUrl("https://example.com/sitemap.xml");
    ```
    
    ## Data Access and Storage
    
    ### Accessing Crawled Data
    
    ```java
    Created: Sat Dec 20 11:21:39 GMT 2025
    - Last Modified: Sun Aug 31 05:32:52 GMT 2025
    - 15.3K bytes
    - Click Count (0)
Back to Top