Search Options

Results per page
Sort
Preferred Languages
Advance

Results 1 - 10 of 12 for 0001 (0.01 sec)

  1. fess-crawler/src/main/resources/org/codelibs/fess/crawler/mime/tika-mimetypes.xml

          <!--  the length of a child atom, or start of data -->
          <match value="moov\000" type="string" offset="4"/>
          <match value="mdat\000" type="string" offset="4"/>
          <match value="free\000" type="string" offset="4"/>
          <match value="skip\000" type="string" offset="4"/>
          <match value="pnot\000" type="string" offset="4"/>
          <!-- General Atom match, specific ftypXXX ones present for subtypes -->
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Thu Mar 13 08:18:01 UTC 2025
    - 320.1K bytes
    - Viewed (1)
  2. fess-crawler/src/test/java/org/codelibs/fess/crawler/client/http/HcHttpClientTest.java

            assertEquals("http://192.168.1.1/path/file", HcHttpClient.constructRedirectLocation("http://192.168.1.1/path/", "file"));
            assertEquals("http://[2001:db8::1]/path/file", HcHttpClient.constructRedirectLocation("http://[2001:db8::1]/path/", "file"));
            assertEquals("http://example.com:8080/path/file", HcHttpClient.constructRedirectLocation("http://example.com:8080/path/", "file"));
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Sep 06 04:15:37 UTC 2025
    - 11.7K bytes
    - Viewed (0)
  3. fess-crawler/src/test/java/org/codelibs/fess/crawler/extractor/impl/EmlExtractorTest.java

                final String[] receivedDate = data.getValues("Received-Date");
                logger.info("Received-Date: {}", receivedDate[0]);
                assertEquals(receivedDate[0], "2012-11-11T02:39:59.000Z");
            }
        }
    
        public void test_getDecodeText() throws Exception {
            assertEquals("", emlExtractor.getDecodeText(null));
            assertEquals("", emlExtractor.getDecodeText(""));
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Thu Aug 07 02:55:08 UTC 2025
    - 4.6K bytes
    - Viewed (1)
  4. fess-crawler-lasta/pom.xml

    <?xml version="1.0"?>
    <project xmlns="http://maven.apache.org/POM/4.0.0" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:schemaLocation="http://maven.apache.org/POM/4.0.0 http://maven.apache.org/maven-v4_0_0.xsd">
    	<modelVersion>4.0.0</modelVersion>
    	<artifactId>fess-crawler-lasta</artifactId>
    	<packaging>jar</packaging>
    	<name>Fess Crawler for LastaFlute</name>
    	<description>This is LastaFlute support.</description>
    	<parent>
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Sep 06 04:15:37 UTC 2025
    - 2.9K bytes
    - Viewed (0)
  5. pom.xml

    <?xml version="1.0" encoding="UTF-8"?>
    <project xmlns="http://maven.apache.org/POM/4.0.0" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:schemaLocation="http://maven.apache.org/POM/4.0.0 http://maven.apache.org/maven-v4_0_0.xsd">
    	<modelVersion>4.0.0</modelVersion>
    	<groupId>org.codelibs.fess</groupId>
    	<artifactId>fess-crawler-parent</artifactId>
    	<version>15.3.0-SNAPSHOT</version>
    	<packaging>pom</packaging>
    	<name>Fess Crawler Project</name>
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Sep 06 04:15:37 UTC 2025
    - 2.8K bytes
    - Viewed (0)
  6. fess-crawler-opensearch/pom.xml

    <?xml version="1.0"?>
    <project xmlns="http://maven.apache.org/POM/4.0.0" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:schemaLocation="http://maven.apache.org/POM/4.0.0 http://maven.apache.org/maven-v4_0_0.xsd">
    	<modelVersion>4.0.0</modelVersion>
    	<artifactId>fess-crawler-opensearch</artifactId>
    	<packaging>jar</packaging>
    	<name>Fess Crawler OpenSearch</name>
    	<parent>
    		<groupId>org.codelibs.fess</groupId>
    		<artifactId>fess-crawler-parent</artifactId>
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Sep 06 04:15:37 UTC 2025
    - 3.4K bytes
    - Viewed (0)
  7. fess-crawler/src/test/java/org/codelibs/fess/crawler/filter/UrlFilterTest.java

            urlFilter = container.getComponent("urlFilter");
        }
    
        /**
         * Test basic initialization with session ID
         */
        public void test_init_withSessionId() {
            String sessionId = "test-session-001";
            urlFilter.init(sessionId);
            // Initialization should complete without errors
            assertNotNull(urlFilter);
        }
    
        /**
         * Test initialization with null session ID
         */
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Wed Sep 03 14:42:53 UTC 2025
    - 19K bytes
    - Viewed (0)
  8. pom.xml

    <?xml version="1.0" encoding="UTF-8"?>
    <project xmlns="http://maven.apache.org/POM/4.0.0" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:schemaLocation="http://maven.apache.org/POM/4.0.0 http://maven.apache.org/xsd/maven-4.0.0.xsd">
    	<modelVersion>4.0.0</modelVersion>
    	<artifactId>fess-suggest</artifactId>
    	<version>15.3.0-SNAPSHOT</version>
    	<packaging>jar</packaging>
    	<name>fess-suggest</name>
    	<url>https://fess.codelibs.org/</url>
    Registered: Fri Sep 19 09:08:11 UTC 2025
    - Last Modified: Sat Sep 06 03:14:57 UTC 2025
    - 4.3K bytes
    - Viewed (0)
  9. fess-crawler/pom.xml

    <?xml version="1.0"?>
    <project xmlns="http://maven.apache.org/POM/4.0.0" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:schemaLocation="http://maven.apache.org/POM/4.0.0 http://maven.apache.org/maven-v4_0_0.xsd">
    	<modelVersion>4.0.0</modelVersion>
    	<artifactId>fess-crawler</artifactId>
    	<packaging>jar</packaging>
    	<name>Fess Crawler</name>
    	<description>Fess Crawler is a crawler framework.</description>
    	<parent>
    		<groupId>org.codelibs.fess</groupId>
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Sep 06 04:15:37 UTC 2025
    - 11.3K bytes
    - Viewed (0)
  10. README.md

    crawler.crawlerContext.setNumOfThread(10);
    
    // Set maximum crawl depth
    crawler.crawlerContext.setMaxDepth(3);
    
    // Set request interval (politeness)
    crawler.crawlerContext.setDefaultIntervalTime(1000); // 1 second
    ```
    
    ### URL Filtering
    
    ```java
    // Include patterns
    crawler.urlFilter.addInclude("https://example.com/.*");
    crawler.urlFilter.addInclude(".*\\.pdf$");
    
    // Exclude patterns  
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Aug 31 05:32:52 UTC 2025
    - 15.3K bytes
    - Viewed (0)
Back to top