Search Options

Results per page
Sort
Preferred Languages
Advance

Results 251 - 260 of 441 for CRAWLER (2.17 sec)

  1. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/AbstractXmlExtractor.java

    import org.apache.logging.log4j.Logger;
    import org.codelibs.core.io.InputStreamUtil;
    import org.codelibs.core.lang.StringUtil;
    import org.codelibs.fess.crawler.Constants;
    import org.codelibs.fess.crawler.entity.ExtractData;
    import org.codelibs.fess.crawler.exception.CrawlerSystemException;
    import org.codelibs.fess.crawler.exception.ExtractException;
    
    /**
     * Abstract base class for XML extractors.
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Sun Nov 23 12:19:14 UTC 2025
    - 8.6K bytes
    - Viewed (0)
  2. fess-crawler/src/test/java/org/codelibs/fess/crawler/transformer/impl/HtmlTransformerTest.java

     */
    package org.codelibs.fess.crawler.transformer.impl;
    
    import java.util.Map;
    
    import org.codelibs.fess.crawler.Constants;
    import org.codelibs.fess.crawler.builder.RequestDataBuilder;
    import org.codelibs.fess.crawler.entity.AccessResultDataImpl;
    import org.codelibs.fess.crawler.entity.ResponseData;
    import org.codelibs.fess.crawler.entity.ResultData;
    import org.codelibs.fess.crawler.exception.CrawlerSystemException;
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Sat Mar 15 06:52:00 UTC 2025
    - 13.8K bytes
    - Viewed (0)
  3. fess-crawler/src/test/resources/extractor/json/test.json

    {
      "title": "Sample Document",
      "author": "John Doe",
      "version": "1.0",
      "published": "2025-01-15",
      "tags": ["crawler", "extractor", "json"],
      "content": {
        "summary": "This is a sample JSON document for testing",
        "body": "The extractor should handle nested objects and arrays properly"
      },
      "metadata": {
        "created_at": "2025-01-01T00:00:00Z",
        "updated_at": "2025-01-15T12:00:00Z"
      }
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Sun Nov 23 03:46:53 UTC 2025
    - 412 bytes
    - Viewed (0)
  4. fess-crawler/src/test/java/org/codelibs/fess/crawler/entity/ResponseDataTest.java

     */
    package org.codelibs.fess.crawler.entity;
    
    import java.io.File;
    import java.io.IOException;
    import java.io.InputStream;
    import java.nio.charset.StandardCharsets;
    import java.nio.file.Files;
    import java.util.Arrays;
    import java.util.Date;
    import java.util.Map;
    import java.util.Set;
    
    import org.codelibs.fess.crawler.Constants;
    import org.codelibs.fess.crawler.entity.RequestData.Method;
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Thu Nov 13 13:29:22 UTC 2025
    - 14.3K bytes
    - Viewed (0)
  5. fess-crawler/src/test/java/org/codelibs/fess/crawler/entity/TestEntity.java

     * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND,
     * either express or implied. See the License for the specific language
     * governing permissions and limitations under the License.
     */
    package org.codelibs.fess.crawler.entity;
    
    import java.util.List;
    
    /**
     * @author shinsuke
     *
     */
    public class TestEntity {
        private String title;
    
        private String body;
    
        private List<String> list;
    
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Sat Mar 15 06:52:00 UTC 2025
    - 1.2K bytes
    - Viewed (0)
  6. fess-crawler/src/test/java/org/codelibs/fess/crawler/client/ftp/FtpClientTest.java

    import org.codelibs.fess.crawler.Constants;
    import org.codelibs.fess.crawler.client.ftp.FtpClient.FtpInfo;
    import org.codelibs.fess.crawler.container.StandardCrawlerContainer;
    import org.codelibs.fess.crawler.entity.RequestData;
    import org.codelibs.fess.crawler.entity.ResponseData;
    import org.codelibs.fess.crawler.exception.ChildUrlsException;
    import org.codelibs.fess.crawler.exception.CrawlingAccessException;
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Mon Nov 24 03:59:47 UTC 2025
    - 21.5K bytes
    - Viewed (0)
  7. fess-crawler/src/test/java/org/codelibs/fess/crawler/util/ResponseDataUtilTest.java

     * governing permissions and limitations under the License.
     */
    package org.codelibs.fess.crawler.util;
    
    import java.io.ByteArrayInputStream;
    import java.io.File;
    import java.io.FileInputStream;
    import java.io.IOException;
    import java.io.InputStream;
    
    import org.codelibs.fess.crawler.entity.ResponseData;
    import org.codelibs.fess.crawler.exception.CrawlingAccessException;
    import org.dbflute.utflute.core.PlainTestCase;
    
    /**
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Sat Nov 22 13:28:22 UTC 2025
    - 7.9K bytes
    - Viewed (0)
  8. fess-crawler/src/main/java/org/codelibs/fess/crawler/service/UrlQueueService.java

     * either express or implied. See the License for the specific language
     * governing permissions and limitations under the License.
     */
    package org.codelibs.fess.crawler.service;
    
    import java.util.List;
    
    import org.codelibs.fess.crawler.entity.UrlQueue;
    
    /**
     * Service interface for managing URL queues.
     * Provides methods for adding, retrieving, and managing URLs within a crawling session.
     *
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 2.6K bytes
    - Viewed (0)
  9. fess-crawler/src/main/java/org/codelibs/fess/crawler/helper/RobotsTxtHelper.java

    import java.util.regex.Pattern;
    
    import org.apache.commons.io.input.BOMInputStream;
    import org.codelibs.core.lang.StringUtil;
    import org.codelibs.fess.crawler.Constants;
    import org.codelibs.fess.crawler.entity.RobotsTxt;
    import org.codelibs.fess.crawler.entity.RobotsTxt.Directive;
    import org.codelibs.fess.crawler.exception.RobotsTxtException;
    
    /**
     * Robots.txt Parser following RFC 9309 specification.
     *
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Fri Nov 14 12:52:01 UTC 2025
    - 11.4K bytes
    - Viewed (0)
  10. fess-crawler/src/test/java/org/codelibs/fess/crawler/service/impl/UrlQueueServiceImplTest.java

    import java.util.LinkedList;
    import java.util.List;
    import java.util.Map;
    import java.util.Queue;
    
    import org.codelibs.fess.crawler.Constants;
    import org.codelibs.fess.crawler.entity.AccessResultImpl;
    import org.codelibs.fess.crawler.entity.UrlQueueImpl;
    import org.codelibs.fess.crawler.helper.MemoryDataHelper;
    import org.dbflute.utflute.core.PlainTestCase;
    import org.mockito.InjectMocks;
    import org.mockito.Mock;
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Thu Nov 13 13:29:22 UTC 2025
    - 14.1K bytes
    - Viewed (0)
Back to top