Search Options

Results per page
Sort
Preferred Languages
Advance

Results 301 - 310 of 529 for crawlen (1.06 sec)

  1. src/main/java/org/codelibs/fess/opensearch/config/exentity/RequestHeader.java

        }
    
        public void setVersionNo(final Long version) {
            asDocMeta().version(version);
        }
    
        public org.codelibs.fess.crawler.client.http.RequestHeader getCrawlerRequestHeader() {
            return new org.codelibs.fess.crawler.client.http.RequestHeader(getName(), getValue());
        }
    
        public WebConfig getWebConfig() {
            if (webConfig == null) {
    Registered: Sat Dec 20 09:19:18 UTC 2025
    - Last Modified: Sat Mar 15 06:53:53 UTC 2025
    - 2.5K bytes
    - Viewed (0)
  2. fess-crawler/src/test/java/org/codelibs/fess/crawler/util/CrawlerWebServer.java

     * either express or implied. See the License for the specific language
     * governing permissions and limitations under the License.
     */
    package org.codelibs.fess.crawler.util;
    
    import java.io.File;
    
    import org.codelibs.core.io.FileUtil;
    import org.codelibs.fess.crawler.exception.CrawlerSystemException;
    import org.mortbay.jetty.Handler;
    import org.mortbay.jetty.Server;
    import org.mortbay.jetty.handler.DefaultHandler;
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Sat Mar 15 06:52:00 UTC 2025
    - 6.3K bytes
    - Viewed (0)
  3. fess-crawler/src/test/java/org/codelibs/fess/crawler/util/TextUtilTest.java

     * governing permissions and limitations under the License.
     */
    package org.codelibs.fess.crawler.util;
    
    import java.io.IOException;
    import java.io.Reader;
    import java.io.StringReader;
    
    import org.codelibs.core.lang.StringUtil;
    import org.codelibs.fess.crawler.util.TextUtil.TextNormalizeContext;
    import org.dbflute.utflute.core.PlainTestCase;
    
    /**
     * @author shinsuke
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Thu Aug 07 02:55:08 UTC 2025
    - 8.2K bytes
    - Viewed (0)
  4. src/main/resources/crawler_opensearch+urlQueueService.xml

    <!DOCTYPE components PUBLIC "-//DBFLUTE//DTD LastaDi 1.0//EN" 
    	"http://dbflute.org/meta/lastadi10.dtd">
    <components namespace="fessCrawler">
    	<component name="urlQueueService"
    		class="org.codelibs.fess.crawler.service.FessUrlQueueService">
    		<arg>crawlerConfig</arg>
    	</component>
    Registered: Sat Dec 20 09:19:18 UTC 2025
    - Last Modified: Thu Oct 30 05:29:49 UTC 2025
    - 336 bytes
    - Viewed (0)
  5. fess-crawler/src/test/java/org/codelibs/fess/crawler/entity/ResultDataTest.java

     * either express or implied. See the License for the specific language
     * governing permissions and limitations under the License.
     */
    package org.codelibs.fess.crawler.entity;
    
    import java.util.function.Function;
    
    import org.codelibs.fess.crawler.exception.CrawlerSystemException;
    import org.dbflute.utflute.core.PlainTestCase;
    
    public class ResultDataTest extends PlainTestCase {
    
        public void test_setRawData() {
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Sat Mar 15 06:52:00 UTC 2025
    - 1.9K bytes
    - Viewed (0)
  6. fess-crawler/src/test/java/org/codelibs/fess/crawler/extractor/impl/HtmlXpathExtractorTest.java

     */
    package org.codelibs.fess.crawler.extractor.impl;
    
    import java.io.BufferedInputStream;
    import java.io.ByteArrayInputStream;
    import java.io.InputStream;
    
    import org.apache.logging.log4j.LogManager;
    import org.apache.logging.log4j.Logger;
    import org.codelibs.core.io.CloseableUtil;
    import org.codelibs.core.io.ResourceUtil;
    import org.codelibs.fess.crawler.container.StandardCrawlerContainer;
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Sat Mar 15 06:52:00 UTC 2025
    - 4.2K bytes
    - Viewed (0)
  7. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/AbstractXmlExtractor.java

    import org.apache.logging.log4j.Logger;
    import org.codelibs.core.io.InputStreamUtil;
    import org.codelibs.core.lang.StringUtil;
    import org.codelibs.fess.crawler.Constants;
    import org.codelibs.fess.crawler.entity.ExtractData;
    import org.codelibs.fess.crawler.exception.CrawlerSystemException;
    import org.codelibs.fess.crawler.exception.ExtractException;
    
    /**
     * Abstract base class for XML extractors.
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Sun Nov 23 12:19:14 UTC 2025
    - 8.6K bytes
    - Viewed (0)
  8. fess-crawler/src/test/java/org/codelibs/fess/crawler/transformer/impl/HtmlTransformerTest.java

     */
    package org.codelibs.fess.crawler.transformer.impl;
    
    import java.util.Map;
    
    import org.codelibs.fess.crawler.Constants;
    import org.codelibs.fess.crawler.builder.RequestDataBuilder;
    import org.codelibs.fess.crawler.entity.AccessResultDataImpl;
    import org.codelibs.fess.crawler.entity.ResponseData;
    import org.codelibs.fess.crawler.entity.ResultData;
    import org.codelibs.fess.crawler.exception.CrawlerSystemException;
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Sat Mar 15 06:52:00 UTC 2025
    - 13.8K bytes
    - Viewed (0)
  9. fess-crawler/src/test/resources/extractor/json/test.json

    {
      "title": "Sample Document",
      "author": "John Doe",
      "version": "1.0",
      "published": "2025-01-15",
      "tags": ["crawler", "extractor", "json"],
      "content": {
        "summary": "This is a sample JSON document for testing",
        "body": "The extractor should handle nested objects and arrays properly"
      },
      "metadata": {
        "created_at": "2025-01-01T00:00:00Z",
        "updated_at": "2025-01-15T12:00:00Z"
      }
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Sun Nov 23 03:46:53 UTC 2025
    - 412 bytes
    - Viewed (0)
  10. src/main/java/org/codelibs/fess/helper/CrawlingConfigHelper.java

    import com.google.common.cache.Cache;
    import com.google.common.cache.CacheBuilder;
    
    import jakarta.annotation.PostConstruct;
    
    /**
     * Helper class for managing crawling configurations.
     * Provides functionality to store, retrieve, and manage different types of crawling configurations
     * including web, file, and data configurations. Supports caching and session-based configuration management.
     */
    public class CrawlingConfigHelper {
    
    Registered: Sat Dec 20 09:19:18 UTC 2025
    - Last Modified: Fri Nov 28 16:29:12 UTC 2025
    - 19.5K bytes
    - Viewed (1)
Back to top