Search Options

Results per page
Sort
Preferred Languages
Advance

Results 71 - 80 of 529 for crawlen (1.25 sec)

  1. src/main/java/org/codelibs/fess/app/web/admin/failureurl/EditForm.java

        public String id;
    
        /**
         * The URL that failed during crawling.
         * This is a required field containing the actual URL that encountered an error.
         */
        @Required
        public String url;
    
        /**
         * The name of the crawler thread that encountered the failure.
         * This is a required field used for identifying which crawler process failed.
         */
        @Required
        public String threadName;
    
    Registered: Sat Dec 20 09:19:18 UTC 2025
    - Last Modified: Thu Jul 17 08:28:31 UTC 2025
    - 4.2K bytes
    - Viewed (0)
  2. fess-crawler/src/main/java/org/codelibs/fess/crawler/exception/MaxLengthExceededException.java

     * governing permissions and limitations under the License.
     */
    package org.codelibs.fess.crawler.exception;
    
    /**
     * MaxLengthExceededException is thrown when the content length exceeds the maximum allowed length.
     * It extends CrawlingAccessException, indicating a crawling-related access issue.
     *
     */
    public class MaxLengthExceededException extends CrawlingAccessException {
    
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 1.2K bytes
    - Viewed (0)
  3. src/main/java/org/codelibs/fess/app/web/api/admin/fileconfig/SearchBody.java

    /**
     * Search request body for file crawling configuration administration API.
     */
    public class SearchBody extends BaseSearchBody {
    
        /**
         * Default constructor.
         */
        public SearchBody() {
            super();
        }
    
        /** Name of the file crawling configuration */
        public String name;
    
        /** File paths to crawl */
        public String paths;
    
    Registered: Sat Dec 20 09:19:18 UTC 2025
    - Last Modified: Thu Jul 17 08:28:31 UTC 2025
    - 1.2K bytes
    - Viewed (0)
  4. fess-crawler/src/main/java/org/codelibs/fess/crawler/client/CrawlerClientCreator.java

     */
    package org.codelibs.fess.crawler.client;
    
    import java.util.LinkedHashMap;
    import java.util.LinkedList;
    import java.util.List;
    import java.util.Map;
    
    import org.apache.logging.log4j.LogManager;
    import org.apache.logging.log4j.Logger;
    import org.codelibs.fess.crawler.container.CrawlerContainer;
    
    import jakarta.annotation.Resource;
    
    /**
     * Creates and manages crawler clients for web crawling operations.
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 4.5K bytes
    - Viewed (0)
  5. fess-crawler/src/main/java/org/codelibs/fess/crawler/entity/ExtractData.java

     * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND,
     * either express or implied. See the License for the specific language
     * governing permissions and limitations under the License.
     */
    package org.codelibs.fess.crawler.entity;
    
    import java.io.Serializable;
    import java.util.HashMap;
    import java.util.Map;
    import java.util.Set;
    
    import org.apache.tika.metadata.ClimateForcast;
    import org.apache.tika.metadata.CreativeCommons;
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Sat Sep 06 04:15:37 UTC 2025
    - 3.8K bytes
    - Viewed (0)
  6. fess-crawler/src/main/java/org/codelibs/fess/crawler/entity/RequestData.java

     */
    package org.codelibs.fess.crawler.entity;
    
    import java.util.Objects;
    
    import org.codelibs.fess.crawler.Constants;
    
    /**
     * Represents a request data for crawling.
     * This class encapsulates the HTTP method, URL, and weight associated with a crawling request.
     */
    public class RequestData {
        /**
         * HTTP methods supported for crawling requests.
         */
        public enum Method {
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 4K bytes
    - Viewed (0)
  7. fess-crawler/src/main/java/org/codelibs/fess/crawler/client/fs/FileSystemClient.java

    import org.codelibs.fess.crawler.Constants;
    import org.codelibs.fess.crawler.builder.RequestDataBuilder;
    import org.codelibs.fess.crawler.client.AbstractCrawlerClient;
    import org.codelibs.fess.crawler.client.AccessTimeoutTarget;
    import org.codelibs.fess.crawler.entity.RequestData;
    import org.codelibs.fess.crawler.entity.ResponseData;
    import org.codelibs.fess.crawler.exception.ChildUrlsException;
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Sun Nov 23 12:19:14 UTC 2025
    - 15.1K bytes
    - Viewed (0)
  8. src/main/java/org/codelibs/fess/mylasta/direction/FessConfig.java

        /** The key of the configuration. e.g. u002eu06d4u2e3cu3002 */
        String CRAWLER_DOCUMENT_FULLSTOP_CHARS = "crawler.document.fullstop.chars";
    
        /** The key of the configuration. e.g. UTF-8 */
        String CRAWLER_CRAWLING_DATA_ENCODING = "crawler.crawling.data.encoding";
    
        /** The key of the configuration. e.g. http,https */
        String CRAWLER_WEB_PROTOCOLS = "crawler.web.protocols";
    Registered: Sat Dec 20 09:19:18 UTC 2025
    - Last Modified: Sat Dec 13 02:21:17 UTC 2025
    - 525.7K bytes
    - Viewed (2)
  9. fess-crawler/src/main/java/org/codelibs/fess/crawler/service/UrlQueueService.java

     * governing permissions and limitations under the License.
     */
    package org.codelibs.fess.crawler.service;
    
    import java.util.List;
    
    import org.codelibs.fess.crawler.entity.UrlQueue;
    
    /**
     * Service interface for managing URL queues.
     * Provides methods for adding, retrieving, and managing URLs within a crawling session.
     *
     * @param <QUEUE> the type of URL queue
     */
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 2.6K bytes
    - Viewed (0)
  10. src/main/java/org/codelibs/fess/app/web/api/admin/webconfig/SearchBody.java

    /**
     * Search request body for web crawling configuration administration API.
     */
    public class SearchBody extends BaseSearchBody {
    
        /**
         * Default constructor.
         */
        public SearchBody() {
            super();
        }
    
        /** Name of the web crawling configuration */
        public String name;
    
        /** URLs to crawl */
        public String urls;
    
    Registered: Sat Dec 20 09:19:18 UTC 2025
    - Last Modified: Thu Jul 17 08:28:31 UTC 2025
    - 1.2K bytes
    - Viewed (0)
Back to top