Crawling - Code Search

src/main/java/org/codelibs/fess/app/web/admin/fileconfig/CreateForm.java

    @CustomSize(maxKey = "form.admin.max.input.size")
    public String paths;

    /** The paths to include during crawling (pattern-based). */
    @CustomSize(maxKey = "form.admin.max.input.size")
    public String includedPaths;

    /** The paths to exclude during crawling (pattern-based). */
    @CustomSize(maxKey = "form.admin.max.input.size")
    public String excludedPaths;

Registered: Sat Dec 20 09:19:18 UTC 2025

- Last Modified: Thu Jul 17 08:28:31 UTC 2025

- 5.6K bytes

- Viewed (0)

github.com/codelibs/fess

src/main/resources/fess_label_en.properties

labels.createdTime=Created Time
labels.depth=Depth
labels.excludedPaths=Excluded Paths for Crawling
labels.excludedUrls=Excluded URLs for Crawling
labels.excludedDocPaths=Excluded Paths for Searching
labels.excludedDocUrls=Excluded URLs for Searching
labels.hostname=Hostname
labels.id=ID
labels.includedPaths=Included Paths for Crawling
labels.includedUrls=Included URLs for Crawling
labels.includedDocPaths=Included Paths for Searching

Registered: Sat Dec 20 09:19:18 UTC 2025

- Last Modified: Sat Dec 13 02:21:17 UTC 2025

- 44K bytes

- Viewed (0)

github.com/codelibs/fess

src/main/java/org/codelibs/fess/job/CrawlJob.java

    /**
     * The namespace identifier for the crawling session.
     * Used to organize and identify crawling activities in the system.
     * Defaults to the system crawling info name.
     */
    protected String namespace = Constants.CRAWLING_INFO_SYSTEM_NAME;

    /**
     * Array of web crawling configuration IDs to process.

Registered: Sat Dec 20 09:19:18 UTC 2025

- Last Modified: Fri Nov 28 16:29:12 UTC 2025

- 19.6K bytes

- Viewed (0)

github.com/codelibs/fess

src/main/java/org/codelibs/fess/app/web/api/admin/crawlinginfo/SearchBody.java

import org.codelibs.fess.app.web.api.admin.BaseSearchBody;

/**
 * Search request body for crawling information administration.
 * Extends BaseSearchBody with crawling information-specific search parameters.
 */
public class SearchBody extends BaseSearchBody {

    /** The crawling session ID to search for. */
    public String sessionId;

    /**
     * Default constructor for SearchBody.
     */

Registered: Sat Dec 20 09:19:18 UTC 2025

- Last Modified: Thu Jul 17 08:28:31 UTC 2025

- 1.1K bytes

- Viewed (0)

github.com/codelibs/fess

src/main/java/org/codelibs/fess/app/web/api/admin/webconfig/SearchBody.java

import org.codelibs.fess.app.web.api.admin.BaseSearchBody;

/**
 * Search request body for web crawling configuration administration API.
 */
public class SearchBody extends BaseSearchBody {

    /**
     * Default constructor.
     */
    public SearchBody() {
        super();
    }

    /** Name of the web crawling configuration */
    public String name;

    /** URLs to crawl */
    public String urls;

Registered: Sat Dec 20 09:19:18 UTC 2025

- Last Modified: Thu Jul 17 08:28:31 UTC 2025

- 1.2K bytes

- Viewed (0)

github.com/codelibs/fess

src/main/java/org/codelibs/fess/exec/Crawler.java

 * <ul>
 * <li>Web crawling - crawls web sites and web content</li>
 * <li>File system crawling - crawls file systems and documents</li>
 * <li>Data store crawling - crawls databases and other data sources</li>
 * <li>Combined crawling - runs multiple crawling types simultaneously</li>
 * </ul>
 *
 * <p>Command line usage:
 * <pre>
 * java org.codelibs.fess.exec.Crawler [options...]

Registered: Sat Dec 20 09:19:18 UTC 2025

- Last Modified: Fri Nov 28 16:29:12 UTC 2025

- 31.4K bytes

- Viewed (0)

github.com/codelibs/fess

src/main/java/org/codelibs/fess/helper/CrawlingConfigHelper.java

import com.google.common.cache.Cache;
import com.google.common.cache.CacheBuilder;

import jakarta.annotation.PostConstruct;

/**
 * Helper class for managing crawling configurations.
 * Provides functionality to store, retrieve, and manage different types of crawling configurations
 * including web, file, and data configurations. Supports caching and session-based configuration management.
 */
public class CrawlingConfigHelper {

Registered: Sat Dec 20 09:19:18 UTC 2025

- Last Modified: Fri Nov 28 16:29:12 UTC 2025

- 19.5K bytes

- Viewed (1)

github.com/codelibs/fess

src/main/java/org/codelibs/fess/app/web/admin/general/EditForm.java

    @Size(max = 10)
    public String thumbnail;

    /**
     * Types of crawling failures to ignore during crawling operations.
     * Specified failure types will not be logged or counted as errors.
     */
    @Size(max = 1000)
    public String ignoreFailureType;

    /**
     * Threshold for failure count before stopping crawling of a URL.
     * Set to -1 to disable the threshold check.
     */
    @Required

Registered: Sat Dec 20 09:19:18 UTC 2025

- Last Modified: Sat Dec 13 02:21:17 UTC 2025

- 10.6K bytes

- Viewed (0)

github.com/codelibs/fess

src/main/java/org/codelibs/fess/helper/WebFsIndexHelper.java

            if (logger.isInfoEnabled()) {
                logger.info("No crawling target urls.");
            }
            return;
        }

        doCrawl(sessionId, webConfigList, fileConfigList);
    }

    /**
     * Performs the actual crawling operation for the provided configurations.
     *
     * @param sessionId The session ID for this crawling operation
     * @param webConfigList List of web configurations to crawl

Registered: Sat Dec 20 09:19:18 UTC 2025

- Last Modified: Fri Nov 28 16:29:12 UTC 2025

- 25K bytes

- Viewed (0)

github.com/codelibs/fess

src/main/java/org/codelibs/fess/app/web/admin/wizard/AdminWizardAction.java

        return redirectWith(getClass(), moreUrl("crawlingConfigForm"));
    }

    /**
     * Creates a crawling configuration and proceeds to the start crawling form.
     *
     * @param form the form containing crawling configuration data
     * @return HTML response redirecting to the start crawling form
     */
    @Execute
    @Secured({ ROLE })

Registered: Sat Dec 20 09:19:18 UTC 2025

- Last Modified: Thu Dec 11 09:47:03 UTC 2025

- 16.3K bytes

- Viewed (0)

Search Options