Search Options

Results per page
Sort
Preferred Languages
Advance

Results 11 - 20 of 23 for processUrl (0.08 sec)

  1. fess-crawler/src/main/java/org/codelibs/fess/crawler/rule/impl/AbstractRule.java

        }
    
        @Override
        public ResponseProcessor getResponseProcessor() {
            return responseProcessor;
        }
    
        /**
         * Sets the response processor for this rule.
         *
         * @param responseProcessor the response processor to set
         */
        public void setResponseProcessor(final ResponseProcessor responseProcessor) {
            this.responseProcessor = responseProcessor;
        }
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Wed Sep 03 14:42:53 UTC 2025
    - 2.8K bytes
    - Viewed (0)
  2. fess-crawler/src/main/java/org/codelibs/fess/crawler/rule/Rule.java

    import org.codelibs.fess.crawler.processor.ResponseProcessor;
    
    /**
     * The Rule interface defines the contract for implementing rules that can be applied to
     * response data in a web crawler. Implementations of this interface should provide logic
     * to determine if a given response data matches the rule, retrieve the rule's identifier,
     * and obtain the associated response processor.
     */
    public interface Rule extends Serializable {
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Mar 15 06:52:00 UTC 2025
    - 1.7K bytes
    - Viewed (0)
  3. fess-crawler/src/main/java/org/codelibs/fess/crawler/processor/ResponseProcessor.java

     * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND,
     * either express or implied. See the License for the specific language
     * governing permissions and limitations under the License.
     */
    package org.codelibs.fess.crawler.processor;
    
    import org.codelibs.fess.crawler.entity.ResponseData;
    
    /**
     * The ResponseProcessor interface defines a contract for processing response data.
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Mar 15 06:52:00 UTC 2025
    - 1.1K bytes
    - Viewed (0)
  4. fess-crawler-lasta/src/main/resources/crawler/rule.xml

    		<property name="ruleId">"sitemapsRule"</property>
    		<property name="responseProcessor">
    			<component
    				class="org.codelibs.fess.crawler.processor.impl.SitemapsResponseProcessor">
    			</component>
    		</property>
    		<postConstruct name="addRule">
    			<arg>"url"</arg>
    			<arg>".*sitemap.*"</arg>
    		</postConstruct>
    	</component>
    
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Oct 11 02:16:55 UTC 2015
    - 1.5K bytes
    - Viewed (0)
  5. fess-crawler/src/main/java/org/codelibs/fess/crawler/processor/impl/NullResponseProcessor.java

     * either express or implied. See the License for the specific language
     * governing permissions and limitations under the License.
     */
    package org.codelibs.fess.crawler.processor.impl;
    
    import org.codelibs.fess.crawler.entity.ResponseData;
    import org.codelibs.fess.crawler.processor.ResponseProcessor;
    
    /**
     * NullResponseProcessor is a class that implements the ResponseProcessor interface.
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 1.5K bytes
    - Viewed (0)
  6. fess-crawler/src/main/java/org/codelibs/fess/crawler/processor/impl/SitemapsResponseProcessor.java

    import org.codelibs.fess.crawler.exception.ChildUrlsException;
    import org.codelibs.fess.crawler.helper.SitemapsHelper;
    import org.codelibs.fess.crawler.processor.ResponseProcessor;
    
    import jakarta.annotation.Resource;
    
    /**
     * A response processor implementation that handles sitemaps.
     * It parses the response body as a SitemapSet, extracts URLs from the sitemaps,
     * and adds them as child URLs to be crawled.
     *
     * <p>
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 3.4K bytes
    - Viewed (0)
  7. fess-crawler/src/main/java/org/codelibs/fess/crawler/helper/impl/LogHelperImpl.java

     *   <li>Processing responses</li>
     *   <li>Handling exceptions during crawling and child URL processing</li>
     *   <li>Handling cases where no URL is in the queue</li>
     *   <li>Handling cases where no response processor or rule is found</li>
     *   <li>Handling system errors</li>
     * </ul>
     *
     * <p>
     * Each logging method checks the log level before logging the message.
     * The log level can be configured in the Log4j2 configuration file.
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 14K bytes
    - Viewed (0)
  8. fess-crawler/src/test/java/org/codelibs/fess/crawler/CrawlerTest.java

                    .<DefaultResponseProcessor> singleton("defaultResponseProcessor", DefaultResponseProcessor.class, processor -> {
                        processor.setTransformer(container.getComponent("fileTransformer"));
                        processor.setSuccessfulHttpCodes(new int[] { 200 });
                        processor.setNotModifiedHttpCodes(new int[] { 304 });
                    })//
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Sep 06 04:15:37 UTC 2025
    - 19.1K bytes
    - Viewed (0)
  9. fess-crawler/src/main/java/org/codelibs/fess/crawler/processor/impl/DefaultResponseProcessor.java

     * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND,
     * either express or implied. See the License for the specific language
     * governing permissions and limitations under the License.
     */
    package org.codelibs.fess.crawler.processor.impl;
    
    import java.util.ArrayList;
    import java.util.HashSet;
    import java.util.List;
    import java.util.Set;
    import java.util.stream.Collectors;
    
    import org.apache.logging.log4j.LogManager;
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Thu Aug 07 02:55:08 UTC 2025
    - 12.5K bytes
    - Viewed (0)
  10. fess-crawler/src/main/java/org/codelibs/fess/crawler/log/LogType.java

        NO_URL_IN_QUEUE,
        /** Indicates the start of a crawler thread. */
        START_THREAD,
        /** Indicates the finish of a crawler thread. */
        FINISHED_THREAD,
        /** Indicates no response processor is available. */
        NO_RESPONSE_PROCESSOR,
        /** Indicates no rule is available for processing. */
        NO_RULE,
        /** Indicates a system error occurred. */
        SYSTEM_ERROR
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 2.4K bytes
    - Viewed (0)
Back to top