Search Options

Results per page
Sort
Preferred Languages
Advance

Results 121 - 130 of 658 for crawler (0.05 sec)

  1. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/MsPowerPointExtractor.java

     */
    package org.codelibs.fess.crawler.extractor.impl;
    
    import java.io.IOException;
    import java.io.InputStream;
    import java.util.Map;
    
    import org.apache.poi.hslf.usermodel.HSLFShape;
    import org.apache.poi.hslf.usermodel.HSLFSlideShow;
    import org.apache.poi.hslf.usermodel.HSLFTextParagraph;
    import org.apache.poi.sl.extractor.SlideShowExtractor;
    import org.codelibs.fess.crawler.entity.ExtractData;
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 2.1K bytes
    - Viewed (0)
  2. src/test/java/org/codelibs/fess/it/CrawlTestBase.java

                ThreadUtil.sleep(500);
                count++;
                final Map<String, Object> scheduler = getSchedulerItem(namePrefix);
                assertTrue(scheduler.containsKey("running"));
                isRunning = (Boolean) scheduler.get("running");
            }
            if (300 <= count) {
                logger.info("Time out: Failed to start crawler)");
                fail(); // Time Out
    Registered: Thu Sep 04 12:52:25 UTC 2025
    - Last Modified: Thu Aug 07 03:06:29 UTC 2025
    - 10K bytes
    - Viewed (0)
  3. fess-crawler/src/test/java/org/codelibs/fess/crawler/client/AbstractCrawlerClientTest.java

     * either express or implied. See the License for the specific language
     * governing permissions and limitations under the License.
     */
    package org.codelibs.fess.crawler.client;
    
    import org.codelibs.fess.crawler.entity.ResponseData;
    import org.codelibs.fess.crawler.exception.MaxLengthExceededException;
    import org.dbflute.utflute.core.PlainTestCase;
    
    /**
     * @author shinsuke
     *
     */
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Mar 15 06:52:00 UTC 2025
    - 3K bytes
    - Viewed (0)
  4. fess-crawler/src/test/java/org/codelibs/fess/crawler/transformer/impl/XpathTransformerTest.java

     */
    package org.codelibs.fess.crawler.transformer.impl;
    
    import java.util.ArrayList;
    import java.util.List;
    import java.util.Map;
    
    import org.codelibs.core.io.ResourceUtil;
    import org.codelibs.fess.crawler.Constants;
    import org.codelibs.fess.crawler.entity.AccessResultDataImpl;
    import org.codelibs.fess.crawler.entity.ResponseData;
    import org.codelibs.fess.crawler.entity.ResultData;
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Mar 15 06:52:00 UTC 2025
    - 12.5K bytes
    - Viewed (0)
  5. fess-crawler/src/main/java/org/codelibs/fess/crawler/service/impl/UrlFilterServiceImpl.java

     * governing permissions and limitations under the License.
     */
    package org.codelibs.fess.crawler.service.impl;
    
    import java.util.List;
    import java.util.regex.Pattern;
    
    import org.codelibs.fess.crawler.helper.MemoryDataHelper;
    import org.codelibs.fess.crawler.service.UrlFilterService;
    
    import jakarta.annotation.Resource;
    
    /**
     * Implementation of the {@link UrlFilterService} interface.
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 4.2K bytes
    - Viewed (0)
  6. fess-crawler-lasta/src/main/resources/crawler/rule.xml

    <!DOCTYPE components PUBLIC "-//DBFLUTE//DTD LastaDi 1.0//EN"
    	"http://dbflute.org/meta/lastadi10.dtd">
    <components namespace="fessCrawler">
    	<include path="crawler/container.xml" />
    	<include path="crawler/transformer.xml" />
    
    	<component name="ruleManager"
    		class="org.codelibs.fess.crawler.rule.impl.RuleManagerImpl" instance="prototype">
    		<postConstruct name="addRule">
    			<arg>sitemapsRule</arg>
    		</postConstruct>
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Oct 11 02:16:55 UTC 2015
    - 1.5K bytes
    - Viewed (0)
  7. src/main/java/org/codelibs/fess/app/web/admin/webconfig/AdminWebconfigAction.java

         */
        @Execute
        @Secured({ ROLE, ROLE + VIEW })
        public HtmlResponse index(final SearchForm form) {
            return asListHtml();
        }
    
        /**
         * Displays a paginated list of web crawler configurations.
         *
         * @param pageNumber the page number to display (optional)
         * @param form the search form containing filter criteria
         * @return HTML response with the web config list
         */
    Registered: Thu Sep 04 12:52:25 UTC 2025
    - Last Modified: Thu Aug 07 03:06:29 UTC 2025
    - 21K bytes
    - Viewed (0)
  8. fess-crawler/src/main/java/org/codelibs/fess/crawler/interval/impl/AbstractIntervalController.java

     * either express or implied. See the License for the specific language
     * governing permissions and limitations under the License.
     */
    package org.codelibs.fess.crawler.interval.impl;
    
    import org.codelibs.fess.crawler.exception.CrawlerSystemException;
    import org.codelibs.fess.crawler.interval.IntervalController;
    
    /**
     * An abstract base class for implementing {@link IntervalController}.
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 4.5K bytes
    - Viewed (0)
  9. src/main/java/org/codelibs/fess/crawler/transformer/FessStandardTransformer.java

     * governing permissions and limitations under the License.
     */
    package org.codelibs.fess.crawler.transformer;
    
    import org.apache.logging.log4j.LogManager;
    import org.apache.logging.log4j.Logger;
    import org.codelibs.fess.crawler.entity.ResponseData;
    import org.codelibs.fess.crawler.extractor.Extractor;
    import org.codelibs.fess.crawler.extractor.ExtractorFactory;
    import org.codelibs.fess.exception.FessSystemException;
    Registered: Thu Sep 04 12:52:25 UTC 2025
    - Last Modified: Thu Jul 17 08:28:31 UTC 2025
    - 3.8K bytes
    - Viewed (0)
  10. fess-crawler/src/test/java/org/codelibs/fess/crawler/extractor/impl/HtmlExtractorTest.java

     */
    package org.codelibs.fess.crawler.extractor.impl;
    
    import java.io.BufferedInputStream;
    import java.io.ByteArrayInputStream;
    import java.io.InputStream;
    
    import org.apache.logging.log4j.LogManager;
    import org.apache.logging.log4j.Logger;
    import org.codelibs.core.io.CloseableUtil;
    import org.codelibs.core.io.ResourceUtil;
    import org.codelibs.fess.crawler.container.StandardCrawlerContainer;
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Mar 15 06:52:00 UTC 2025
    - 3.7K bytes
    - Viewed (0)
Back to top