Search Options

Results per page
Sort
Preferred Languages
Advance

Results 21 - 30 of 37 for internal (0.05 sec)

  1. README.md

    - **Flexible Configuration**: XML-based dependency injection with LastaFlute DI
    - **Extensible Architecture**: Plugin system for custom extractors, transformers, and clients
    - **Rate Limiting**: Politeness policies and interval controllers
    - **URL Filtering**: Regex-based inclusion/exclusion patterns
    - **Data Persistence**: Multiple backend options including OpenSearch integration
    
    ## Technology Stack
    
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Aug 31 05:32:52 UTC 2025
    - 15.3K bytes
    - Viewed (0)
  2. fess-crawler-opensearch/src/main/resources/crawler_opensearch.xml

    <components namespace="fessCrawler">
        <include path="crawler/container.xml"/>
        <include path="crawler/client.xml"/>
        <include path="crawler/rule.xml"/>
        <include path="crawler/filter.xml"/>
        <include path="crawler/interval.xml"/>
        <include path="crawler/extractor.xml"/>
        <include path="crawler/mimetype.xml"/>
        <include path="crawler/encoding.xml"/>
        <include path="crawler/urlconverter.xml"/>
        <include path="crawler/log.xml"/>
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Thu Nov 07 04:44:10 UTC 2024
    - 2.2K bytes
    - Viewed (0)
  3. fess-crawler/src/test/java/org/codelibs/fess/crawler/client/FaultTolerantClientTest.java

            final FaultTolerantClient client = new FaultTolerantClient();
            client.setRetryInterval(100);
            final TestClient testClient = new TestClient();
            testClient.exceptionCount = 4;
            testClient.interval = 100;
            final TestListener testListener = new TestListener();
            client.setCrawlerClient(testClient);
            client.setRequestListener(testListener);
            final String url = "http://test.com/";
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Mar 15 06:52:00 UTC 2025
    - 15.1K bytes
    - Viewed (0)
  4. fess-crawler/src/main/resources/org/codelibs/fess/crawler/mime/tika-mimetypes.xml

        <sub-class-of type="text/plain"/>
        <alias type="text/x-dtd"/>
        <glob pattern="*.dtd"/>
      </mime-type>
    
      <mime-type type="application/xml-external-parsed-entity">
        <alias type="text/xml-external-parsed-entity"/>
      </mime-type>
    
      <mime-type type="application/xmpp+xml"/>
      <mime-type type="application/xop+xml">
        <glob pattern="*.xop"/>
      </mime-type>
    
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Thu Mar 13 08:18:01 UTC 2025
    - 320.1K bytes
    - Viewed (1)
  5. fess-crawler/src/main/java/org/codelibs/fess/crawler/interval/impl/DefaultIntervalController.java

     * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND,
     * either express or implied. See the License for the specific language
     * governing permissions and limitations under the License.
     */
    package org.codelibs.fess.crawler.interval.impl;
    
    import java.util.Map;
    
    import org.codelibs.core.lang.ThreadUtil;
    
    /**
     * Default implementation of the IntervalController.
     * This class provides a default way to manage delays between crawler operations.
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 3.4K bytes
    - Viewed (0)
  6. fess-crawler/src/test/java/org/codelibs/fess/crawler/interval/impl/HostIntervalControllerTest.java

     * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND,
     * either express or implied. See the License for the specific language
     * governing permissions and limitations under the License.
     */
    package org.codelibs.fess.crawler.interval.impl;
    
    import java.util.ArrayList;
    import java.util.List;
    import java.util.concurrent.Callable;
    import java.util.concurrent.ExecutionException;
    import java.util.concurrent.ExecutorService;
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Mar 15 06:52:00 UTC 2025
    - 3.2K bytes
    - Viewed (0)
  7. fess-crawler-opensearch/src/main/java/org/codelibs/fess/crawler/client/FesenClient.java

         */
        public void setSizeForDelete(final int sizeForDelete) {
            this.sizeForDelete = sizeForDelete;
        }
    
        /**
         * Sets the retry interval in milliseconds.
         *
         * @param retryInterval The retry interval.
         */
        public void setRetryInterval(final long retryInterval) {
            this.retryInterval = retryInterval;
        }
    
        /**
         * Sets the maximum retry count.
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Aug 31 05:32:52 UTC 2025
    - 25.3K bytes
    - Viewed (0)
  8. fess-crawler/src/main/java/org/codelibs/fess/crawler/helper/SitemapsHelper.java

            } catch (final Exception e) {
                throw new SitemapsException("Could not parse XML Sitemaps.", e);
            }
            return handler.getSitemapSet();
        }
    
        /**
         * Disables external resources for the SAX parser to prevent XXE attacks.
         * @param parser the SAX parser to configure
         * @throws SAXNotRecognizedException if the parser doesn't recognize the feature
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 14.7K bytes
    - Viewed (0)
  9. fess-crawler/src/main/java/org/codelibs/fess/crawler/CrawlerThread.java

    import org.codelibs.fess.crawler.exception.ChildUrlsException;
    import org.codelibs.fess.crawler.exception.CrawlingAccessException;
    import org.codelibs.fess.crawler.helper.LogHelper;
    import org.codelibs.fess.crawler.interval.IntervalController;
    import org.codelibs.fess.crawler.log.LogType;
    import org.codelibs.fess.crawler.processor.ResponseProcessor;
    import org.codelibs.fess.crawler.rule.Rule;
    import org.codelibs.fess.crawler.service.DataService;
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Thu Aug 07 02:55:08 UTC 2025
    - 20.4K bytes
    - Viewed (0)
  10. fess-crawler/src/main/java/org/codelibs/fess/crawler/client/http/HcHttpClient.java

            this.authSchemeProviderMap = authSchemeProviderMap;
        }
    
        /**
         * Sets the connection check interval in seconds.
         *
         * @param connectionCheckInterval The connection check interval
         */
        public void setConnectionCheckInterval(final int connectionCheckInterval) {
            this.connectionCheckInterval = connectionCheckInterval;
        }
    
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Thu Aug 07 02:55:08 UTC 2025
    - 52.2K bytes
    - Viewed (0)
Back to top