Search Options

Results per page
Sort
Preferred Languages
Advance

Results 61 - 70 of 84 for mxml (0.03 sec)

  1. fess-crawler/src/test/java/org/codelibs/fess/crawler/util/CrawlerWebServer.java

                FileUtil.writeBytes(robotTxtFile.getAbsolutePath(), buf.toString().getBytes("UTF-8"));
                robotTxtFile.deleteOnExit();
    
                // sitemaps.xml
                buf = new StringBuilder();
                buf.append("<?xml version=\"1.0\" encoding=\"UTF-8\"?>").append('\n');
                buf.append("<urlset ").append("xmlns=\"http://www.sitemaps.org/schemas/sitemap/0.9\">").append('\n');
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Mar 15 06:52:00 UTC 2025
    - 6.3K bytes
    - Viewed (0)
  2. fess-crawler-lasta/src/test/java/org/codelibs/fess/crawler/util/CrawlerWebServer.java

                FileUtil.writeBytes(robotTxtFile.getAbsolutePath(), buf.toString().getBytes("UTF-8"));
                robotTxtFile.deleteOnExit();
    
                // sitemaps.xml
                buf = new StringBuilder();
                buf.append("<?xml version=\"1.0\" encoding=\"UTF-8\"?>").append('\n');
                buf.append("<urlset ").append("xmlns=\"http://www.sitemaps.org/schemas/sitemap/0.9\">").append('\n');
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Mar 15 06:52:00 UTC 2025
    - 6.3K bytes
    - Viewed (0)
  3. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/HtmlExtractor.java

    import java.util.HashMap;
    import java.util.List;
    import java.util.Map;
    import java.util.regex.Pattern;
    import java.util.stream.Collectors;
    
    import javax.xml.xpath.XPathEvaluationResult;
    import javax.xml.xpath.XPathException;
    import javax.xml.xpath.XPathNodes;
    
    import org.apache.logging.log4j.LogManager;
    import org.apache.logging.log4j.Logger;
    import org.codelibs.core.lang.StringUtil;
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 9.3K bytes
    - Viewed (0)
  4. fess-crawler-opensearch/src/test/java/org/codelibs/fess/crawler/CrawlerTest.java

        @Resource
        private FesenClient fesenClient;
    
        private OpenSearchRunner runner;
    
        @Override
        protected String prepareConfigFile() {
            return "app.xml";
        }
    
        @Override
        protected boolean isUseOneTimeContainer() {
            return true;
        }
    
        @Override
        public void setUp() throws Exception {
            // create runner instance
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Sep 06 04:15:37 UTC 2025
    - 7.7K bytes
    - Viewed (0)
  5. fess-crawler/src/test/java/org/codelibs/fess/crawler/helper/RobotsTxtHelperTest.java

            String[] sitemaps = robotsTxt.getSitemaps();
            assertEquals(2, sitemaps.length);
            assertEquals("http://www.example.com/sitmap.xml", sitemaps[0]);
            assertEquals("http://www.example.net/sitmap.xml", sitemaps[1]);
    
        }
    
        public void testParse_disable() {
            final InputStream in = RobotsTxtHelperTest.class.getResourceAsStream("robots.txt");
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Mar 15 06:52:00 UTC 2025
    - 5.9K bytes
    - Viewed (0)
  6. fess-crawler/src/main/java/org/codelibs/fess/crawler/helper/impl/MimeTypeHelperImpl.java

     *   <li>Configure whether to use the filename for MIME type detection when the stream is octet-stream.</li>
     * </ul>
     *
     * <p>
     * The MIME type detection is based on the {@code tika-mimetypes.xml} resource, which is loaded during initialization.
     * </p>
     *
     * <p>
     * Usage:
     * </p>
     * <pre>
     * MimeTypeHelperImpl mimeTypeHelper = new MimeTypeHelperImpl();
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 6.5K bytes
    - Viewed (0)
  7. fess-crawler-lasta/src/test/java/org/codelibs/fess/crawler/CrawlerTest.java

        @Resource
        private FileTransformer fileTransformer;
    
        @Resource
        private CrawlerContainer crawlerContainer;
    
        @Override
        protected String prepareConfigFile() {
            return "crawler.xml";
        }
    
        public void test_execute_web() throws Exception {
            final CrawlerWebServer server = new CrawlerWebServer(7070);
            server.start();
    
            final String url = "http://localhost:7070/";
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Sep 06 04:15:37 UTC 2025
    - 12.8K bytes
    - Viewed (0)
  8. README.md

    ## Quick Start
    
    ### Prerequisites
    
    - Java 21 or higher
    - OpenSearch/Elasticsearch cluster (2.x+ recommended)
    - Maven 3.8+ for building from source
    
    ### Installation
    
    Add the dependency to your `pom.xml`:
    
    ```xml
    <dependency>
        <groupId>org.codelibs.fess</groupId>
        <artifactId>fess-suggest</artifactId>
        <version>15.2.0-SNAPSHOT</version>
    </dependency>
    ```
    
    ### Basic Usage
    
    Registered: Fri Sep 19 09:08:11 UTC 2025
    - Last Modified: Sun Aug 31 03:31:14 UTC 2025
    - 12.1K bytes
    - Viewed (1)
  9. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/AbstractXmlExtractor.java

    import org.codelibs.fess.crawler.exception.CrawlerSystemException;
    import org.codelibs.fess.crawler.exception.ExtractException;
    
    /**
     * Abstract base class for XML extractors.
     * Provides common functionality for extracting text content from XML-like documents.
     * It handles encoding detection, HTML entity unescaping, and tag-based content extraction.
     *
     */
    public abstract class AbstractXmlExtractor extends AbstractExtractor {
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 8.5K bytes
    - Viewed (0)
  10. fess-crawler/src/main/java/org/codelibs/fess/crawler/entity/SitemapFile.java

     * governing permissions and limitations under the License.
     */
    package org.codelibs.fess.crawler.entity;
    
    import org.codelibs.core.lang.StringUtil;
    
    /**
     * Represents a Sitemap file entry, conforming to the Sitemap XML format.
     * This class holds information about a single Sitemap, including its location and last modification timestamp.
     * It implements the {@link Sitemap} interface.
     *
     * <p>
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 4.4K bytes
    - Viewed (1)
Back to top