Search Options

Results per page
Sort
Preferred Languages
Advance

Results 1 - 6 of 6 for generic (0.04 sec)

  1. fess-crawler-lasta/src/main/resources/crawler/extractor.xml

    				"application/mikey",
    				"application/moss-keys",
    				"application/moss-signature",
    				"application/mosskey-data",
    				"application/mosskey-request",
    				"application/mp4",
    				"application/mpeg4-generic",
    				"application/mpeg4-iod",
    				"application/mpeg4-iod-xmt",
    				"application/msword",
    				"application/msword2",
    				"application/msword5",
    				"application/mxf",
    				"application/nasdata",
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Aug 01 21:40:30 UTC 2020
    - 49K bytes
    - Viewed (0)
  2. fess-crawler/src/main/resources/org/codelibs/fess/crawler/mime/tika-mimetypes.xml

        <_comment>MP4 container format</_comment>
        <glob pattern="*.mp4s"/>
        <sub-class-of type="application/quicktime" />
      </mime-type>
    
      <mime-type type="application/mpeg4-generic"/>
      <mime-type type="application/mpeg4-iod"/>
      <mime-type type="application/mpeg4-iod-xmt"/>
    
      <!-- http://www.iana.org/assignments/media-types/application/msword -->
      <mime-type type="application/msword">
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Thu Mar 13 08:18:01 UTC 2025
    - 320.1K bytes
    - Viewed (1)
  3. fess-crawler/src/main/java/org/codelibs/fess/crawler/Constants.java

        /**
         * The feature for external general entities in XML.
         */
        public static final String FEATURE_EXTERNAL_GENERAL_ENTITIES = "http://xml.org/sax/features/external-general-entities";
    
        /**
         * Feature for external parameter entities in XML.
         */
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 3.6K bytes
    - Viewed (0)
  4. fess-crawler/src/main/java/org/codelibs/fess/crawler/log/LogType.java

        /** Indicates processing a child URL due to an exception. */
        PROCESS_CHILD_URL_BY_EXCEPTION,
        /** Indicates an access exception during crawling. */
        CRAWLING_ACCESS_EXCEPTION,
        /** Indicates a general exception during crawling. */
        CRAWLING_EXCEPTION,
        /** Indicates no URL is available in the queue. */
        NO_URL_IN_QUEUE,
        /** Indicates the start of a crawler thread. */
        START_THREAD,
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 2.4K bytes
    - Viewed (0)
  5. fess-crawler/src/main/java/org/codelibs/fess/crawler/entity/SitemapUrl.java

         * both sources differently.
         */
        private String lastmod;
    
        /**
         * How frequently the page is likely to change. This value provides general
         * information to search engines and may not correlate exactly to how often
         * they crawl the page. Valid values are:
         * <ul>
         * <li>always</li>
         * <li>hourly</li>
         * <li>daily</li>
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 6.5K bytes
    - Viewed (0)
  6. fess-crawler/src/main/java/org/codelibs/fess/crawler/entity/RobotsTxt.java

        }
    
        /**
         * Returns the most specific directive matching the given user agent.
         * The method finds the longest matching user agent pattern in the directives,
         * excluding the general "*" pattern which matches all bots.
         *
         * @param userAgent the user agent string to match against directives,
         *                 can be null (treated as empty string)
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 10K bytes
    - Viewed (0)
Back to top