Search Options

Results per page
Sort
Preferred Languages
Advance

Results 1 - 9 of 9 for extracted (1.28 sec)

  1. src/main/java/org/codelibs/fess/crawler/transformer/FessXpathTransformer.java

            }
            resultData.setEncoding(charsetName);
        }
    
        /**
         * Normalizes the extracted data, particularly handling title normalization.
         *
         * @param responseData the response data from crawling
         * @param dataMap the data map containing extracted field values
         */
        protected void normalizeData(final ResponseData responseData, final Map<String, Object> dataMap) {
    Registered: Sat Dec 20 09:19:18 UTC 2025
    - Last Modified: Fri Dec 12 13:58:40 UTC 2025
    - 54.6K bytes
    - Viewed (0)
  2. src/test/java/jcifs/smb/SmbFileIntegrationTest.java

            assertEquals("file.txt", file.getName(), "Name should be extracted correctly");
            assertTrue(file.getPath().endsWith("/shared/path/file.txt"), "Path should end correctly");
            assertEquals("shared", file.getShare(), "Share should be extracted correctly");
            assertNotNull(file.getParent(), "Parent should not be null");
    Registered: Sat Dec 20 13:44:44 UTC 2025
    - Last Modified: Sat Aug 30 05:58:03 UTC 2025
    - 56K bytes
    - Viewed (0)
  3. src/main/java/org/codelibs/fess/ldap/LdapManager.java

                        }
                        consumer.accept(entryDn);
                    }
                }
            }
        }
    
        /**
         * Extracts the role name from an LDAP entry DN.
         *
         * @param entryDn the LDAP entry DN
         * @return the extracted role name, or null if not found
         */
        protected String getSearchRoleName(final String entryDn) {
            if (entryDn == null) {
                return null;
    Registered: Sat Dec 20 09:19:18 UTC 2025
    - Last Modified: Fri Nov 28 16:29:12 UTC 2025
    - 86.3K bytes
    - Viewed (0)
  4. fess-crawler-lasta/src/main/resources/crawler/extractor.xml

    		class="org.codelibs.fess.crawler.extractor.impl.MsPowerPointExtractor" />
    	<component name="msPublisherExtractor"
    		class="org.codelibs.fess.crawler.extractor.impl.MsPublisherExtractor" />
    	<component name="msVisioExtractor"
    		class="org.codelibs.fess.crawler.extractor.impl.MsVisioExtractor" />
    	<component name="pdfExtractor"
    		class="org.codelibs.fess.crawler.extractor.impl.PdfExtractor" />
    	<component name="lhaExtractor"
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Sun Nov 23 03:46:53 UTC 2025
    - 50.1K bytes
    - Viewed (0)
  5. src/main/resources/fess_config.properties

    dc:title=title:string\n\
    
    # html
    
    # XPath to extract main content from HTML documents.
    crawler.document.html.content.xpath=//BODY
    # XPath to extract language attribute from HTML documents.
    crawler.document.html.lang.xpath=//HTML/@lang
    # XPath to extract digest (description) from HTML documents.
    crawler.document.html.digest.xpath=//META[@name='description']/@content
    # XPath to extract canonical URL from HTML documents.
    Registered: Sat Dec 20 09:19:18 UTC 2025
    - Last Modified: Thu Dec 11 09:47:03 UTC 2025
    - 54.8K bytes
    - Viewed (0)
  6. src/main/resources/fess_label_fr.properties

    labels.disabled=Désactivé
    labels.pathmap_pt_crawling=Exploration
    labels.pathmap_pt_displaying=Affichage
    labels.pathmap_pt_both=Exploration/Affichage
    labels.pathmap_pt_stored=Conversion d'URL extraite
    labels.regular_name=Nom régulier
    labels.duplicate_name=Nom en double
    labels.duplicate_host_configuration=Hôte en double
    labels.duplicate_host_title_details=Hôte en double
    Registered: Sat Dec 20 09:19:18 UTC 2025
    - Last Modified: Sat Dec 13 02:21:17 UTC 2025
    - 49.2K bytes
    - Viewed (0)
  7. src/main/java/org/codelibs/fess/helper/ViewHelper.java

            }
            buf.append(segment);
            return buf.toString();
        }
    
        /**
         * Gets the site path for display purposes.
         * Extracts and formats the site path from document URL.
         *
         * @param docMap the document data map
         * @return the formatted site path
         */
        public Object getSitePath(final Map<String, Object> docMap) {
    Registered: Sat Dec 20 09:19:18 UTC 2025
    - Last Modified: Fri Nov 28 16:29:12 UTC 2025
    - 52.6K bytes
    - Viewed (0)
  8. fess-crawler/src/main/java/org/codelibs/fess/crawler/client/http/HcHttpClient.java

                httpClientPropertyMap.put(name, value);
            }
        }
    
        /**
         * Processes robots.txt for the given URL.
         * This method fetches and parses the robots.txt file to extract disallow/allow rules
         * and sitemap information.
         *
         * @param url The URL to process robots.txt for
         */
        protected void processRobotsTxt(final String url) {
            if (StringUtil.isBlank(url)) {
    Registered: Sat Dec 20 11:21:39 UTC 2025
    - Last Modified: Sun Nov 23 12:19:14 UTC 2025
    - 53.7K bytes
    - Viewed (0)
  9. src/main/java/jcifs/smb/SmbSessionImpl.java

            // Simple implementation - could be enhanced with proper cluster discovery
            String hostname = serverAddress.getHostName();
            if (hostname != null && hostname.contains(".")) {
                // Extract potential cluster name from hostname
                String[] parts = hostname.split("\\.");
                if (parts.length > 1) {
                    return parts[0]; // Use first part as cluster name
                }
            }
    Registered: Sat Dec 20 13:44:44 UTC 2025
    - Last Modified: Sun Aug 31 08:00:57 UTC 2025
    - 68.9K bytes
    - Viewed (0)
Back to top