Search Options

Results per page
Sort
Preferred Languages
Advance

Results 1 - 10 of 83 for command (0.03 sec)

  1. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/CommandExtractor.java

            this.tempDir = tempDir;
        }
    
        /**
         * Sets the command to execute for text extraction.
         * @param command The command to set.
         */
        public void setCommand(final String command) {
            this.command = command;
        }
    
        /**
         * Sets the timeout for command execution.
         * @param executionTimeout The execution timeout in milliseconds.
         */
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 16K bytes
    - Viewed (0)
  2. fess-crawler/src/test/java/org/codelibs/fess/crawler/extractor/impl/CommandExtractorTest.java

            final String content = "TEST";
            final File contentFile = createContentFile(".txt", content.getBytes());
    
            final CommandExtractor extractor = new CommandExtractor();
            extractor.command = getCommand(scriptFile);
            final Map<String, String> params = new HashMap<String, String>();
            final ExtractData text = extractor.getText(new FileInputStream(contentFile), params);
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Mar 15 06:52:00 UTC 2025
    - 9.8K bytes
    - Viewed (0)
  3. fess-crawler/src/main/java/org/codelibs/fess/crawler/entity/SitemapUrl.java

         * time they are accessed. The value "never" should be used to describe
         * archived URLs.
         *
         * Please note that the value of this tag is considered a hint and not a
         * command. Even though search engine crawlers may consider this information
         * when making decisions, they may crawl pages marked "hourly" less
         * frequently than that, and they may crawl pages marked "yearly" more
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 6.5K bytes
    - Viewed (0)
  4. fess-crawler/src/main/java/org/codelibs/fess/crawler/client/ftp/FtpClient.java

    import org.apache.commons.lang3.StringUtils;
    import org.apache.commons.net.ftp.FTP;
    import org.apache.commons.net.ftp.FTPClient;
    import org.apache.commons.net.ftp.FTPClient.NatServerResolverImpl;
    import org.apache.commons.net.ftp.FTPClientConfig;
    import org.apache.commons.net.ftp.FTPFile;
    import org.apache.commons.net.ftp.FTPFileFilters;
    import org.apache.commons.net.ftp.FTPSClient;
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 39.5K bytes
    - Viewed (0)
  5. fess-crawler-lasta/src/main/resources/crawler/extractor.xml

    				"text/vnd.iptc.anpa",
    				"text/vnd.iptc.newsml",
    				"text/vnd.iptc.nitf",
    				"text/vnd.latex-z",
    				"text/vnd.motorola.reflex",
    				"text/vnd.ms-mediapackage",
    				"text/vnd.net2phone.commcenter.command",
    				"text/vnd.si.uricatalogue",
    				"text/vnd.sun.j2me.app-descriptor",
    				"text/vnd.trolltech.linguist",
    				"text/vnd.wap.si",
    				"text/vnd.wap.sl",
    				"text/vnd.wap.wml",
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Aug 01 21:40:30 UTC 2020
    - 49K bytes
    - Viewed (0)
  6. fess-crawler/src/main/resources/org/codelibs/fess/crawler/mime/tika-mimetypes.xml

        </magic>
        <!-- XML files can start with a comment but then must not contain processing instructions.
             This should be rare so we assign lower priority here. Priority is also lower than text/html magics
             for them to be preferred for HTML starting with comment.-->
        <magic priority="30">
          <match value="&lt;!--" type="string" offset="0"/>
        </magic>
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Thu Mar 13 08:18:01 UTC 2025
    - 320.1K bytes
    - Viewed (1)
  7. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/AbstractXmlExtractor.java

    import java.util.regex.Pattern;
    
    import org.apache.commons.io.ByteOrderMark;
    import org.apache.commons.io.input.BOMInputStream;
    import org.apache.commons.text.translate.AggregateTranslator;
    import org.apache.commons.text.translate.CharSequenceTranslator;
    import org.apache.commons.text.translate.EntityArrays;
    import org.apache.commons.text.translate.LookupTranslator;
    import org.apache.commons.text.translate.NumericEntityUnescaper;
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Jul 06 02:13:03 UTC 2025
    - 8.5K bytes
    - Viewed (0)
  8. fess-crawler/src/main/java/org/codelibs/fess/crawler/extractor/impl/TikaExtractor.java

    import java.util.Map;
    import java.util.Properties;
    import java.util.concurrent.ConcurrentHashMap;
    import java.util.function.BiConsumer;
    import java.util.stream.Collectors;
    
    import org.apache.commons.io.output.DeferredFileOutputStream;
    import org.apache.commons.lang3.SystemUtils;
    import org.apache.logging.log4j.LogManager;
    import org.apache.logging.log4j.Logger;
    import org.apache.tika.config.TikaConfig;
    import org.apache.tika.detect.Detector;
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Thu Aug 07 02:55:08 UTC 2025
    - 30.7K bytes
    - Viewed (0)
  9. README.md

    - **Transformers**: Data transformation and enrichment
    - **Filters**: URL filtering with regex patterns
    - **Rules**: Content processing rules and validation
    
    ## Building and Testing
    
    ### Build Commands
    
    ```bash
    # Build all modules
    mvn clean install
    
    # Build without tests
    mvn clean install -DskipTests
    
    # Build specific module
    mvn clean install -pl fess-crawler
    
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sun Aug 31 05:32:52 UTC 2025
    - 15.3K bytes
    - Viewed (0)
  10. fess-crawler/src/test/java/org/codelibs/fess/crawler/extractor/impl/ApiExtractorTest.java

    import javax.servlet.http.HttpServletRequest;
    import javax.servlet.http.HttpServletResponse;
    
    import org.apache.commons.fileupload.FileItem;
    import org.apache.commons.fileupload.FileUploadException;
    import org.apache.commons.fileupload.disk.DiskFileItemFactory;
    import org.apache.commons.fileupload.servlet.ServletFileUpload;
    import org.codelibs.fess.crawler.entity.ExtractData;
    Registered: Sun Sep 21 03:50:09 UTC 2025
    - Last Modified: Sat Mar 15 06:52:00 UTC 2025
    - 5.4K bytes
    - Viewed (0)
Back to top