<?php 
/* 
 * htdig_setup_configuration.php 
 * 
 * Purpose: create a configuration file for use by Htdig programs. 
 * 
 * Run this script from the command line use PHP standalone CGI 
 * executable program. 
 * 
 * @(#) $Header: /home/mlemos/cvsroot/htdiginterface/htdig_setup_configuration.php,v 1.5 2005/02/08 06:09:48 mlemos Exp $ 
 * 
 */ 
 
    require("htdig.php"); 
    require("configuration.php"); 
 
    $htdig=new htdig_class; 
 
    /* 
     * Where are the executables of htsearch, htdig, htmerge, htfuzzy 
     * located? They should be in the same directory. It does not need 
     * to be in the original instalation directory. 
     */ 
    $htdig->htdig_path=$htdig_path; 
 
    /* 
     * Where this search engine configuration file should be stored? It 
     * does not need to be in the original htdig instalation directory. 
     * If you need to index more than one site in your server run this 
     * script as many times as need specifying different configuration file 
     * names. 
     */ 
    $htdig->configuration=$htdig_configuration_file; 
 
    /* 
     * Where this search engine database files hould be stored? It 
     * does not need to be in the original htdig instalation directory. 
     * If you need to index more than one site in your server run this 
     * script as many times as need specifying different database 
     * directories. 
     */ 
    $htdig->database_directory=$htdig_database_directory; 
 
    /* 
     * Additional options that should be added to the configuration file. 
     * Consult htdig manual to learn about all of them. 
     */ 
    $options=array( 
 
        /* 
         * List of one or more URLs that htdig should start digging. It 
         * will follow the links contained in these URL pages. 
         */ 
        "start_url"=>$site_url, 
 
        /* 
         * List of one or more URLs that htdig should restrict when 
         * following links. 
         */ 
        "limit_urls"=>$site_url, 
 
        /* 
         * List of search algoritms to use and the associated weights that will 
         * be used to compute the score of each match. 
         */ 
        "search_algorithm"=>"exact:1 endings:0.5", 
 
        /* 
         * List of patterns that is used to exclude URLs from being indexed. 
         */ 
        "exclude_urls"=>"? browse/ user_options.html search.html", 
 
        /* 
         * Wait a few seconds before proceeding to the next page of the site 
         * being crawled. 
         */ 
        "server_wait_time"=>5, 
 
        /* 
         * Where the special template files htdig_header.html 
         * htdig_nomatch.html htdig_syntaxerror.html htdig_template.html are 
         * located.  These are special template files used by the htdig_class 
         * to parse htsearch program results. Do not change the template files. 
         * Install them to the path specified by this option. 
         */ 
        "template_path"=>"templates" 
 
    ); 
 
    /* 
     * Generate and save the configuration file in path specified in 
     * $htdig->configuration variable. 
     */ 
    $error=$htdig->GenerateConfiguration($options); 
    if(strcmp($error,"")) 
        echo "Error: $error\n"; 
?>
 
 |