<?php
/*
* htdig_setup_configuration.php
*
* Purpose: create a configuration file for use by Htdig programs.
*
* Run this script from the command line use PHP standalone CGI
* executable program.
*
* @(#) $Header: /home/mlemos/cvsroot/htdiginterface/htdig_setup_configuration.php,v 1.5 2005/02/08 06:09:48 mlemos Exp $
*
*/
require("htdig.php");
require("configuration.php");
$htdig=new htdig_class;
/*
* Where are the executables of htsearch, htdig, htmerge, htfuzzy
* located? They should be in the same directory. It does not need
* to be in the original instalation directory.
*/
$htdig->htdig_path=$htdig_path;
/*
* Where this search engine configuration file should be stored? It
* does not need to be in the original htdig instalation directory.
* If you need to index more than one site in your server run this
* script as many times as need specifying different configuration file
* names.
*/
$htdig->configuration=$htdig_configuration_file;
/*
* Where this search engine database files hould be stored? It
* does not need to be in the original htdig instalation directory.
* If you need to index more than one site in your server run this
* script as many times as need specifying different database
* directories.
*/
$htdig->database_directory=$htdig_database_directory;
/*
* Additional options that should be added to the configuration file.
* Consult htdig manual to learn about all of them.
*/
$options=array(
/*
* List of one or more URLs that htdig should start digging. It
* will follow the links contained in these URL pages.
*/
"start_url"=>$site_url,
/*
* List of one or more URLs that htdig should restrict when
* following links.
*/
"limit_urls"=>$site_url,
/*
* List of search algoritms to use and the associated weights that will
* be used to compute the score of each match.
*/
"search_algorithm"=>"exact:1 endings:0.5",
/*
* List of patterns that is used to exclude URLs from being indexed.
*/
"exclude_urls"=>"? browse/ user_options.html search.html",
/*
* Wait a few seconds before proceeding to the next page of the site
* being crawled.
*/
"server_wait_time"=>5,
/*
* Where the special template files htdig_header.html
* htdig_nomatch.html htdig_syntaxerror.html htdig_template.html are
* located. These are special template files used by the htdig_class
* to parse htsearch program results. Do not change the template files.
* Install them to the path specified by this option.
*/
"template_path"=>"templates"
);
/*
* Generate and save the configuration file in path specified in
* $htdig->configuration variable.
*/
$error=$htdig->GenerateConfiguration($options);
if(strcmp($error,""))
echo "Error: $error\n";
?>
|