Sample File Contents

# archive.cfg (Archive configuration, normally edited through the web interface)
#
# Archive Configuration file for Webglimpse
#
# title String = Title of search as placed in wgindex.html
#
# urlpath http://domain.com/path = URL to archive directory
# (unused in v1.6 & above)
#
# traverse_type n = 0 for Traversal of local links only
# = 1 for Traversal of remote and local links
# = 2 for Subdirectory-based archive
#
# explicit_only n = 0 for traversal of any link, explicit or non-explicit
# = 1 for traversal of only explicit links to remote sites
#
# numhops n = # of hops to traverse from starting page
#
# nhhops n = # of hops to allow for each neighborhood
#
# local_limit n = maximum # of local pages to index
#
# remote_limit n = maximum # of remote pages to index
#
# addboxes n = 0 to NOT add search boxes to all indexed pages
# = 1 to add search boxes to all indexed pages
#
# vhost Hostname = name of virtual host to use for this index
#
# usemaxmem 0 = 0 to NOT use maximum available memory
# = 1 to use maximum memory to speed up indexing
#
# urllist Url1,Url2,.. = List of starting URL's or Directories to index
#
#

title My Search Page
urlpath http://myserver.com/path/to/directory
traverse_type 0
explicit_only 1
numhops 2
nhhops 1
local_limit 99999
remote_limit 250
addboxes 0
vhost myserver.com
usemaxmem 0
urllist http://myserver.com/directory1,http://myserver.com.directory2


wgsites.conf

SERVER tucson.com
PORT 80
DOCUMENTROOT /home/WWW
USERDIR public_html
DIRECTORYINDEX index.html index.htm index.shtml
ALIAS /icons/ /home/httpd/icons/
ALIAS /msql/ /home/msql/docs/
SCRIPTALIAS /cgi-bin/ /home/httpd/cgi-bin/


wgfilter-index

Deny (^|/)JavaScript:
Deny \.gif$
Deny \.jpeg$
Deny \.mpeg$
Deny \.jpg$
Deny \.ppt$
Deny \.PPT$
Deny \.au$
Deny \.wav$
Deny \.mov$
Deny \.htm$
Deny \.html$
Deny \.gz$
Deny \.Z$
Deny \.tgz$
Deny \.txt$
Deny \.zip$
Deny \.ps$
Deny \.exe$
Deny (^|/)wgindex\.html$
Deny (^|/)wgall\.html$
Deny \.wg
Deny \.glimpse_
Deny (^|/)indexing-in-progress$
Deny (^|/)wgreindex$
Deny (^|/)archive.cfg$
Deny (^|/)\.nh\.
Deny ~$
Deny (^|/)_vti
Deny (^|/)\.htpasswd$
Deny (^|/)\.htgroup$


wg_toindex

/var/www/html/document1.html   http://myserver.domain.com/document1.html  1
/var/www/html/document2.html   http://myserver.domain.com/document2.html  1
/var/www/htmldocument3.html    http://myserver.domain.com/document3.html  1
/var/www/html/document4.html   http://myserver.domain.com/document4.html  1
/var/www/html/document5.html   http://myserver.domain.com/document5.html  1