From: Adam Dickmeiss Date: Mon, 26 Feb 2001 22:51:51 +0000 (+0000) Subject: Added config for zebra/zmbol. X-Git-Tag: ZMBOT.0.1~27 X-Git-Url: http://lists.indexdata.dk/?a=commitdiff_plain;h=e80b5c034f20b43530880ba530a8e1de06646726;p=tclrobot.git Added config for zebra/zmbol. --- diff --git a/robot.tcl b/robot.tcl index 9b672cd..c7d85c4 100755 --- a/robot.tcl +++ b/robot.tcl @@ -1,5 +1,5 @@ #!/usr/bin/tclsh -# $Id: robot.tcl,v 1.12 2001/01/23 14:28:41 adam Exp $ +# $Id: robot.tcl,v 1.13 2001/02/26 22:51:51 adam Exp $ # proc RobotFileNext1 {area lead} { puts "RobotFileNext1 area=$area lead=$lead" @@ -264,6 +264,9 @@ proc RobotHref {url hrefx hostx pathx} { if {[string first { } $href] >= 0} { return 0 } + if {[string length $href] > 256} { + return 0 + } if {[string first {?} $url] >= 0 && [string first {?} $href] >= 0} { return 0 } @@ -757,7 +760,7 @@ set i 0 set l [llength $argv] if {$l < 2} { - puts {tclrobot: usage [-j jobs] [-c count] [-d domain] [url ..]} + puts {tclrobot: usage [-j jobs] [-i idle] [-c count] [-d domain] [url ..]} puts " Example: -c 3 -d '*.dk' http://www.indexdata.dk/" exit 1 } @@ -784,6 +787,12 @@ while {$i < $l} { } lappend domains $dom } + -i* { + set idleTime [string range $arg 2 end] + if {![string length $idleTime]} { + set idleTime [lindex $argv [incr i]] + } + } default { set href $arg if {[RobotHref http://www.indexdata.dk/ href host path]} { diff --git a/tab/zebra.cfg b/tab/zebra.cfg new file mode 100644 index 0000000..0f77308 --- /dev/null +++ b/tab/zebra.cfg @@ -0,0 +1,15 @@ +# Simple Zebra configuration file +# $Id: zebra.cfg,v 1.1 2001/02/26 22:51:51 adam Exp $ +# +# Where the schema files, attribute files, etc are located. +profilePath: .:../../zebra/tab:../../yaz/tab + +# Files that describe the attribute sets supported. +attset: bib1.att +attset: gils.att +attset: explain.att + +recordtype: grs.sgml + +storekeys: 1 +storedata: 1 diff --git a/tab/zmbot.abs b/tab/zmbot.abs new file mode 100644 index 0000000..9395b88 --- /dev/null +++ b/tab/zmbot.abs @@ -0,0 +1,30 @@ +# $Id: zmbot.abs,v 1.1 2001/02/26 22:51:51 adam Exp $ + +name gils +reference GILS-schema +attset gils.att +tagset tagsetm.tag +tagset tagsetg.tag + +esetname F @ + +#all Any + +elm (1,1) schemaIdentifier - +elm (1,10) rank - +elm (1,12) url - +elm (1,14) localControlNumber - +elm (2,1) title !:w,!:p,!:s +# + +elm distance distance - +elm si si - +elm si/date date - +elm si/format format - +elm publisher publisher - +elm publisher/identifier identifier Linkage:0 +elm publisher/type type Linkage-Type:0 +elm cr cr - +elm cr/identifier identifier - +elm cr/description description - +elm documentcontent content any:w