From: Adam Dickmeiss Date: Mon, 25 Mar 2002 16:11:08 +0000 (+0000) Subject: *** empty log message *** X-Git-Tag: ZMBOT.0.1~4 X-Git-Url: http://git.indexdata.com/?p=tclrobot.git;a=commitdiff_plain;h=bd463f7d1f1610a3c7a3d9e678f5c4ff27f9d546 *** empty log message *** --- diff --git a/robot.tcl b/robot.tcl index 56e33a4..bfe875f 100755 --- a/robot.tcl +++ b/robot.tcl @@ -1,5 +1,5 @@ #!/usr/bin/tclsh -# $Id: robot.tcl,v 1.31 2002/02/28 14:04:11 adam Exp $ +# $Id: robot.tcl,v 1.32 2002/03/25 16:11:08 adam Exp $ # proc RobotFileNext1 {area lead} { # puts "RobotFileNext1 area=$area lead=$lead" @@ -288,12 +288,12 @@ proc RobotHref {url hrefx hostx pathx} { if {[string length $href] > 256} { return 0 } - if {[string first {?} $href] >= 0} { - return 0 - } - if {[string first {?} $url] >= 0 && [string first {?} $href] >= 0} { - return 0 - } +# if {[string first {?} $href] >= 0} { +# return 0 +# } +# if {[string first {?} $url] >= 0 && [string first {?} $href] >= 0} { +# return 0 +# } # get method (if any) if {![regexp {^([^/:]+):(.*)} $href x method hpath]} { set hpath $href @@ -548,7 +548,7 @@ proc RobotTextHtml {url out} { # don't print title of document content if noindex is used if {!$noindex} { puts $out "$title" - regsub -all {} $body { } abody regsub -all -nocase {} $abody {} bbody regsub -all {<[^\>]+>} $bbody {} nbody puts $out ""