#!/usr/local/bin/tclsh8.3

# Copyright 2003 Jose Nazario <jose@monkey.org>
# All rights reserved.
#
# Redistribution and use in source and binary forms, with or without
# modification, are permitted provided that the following conditions
# are met:
# 1. Redistributions of source code must retain the above copyright
#    notice, this list of conditions and the following disclaimer.
# 2. Redistributions in binary form must reproduce the above copyright
#    notice, this list of conditions and the following disclaimer in the
#    documentation and/or other materials provided with the distribution.
# 3. All advertising materials mentioning features or use of this software
#    must display the following acknowledgement:
#       This product contains software developed by Jose Nazario.
#
# THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR
# IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
# OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
# IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT,
# INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT
# NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
# DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
# THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
# (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF
# THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.

package require Tnm
package require struct
package require cmdline
package require htmlparse

proc mycb {tag slash param text} {
	global todo
	global depth

	foreach data $param {
		if {[regexp -nocase "href=" $data]} {
			regsub -nocase {^href=} $data "" data
			regsub -nocase -all {\"} $data "" data
			if {$depth < 2} {
				lappend todo $data
			}
		}
	}
}

# implements a basic stack pop (no push needed here).

proc lpop {_L} {
	upvar 1 $_L L
	set res [lindex $L 0]	
	set L [lrange $L 1 end]
	set res
}

set depth 0
set todo $argv
lappend todo "ENDARGV"

while {[llength $todo]} {
	set page [lpop todo]
	if {$page == "ENDARGV"} {
		lappend todo "ALLDONE"
		continue
	}
	if {$page == "ALLDONE" } {
		incr depth
		break
	}
	if {$page == ""} {
		continue
	}
	puts "==> checking $page"
	if [catch {set page [http get $page "/tmp/http-out"]}] {
		puts "    link not found: $page"
		continue
	}

	set f [open "/tmp/http-out" "r"]
	set r [read $f]

	foreach line [split $r "\n"] {
		catch {::htmlparse::parse -cmd mycb -incvar err $line}
	}

	close $f
}

puts "linkcheck ending"
