#! /bin/sh
## special handler for altavista, since they only hand out chunks of 10 at
## a time.  Tries to isolate out results without the leading/trailing trash.
## multiword arguments are foo+bar, as usual.
## Second optional arg switches the "what" field, to e.g. "news"

test "${1}" = "" && echo 'Needs an argument to search for!' && exit 1
test "${2}" && WHAT="${2}"

# convert multiple args
PLUSARG="`echo $* | sed 's/ /+/g'`"

# Plug in arg.  only doing simple-q for now; pg=aq for advanced-query
# embedded quotes define phrases; otherwise it goes wild on multi-words
QB="GET /cgi-bin/query?pg=q&what=${WHAT}&fmt=c&q=\"${PLUSARG}\""

# ping 'em once, to get the routing warm
nc -z -w 8 www.altavista.digital.com 24015 2> /dev/null
echo "=== Altavista ==="

for xx in 0 10 20 30 40 50 60 70 80 90 100 110 120 130 140 150 160 170 180 \
  190 200 210 220 230 240 250 260 270 280 290 300 310 320 330 340 350 ; do
  echo "${QB}&stq=${xx}" | nc -w 15 www.altavista.digital.com 80 | \
  egrep '^<a href="http://'

exit 0

# old filter stuff
  sed -e '/Documents .* matching .* query /,/query?.*stq=.* Document/p' \
  -e d


Name Type Size Permission Actions
contrib Folder 0755
README File 239 B 0644
alta File 1.11 KB 0644
bsh File 487 B 0644
dist.sh File 883 B 0644
irc File 1.85 KB 0644
iscan File 1005 B 0644
ncp File 1.43 KB 0644
probe File 2.07 KB 0644
web.gz File 2.5 KB 0644
webproxy.gz File 2.69 KB 0644
webrelay File 1.52 KB 0644
websearch File 2.92 KB 0644