#! /bin/sh ## special handler for altavista, since they only hand out chunks of 10 at ## a time. Tries to isolate out results without the leading/trailing trash. ## multiword arguments are foo+bar, as usual. ## Second optional arg switches the "what" field, to e.g. "news" test "${1}" = "" && echo 'Needs an argument to search for!' && exit 1 WHAT="web" test "${2}" && WHAT="${2}" # convert multiple args PLUSARG="`echo $* | sed 's/ /+/g'`" # Plug in arg. only doing simple-q for now; pg=aq for advanced-query # embedded quotes define phrases; otherwise it goes wild on multi-words QB="GET /cgi-bin/query?pg=q&what=${WHAT}&fmt=c&q=\"${PLUSARG}\"" # ping 'em once, to get the routing warm nc -z -w 8 www.altavista.digital.com 24015 2> /dev/null echo "=== Altavista ===" for xx in 0 10 20 30 40 50 60 70 80 90 100 110 120 130 140 150 160 170 180 \ 190 200 210 220 230 240 250 260 270 280 290 300 310 320 330 340 350 ; do echo "${QB}&stq=${xx}" | nc -w 15 www.altavista.digital.com 80 | \ egrep '^<a href="http://' done exit 0 # old filter stuff sed -e '/Documents .* matching .* query /,/query?.*stq=.* Document/p' \ -e d
Name | Type | Size | Permission | Actions |
---|---|---|---|---|
contrib | Folder | 0755 |
|
|
README | File | 239 B | 0644 |
|
alta | File | 1.11 KB | 0644 |
|
bsh | File | 487 B | 0644 |
|
dist.sh | File | 883 B | 0644 |
|
irc | File | 1.85 KB | 0644 |
|
iscan | File | 1005 B | 0644 |
|
ncp | File | 1.43 KB | 0644 |
|
probe | File | 2.07 KB | 0644 |
|
web.gz | File | 2.5 KB | 0644 |
|
webproxy.gz | File | 2.69 KB | 0644 |
|
webrelay | File | 1.52 KB | 0644 |
|
websearch | File | 2.92 KB | 0644 |
|