#!/bin/bash #ort varagent='"msnbot/2.0b (+http://search.msn.com/msnbot.htm)"' export varagent='Mozilla/4.0 (compatible; MSIE 6.0; Windows NT 5.1; SV1)' export outputdir=/srv/http/nginx/proxy # rmccurdy.com # need curl and spidermonkey #echo "UPDATED: no multi connections support one at a time" #echo "also no cookie needed for proxyies.my-proxy.com anymore !!?" #echo "FIXED 04/15/2010 : nntime.com changed script" #echo "UPDATE 11/09 : crontab the script so it should auto update" #echo "UPDATE 4/20 : fixed my-proxy.com" #echo killing cron snort snortsam #killall snort snortsam cron rm cookie sakura good.txt proxylist.txt rm $outputdir/elite.txt $outputdir/anony.txt $outputdir/trans.txt if [ ! -f "proxylist.txt" ] then echo "proxylist.txt not found downloading list" sleep 5 echo "ripping freeproxylists.com" sleep 1 for img in `curl -A "$varagent" -s http://www.freeproxylists.com/elite.php | grep "elite " | sed 's/.*elite\///g' | sed 's/\.html.*//g' | sed 's/^/http:\/\/www.freeproxylists.com\/load_elite_/g' | sed 's/$/\.html/g'` do curl -A "$varagent" -s $img | awk '{gsub("</td></tr><tr><td>","\n"); print}' | awk '{gsub("</td><td>",":"); print}' | sed 's/<.*//g' | grep -v "<" >> proxylist.txt done echo "ripping proxylist.sakura.ne.jp" sleep 1 curl -s -A "$varagent" 'http://proxylist.sakura.ne.jp/index.htm?pages=0' | grep 'proxy([1-4]' > tmp curl -s -A "$varagent" 'http://proxylist.sakura.ne.jp/index.htm?pages=1' | grep 'proxy([1-4]' >> tmp curl -s -A "$varagent" 'http://proxylist.sakura.ne.jp/index.htm?pages=2' | grep 'proxy([1-4]' >> tmp curl -s -A "$varagent" 'http://proxylist.sakura.ne.jp/index.htm?pages=3' | grep 'proxy([1-4]' >> tmp curl -s -A "$varagent" 'http://proxylist.sakura.ne.jp/index.htm?pages=4' | grep 'proxy([1-4]' >> tmp curl -s -A "$varagent" 'http://proxylist.sakura.ne.jp/index.htm?pages=5' | grep 'proxy([1-4]' >> tmp curl -s -A "$varagent" 'http://proxylist.sakura.ne.jp/index.htm?pages=6' | grep 'proxy([1-4]' >> tmp mv tmp sakura cat sakura.js sakura > tmp js tmp >> proxylist.txt echo "ripping multiproxy.org" lynx -connect_timeout=3 -width=999 -dump -nolist "http://www.multiproxy.org/cgi-bin/search-proxy.pl" | sed 's/ //'g | grep ':' >> proxylist.txt echo "ripping nntime.com" sleep 1 rm tmp for i in {01,02,03,04,05,06,07,08,09,10,11,12,13,14,15,16,17} do curl -A "$varagent" -s "http://nntime.com/proxy-list-$i.htm" -A "SAMSUNG-SGH-E250/1.0 Profile/MIDP-2.0 Configuration/CLDC-1.1 UP.Browser/6.2.3.3.c.1.101 (GUI) MMP/2.0 (compatible; Googlebot-Mobile/2.1; +http://www.google.com/bot.html)" | egrep "(document.write| = )|;<\/script>" |sed -e 's/.*/print("/g' -e 's/