Script to scan Alexa's top 1m websites

This commit is contained in:
Julien Vehent 2014-01-09 11:52:17 -05:00
parent af7b4ce18c
commit e4ea957c8d
2 changed files with 1000018 additions and 0 deletions

18
top1m/testtop1m.sh Executable file
View file

@ -0,0 +1,18 @@
#!/usr/bin/env bash
[ ! -e "results" ] && mkdir results
i=1
while [ $i -lt 1000000 ]
do
echo processings sites $i to $((i + 50))
for t in $(tail -$((1000000 - $i)) top-1m.csv | head -50 |cut -d ',' -f 2)
do
tcping -u 2000000 $t 443
if [ $? -gt 0 ]
then
continue
fi
../cipherscan $t:443 > results/$t &
done
sleep 10
i=$(( i + 50))
done

1000000
top1m/top-1m.csv Normal file

File diff suppressed because it is too large Load diff