set a useragent
This commit is contained in:
parent
8c4421108b
commit
2b46e8899f
1 changed files with 9 additions and 3 deletions
12
urls.sh
12
urls.sh
|
@ -1,3 +1,9 @@
|
||||||
wget --spider --force-html -r -l1 -H $@ 2>&1 \
|
wget --spider --force-html -r -l1 -H -U 'searplbot/1.0' $@ 2>&1 | tee wg
|
||||||
| grep '^--' | awk '{ print $3 }' \
|
|
||||||
| grep -v '\.\(css\|js\|png\|gif\|jpg\|txt\|ico\|ttf\|svg\)$'
|
grep '^--' wg | awk '{ print $3 }' \
|
||||||
|
| grep -v '\.\(css\|js\|png\|gif\|jpg\|txt\|ico\|ttf\|svg\)$' \
|
||||||
|
| tee ur
|
||||||
|
|
||||||
|
sleep 10
|
||||||
|
|
||||||
|
php crawl.php $(cat ur)
|
||||||
|
|
Loading…
Reference in a new issue