- 論壇徽章:
- 0
|
爬糗事一個(gè)小程序 很簡答
昨天開始在看py 爬蟲
但是tm 的 看不懂。
例子運(yùn)行也失敗了
想了想 用shell 寫了個(gè)入門的
VirtualBox_Ubuntu_06_01_2016_13_55_17.png (253.21 KB, 下載次數(shù): 89)
下載附件
2016-01-06 14:00 上傳
- #!/bin/bash
- page=1
- function get_html(){
- curl -A "Mozilla/4.0 £šcompatible£» MSIE 6.0£» Windows NT 5.0£©" qiushibaike/8hr/page/$page>fun
- echo "This is page$1"
- sed -n '/<div class="content">/,/<\/div>/p' fun|sed 's/^<.*//g' |sed '/^ *$/d'>f
- read_by_line
- let page=$1+1
- have_fun $page
- }
- function have_fun()
- {
- for i in `seq 10`
- do
-
- Input_user=n
- i=$page
- Input_user=0
- if [ $i -eq 1 ]
- then
- echo "have fun"
- get_html $i
- else
- echo "Continue? [y|N]"
- read Input_user
- fi
- if [[ $Input_user == N ]]
- then
- exit
- else
- get_html $i
- fi
- done
- }
- function read_by_line()
- {
- clear
- while read line
- do
- echo
- echo $line |sed 's/<br\/>/\n/g'
- echo
- echo "Continue [y|N]"
- read Input_user</dev/tty
- if [[ $Input_user == N ]]
- then
- exit
- fi
- done <f
- }
- have_fun
- rm -rf f fun
復(fù)制代碼 |
|