python從實際網頁得到HTML的兩種方法
1
import urllib
2
3
def downloadhtml1():
4
sock = urllib.urlopen("http://www.baidu.com")
5
htmlContent = sock.read()
6
sock.close()
7
dirInfo = open('D:\\baidu1.html', 'a')
8
dirInfo.write(htmlContent)
9
dirInfo.close()
10
11
def cbk(a, b, c):
12
per = 100.0 *a * b / c
13
if per > 100:
14
per = 100
15
print '%.2f%%' %per
16
17
def downloadhtml2():
18
url = 'http://www.baidu.com'
19
local = 'd:\\baidu2.html'
20
urllib.urlretrieve(url,local,cbk)
21
22
if __name__ == '__main__':
23
downloadhtml1()
24
downloadhtml2()

2

3

4

5

6

7

8

9

10

11

12

13

14

15

16

17

18

19

20

21

22

23

24
