今天得了一批域名,需要把域名解析成ip
因?yàn)榱勘容^大所以采用了多進(jìn)程和隊(duì)列的方式
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
|
from multiprocessing import Process,Queue,Pool import socket import multiprocessing import os #寫入文件 def write(q,lock,filename): while not q.empty(): url = q.get() print (url) try : ip = socket.gethostbyname(url) except : ip = "unknow" print (ip) with open (filename, 'a+' ) as f: lock.acquire() #加鎖防止多個(gè)進(jìn)程寫入會(huì)混亂 try : f.write(url + " " + ip + "\n" ) finally : lock.release() #添加到隊(duì)列 def readurl(q,n): with open ( str (n) + '.txt' , 'r' ) as f: lines = f.readlines() for line in lines: q.put(line.strip()) return q #根據(jù)進(jìn)程進(jìn)行拆分txt def multi(urllist,n): with open (urllist, 'r' ) as f: lines = f.readlines() line = int ( len (lines) / n) print (line) for m in range ( 0 ,n): with open ( str (m) + '.txt' , 'a+' ) as f1: for i in range (line * m,line * (m + 1 )): f1.write(lines[i]) #刪除拆分的txt文件 def remove(n): for i in range ( 0 ,n): os.remove( str (i) + '.txt' ) print ( "######清除臨時(shí)文件######" ) if __name__ = = "__main__" : manager = multiprocessing.Manager() q = manager.Queue() lock = manager.Lock() m = 5 #設(shè)置掃描進(jìn)程數(shù) urllist = "url.txt" #待解析的url filename = "test.txt" #結(jié)果保存的文件名 multi(urllist,m) p = Pool(m) for i in range (m): p.apply_async(write,args = (readurl(q,i),lock,filename)) p.close() p.join() remove(m) print ( "#######全部文件采集完成########" ) |
以上這篇Python 實(shí)現(xiàn)域名解析為ip的方法就是小編分享給大家的全部?jī)?nèi)容了,希望能給大家一個(gè)參考,也希望大家多多支持服務(wù)器之家。
原文鏈接:https://blog.csdn.net/qq1124794084/article/details/80534678