-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathMain_all.py
54 lines (43 loc) · 1.06 KB
/
Main_all.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
#from general import *
from queue import Queue
import threading
from spider import Spider
from parsing import *
#Project_name='Anime'
def append_file(data,name):
try:
f=open(name+'.txt','a')
for l in data:
f.write(l+'\n\n')
f.close()
except Exception:
print("file not appended")
def create_w():
for i in range(0,N):
t= threading.Thread(target=work)
t.daemon=True
t.start()
def work():
while True:
url=queue.get()
print("current Page")
print(url)
s.crawl(url)
queue.task_done()
def crawl_t():
if (len(Spider.que)>0):
#print(len(Spider.que))
for lnks in Spider.que:
queue.put(lnks)
queue.join()
crawl_t()
Home =input("Enter a valid URL:\n")
name =input("Enter a Name of file :\n")
Domain=get_d(Home)
N=5 ## number of threads
queue = Queue()
s=Spider(Home,Home,Domain)
create_w()
crawl_t()
append_file(Spider.craw,name)
print("File Saved")