-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathMain.py
More file actions
60 lines (50 loc) · 2.15 KB
/
Main.py
File metadata and controls
60 lines (50 loc) · 2.15 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
from Audit import *
import threading
from queue import Queue
from CrawlerBot.main import create_workers
from CrawlerBot.main import crawl
from CrawlerBot.main import *
from CrawlerBot.domain import *
from CrawlerBot.general import *
from CrawlerBot.linkfinder import *
from CrawlerBot import spider
from general2 import *
from Scrap_Webpage import scrape
from multiprocessing import Pool
import time
def load_and_write_workbook(workbook_name, name_of_audit_sheet, result):
Newbook = load_workbook(workbook_name + ".xlsx")
Newbook.create_sheet(name_of_audit_sheet)
worksheet = Newbook[name_of_audit_sheet]
if any(isinstance(el, list) for el in result):
result_in = [item for sublist in result for item in sublist]
else:
result_in = result
m = len(result_in)
for i in range(1, m + 1):
worksheet.cell(row=i, column=1, value=(result_in[i - 1]))
Newbook.save(filename=PROJECT_NAME + '.xlsx')
create_workers()
crawl()
time.sleep(6)
print("Auditing")
scrapped_data = get_scrapped_data(PROJECT_NAME + '\crawled.txt')
duplicate_titles = scrapped_data.duplicate_titles()
duplicate_descriptions = scrapped_data.duplicate_meta_descriptions()
missing_descriptions = scrapped_data.get_missing_descriptions()
missing_titles = scrapped_data.get_missing_titles()
missing_h1 = scrapped_data.get_missing_h1()
duplicate_h1 = scrapped_data.get_duplicate_h1()
missing_canonicals = scrapped_data.get_missing_canonicals()
wrong_canonicals = scrapped_data.improper_canonicals()
missing_viewports = scrapped_data.missing_viewports()
low_titles = scrapped_data.get_titles_with_less_content()
low_meta = scrapped_data.get_meta_des_with_less_content()
print("Preparing Results")
create_workbook(PROJECT_NAME)
load_and_write_workbook(PROJECT_NAME, 'DuplicateTitles', duplicate_titles)
load_and_write_workbook(PROJECT_NAME, 'DuplicateMetaDescriptions', duplicate_descriptions)
load_and_write_workbook(PROJECT_NAME, 'missingDescriptions', missing_descriptions)
load_and_write_workbook(PROJECT_NAME, 'Thin Meta', low_meta)
load_and_write_workbook(PROJECT_NAME, 'thin titles', low_titles)
load_and_write_workbook(PROJECT_NAME, 'Missing Viewports', missing_viewports)