1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67
| import requests from lxml import etree
method = input("不知道公司名字选1输入官网,知道公司名字选2输入名字") url = "https://www.beianx.cn/search/" handers = { 'User-Agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/97.0.4692.99 Safari/537.36 Edg/97.0.1072.69'}
if method == "1": website = input("请输入公司的官网的域名,不要子域名不要根域名,直接域名即可可") res = requests.get(f"{url}{website}") tree = etree.HTML(res.text) result = tree.xpath("/html/body/div[2]/table/tbody/tr/td[2]/a/text()") print(str(result)) elif method == "2": conpany = input("请输入公司的名字") print("加载中...") res = requests.get(f"{url}{conpany}") tree = etree.HTML(res.text) result_list = [] i = True index = 1 while i: try: result = tree.xpath(f"/html/body/div[2]/table/tbody/tr[{str(index)}]/td[6]/div/a/text()") if result == []: i = False else: result_list += result index += 1 except: i = False print("出错了") final = '\n'.join(result_list) mod = input("请选择:1.直接获取所有的url 2.获取所有非子域名 3.根据hunter domain语法来输出所有的痱子域名") if mod == "1": print(final)
elif mod == "2": final_list2 = [] for item in result_list: new_item = item.split('.') del new_item[0] final_item = '.'.join(new_item) final_list2.append(final_item) print('\n'.join(final_list2))
elif mod == "3": final_list2 = [] for item in result_list: new_item = item.split('.') del new_item[0] final_item = '.'.join(new_item) final_list2.append(final_item)
resultlist = list() for item in final_list2: newitem = f"domain=\"{item}\"" resultlist.append(newitem) print('||'.join(resultlist)) else: print("都说了不要乱输东西了,你看是不是又要重新来了嘛")
else: print("给你说了输什么还要乱输是吧?")
|