Python查询工信部网站备案信息

 6119

Python查询工信部网站备案信息,通过 https://beian.miit.gov.cn/ 查询信息,确保与管局实际信息一致;

支持自动完成图片拖动验证,存在极低的失败率;支持循环翻页查询,获取企业名下的所有备案信息;查询完毕后按任意键继续查询;非常方便,哈哈~~


看代码:

  1. # -*- coding: utf-8 -*-
  2. import requests,hashlib,time,base64,cv2,os
  3. while True:
  4.     #提前获取要查询的对象信息,以免Token失效(Token有效时间为3分钟)
  5.     print("项目地址:https://github.com/wongzeon/ICP-Checker\n")
  6.     print("版本:V1.1 可用测试:2021-7-27\n")
  7.     print("以企业名称查询的,需要输入企业全称\n")
  8.     print("以域名查询的,请不要输入“http/www”等域名外的字符\n")
  9.     info = input("请输入要查询的备案信息,可以为公司名或域名:")
  10.     info_data = {
  11.         'pageNum':'',
  12.         'pageSize':'',
  13.         'unitName':info
  14.     }
  15.     #构造AuthKey
  16.     timeStamp = int(round(time.time()*1000))
  17.     authSecret = 'testtest' + str(timeStamp)
  18.     authKey = hashlib.md5(authSecret.encode(encoding='UTF-8')).hexdigest()
  19.     #获取Cookie
  20.     cookie_headers = {
  21.     'accept': 'text/html,application/xhtml+xml,application/xml;q=0.9,image/webp,image/apng,*/*;q=0.8,application/signed-exchange;v=b3;q=0.9',
  22.     'accept-encoding': 'gzip, deflate, br',
  23.     'accept-language': 'zh-CN,zh;q=0.9,en;q=0.8,en-GB;q=0.7,en-US;q=0.6',
  24.     'user-agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/90.0.4430.72 Safari/537.36 Edg/90.0.818.42'
  25.     }
  26.     cookie = requests.utils.dict_from_cookiejar(requests.get('https://beian.miit.gov.cn/',headers=cookie_headers).cookies)['__jsluid_s']
  27.     #请求获取Token
  28.     t_url = 'https://hlwicpfwc.miit.gov.cn/icpproject_query/api/auth'
  29.     t_headers = {
  30.         'Host': 'hlwicpfwc.miit.gov.cn',
  31.         'Connection': 'keep-alive',
  32.         'sec-ch-ua': '" Not A;Brand";v="99", "Chromium";v="90", "Microsoft Edge";v="90"',
  33.         'Accept': '*/*',
  34.         'DNT': '1',
  35.         'sec-ch-ua-mobile': '?0',
  36.         'User-Agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/90.0.4430.85 Safari/537.36 Edg/90.0.818.46',
  37.         'Origin': 'https://beian.miit.gov.cn',
  38.         'Sec-Fetch-Site': 'same-site',
  39.         'Sec-Fetch-Mode': 'cors',
  40.         'Sec-Fetch-Dest': 'empty',
  41.         'Referer': 'https://beian.miit.gov.cn/',
  42.         'Accept-Encoding': 'gzip, deflate, br',
  43.         'Accept-Language': 'zh-CN,zh;q=0.9,en;q=0.8,en-GB;q=0.7,en-US;q=0.6',
  44.         'Cookie': '__jsluid_s=' + cookie
  45.     }
  46.     data = {
  47.         'authKey': authKey,
  48.         'timeStamp': timeStamp
  49.     }
  50.     t_response = requests.post(t_url,data=data,headers=t_headers)
  51.     try:
  52.         get_token = t_response.json()['params']['bussiness']
  53.     except:
  54.         print('\n'"请求被禁止,请稍后或更换头部与IP后再试,状态码:",t_response.status_code)
  55.         break
  56.     #获取验证图像、UUID
  57.     p_url = 'https://hlwicpfwc.miit.gov.cn/icpproject_query/api/image/getCheckImage'
  58.     p_headers = {
  59.         'Host': 'hlwicpfwc.miit.gov.cn',
  60.         'Connection': 'keep-alive',
  61.         'Content-Length': '0',
  62.         'sec-ch-ua': '" Not A;Brand";v="99", "Chromium";v="90", "Microsoft Edge";v="90"',
  63.         'Accept': 'application/json, text/plain, */*',
  64.         'DNT': '1',
  65.         'sec-ch-ua-mobile': '?0',
  66.         'User-Agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/90.0.4430.85 Safari/537.36 Edg/90.0.818.46',
  67.         'token': get_token,
  68.         'Origin': 'https://beian.miit.gov.cn',
  69.         'Sec-Fetch-Site': 'same-site',
  70.         'Sec-Fetch-Mode': 'cors',
  71.         'Sec-Fetch-Dest': 'empty',
  72.         'Referer': 'https://beian.miit.gov.cn/',
  73.         'Accept-Encoding': 'gzip, deflate, br',
  74.         'Accept-Language': 'zh-CN,zh;q=0.9,en;q=0.8,en-GB;q=0.7,en-US;q=0.6',
  75.         'Cookie': '__jsluid_s=' + cookie
  76.     }
  77.     p_request = requests.post(p_url,data='',headers=p_headers)
  78.     try:
  79.         p_uuid = p_request.json()['params']['uuid']
  80.         big_image = p_request.json()['params']['bigImage']
  81.         small_image = p_request.json()['params']['smallImage']
  82.     except KeyError:
  83.         print("请重试,请求状态码:",p_request.status_code)
  84.     #解码图片,写入并计算图片缺口位置
  85.     with open('bigImage.jpg','wb') as f:
  86.         f.write(base64.b64decode(big_image))
  87.         f.close()
  88.     with open('smallImage.jpg','wb') as f:
  89.         f.write(base64.b64decode(small_image))
  90.         f.close()
  91.     background_image = cv2.imread('bigImage.jpg',cv2.COLOR_GRAY2RGB)
  92.     fill_image = cv2.imread('smallImage.jpg',cv2.COLOR_GRAY2RGB)
  93.     background_image_canny = cv2.Canny(background_image, 100, 200)
  94.     fill_image_canny = cv2.Canny(fill_image, 100, 300)
  95.     position_match = cv2.matchTemplate(background_image, fill_image, cv2.TM_CCOEFF_NORMED)
  96.     min_val,max_val,min_loc,max_loc = cv2.minMaxLoc(position_match)
  97.     position = max_loc
  98.     mouse_length = position[0]+1
  99.     os.remove('bigImage.jpg')
  100.     os.remove('smallImage.jpg')
  101.     #通过拼图验证,获取sign
  102.     check_url = 'https://hlwicpfwc.miit.gov.cn/icpproject_query/api/image/checkImage'
  103.     check_headers = {
  104.         'Host': 'hlwicpfwc.miit.gov.cn',
  105.         'Accept': 'application/json, text/plain, */*',
  106.         'Connection': 'keep-alive',
  107.         'Content-Length': '60',
  108.         'sec-ch-ua': '" Not A;Brand";v="99", "Chromium";v="90", "Microsoft Edge";v="90"',
  109.         'DNT': '1',
  110.         'sec-ch-ua-mobile': '?0',
  111.         'User-Agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/90.0.4430.72 Safari/537.36 Edg/90.0.818.42',
  112.         'token': get_token,
  113.         'Content-Type': 'application/json',
  114.         'Origin': 'https://beian.miit.gov.cn',
  115.         'Sec-Fetch-Site': 'same-site',
  116.         'Sec-Fetch-Mode': 'cors',
  117.         'Sec-Fetch-Dest': 'empty',
  118.         'Referer': 'https://beian.miit.gov.cn/',
  119.         'Accept-Encoding': 'gzip, deflate, br',
  120.         'Accept-Language': 'zh-CN,zh;q=0.9,en;q=0.8,en-GB;q=0.7,en-US;q=0.6',
  121.         'Cookie': '__jsluid_s=' + cookie
  122.     }
  123.     check_data = {
  124.         'key':p_uuid,
  125.         'value':mouse_length
  126.     }
  127.     check_request = requests.post(check_url,json=check_data,headers=check_headers)
  128.     try:
  129.         sign = check_request.json()['params']
  130.     except Exception:
  131.         print('\n'"请求被禁止,请稍后或更换头部与IP后再试,状态码:",check_request.status_code)
  132.         break
  133.     #获取备案信息
  134.     info_url = 'https://hlwicpfwc.miit.gov.cn/icpproject_query/api/icpAbbreviateInfo/queryByCondition'
  135.     info_headers = {
  136.         'Host': 'hlwicpfwc.miit.gov.cn',
  137.         'Connection': 'keep-alive',
  138.         'Content-Length': '78',
  139.         'sec-ch-ua': '" Not A;Brand";v="99", "Chromium";v="90", "Microsoft Edge";v="90"',
  140.         'DNT': '1',
  141.         'sec-ch-ua-mobile': '?0',
  142.         'User-Agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/90.0.4430.72 Safari/537.36 Edg/90.0.818.42',
  143.         'Content-Type': 'application/json',
  144.         'Accept': 'application/json, text/plain, */*',
  145.         'uuid': p_uuid,
  146.         'token': get_token,
  147.         'sign': sign,
  148.         'Origin': 'https://beian.miit.gov.cn',
  149.         'Sec-Fetch-Site': 'same-site',
  150.         'Sec-Fetch-Mode': 'cors',
  151.         'Sec-Fetch-Dest': 'empty',
  152.         'Referer': 'https://beian.miit.gov.cn/',
  153.         'Accept-Encoding': 'gzip, deflate, br',
  154.         'Accept-Language': 'zh-CN,zh;q=0.9,en;q=0.8,en-GB;q=0.7,en-US;q=0.6',
  155.         'Cookie': '__jsluid_s=' + cookie
  156.     }
  157.     info_request = requests.post(info_url,json=info_data,headers=info_headers)
  158.     domain_total = info_request.json()['params']['total']
  159.     page_total = info_request.json()['params']['lastPage']
  160.     page_size = info_request.json()['params']['pageSize']
  161.     start_row = info_request.json()['params']['startRow']
  162.     end_row = info_request.json()['params']['endRow']
  163.     os.system('cls')
  164.     print("\n查询对象",info,"共有",domain_total,"个备案域名",'\n')
  165.     print("域名具体信息如下:")
  166.     for i in range(1,page_total+1):
  167.         for k in range(start_row,end_row+1):
  168.             info_base = info_request.json()['params']['list'][k]
  169.             domain_name = info_base['domain']
  170.             domain_type = info_base['natureName']
  171.             domain_licence = info_base['mainLicence']
  172.             domain_web_licence = info_base['serviceLicence']
  173.             domain_site_name = info_base['serviceName']
  174.             domain_status = info_base['limitAccess']
  175.             domain_approve_date = info_base['updateRecordTime']
  176.             domain_owner = info_base['unitName']
  177.             try:
  178.                 domain_content_approved = info_base['contentTypeName']
  179.                 if not bool(domain_content_approved):
  180.                     domain_content_approved = "无"
  181.             except KeyError:
  182.                 domain_content_approved = "无"
  183.             print("\n域名主办方:",domain_owner,'\n')
  184.             print("域名:",domain_name,'\n')
  185.             print("网站名称:",domain_site_name,'\n')
  186.             print("备案许可证号:",domain_licence,'\n')
  187.             print("网站备案号:",domain_web_licence,'\n')
  188.             print("域名类型:",domain_type,'\n')
  189.             print("网站前置审批项:",domain_content_approved,'\n')
  190.             print("是否限制接入:",domain_status,'\n')
  191.             print("审核通过日期:",domain_approve_date,'\n')
  192.         info_data_page = {
  193.             'pageNum':i+1,
  194.             'pageSize':'10',
  195.             'unitName':info
  196.         }
  197.         if info_data_page['pageNum'] > page_total:
  198.             print("查询完毕",'\n')
  199.             break
  200.         else:
  201.             info_request = requests.post(info_url,json=info_data_page,headers=info_headers)
  202.             start_row = info_request.json()['params']['startRow']
  203.             end_row = info_request.json()['params']['endRow']
  204.             time.sleep(3)
  205.     os.system('pause')


本文网址:https://www.zztuku.com/detail-9814.html
站长图库 - Python查询工信部网站备案信息
申明:如有侵犯,请 联系我们 删除。

评论(0)条

您还没有登录,请 登录 后发表评论!

提示:请勿发布广告垃圾评论,否则封号处理!!

    编辑推荐