使用场景
对手机号码进行地域分析,需要查询归属地;
问题描述
针对数据集比较大的情况,通过脚本来处理,使用多线程的方法来加快查询速度
pool = multiprocessing.Pool(processes=pool_count)
for i in data_cut(data,pool_count):
data_log_list.append(pool.apply_async(main, (i,)))
pool.close()
pool.join()
解决方案
创建一个 pool 进程池,然后通过data_cut将数据读取并且等分成数据组,设置好pool_count进程数量就可以开始,每个数据组独立查询然后将结果汇总给push_log进行最终处理,保存为csv文件。
# 电话号码归属地查询
import os
import sys
import time
import json
import warnings
import pandas as pd
import multiprocessing
from phone import Phone
warnings.filterwarnings("ignore")
path = os.path.abspath(".")
def data_cut(data_list,data_cut=4):
#将任务拆分,建议拆分数为CPU核心数,默认为4
#分组数据,分组间隔
data_all=[]
if data_cut > len(data_list):
data_cut = len(data_list)
data_cut_num = int((len(data_list)+1)/data_cut)
for i in range(1,data_cut+1):
if i < data_cut:
data_1=data_list[data_cut_num*(i-1):data_cut_num*i]
else:
data_1=data_list[data_cut_num*(i-1):]
data_all.append(data_1)
return data_all
def push_log(data_log_list,file_name):
data_all = []
data_list = [i.get() for i in data_log_list]
for i in data_list:
for j in i:
data_all.append(j)
data_all = pd.DataFrame(data_all)
data_all.to_csv(path + "/phone_{}.csv".format(file_name),index=False,encoding='gbk')
print('成功查询:',data_all.shape[0])
def main(data):
resp = []
for i in data:
try:
if type(Phone().find(i)) == dict:
resp.append(Phone().find(i))
except:
pass
return resp
if __name__ == '__main__':
start_time= time.time()
file_name = name = sys.argv[1]
data = pd.read_table(path + "/{}".format(file_name),header=None)
data=list(data[0])
pool_count = 12
data_log_list = []
pool = multiprocessing.Pool(processes=pool_count)
for i in data_cut(data,pool_count):
data_log_list.append(pool.apply_async(main, (i,)))
pool.close()
pool.join()
push_log(data_log_list,file_name)
print(time.time()-start_time)
方法补充
除了上文的方法,小编还为大家整理了一些其他Python号码归属地查询的方法,需要的可以参考一下
方法一:
import requests
def get_callerloc(phone):
url = f"https://www.qvdv.com/tools/qvdv-api-mobile.html?f=json&mobile={phone}"
headers = {
'user-agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/100.0.4896.75 Safari/537.36',
}
response = requests.request("GET", url, headers=headers).json()
return response["message"]
if __name__ == '__main__':
phone = input("请输入手机号(查询归属地):")
res = get_callerloc(phone)
print("手机号码:"+res["mobile"])
print("归属地:"+res["province"])
print("运营商:"+res["supplier"])
截图
方法二
GUI
from tkinter import *
from tkinter import ttk
from tkinter import messagebox
from Get_Attr import Get_Infos
import re
import threading
class App:
def __init__(self):
self.root=Tk()
self.root.title('手机号码归属地查询-v1.0')
self.root.resizable(0,0)
width=410
height=390
left=(self.root.winfo_screenwidth()-width)/2
top=(self.root.winfo_screenheight()-height)/2
self.root.geometry('%dx%d+%d+%d'%(width,height,left,top))
self.create_widet()
self.set_widget()
self.place_widget()
self.root.mainloop()
def create_widet(self):
self.l1=ttk.Label(self.root)
self.e1=ttk.Entry(self.root)
self.b1=ttk.Button(self.root)
self.lf=ttk.LabelFrame(self.root)
self.l2=ttk.Label(self.lf)
self.e2=ttk.Entry(self.lf)
self.l3=ttk.Label(self.lf)
self.e3=ttk.Entry(self.lf)
self.l4=ttk.Label(self.lf)
self.e4=ttk.Entry(self.lf)
self.l5=ttk.Label(self.lf)
self.e5=ttk.Entry(self.lf)
self.l6=ttk.Label(self.lf)
self.e6=ttk.Entry(self.lf)
self.l7=ttk.Label(self.lf)
self.e7=ttk.Entry(self.lf)
self.b1.config(command=lambda:self.thread_it(self.search_infos))
def set_widget(self):
self.e2_var=StringVar()
self.e3_var=StringVar()
self.e4_var=StringVar()
self.e5_var=StringVar()
self.e6_var=StringVar()
self.e7_var=StringVar()
self.l1.config(text='请输入手机号:')
self.b1.config(text='查询')
self.lf.config(text='查询结果')
self.l2.config(text='手机号码:')
self.l3.config(text='所属省份:')
self.l4.config(text='所属城市:')
self.l5.config(text='区 号:')
self.l6.config(text='邮 编:')
self.l7.config(text='类 型:')
#将字符串变量绑定Entry组件
self.e2.config(textvariable=self.e2_var)
self.e3.config(textvariable=self.e3_var)
self.e4.config(textvariable=self.e4_var)
self.e5.config(textvariable=self.e5_var)
self.e6.config(textvariable=self.e6_var)
self.e7.config(textvariable=self.e7_var)
self.root.bind('<Escape>',self.escape)
self.root.bind('<Return>',self.do_search)
def place_widget(self):
self.l1.place(x=30,y=20)
self.e1.place(x=130,y=20)
self.b1.place(x=290,y=20)
self.lf.place(x=30,y=60,width=350,height=300)
self.l2.place(x=60,y=10)
self.e2.place(x=150,y=10)
self.l3.place(x=60,y=50)
self.e3.place(x=150,y=50)
self.l4.place(x=60,y=90)
self.e4.place(x=150,y=90)
self.l5.place(x=60,y=130)
self.e5.place(x=150,y=130)
self.l6.place(x=60,y=170)
self.e6.place(x=150,y=170)
self.l7.place(x=60,y=210)
self.e7.place(x=150,y=210)
def search_infos(self):
pn=self.e1.get()
#判断输入类型,必须为11位数字
if re.match('\d{11}',pn):
result=Get_Infos().get_infos(pn)
self.e2_var.set(pn)
self.e3_var.set(result['province'])
self.e4_var.set(result['city'])
self.e5_var.set(result['areacode'])
self.e6_var.set(result['zip'])
self.e7_var.set(result['company'])
else:
messagebox.showwarning('警告','输入有误,请检查!')
#使用线程防止UI界面卡死
def thread_it(self,func,*args):
t=threading.Thread(target=func,args=args)
t.setDaemon(True)
t.start()
def escape(self,event):
self.root.destroy()
def do_search(self,event):
self.thread_it(self.search_infos())
if __name__ == '__main__':
a=App()
Get_Attr
import json
import requests
from urllib.parse import urlencode
class Get_Infos():
def __init__(self):
self.url='http://apis.juhe.cn/mobile/get?'
self.headers={
'User-Agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/81.0.4044.138 Safari/537.36'
}
def get_infos(self,phone_num):
params={
'phone':phone_num,
'key':'7a2b367a62fa24108b1f27ed4c84c97a',
'dtype':''
}
r=requests.get(self.url+urlencode(params),headers=self.headers)
_json=json.loads(r.text)
if _json.get('resultcode')=='200':
result=_json.get('result')
item={}
item['province']=result.get('province')
item['city']=result.get('city')
item['areacode']=result.get('areacode')
item['zip']=result.get('zip')
item['company']=result.get('company')
return item
else:
return False
到此这篇关于Python实现号码归属地查询功能的文章就介绍到这了,更多相关Python号码归属地查询内容请搜索编程网以前的文章或继续浏览下面的相关文章希望大家以后多多支持编程网!