首页 编程教程正文

【Python爬虫原创代码】利用python爬取全国各地天气预报

piaodoo 编程教程 2020-02-22 22:07:31 1007 0 python教程

本文来源吾爱破解论坛

本帖最后由 袅袅系秋风 于 2019-3-23 18:20 编辑

最近在学习python爬虫,写了这个程序练手,有谁想参考的可以看一下,大家共同学习。



程序利用的是python的requests模块以及re模块


主要通过requests.get()获取网页代码保存到response中,然后通过正则从html代码中提取自己想要的数据。


最后将这些数据封装为图形化界面


程序运行截图如下:

1.png (185.57 KB, 下载次数: 3)

下载附件  保存到相册

2019-3-22 21:20 上传


(tip: 也可以通过字符查询,默认显示查询的第一个,如果想要显示准确的地方天气建议填完整城市名或完整城市拼音)




下面是代码:



[Python] 纯文本查看 复制代码
from tkinter import *
import tkinter as tk
import requests
from PIL import ImageTk as itk


class MyFrame(Frame):
    def __init__(self):
        self.root=Tk()

        self.root.title("天气查询")
        self.root.geometry('1200x700+400+220')

        bg = tk.Canvas(self.root, width=1200, height=600, bg='white')
        self.img = itk.PhotoImage(file="bg.gif")
        bg.place(x=100, y=40)
        bg.create_image(0, 0, anchor=NW, image=self.img)

        self.city = Entry(self.root, width=16, font=("仿宋", 18, "normal"))
        self.city.place(x=200, y=60)

        citylabel=Label(self.root,text='查询城市',font=("仿宋", 18, "normal"))
        citylabel.place(x=80,y=60)

        [i]#查询按钮
[/i][i]        [/i]chaxun = Button(self.root, width=10, height=3, text="查询", bg='#00CCFF', bd=5, font="bold")
        chaxun.bind("<Button-1>", self.search)
        chaxun.place(x=800, y=50)

        self.result=Listbox(self.root,heigh=18,width=65,font=("仿宋", 20, "normal"))[i]#显示天气框
[/i][i]        [/i]self.result.place(x=125,y=120)

    def tianqiforecast(self,searchcity):
        print('请输入所要查询天气的城市:')
        city = searchcity
        [i]# city='minquan'
[/i][i]        [/i]url = 'http://toy1.weather.com.cn/search?cityname=' + city + '&callback=success_jsonpCallback&_=1548048506469'
[i]# print(url)
[/i][i]        [/i]headers = {
            'User-Agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/71.0.3578.98 Safari/537.36',
            'Cookie': '__guid=182823328.3322839646442213000.1543932524694.901; vjuids=1858d43b6.167798cbdb7.0.8c4d7463d5c5d; vjlast=1543932526.1543932526.30; userNewsPort0=1; f_city=%E5%B9%B3%E9%A1%B6%E5%B1%B1%7C101180501%7C; Hm_lvt_080dabacb001ad3dc8b9b9049b36d43b=1543932526,1543932551,1543932579; Wa_lvt_1=1547464114,1547464115,1547880054,1547983123; defaultCty=101181001; defaultCtyName=%u5546%u4E18; monitor_count=6; Wa_lpvt_1=1547983809'
}
        response = requests.get(url, headers=headers)
        html1 = response.content.decode('utf-8')
        [i]# print(html)
[/i][i]
[/i][i]        [/i]citys = re.findall('"ref":"(.*?)~.*?~(.*?)~.*?~(.*?)~.*?~.*?~.*?~.*?~(.*?)"', html1, re.S)
        if (len(citys) == 0):
            print('未查找到该城市')
            exit(-5)
        for i in range(0, len(citys)):
            print(i + 1, ':%14s%14s%14s%14s ' % (citys[i][0], citys[i][3], citys[i][2], citys[i][1]))
        [i]#choose = int(input('请选择城市编号:[1~' + str(len(citys)) + ']\n'))
[/i][i]        [/i]choose=1
        if (len(citys[choose - 1][0]) == 9):
            if (citys[choose - 1][0][0] != '1' or citys[choose - 1][0][1] != '0' or citys[choose - 1][0][2] != '1'):
                print('暂时无法查询国外天气,程序已退出')
                exit(404)
            else:
                url2 = 'http://www.weather.com.cn/weathern/' + citys[choose - 1][0] + '.shtml'
responseweather = requests.get(url2, headers=headers)
            html2 = responseweather.content.decode('utf-8')

            weather = re.findall('<li class="date-.*?".*?".*?">(.*?)</.*?"date-i.*?">(.*?)<.*?', html2, re.S)
            weather.append(re.findall(
                '<p class="weather-in.*?" title="(.*?)".*?title="(.*?)".*?title="(.*?)".*?<p class="wind-i.*?">(.*?)</p>',
                html2, re.S))
            Hightempture = re.findall(
                '<script>var eventDay =\["(.*?)","(.*?)","(.*?)","(.*?)","(.*?)","(.*?)","(.*?)","(.*?)"\];', html2,
                re.S)
            Lowtempture = re.findall(
                'var eventNight =\["(.*?)","(.*?)","(.*?)","(.*?)","(.*?)","(.*?)","(.*?)","(.*?)"\];',
                html2, re.S)
            [i]# print(Hightempture,Lowtempture)
[/i][i]            [/i]b='查询城市为:'+ str(citys[choose - 1][3])+'    '+str(citys[choose - 1][1])
            self.result.insert(END, b)
            for i in range(0, 8):
                [i]# print(weather[i])
[/i][i]                [/i]'''print("%4s%4s%10s\t\t\t%s℃ ~ %s℃\t\t\t%s%s%-s" % (
                    weather[i][0], weather[i][1], weather[8][i][0], Lowtempture[0][i], Hightempture[0][i],
                    weather[8][i][1],
                    weather[8][i][3], weather[8][i][2]))'''
a = weather[i][0] + '    ' + weather[i][1] + '    ' + weather[8][i][0] + '    ' + Lowtempture[0][i] + '℃  ~  ' + \
                    Hightempture[0][i] + '℃   ' + weather[8][i][1]  + weather[8][i][3]+ weather[8][i][2]
                self.result.insert(END, a)

        if (len(citys[choose - 1][0]) == 12):
            url2 = 'http://forecast.weather.com.cn/town/weathern/' + citys[choose - 1][0] + '.shtml'
responseweather = requests.get(url2, headers=headers)
            html2 = responseweather.content.decode('utf-8')

            weather = re.findall('<li class="date-.*?".*?"da.*?">(.*?)</.*?"date-i.*?">(.*?)<.*?', html2, re.S)

            html2 = re.sub('lt;', '<', html2)
            weather.append(re.findall(
                '<p class="weather-in.*?" title="(.*?)".*?title="(.*?)".*?title="(.*?)".*?<p class="wind-i.*?">\\r\\n(.*?)\\r\\n',
                html2, re.S))

            Hightempture = re.findall(
                'var eventDay = \["(.*?)","(.*?)","(.*?)","(.*?)","(.*?)","(.*?)","(.*?)","(.*?)"\];', html2, re.S)

            Lowtempture = re.findall(
                'var eventNight = \["(.*?)","(.*?)","(.*?)","(.*?)","(.*?)","(.*?)","(.*?)","(.*?)"\];',
                html2, re.S)
            [i]# print(Hightempture,Lowtempture)
[/i][i]            [/i]b='查询城市为:'+str(citys[choose - 1][3])+'   '+str( citys[choose - 1][2])+ '    ' +str(citys[choose - 1][1])
            self.result.insert(0,b)
            [i]#print(weather[8][2])
[/i][i]            #print(weather)
[/i][i]            [/i]for i in range(0, 8):
                [i]# print(weather[i])
[/i][i]                [/i]'''print("%4s%4s%10s\t\t\t%s℃ ~ %s℃\t\t\t%s%s%-s" % (
                    weather[i][0], weather[i][1], weather[8][i][0], Lowtempture[0][i], Hightempture[0][i],
                    weather[8][i][1],
                    weather[8][i][3], weather[8][i][2]))'''
a = weather[i][0] + '    ' + weather[i][1] + '    ' + weather[8][i][0] + '    ' + Lowtempture[0][i] + '℃  ~  ' + \
                    Hightempture[0][i] + '℃   ' + weather[8][i][1]  + weather[8][i][3]+ weather[8][i][2]
                self.result.insert(END, a)
    def search(self,event):
        mycity=self.city.get()
        if(mycity!=''):
            self.result.delete(0,END)
            self.city.delete(0,END)
            self.tianqiforecast(mycity)

if __name__=='__main__':
    myframe=MyFrame()
    myframe.root.mainloop()


想下载的也可以在这里下载源代码
嗨学网

天气预报带ui界面.rar

2019-3-22 21:27 上传

点击文件名下载附件

下载积分: 吾爱币 -1 CB

2.12 KB, 下载次数: 144, 下载积分: 吾爱币 -1 CB

本帖被以下淘专辑推荐: · 爬虫专栏|主题: 38, 订阅: 39

版权声明:

本站所有资源均为站长或网友整理自互联网或站长购买自互联网,站长无法分辨资源版权出自何处,所以不承担任何版权以及其他问题带来的法律责任,如有侵权或者其他问题请联系站长删除!站长QQ754403226 谢谢。

有关影视版权:本站只供百度云网盘资源,版权均属于影片公司所有,请在下载后24小时删除,切勿用于商业用途。本站所有资源信息均从互联网搜索而来,本站不对显示的内容承担责任,如您认为本站页面信息侵犯了您的权益,请附上版权证明邮件告知【754403226@qq.com】,在收到邮件后72小时内删除。本文链接:https://www.piaodoo.com/7612.html

搜索