思路:
一、根據city.txt文檔來獲取不一樣城市code
二、獲取中國天氣網7d和15d不一樣城市url
三、利用requests庫請求url獲取html內容
四、利用beautifulsoup獲取7d和15d指定天氣數據
五、將獲取的天氣數據保存到csv文件中html
# -*- coding: utf-8 -*- import requests from bs4 import BeautifulSoup import csv ''' 獲取不一樣城市code ''' def get_citycode(city_name): with open('city.txt', 'r', encoding='UTF-8') as fs: lines = fs.readlines()#一次讀取整個文件內容,且自動分紅一行列表,readline()每次只讀取一行 for line in lines: if(city_name in line): code = line.split('=')[0].strip()#每行去掉頭尾空格,且用「=」分隔出code和cityname,返回字符串列表 return code raise ValueError('invalid city name')#拋出異常 ''' 獲取不一樣城市7天url ''' def get_7d_url(city_name): url = 'http://www.weather.com.cn/weather/' code = get_citycode(city_name) return url + code + '.shtml' ''' 獲取不一樣城市15天url ''' def get_15d_url(city_name): url = 'http://www.weather.com.cn/weather15d/' code = get_citycode(city_name) return url + code + '.shtml' '''' 獲取html內容 ''' def get_content(url, data=None): rep = requests.get(url, timeout=60) rep.encoding = 'utf-8' return rep.text ''' 獲取7天指定數據 ''' def get_7d_data(htmltext, city): content = [] bs = BeautifulSoup(htmltext, "html.parser") body = bs.body data = body.find('div', {'id': '7d'}) ul = data.find('ul') li = ul.find_all('li') for day in li: line = [city] date = day.find('h1').string p = day.find_all('p') text = p[0].string if p[1].find('span') is None: temperature_H = None else: temperature_H = p[1].find('span').string temperature_L = p[1].find('i').string wind_force = p[2].find('i').string line.append(date) line.append(text) line.append(temperature_H) line.append(temperature_L) line.append(wind_force) content.append(line) return content ''' 獲取15天指定數據 ''' def get_15d_data(htmltext, city): content = [] bs = BeautifulSoup(htmltext, "html.parser") body = bs.body data = body.find('div', {'id': '15d'}) ul = data.find('ul') li = ul.find_all('li') for day in li: line = [city] span = day.find_all('span') date = span[0].string text = span[1].string if span[2].find('em') is None: temperature_H = None else: temperature_H = span[2].find('em').string temperature_L = span[2].string wind_direction = span[3].string wind_force = span[4].string line.append(date) line.append(text) line.append(temperature_H) line.append(temperature_L) line.append(wind_direction) line.append(wind_force) content.append(line) return content ''' 保存獲取到的天氣數據 csv文件 ''' def save_data(data, filename): with open(filename, 'a', errors='ignore', newline='') as f: #newline=" "是爲了不寫入以後有空行 f_csv = csv.writer(f) f_csv.writerows(data)#數據整行寫入csv文件中 ''' 爬取7每天氣數據 ''' def _7d(city): url = get_7d_url(city) html = get_content(url) result = get_7d_data(html,city) save_data(result, 'E:\weather.csv') ''' 爬取15每天氣數據 ''' def _15d(city): url = get_15d_url(city) html = get_content(url) result = get_15d_data(html,city) save_data(result, 'E:\weather.csv') if __name__ == '__main__': cities = input('city name: ').split(' ') # 鍵盤輸入城市,用空格分隔開 for city in cities: _7d(city) _15d(city)
附:city.txt 獲取地址:https://pan.baidu.com/s/1VNW8AJi6_zo7mP_90lTkiA 提取碼:red5 python