python/shell代碼片斷

查看某模塊路徑php

Bash
pip show --files selenium

文件編碼轉換html

Bash
convmv -f GBK -t UTF-8 --notest -r ydcz_1/

查找當前目錄下,結尾爲.php的文件中,包含字符串「zfb_box」的文件python

Bash
find ./ -name "*.php" | xargs grep 「zfb_box"

百度搜索結果URL提取主域名mysql

Bash
cat xinxi_jieguo|awk -F"," '{print $3}'|egrep -o 'http://[^/]*?/' |egrep -o '([a-z0-9_-]{1,32}\.)+([a-z0-9_-]{1,32})((\.[a-z]{2,4})(.[a-z]{1,2})?)'|egrep -o "\.[^\.]*?\.(com\.cn|com|cn|net|org|cc|hk|tv|info|de|tw|wang|kr)$」

 

統計每一個域名流量分發android

Bash
cat xinxi_jieguo|awk -F"," '{print $3}'|egrep '\.1688.com'|egrep -o 'http://[^/]*?/[^/]*?/' | sort|uniq -c|sort -nr

201904172109394211332.jpg

 

兩文件按列合併web

Bash
paste -d " " 4+.txt out.txt > hebing.txt

awk計算重複次數正則表達式

Bash
cat urldata|awk '{a[$1]++}END{for(i in a){print i,a[i]}}'

按列求和sql

Bash
awk '/aaa/ {sum += $2};END {print sum}’ test

按列求和2express

Bash
cat test.txt | awk '{s[$1]+=$2}END{for(i in s){print i,s[i]}}'

按行數將一個文件分割成多個,sitemap使用json

Bash
split -8142 file outfile

查找目錄下包含某個字符的文件

Bash
find .|xargs grep -ri "IBM"

python下載圖片

Python
#! /usr/bin/env python #coding=utf-8 import url lib,os filepath=os.getcwd() if os.path.exists(filepath) is False: os.mkdir(filepath) x=1 print u'爬蟲準備就緒...' for line in open('logo_url.txt'): line = line.strip() id = line.split(',')[1] imgurl = line.split(',')[2] temp= '%s.jpg' % id print u'正在下載第%s張圖片' % x print imgurl try: urllib.urlretrieve(imgurl,temp) x+=1 except: continue print u'圖片下載完畢,保存路徑爲'+filepath

MD5生成

Python
import hashlib m2 = hashlib.md5() m2.update(src) print m2.hexdigest()

讀取CSV

Python
# coding: utf-8 import csv csvfile = file('csv_test.csv', 'rb') reader = csv.reader(csvfile) for line in reader: print line csvfile.close()

寫入CSV

Python
# coding: utf-8 import csv csvfile = file('csv_test.csv', 'wb') writer = csv.writer(csvfile) writer.writerow(['姓名', '年齡', '電話']) data = [ ('小河', '25', '1234567'), ('小芳', '18', '789456') ] writer.writerows(data) csvfile.close()

刪除中文字符串

Python
#coding: utf-8 import sys import re reload(sys) sys.setdefaultencoding('utf8') s = """ en: Regular expression is a powerful tool for manipulating text. zh: 漢語是世界上最優美的語言,正則表達式是一個頗有用的工具 jp: 正規表現は很是に役に立つツールテキストを操做することです。 jp-char: あアいイうウえエおオ kr:정규 표현식은 매우 유용한 도구 텍스트를 조작하는 것입니다. """ print "原始utf8字符" #utf8 print "--------" print repr(s) print "--------\n" #非ansi re_words=re.compile(r"[\x80-\xff]+") m = re_words.search(s,0) print "非ansi字符" print "--------" print m print m.group() print "--------\n" #unicode s = unicode(s) print "原始unicode字符" print "--------" print repr(s) print "--------\n" #unicode chinese re_words = re.compile(u"[\u4e00-\u9fa5]+") m = re_words.search(s,0) print "unicode 中文" print "--------" print m print m.group() res = re.findall(re_words, s) # 查詢出全部的匹配字符串 if res: print "There are %d parts:\n"% len(res) for r in res: print "\t",r print print "--------\n" #unicode korean re_words=re.compile(u"[\uac00-\ud7ff]+") m = re_words.search(s,0) print "unicode 韓文" print "--------" print m print m.group() print "--------\n" #unicode japanese katakana re_words=re.compile(u"[\u30a0-\u30ff]+") m = re_words.search(s,0) print "unicode 日文 片假名" print "--------" print m print m.group() print "--------\n" #unicode japanese hiragana re_words=re.compile(u"[\u3040-\u309f]+") m = re_words.search(s,0) print "unicode 日文 平假名" print "--------" print m print m.group() print "--------\n" #unicode cjk Punctuation re_words=re.compile(u"[\u3000-\u303f\ufb00-\ufffd]+") m = re_words.search(s,0) print "unicode 標點符號" print "--------" print m print m.group() print "--------\n"

經過scrapinghub提取代理ip,抓取海外網頁

Python
import requests from requests.auth import HTTPProxyAuth url = "http://m.baidu.com/s?word=seo" headers = {} proxy_host = "paygo.crawlera.com" proxy_auth = HTTPProxyAuth("88aa8b802a7f4626b659dae926ee445b", "") proxies = {"http": "http://proxy.crawlera.com:8010/".format(proxy_host)} if url.startswith("https:"): url = "http://" + url[8:] headers["X-Crawlera-Use-HTTPS"] = "1" r = requests.get(url, headers=headers, proxies=proxies, auth=proxy_auth) print r.headers['x-crawlera-slave']

mysql查詢數據

Python
def sql_r_num(sql): cur = con.cursor() cur.execute(sql) data = cur.fetchone() return data[0] user_nums = sql_r_num("select max(id) from ask_users")

兩個時間點之間,隨機生成日期

Python
def random_date(): a1=(2018,1,1,0,0,0,0,0,0) #設置開始日期時間元組(1976-01-01 00:00:00) a2=(2019,4,14,0,0,0,0,0,0) #設置結束日期時間元組(1990-12-31 23:59:59) start=time.mktime(a1) #生成開始時間戳 end=time.mktime(a2) #生成結束時間戳 #隨機生成日期字符串 t=random.randint(start,end) #在開始和結束時間戳中隨機取出一個 date_touple=time.localtime(t) #將時間戳生成時間元組 date=time.strftime("%Y-%m-%d %H:%M:%S",date_touple) #將時間元組轉成格式化字符串(1976-05-21) return date

寫入mysql

Python
import sys,time,os,smtplib import MySQLdb as mdb mysql_time = time.strftime('%Y-%m-%d',time.localtime(time.time())) con= mdb.connect("23.236.79.228","root","123456」,」seo_data",charset=「utf8」,unix_socket='/tmp/mysql.sock') cur = con.cursor() mysql_haosou_uv = '''INSERT INTO haosou_pc_uv VALUES ("%s",%s)''' % (mysql_time,','.join(sql_haosou_uv)) mysql_bd_pc_spider = '''INSERT INTO bd_pc_spider VALUES ("%s",%s)''' % (mysql_time,','.join(sql_bd_pc_spider)) mysql_bd_m_spider = '''INSERT INTO bd_m_spider VALUES ("%s",%s)''' % (mysql_time,','.join(sql_bd_m_spider)) mysql_bd_pc_uv = '''INSERT INTO bd_pc_uv VALUES ("%s",%s)''' % (mysql_time,','.join(sql_bd_pc_uv)) mysql_bd_m_uv = '''INSERT INTO bd_m_uv VALUES ("%s",%s)''' % (mysql_time,','.join(sql_bd_m_uv)) sql_list = [mysql_haosou_uv,mysql_bd_pc_spider,mysql_bd_m_spider,mysql_bd_pc_uv,mysql_bd_m_uv] for sql in sql_list: print 'Import:%s' % sql try: cur.execute(sql) con.commit() print 'done' except: con.rollback()

判斷字符串是否所有爲中文

Python
#coding:utf-8 import sys reload(sys) sys.setdefaultencoding('utf8') '''判斷當前字符串是否所有爲中文''' def check_contain_chinese(check_str): n = 0 m = 0 for ch in check_str.decode('utf-8'): if u'\u4e00' <= ch <= u'\u9fff': n += 1 else: m += 1 if m == 0: return 1 else: return 0

文本格式化

Markup
a = re.sub(r'<(?!p|img|/p)[^<>]*?>','',content).strip()   #將除p和img以外的標籤清空,且去除正文開頭結尾的換行,並把單引號換成雙引號
b = re.sub(r'<p[^>]*?>','<p>',a) #格式化p標籤 newcontent = re.sub(r'alt="[^"]*?"','alt="%s"' % title,b).lower()

提取字符串中文並計算字數

Python
text = re.sub("[\s+\.\!\/_,$%^*(+\"\']+|[+——!,::。?、~@#¥%……&*()「」《》]+".decode("utf8"), "".decode("utf8"),newcontent) #去除中英文標點符號 text2 = re.sub('<[^>]*?>','',text) #去除全部標籤 words_number = len(text2)

unicode字符串轉義(Python中,如何將反斜槓u類型(\uXXXX)的字符串,轉換爲對應的unicode的字符)

Python
slashUStr = "\\u0063\\u0072\\u0069\\u0066\\u0061\\u006E\\u0020\\u5728\\u8DEF\\u4E0A" decodedUniChars = slashUStr.decode("unicode-escape") print "decodedUniChars=",decodedUniChars

json與dict轉化

Python
import simplejson # JSON轉化爲字典 json_2_dict = simplejson.loads(user) print json_2_dict #字典轉化爲JSON字符串 dict_2_jsonstr = simplejson.dumps(json_2_dict) print dict_2_jsonstr

識別客戶端類型

Python
def getUA(ua): reg_b = re.compile(r"(android|bb\\d+|meego).+mobile|avantgo|bada\\/|blackberry|blazer|compal|elaine|fennec|hiptop|iemobile|ip(hone|od)|iris|kindle|lge |maemo|midp|mmp|mobile.+firefox|netfront|opera m(ob|in)i|palm( os)?|phone|p(ixi|re)\\/|plucker|pocket|psp|series(4|6)0|symbian|treo|up\\.(browser|link)|vodafone|wap|windows ce|xda|xiino", re.I|re.M) reg_v = re.compile(r"1207|6310|6590|3gso|4thp|50[1-6]i|770s|802s|a wa|abac|ac(er|oo|s\\-)|ai(ko|rn)|al(av|ca|co)|amoi|an(ex|ny|yw)|aptu|ar(ch|go)|as(te|us)|attw|au(di|\\-m|r |s )|avan|be(ck|ll|nq)|bi(lb|rd)|bl(ac|az)|br(e|v)w|bumb|bw\\-(n|u)|c55\\/|capi|ccwa|cdm\\-|cell|chtm|cldc|cmd\\-|co(mp|nd)|craw|da(it|ll|ng)|dbte|dc\\-s|devi|dica|dmob|do(c|p)o|ds(12|\\-d)|el(49|ai)|em(l2|ul)|er(ic|k0)|esl8|ez([4-7]0|os|wa|ze)|fetc|fly(\\-|_)|g1 u|g560|gene|gf\\-5|g\\-mo|go(\\.w|od)|gr(ad|un)|haie|hcit|hd\\-(m|p|t)|hei\\-|hi(pt|ta)|hp( i|ip)|hs\\-c|ht(c(\\-| |_|a|g|p|s|t)|tp)|hu(aw|tc)|i\\-(20|go|ma)|i230|iac( |\\-|\\/)|ibro|idea|ig01|ikom|im1k|inno|ipaq|iris|ja(t|v)a|jbro|jemu|jigs|kddi|keji|kgt( |\\/)|klon|kpt |kwc\\-|kyo(c|k)|le(no|xi)|lg( g|\\/(k|l|u)|50|54|\\-[a-w])|libw|lynx|m1\\-w|m3ga|m50\\/|ma(te|ui|xo)|mc(01|21|ca)|m\\-cr|me(rc|ri)|mi(o8|oa|ts)|mmef|mo(01|02|bi|de|do|t(\\-| |o|v)|zz)|mt(50|p1|v )|mwbp|mywa|n10[0-2]|n20[2-3]|n30(0|2)|n50(0|2|5)|n7(0(0|1)|10)|ne((c|m)\\-|on|tf|wf|wg|wt)|nok(6|i)|nzph|o2im|op(ti|wv)|oran|owg1|p800|pan(a|d|t)|pdxg|pg(13|\\-([1-8]|c))|phil|pire|pl(ay|uc)|pn\\-2|po(ck|rt|se)|prox|psio|pt\\-g|qa\\-a|qc(07|12|21|32|60|\\-[2-7]|i\\-)|qtek|r380|r600|raks|rim9|ro(ve|zo)|s55\\/|sa(ge|ma|mm|ms|ny|va)|sc(01|h\\-|oo|p\\-)|sdk\\/|se(c(\\-|0|1)|47|mc|nd|ri)|sgh\\-|shar|sie(\\-|m)|sk\\-0|sl(45|id)|sm(al|ar|b3|it|t5)|so(ft|ny)|sp(01|h\\-|v\\-|v )|sy(01|mb)|t2(18|50)|t6(00|10|18)|ta(gt|lk)|tcl\\-|tdg\\-|tel(i|m)|tim\\-|t\\-mo|to(pl|sh)|ts(70|m\\-|m3|m5)|tx\\-9|up(\\.b|g1|si)|utst|v400|v750|veri|vi(rg|te)|vk(40|5[0-3]|\\-v)|vm40|voda|vulc|vx(52|53|60|61|70|80|81|83|85|98)|w3c(\\-| )|webc|whit|wi(g |nc|nw)|wmlb|wonu|x700|yas\\-|your|zeto|zte\\-", re.I|re.M) b = reg_b.search(ua) v = reg_v.search(ua[0:4]) if b or v: return 'wap' else: return 'pc'

日期遍歷

Python
import datatime,time def date_range(start, end, only_monday=False, input_format='%y%m%d', output_format='%y%m%d'): '''如print date_range(140130, 140202) 輸出['140130', '140131', '140201', '140202'] ''' start = str(start) end = str(end) start = datetime.datetime.strptime(start, input_format) end = datetime.datetime.strptime(end, input_format) one_day = datetime.timedelta(days=1) range_ = [] d = start - one_day while 1: d = d + one_day if d > end: break if only_monday and d.strftime('%w')!='1': continue range_.append(datetime.datetime.strftime(d, output_format)) return range_

查看某模塊路徑

Bash
pip show --files selenium

文件編碼轉換

Bash
convmv -f GBK -t UTF-8 --notest -r ydcz_1/

查找當前目錄下,結尾爲.php的文件中,包含字符串「zfb_box」的文件

Bash
find ./ -name "*.php" | xargs grep 「zfb_box"

百度搜索結果URL提取主域名

Bash
cat xinxi_jieguo|awk -F"," '{print $3}'|egrep -o 'http://[^/]*?/' |egrep -o '([a-z0-9_-]{1,32}\.)+([a-z0-9_-]{1,32})((\.[a-z]{2,4})(.[a-z]{1,2})?)'|egrep -o "\.[^\.]*?\.(com\.cn|com|cn|net|org|cc|hk|tv|info|de|tw|wang|kr)$」

 

統計每一個域名流量分發

Bash
cat xinxi_jieguo|awk -F"," '{print $3}'|egrep '\.1688.com'|egrep -o 'http://[^/]*?/[^/]*?/' | sort|uniq -c|sort -nr

201904172109394211332.jpg

 

兩文件按列合併

Bash
paste -d " " 4+.txt out.txt > hebing.txt

awk計算重複次數

Bash
cat urldata|awk '{a[$1]++}END{for(i in a){print i,a[i]}}'

按列求和

Bash
awk '/aaa/ {sum += $2};END {print sum}’ test

按列求和2

Bash
cat test.txt | awk '{s[$1]+=$2}END{for(i in s){print i,s[i]}}'

按行數將一個文件分割成多個,sitemap使用

Bash
split -8142 file outfile

查找目錄下包含某個字符的文件

Bash
find .|xargs grep -ri "IBM"

python下載圖片

Python
#! /usr/bin/env python #coding=utf-8 import url lib,os filepath=os.getcwd() if os.path.exists(filepath) is False: os.mkdir(filepath) x=1 print u'爬蟲準備就緒...' for line in open('logo_url.txt'): line = line.strip() id = line.split(',')[1] imgurl = line.split(',')[2] temp= '%s.jpg' % id print u'正在下載第%s張圖片' % x print imgurl try: urllib.urlretrieve(imgurl,temp) x+=1 except: continue print u'圖片下載完畢,保存路徑爲'+filepath

MD5生成

Python
import hashlib m2 = hashlib.md5() m2.update(src) print m2.hexdigest()

讀取CSV

Python
# coding: utf-8 import csv csvfile = file('csv_test.csv', 'rb') reader = csv.reader(csvfile) for line in reader: print line csvfile.close()

寫入CSV

Python
# coding: utf-8 import csv csvfile = file('csv_test.csv', 'wb') writer = csv.writer(csvfile) writer.writerow(['姓名', '年齡', '電話']) data = [ ('小河', '25', '1234567'), ('小芳', '18', '789456') ] writer.writerows(data) csvfile.close()

刪除中文字符串

Python
#coding: utf-8 import sys import re reload(sys) sys.setdefaultencoding('utf8') s = """ en: Regular expression is a powerful tool for manipulating text. zh: 漢語是世界上最優美的語言,正則表達式是一個頗有用的工具 jp: 正規表現は很是に役に立つツールテキストを操做することです。 jp-char: あアいイうウえエおオ kr:정규 표현식은 매우 유용한 도구 텍스트를 조작하는 것입니다. """ print "原始utf8字符" #utf8 print "--------" print repr(s) print "--------\n" #非ansi re_words=re.compile(r"[\x80-\xff]+") m = re_words.search(s,0) print "非ansi字符" print "--------" print m print m.group() print "--------\n" #unicode s = unicode(s) print "原始unicode字符" print "--------" print repr(s) print "--------\n" #unicode chinese re_words = re.compile(u"[\u4e00-\u9fa5]+") m = re_words.search(s,0) print "unicode 中文" print "--------" print m print m.group() res = re.findall(re_words, s) # 查詢出全部的匹配字符串 if res: print "There are %d parts:\n"% len(res) for r in res: print "\t",r print print "--------\n" #unicode korean re_words=re.compile(u"[\uac00-\ud7ff]+") m = re_words.search(s,0) print "unicode 韓文" print "--------" print m print m.group() print "--------\n" #unicode japanese katakana re_words=re.compile(u"[\u30a0-\u30ff]+") m = re_words.search(s,0) print "unicode 日文 片假名" print "--------" print m print m.group() print "--------\n" #unicode japanese hiragana re_words=re.compile(u"[\u3040-\u309f]+") m = re_words.search(s,0) print "unicode 日文 平假名" print "--------" print m print m.group() print "--------\n" #unicode cjk Punctuation re_words=re.compile(u"[\u3000-\u303f\ufb00-\ufffd]+") m = re_words.search(s,0) print "unicode 標點符號" print "--------" print m print m.group() print "--------\n"

經過scrapinghub提取代理ip,抓取海外網頁

Python
import requests from requests.auth import HTTPProxyAuth url = "http://m.baidu.com/s?word=seo" headers = {} proxy_host = "paygo.crawlera.com" proxy_auth = HTTPProxyAuth("88aa8b802a7f4626b659dae926ee445b", "") proxies = {"http": "http://proxy.crawlera.com:8010/".format(proxy_host)} if url.startswith("https:"): url = "http://" + url[8:] headers["X-Crawlera-Use-HTTPS"] = "1" r = requests.get(url, headers=headers, proxies=proxies, auth=proxy_auth) print r.headers['x-crawlera-slave']

mysql查詢數據

Python
def sql_r_num(sql): cur = con.cursor() cur.execute(sql) data = cur.fetchone() return data[0] user_nums = sql_r_num("select max(id) from ask_users")

兩個時間點之間,隨機生成日期

Python
def random_date(): a1=(2018,1,1,0,0,0,0,0,0) #設置開始日期時間元組(1976-01-01 00:00:00) a2=(2019,4,14,0,0,0,0,0,0) #設置結束日期時間元組(1990-12-31 23:59:59) start=time.mktime(a1) #生成開始時間戳 end=time.mktime(a2) #生成結束時間戳 #隨機生成日期字符串 t=random.randint(start,end) #在開始和結束時間戳中隨機取出一個 date_touple=time.localtime(t) #將時間戳生成時間元組 date=time.strftime("%Y-%m-%d %H:%M:%S",date_touple) #將時間元組轉成格式化字符串(1976-05-21) return date

寫入mysql

Python
import sys,time,os,smtplib import MySQLdb as mdb mysql_time = time.strftime('%Y-%m-%d',time.localtime(time.time())) con= mdb.connect("23.236.79.228","root","123456」,」seo_data",charset=「utf8」,unix_socket='/tmp/mysql.sock') cur = con.cursor() mysql_haosou_uv = '''INSERT INTO haosou_pc_uv VALUES ("%s",%s)''' % (mysql_time,','.join(sql_haosou_uv)) mysql_bd_pc_spider = '''INSERT INTO bd_pc_spider VALUES ("%s",%s)''' % (mysql_time,','.join(sql_bd_pc_spider)) mysql_bd_m_spider = '''INSERT INTO bd_m_spider VALUES ("%s",%s)''' % (mysql_time,','.join(sql_bd_m_spider)) mysql_bd_pc_uv = '''INSERT INTO bd_pc_uv VALUES ("%s",%s)''' % (mysql_time,','.join(sql_bd_pc_uv)) mysql_bd_m_uv = '''INSERT INTO bd_m_uv VALUES ("%s",%s)''' % (mysql_time,','.join(sql_bd_m_uv)) sql_list = [mysql_haosou_uv,mysql_bd_pc_spider,mysql_bd_m_spider,mysql_bd_pc_uv,mysql_bd_m_uv] for sql in sql_list: print 'Import:%s' % sql try: cur.execute(sql) con.commit() print 'done' except: con.rollback()

判斷字符串是否所有爲中文

Python
#coding:utf-8 import sys reload(sys) sys.setdefaultencoding('utf8') '''判斷當前字符串是否所有爲中文''' def check_contain_chinese(check_str): n = 0 m = 0 for ch in check_str.decode('utf-8'): if u'\u4e00' <= ch <= u'\u9fff': n += 1 else: m += 1 if m == 0: return 1 else: return 0

文本格式化

Markup
a = re.sub(r'<(?!p|img|/p)[^<>]*?>','',content).strip()   #將除p和img以外的標籤清空,且去除正文開頭結尾的換行,並把單引號換成雙引號
b = re.sub(r'<p[^>]*?>','<p>',a) #格式化p標籤 newcontent = re.sub(r'alt="[^"]*?"','alt="%s"' % title,b).lower()

提取字符串中文並計算字數

Python
text = re.sub("[\s+\.\!\/_,$%^*(+\"\']+|[+——!,::。?、~@#¥%……&*()「」《》]+".decode("utf8"), "".decode("utf8"),newcontent) #去除中英文標點符號 text2 = re.sub('<[^>]*?>','',text) #去除全部標籤 words_number = len(text2)

unicode字符串轉義(Python中,如何將反斜槓u類型(\uXXXX)的字符串,轉換爲對應的unicode的字符)

Python
slashUStr = "\\u0063\\u0072\\u0069\\u0066\\u0061\\u006E\\u0020\\u5728\\u8DEF\\u4E0A" decodedUniChars = slashUStr.decode("unicode-escape") print "decodedUniChars=",decodedUniChars

json與dict轉化

Python
import simplejson # JSON轉化爲字典 json_2_dict = simplejson.loads(user) print json_2_dict #字典轉化爲JSON字符串 dict_2_jsonstr = simplejson.dumps(json_2_dict) print dict_2_jsonstr

識別客戶端類型

Python
def getUA(ua): reg_b = re.compile(r"(android|bb\\d+|meego).+mobile|avantgo|bada\\/|blackberry|blazer|compal|elaine|fennec|hiptop|iemobile|ip(hone|od)|iris|kindle|lge |maemo|midp|mmp|mobile.+firefox|netfront|opera m(ob|in)i|palm( os)?|phone|p(ixi|re)\\/|plucker|pocket|psp|series(4|6)0|symbian|treo|up\\.(browser|link)|vodafone|wap|windows ce|xda|xiino", re.I|re.M) reg_v = re.compile(r"1207|6310|6590|3gso|4thp|50[1-6]i|770s|802s|a wa|abac|ac(er|oo|s\\-)|ai(ko|rn)|al(av|ca|co)|amoi|an(ex|ny|yw)|aptu|ar(ch|go)|as(te|us)|attw|au(di|\\-m|r |s )|avan|be(ck|ll|nq)|bi(lb|rd)|bl(ac|az)|br(e|v)w|bumb|bw\\-(n|u)|c55\\/|capi|ccwa|cdm\\-|cell|chtm|cldc|cmd\\-|co(mp|nd)|craw|da(it|ll|ng)|dbte|dc\\-s|devi|dica|dmob|do(c|p)o|ds(12|\\-d)|el(49|ai)|em(l2|ul)|er(ic|k0)|esl8|ez([4-7]0|os|wa|ze)|fetc|fly(\\-|_)|g1 u|g560|gene|gf\\-5|g\\-mo|go(\\.w|od)|gr(ad|un)|haie|hcit|hd\\-(m|p|t)|hei\\-|hi(pt|ta)|hp( i|ip)|hs\\-c|ht(c(\\-| |_|a|g|p|s|t)|tp)|hu(aw|tc)|i\\-(20|go|ma)|i230|iac( |\\-|\\/)|ibro|idea|ig01|ikom|im1k|inno|ipaq|iris|ja(t|v)a|jbro|jemu|jigs|kddi|keji|kgt( |\\/)|klon|kpt |kwc\\-|kyo(c|k)|le(no|xi)|lg( g|\\/(k|l|u)|50|54|\\-[a-w])|libw|lynx|m1\\-w|m3ga|m50\\/|ma(te|ui|xo)|mc(01|21|ca)|m\\-cr|me(rc|ri)|mi(o8|oa|ts)|mmef|mo(01|02|bi|de|do|t(\\-| |o|v)|zz)|mt(50|p1|v )|mwbp|mywa|n10[0-2]|n20[2-3]|n30(0|2)|n50(0|2|5)|n7(0(0|1)|10)|ne((c|m)\\-|on|tf|wf|wg|wt)|nok(6|i)|nzph|o2im|op(ti|wv)|oran|owg1|p800|pan(a|d|t)|pdxg|pg(13|\\-([1-8]|c))|phil|pire|pl(ay|uc)|pn\\-2|po(ck|rt|se)|prox|psio|pt\\-g|qa\\-a|qc(07|12|21|32|60|\\-[2-7]|i\\-)|qtek|r380|r600|raks|rim9|ro(ve|zo)|s55\\/|sa(ge|ma|mm|ms|ny|va)|sc(01|h\\-|oo|p\\-)|sdk\\/|se(c(\\-|0|1)|47|mc|nd|ri)|sgh\\-|shar|sie(\\-|m)|sk\\-0|sl(45|id)|sm(al|ar|b3|it|t5)|so(ft|ny)|sp(01|h\\-|v\\-|v )|sy(01|mb)|t2(18|50)|t6(00|10|18)|ta(gt|lk)|tcl\\-|tdg\\-|tel(i|m)|tim\\-|t\\-mo|to(pl|sh)|ts(70|m\\-|m3|m5)|tx\\-9|up(\\.b|g1|si)|utst|v400|v750|veri|vi(rg|te)|vk(40|5[0-3]|\\-v)|vm40|voda|vulc|vx(52|53|60|61|70|80|81|83|85|98)|w3c(\\-| )|webc|whit|wi(g |nc|nw)|wmlb|wonu|x700|yas\\-|your|zeto|zte\\-", re.I|re.M) b = reg_b.search(ua) v = reg_v.search(ua[0:4]) if b or v: return 'wap' else: return 'pc'

日期遍歷

Python
import datatime,time def date_range(start, end, only_monday=False, input_format='%y%m%d', output_format='%y%m%d'): '''如print date_range(140130, 140202) 輸出['140130', '140131', '140201', '140202'] ''' start = str(start) end = str(end) start = datetime.datetime.strptime(start, input_format) end = datetime.datetime.strptime(end, input_format) one_day = datetime.timedelta(days=1) range_ = [] d = start - one_day while 1: d = d + one_day if d > end: break if only_monday and d.strftime('%w')!='1': continue range_.append(datetime.datetime.strftime(d, output_format)) return range_

轉帳自:https://www.gogochuang.com/post/58.html

相關文章
相關標籤/搜索