python统计最近几天访问的网站次数

时间：2014-03-28 19:05:20 阅读：703 评论：0 收藏：0 [点我收藏+]

数据是从chrome中的History分析出来的，它用的是sqlite数据库，python有接口

import sqlite3
import thread
import time
import datetime
import re
def getHistoryDB():
    path=‘C:\Users\Administrator\AppData\Local\Google\Chrome\User Data\Default\History‘
    db=sqlite3.connect(path)#将path换自己电脑History的路径
    cu=db.cursor()
    cu.execute("select url,title,(substr(last_visit_time,1,11)-11644473600) from urls")
    result=cu.fetchall()
    cu.close()
    db.close()
    ‘‘‘
    print ‘length:‘+str(len(result))
   # print getTime(result[len(result)-1][2])
    
    #print result[len(result)-1][2]
    
    for x in range(10):
        print ‘---------------‘
        print getWebsite(result[x][0])
        print result[x][1]
        print getTime(result[x][2])
        #print getTime(result[x][5])
        ‘‘‘
    return result
        
def getWebsite(result):
    AllWebsite={}
    for x in result:
        #处理url
        url=getUrl(x[0])
        #print url
        
        website=url.split(‘.‘)
        #print website
        if len(website)<=1:
            key=‘others‘
        else:
            key=url
        #如果为空
        if key in AllWebsite:
            AllWebsite[key]+=1
        else:
            AllWebsite[key]=1       
    return AllWebsite

def displayWebsite():
    result=getHistoryDB()
    AllWebsite=getWebsite(result)
    for x in AllWebsite:
        print x,AllWebsite[x]
        
 #从url中提起到关键信息，如http://www.baidu.com/xxxxxxx,得到www.baidu.com       
def getUrl(urls):
    reg=re.compile(‘//(.*?)/‘)
    url=reg.findall(urls)
    #print url
    #print len(url)
    if len(url)>0:
        return url[0]
    else:
        return ‘nothing‘
    
#获得访问时间的，没有用到
def getTime(vtime):
    #print vtime
    #vtime=format(float(vtime)/10000000,‘.3f‘)   
    #print vtime
    return time.strftime(‘%Y-%m-%d %H:%M:%S‘,time.localtime(float(vtime)))
    
if __name__==‘__main__‘:
    displayWebsite()
    #getHistoryDB()

去看看你最近常浏览的网站吧，是否有什么有趣的发现

python统计最近几天访问的网站次数,布布扣,bubuko.com

python统计最近几天访问的网站次数

原文：http://blog.csdn.net/iloster/article/details/22323891

踩

(0)

评论一句话评论（0）

分享档案

更多>

2021年09月23日 (328)
2021年09月24日 (313)
2021年09月17日 (191)
2021年09月15日 (369)
2021年09月16日 (411)
2021年09月13日 (439)
2021年09月11日 (398)
2021年09月12日 (393)
2021年09月10日 (160)
2021年09月08日 (222)