44 lines
1.2 KiB
Python
44 lines
1.2 KiB
Python
|
import time
|
||
|
import re
|
||
|
|
||
|
from iwla import IWLA
|
||
|
from iplugin import IPlugin
|
||
|
|
||
|
class IWLAPostAnalysisTopPages(IPlugin):
|
||
|
def __init__(self, iwla):
|
||
|
super(IWLAPostAnalysisTopPages, self).__init__(iwla)
|
||
|
self.API_VERSION = 1
|
||
|
|
||
|
def load(self):
|
||
|
self.index_re = re.compile(r'/index.*')
|
||
|
return True
|
||
|
|
||
|
def hook(self):
|
||
|
start_time = self.iwla.getStartAnalysisTime()
|
||
|
start_time = time.mktime(start_time)
|
||
|
|
||
|
stats = self.iwla.getCurrentVisists()
|
||
|
month_stats = self.iwla.getMonthStats()
|
||
|
|
||
|
top_pages = month_stats.get('top_pages', {})
|
||
|
|
||
|
for (k, super_hit) in stats.items():
|
||
|
if super_hit['robot']: continue
|
||
|
for r in super_hit['requests']:
|
||
|
if not r['is_page']: continue
|
||
|
|
||
|
if time.mktime(r['time_decoded']) < start_time: continue
|
||
|
|
||
|
uri = r['extract_request']['extract_uri']
|
||
|
if self.index_re.match(uri):
|
||
|
uri = '/'
|
||
|
|
||
|
uri = "%s%s" % (r.get('server_name', ''), uri)
|
||
|
|
||
|
if not uri in top_pages.keys():
|
||
|
top_pages[uri] = 1
|
||
|
else:
|
||
|
top_pages[uri] += 1
|
||
|
|
||
|
month_stats['top_pages'] = top_pages
|