iwla

iwla Commit Details

Date:2014-11-27 13:47:31 (6 years 9 months ago)
Author:Grégory Soutadé
Branch:dev, master
Commit:f7bf2e11bad5981f72f9680198e88d7abaa99d23
Parents: c87ddfb1aabdbbefd6dca0f01bd0aee3a6fd208a
Message:Add top_hits plugin

Changes:
Cplugins/post_analysis/top_pages.py → plugins/post_analysis/top_hits.py
Aplugins/display/top_hits.py (full)

File differences

plugins/display/top_hits.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
import time
from iwla import IWLA
from iplugin import IPlugin
from display import *
class IWLADisplayTopHits(IPlugin):
def __init__(self, iwla):
super(IWLADisplayTopHits, self).__init__(iwla)
self.API_VERSION = 1
self.requires = ['IWLAPostAnalysisTopHits']
def hook(self):
top_hits = self.iwla.getMonthStats()['top_hits']
top_hits = sorted(top_hits.items(), key=lambda t: t[1], reverse=True)
index = self.iwla.getDisplayIndex()
table = DisplayHTMLBlockTable('Top Hits', ['URI', 'Entrance'])
for (uri, entrance) in top_hits[:10]:
table.appendRow([uri, entrance])
index.appendBlock(table)
cur_time = self.iwla.getCurTime()
title = time.strftime('All Hits - %B %Y', cur_time)
filename = 'top_hits_%d.html' % (cur_time.tm_mon)
path = '%d/%s' % (cur_time.tm_year, filename)
page = DisplayHTMLPage(title, path)
table = DisplayHTMLBlockTable('Top Hits', ['URI', 'Entrance'])
for (uri, entrance) in top_hits:
table.appendRow([uri, entrance])
page.appendBlock(table)
display = self.iwla.getDisplay()
display.addPage(page)
block = DisplayHTMLRawBlock()
block.setRawHTML('<a href=\'%s\'>All hits</a>' % (filename))
index.appendBlock(block)
plugins/post_analysis/top_hits.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
from iwla import IWLA
from iplugin import IPlugin
class IWLAPostAnalysisTopHits(IPlugin):
def __init__(self, iwla):
super(IWLAPostAnalysisTopHits, self).__init__(iwla)
self.API_VERSION = 1
def hook(self):
stats = self.iwla.getCurrentVisists()
month_stats = self.iwla.getMonthStats()
top_hits = month_stats.get('top_hits', {})
for (k, super_hit) in stats.items():
if super_hit['robot']: continue
for r in super_hit['requests']:
if r['is_page']: continue
if not self.iwla.isValidForCurrentAnalysis(r) or\
not self.iwla.hasBeenViewed(r):
continue
uri = r['extract_request']['extract_uri']
uri = "%s%s" % (r.get('server_name', ''), uri)
if not uri in top_hits.keys():
top_hits[uri] = 1
else:
top_hits[uri] += 1
month_stats['top_hits'] = top_hits

Archive Download the corresponding diff file

Branches

Tags