Commit
This commit is contained in:
19
plugins/pre_analysis/H002_soutade.py
Normal file
19
plugins/pre_analysis/H002_soutade.py
Normal file
@@ -0,0 +1,19 @@
|
||||
import re
|
||||
|
||||
# Remove logo from indefero
|
||||
logo_re = re.compile(r'^.+/logo/$')
|
||||
|
||||
# Basic rule to detect robots
|
||||
|
||||
def hook(hits):
|
||||
for k in hits.keys():
|
||||
super_hit = hits[k]
|
||||
|
||||
if super_hit['robot']: continue
|
||||
|
||||
for p in super_hit['pages']:
|
||||
if not p['is_page']: continue
|
||||
if logo_re.match(p['extract_request']['extract_uri']):
|
||||
p['is_page'] = False
|
||||
super_hit['viewed_pages'] -= 1
|
||||
super_hit['viewed_hits'] += 1
|
||||
Reference in New Issue
Block a user