forked from EFForg/badger-sett
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathaudit.py
39 lines (32 loc) · 1.13 KB
/
audit.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
from collections import Counter
import git
import json
import re
def get_old_maps():
repo = git.Repo('./')
old_maps = {}
# load old map data
for c in repo.iter_commits('master'):
if re.match(r'Update seed data: \d+\.\d+\.\d+', c.message):
repo.git.checkout(c.hexsha)
with open('results.json', encoding='utf-8') as f:
js = json.load(f)
if 'version' in js:
old_maps[js['version']] = js
return old_maps
def count_domain_blocks():
old_maps = get_old_maps()
# count number of times each domain has been blocked
ctr = Counter()
for m in old_maps.values():
for domain, data in m['action_map'].items():
if data['heuristicAction'] in ['block', 'cookieblock']:
ctr[domain] += 1
return ctr
# Find domains that are blocked now but have never been blocked before
def count_new_blocks(data):
blocked = [d for d, v in data['action_map'].items()
if v['heuristicAction'] in ['block', 'cookieblock']]
ctr = count_domain_blocks()
new = [d for d in blocked if d not in ctr]
return new