-
Notifications
You must be signed in to change notification settings - Fork 1
/
Copy pathutils.py
90 lines (71 loc) · 2.35 KB
/
utils.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
import json
import datetime
import ipaddress
from w3lib.url import canonicalize_url
def normalise_uri(uri):
uri = uri.replace("//", "/")
return canonicalize_url(uri, keep_fragments=True)
def anonymise_ip(ip):
"""Zero out the last bits of an IP address"""
ip = ipaddress.ip_address(ip)
if ip.version == 4:
shift = 8
else:
shift = 80
ip = int(ip) >> shift << shift
return str(ipaddress.ip_address(ip))
class JSONEncoder(json.JSONEncoder):
def default(self, obj):
if isinstance(obj, datetime.datetime):
return obj.isoformat()
return super().default(obj)
DEFAULT_ALPHABET = 'mn6j2c4rv8bpygw95z7hsdaetxuk3fq'
DEFAULT_BLOCK_SIZE = 24
# Author: Michael Fogleman
# License: MIT
# Link: http://code.activestate.com/recipes/576918/
class IntEncoder(object):
def __init__(self, alphabet=DEFAULT_ALPHABET,
block_size=DEFAULT_BLOCK_SIZE,
min_length=4):
self.alphabet = alphabet
self.block_size = block_size
self.min_length = min_length
self.mask = (1 << block_size) - 1
self.mapping = list(range(block_size))
self.mapping.reverse()
def encode_url(self, n):
return self.enbase(self.encode(n))
def decode_url(self, n):
return self.decode(self.debase(n))
def encode(self, n):
return (n & ~self.mask) | self._encode(n & self.mask)
def _encode(self, n):
result = 0
for i, b in enumerate(self.mapping):
if n & (1 << i):
result |= (1 << b)
return result
def decode(self, n):
return (n & ~self.mask) | self._decode(n & self.mask)
def _decode(self, n):
result = 0
for i, b in enumerate(self.mapping):
if n & (1 << b):
result |= (1 << i)
return result
def enbase(self, x):
result = self._enbase(x)
padding = self.alphabet[0] * (self.min_length - len(result))
return '%s%s' % (padding, result)
def _enbase(self, x):
n = len(self.alphabet)
if x < n:
return self.alphabet[x]
return self._enbase(x // n) + self.alphabet[x % n]
def debase(self, x):
n = len(self.alphabet)
result = 0
for i, c in enumerate(reversed(x)):
result += self.alphabet.index(c) * (n ** i)
return result