-
Notifications
You must be signed in to change notification settings - Fork 496
/
Copy pathbase.py
130 lines (104 loc) · 4.13 KB
/
base.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
from abc import ABCMeta
from abc import abstractmethod
from abc import abstractproperty
from detect_secrets.core.potential_secret import PotentialSecret
from detect_secrets.plugins.core.constants import WHITELIST_REGEXES
class BasePlugin(object):
"""This is an abstract class to define Plugins API"""
__metaclass__ = ABCMeta
secret_type = None
def __init__(self, **kwargs):
if not self.secret_type:
raise ValueError('Plugins need to declare a secret_type.')
def analyze(self, file, filename):
"""
:param file: The File object itself.
:param filename: string; filename of File object, used for creating
PotentialSecret objects
:returns dictionary representation of set (for random access by hash)
{ detect_secrets.core.potential_secret.__hash__:
detect_secrets.core.potential_secret }
"""
potential_secrets = {}
for line_num, line in enumerate(file.readlines(), start=1):
if any(regex.search(line) for regex in WHITELIST_REGEXES):
continue
secrets = self.analyze_string(line, line_num, filename)
potential_secrets.update(secrets)
return potential_secrets
@abstractmethod
def analyze_string(self, string, line_num, filename):
"""
:param string: string; the line to analyze
:param line_num: integer; line number that is currently being analyzed
:param filename: string; name of file being analyzed
:returns: dictionary
NOTE: line_num and filename are used for PotentialSecret creation only.
"""
raise NotImplementedError
@abstractmethod
def secret_generator(self, string):
"""Flags secrets in a given string, and yields the raw secret value.
Used in self.analyze_string for PotentialSecret creation.
:type string: str
:param string: the secret to scan
"""
raise NotImplementedError
def adhoc_scan(self, string):
"""To support faster discovery, we want the ability to conveniently
check what different plugins say regarding a single line/secret. This
supports that.
This is very similar to self.analyze_string, but allows the flexibility
for subclasses to add any other notable info (rather than just a
PotentialSecret type). e.g. HighEntropyStrings adds their Shannon
entropy in which they made their decision.
:type string: str
:param string: the string to analyze
:rtype: str
:returns: descriptive string that fits the format
<classname>: <returned-value>
"""
# TODO: Handle multiple secrets on single line.
results = self.analyze_string(string, 0, 'does_not_matter')
if not results:
return 'False'
else:
return 'True'
@property
def __dict__(self):
return {
'name': self.__class__.__name__,
}
class RegexBasedDetector(BasePlugin):
"""Base class for regular-expressed based detectors.
To create a new regex-based detector, subclass this and set
`secret_type` with a description and `blacklist`
with a sequence of regular expressions, like:
class FooDetector(RegexBasedDetector):
secret_type = "foo"
blacklist = (
re.compile(r'foo'),
)
"""
__metaclass__ = ABCMeta
@abstractproperty
def secret_type(self):
raise NotImplementedError
@abstractproperty
def blacklist(self):
raise NotImplementedError
def analyze_string(self, string, line_num, filename):
output = {}
for identifier in self.secret_generator(string):
secret = PotentialSecret(
self.secret_type,
filename,
identifier,
line_num,
)
output[secret] = secret
return output
def secret_generator(self, string):
for regex in self.blacklist:
for match in regex.findall(string):
yield match