mirror of https://github.com/CIRCL/AIL-framework
fix: [module_extractor] don't extract onion from crawled items
parent
f4fca05524
commit
f77c9268bb
|
@ -56,6 +56,9 @@ class Onion(AbstractModule):
|
||||||
|
|
||||||
def extract(self, obj, content, tag):
|
def extract(self, obj, content, tag):
|
||||||
extracted = []
|
extracted = []
|
||||||
|
if self.obj.type == 'item':
|
||||||
|
if 'infoleak:submission="crawler"' in obj.get_tags():
|
||||||
|
return extracted
|
||||||
onions = self.regex_finditer(self.onion_regex, obj.get_global_id(), content)
|
onions = self.regex_finditer(self.onion_regex, obj.get_global_id(), content)
|
||||||
for onion in onions:
|
for onion in onions:
|
||||||
start, end, value = onion
|
start, end, value = onion
|
||||||
|
|
Loading…
Reference in New Issue