mirror of https://github.com/CIRCL/AIL-framework
fix: [module_extractor] don't extract onion from crawled items
parent
f4fca05524
commit
f77c9268bb
|
@ -56,6 +56,9 @@ class Onion(AbstractModule):
|
|||
|
||||
def extract(self, obj, content, tag):
|
||||
extracted = []
|
||||
if self.obj.type == 'item':
|
||||
if 'infoleak:submission="crawler"' in obj.get_tags():
|
||||
return extracted
|
||||
onions = self.regex_finditer(self.onion_regex, obj.get_global_id(), content)
|
||||
for onion in onions:
|
||||
start, end, value = onion
|
||||
|
|
Loading…
Reference in New Issue