mirror of https://github.com/CIRCL/AIL-framework
chg: [tools] add reprocess title + CEDetector
parent
1112615ec3
commit
3f78457dff
|
@ -341,6 +341,8 @@ def obj_iterator(obj_type, filters):
|
||||||
return Pgps.get_all_pgps_objects(filters=filters)
|
return Pgps.get_all_pgps_objects(filters=filters)
|
||||||
elif obj_type == 'message':
|
elif obj_type == 'message':
|
||||||
return chats_viewer.get_messages_iterator(filters=filters)
|
return chats_viewer.get_messages_iterator(filters=filters)
|
||||||
|
elif obj_type == 'title':
|
||||||
|
return Titles.Titles().get_iterator()
|
||||||
|
|
||||||
|
|
||||||
def card_objs_iterators(filters):
|
def card_objs_iterators(filters):
|
||||||
|
|
|
@ -111,17 +111,28 @@ def test_detection():
|
||||||
if not is_detected:
|
if not is_detected:
|
||||||
not_detected.add(domain)
|
not_detected.add(domain)
|
||||||
|
|
||||||
print()
|
|
||||||
print()
|
|
||||||
print()
|
|
||||||
print()
|
|
||||||
for domain in not_detected:
|
for domain in not_detected:
|
||||||
dom = Domain(domain)
|
dom = Domain(domain)
|
||||||
print('-----------', domain)
|
# print('-----------', domain)
|
||||||
for h in dom.get_correlation('title').get('title', []):
|
for h in dom.get_correlation('title').get('title', []):
|
||||||
print(Title(h[1:]).get_content().lower())
|
c = Title(h[1:]).get_content().lower()
|
||||||
print()
|
if c == '404 not found':
|
||||||
print()
|
lt = []
|
||||||
|
dom = Domain(domain)
|
||||||
|
print('-----------', domain)
|
||||||
|
for hi in dom.get_correlation('title').get('title', []):
|
||||||
|
print(Title(hi[1:]).get_content().lower())
|
||||||
|
ci = Title(hi[1:]).get_content().lower()
|
||||||
|
if ci != '404 not found' and ci not in []:
|
||||||
|
lt.append(ci)
|
||||||
|
if lt:
|
||||||
|
print('-----------', domain)
|
||||||
|
for ti in lt:
|
||||||
|
print(ti)
|
||||||
|
print()
|
||||||
|
print()
|
||||||
|
|
||||||
|
# Tag.delete_object_tag(tag, 'domain', domain)
|
||||||
|
|
||||||
|
|
||||||
if __name__ == "__main__":
|
if __name__ == "__main__":
|
||||||
|
|
|
@ -29,11 +29,13 @@ from lib.objects import ail_objects
|
||||||
# from modules.Onion import Onion
|
# from modules.Onion import Onion
|
||||||
# from modules.Telegram import Telegram
|
# from modules.Telegram import Telegram
|
||||||
|
|
||||||
|
from modules.CEDetector import CEDetector
|
||||||
from modules.Languages import Languages
|
from modules.Languages import Languages
|
||||||
from modules.OcrExtractor import OcrExtractor
|
from modules.OcrExtractor import OcrExtractor
|
||||||
from modules.QrCodeReader import QrCodeReader
|
from modules.QrCodeReader import QrCodeReader
|
||||||
|
|
||||||
MODULES = {
|
MODULES = {
|
||||||
|
'CEDetector': CEDetector,
|
||||||
'Languages': Languages,
|
'Languages': Languages,
|
||||||
'OcrExtractor': OcrExtractor,
|
'OcrExtractor': OcrExtractor,
|
||||||
'QrCodeReader': QrCodeReader
|
'QrCodeReader': QrCodeReader
|
||||||
|
@ -70,7 +72,7 @@ if __name__ == "__main__":
|
||||||
obj_type = args.type
|
obj_type = args.type
|
||||||
if not is_object_type(obj_type):
|
if not is_object_type(obj_type):
|
||||||
raise Exception(f'Invalid Object Type: {obj_type}')
|
raise Exception(f'Invalid Object Type: {obj_type}')
|
||||||
if obj_type not in ['image', 'item', 'message', 'screenshot']:
|
if obj_type not in ['image', 'item', 'message', 'screenshot', 'title']:
|
||||||
raise Exception(f'Currently not supported Object Type: {obj_type}')
|
raise Exception(f'Currently not supported Object Type: {obj_type}')
|
||||||
|
|
||||||
modulename = args.module
|
modulename = args.module
|
||||||
|
|
Loading…
Reference in New Issue