mirror of https://github.com/CIRCL/AIL-framework
				
				
				
			fix: [module] fix module obj type: language + mail
							parent
							
								
									623ba455ff
								
							
						
					
					
						commit
						6978764b02
					
				|  | @ -25,11 +25,13 @@ class Languages(AbstractModule): | |||
|         self.logger.info(f'Module {self.module_name} initialized') | ||||
| 
 | ||||
|     def compute(self, message): | ||||
|         item = self.get_obj() | ||||
|         if item.is_crawled(): | ||||
|             domain = Domain(item.get_domain()) | ||||
|             for lang in item.get_languages(min_probability=0.8): | ||||
|                 domain.add_language(lang.language) | ||||
|         obj = self.get_obj() | ||||
|          | ||||
|         if obj.type == 'item': | ||||
|             if item.is_crawled(): | ||||
|                 domain = Domain(item.get_domain()) | ||||
|                 for lang in item.get_languages(min_probability=0.8): | ||||
|                     domain.add_language(lang.language) | ||||
| 
 | ||||
| 
 | ||||
| if __name__ == '__main__': | ||||
|  |  | |||
|  | @ -139,7 +139,7 @@ class Mail(AbstractModule): | |||
|         item = self.get_obj() | ||||
|         item_date = item.get_date() | ||||
| 
 | ||||
|         mails = self.regex_findall(self.email_regex, item_id, item.get_content()) | ||||
|         mails = self.regex_findall(self.email_regex, item.id, item.get_content()) | ||||
|         mxdomains_email = {} | ||||
|         for mail in mails: | ||||
|             mxdomain = mail.rsplit('@', 1)[1].lower() | ||||
|  | @ -172,9 +172,9 @@ class Mail(AbstractModule): | |||
|         # for tld in mx_tlds: | ||||
|         #     Statistics.add_module_tld_stats_by_date('mail', item_date, tld, mx_tlds[tld]) | ||||
| 
 | ||||
|         msg = f'Mails;{item.get_source()};{item_date};{item.get_basename()};Checked {num_valid_email} e-mail(s);{item_id}' | ||||
|         msg = f'Mails;{item.get_source()};{item_date};{item.get_basename()};Checked {num_valid_email} e-mail(s);{item.id}' | ||||
|         if num_valid_email > self.mail_threshold: | ||||
|             print(f'{item_id}    Checked {num_valid_email} e-mail(s)') | ||||
|             print(f'{item.id}    Checked {num_valid_email} e-mail(s)') | ||||
|             self.redis_logger.warning(msg) | ||||
|             # Tags | ||||
|             tag = 'infoleak:automatic-detection="mail"' | ||||
|  |  | |||
		Loading…
	
		Reference in New Issue
	
	 terrtia
						terrtia