2022-09-20 16:11:48 +02:00
|
|
|
#!/usr/bin/env python3
|
|
|
|
# -*-coding:UTF-8 -*
|
|
|
|
|
|
|
|
import os
|
|
|
|
import sys
|
|
|
|
|
|
|
|
sys.path.append(os.environ['AIL_BIN'])
|
|
|
|
##################################
|
|
|
|
# Import Project packages
|
|
|
|
##################################
|
|
|
|
from modules.abstract_module import AbstractModule
|
|
|
|
from lib.objects.Domains import Domain
|
|
|
|
from lib.objects.Items import Item
|
2022-10-25 16:25:19 +02:00
|
|
|
# from lib.ConfigLoader import ConfigLoader
|
2022-09-20 16:11:48 +02:00
|
|
|
|
|
|
|
class Languages(AbstractModule):
|
|
|
|
"""
|
|
|
|
Languages module for AIL framework
|
|
|
|
"""
|
|
|
|
|
|
|
|
def __init__(self):
|
|
|
|
super(Languages, self).__init__()
|
|
|
|
|
|
|
|
# Send module state to logs
|
2023-05-12 15:29:53 +02:00
|
|
|
self.logger.info(f'Module {self.module_name} initialized')
|
2022-09-20 16:11:48 +02:00
|
|
|
|
|
|
|
def compute(self, message):
|
2023-10-11 14:53:12 +02:00
|
|
|
obj = self.get_obj()
|
|
|
|
|
|
|
|
if obj.type == 'item':
|
2023-11-08 11:59:06 +01:00
|
|
|
if obj.is_crawled():
|
|
|
|
domain = Domain(obj.get_domain())
|
2024-02-05 14:10:19 +01:00
|
|
|
for lang in obj.get_languages(min_probability=0.8, force_gcld3=True):
|
2024-01-15 14:17:15 +01:00
|
|
|
print(lang)
|
|
|
|
domain.add_language(lang)
|
2022-09-20 16:11:48 +02:00
|
|
|
|
2022-10-25 16:25:19 +02:00
|
|
|
|
2022-09-20 16:11:48 +02:00
|
|
|
if __name__ == '__main__':
|
|
|
|
module = Languages()
|
|
|
|
module.run()
|