fix: [module] fix module obj type: language + mail

This commit is contained in:
terrtia 2023-10-11 14:53:12 +02:00
parent 623ba455ff
commit 6978764b02
No known key found for this signature in database
GPG key ID: 1E1B1F50D84613D0
2 changed files with 10 additions and 8 deletions

View file

@ -25,7 +25,9 @@ class Languages(AbstractModule):
self.logger.info(f'Module {self.module_name} initialized') self.logger.info(f'Module {self.module_name} initialized')
def compute(self, message): def compute(self, message):
item = self.get_obj() obj = self.get_obj()
if obj.type == 'item':
if item.is_crawled(): if item.is_crawled():
domain = Domain(item.get_domain()) domain = Domain(item.get_domain())
for lang in item.get_languages(min_probability=0.8): for lang in item.get_languages(min_probability=0.8):

View file

@ -139,7 +139,7 @@ class Mail(AbstractModule):
item = self.get_obj() item = self.get_obj()
item_date = item.get_date() item_date = item.get_date()
mails = self.regex_findall(self.email_regex, item_id, item.get_content()) mails = self.regex_findall(self.email_regex, item.id, item.get_content())
mxdomains_email = {} mxdomains_email = {}
for mail in mails: for mail in mails:
mxdomain = mail.rsplit('@', 1)[1].lower() mxdomain = mail.rsplit('@', 1)[1].lower()
@ -172,9 +172,9 @@ class Mail(AbstractModule):
# for tld in mx_tlds: # for tld in mx_tlds:
# Statistics.add_module_tld_stats_by_date('mail', item_date, tld, mx_tlds[tld]) # Statistics.add_module_tld_stats_by_date('mail', item_date, tld, mx_tlds[tld])
msg = f'Mails;{item.get_source()};{item_date};{item.get_basename()};Checked {num_valid_email} e-mail(s);{item_id}' msg = f'Mails;{item.get_source()};{item_date};{item.get_basename()};Checked {num_valid_email} e-mail(s);{item.id}'
if num_valid_email > self.mail_threshold: if num_valid_email > self.mail_threshold:
print(f'{item_id} Checked {num_valid_email} e-mail(s)') print(f'{item.id} Checked {num_valid_email} e-mail(s)')
self.redis_logger.warning(msg) self.redis_logger.warning(msg)
# Tags # Tags
tag = 'infoleak:automatic-detection="mail"' tag = 'infoleak:automatic-detection="mail"'