mirror of
https://github.com/ail-project/ail-framework.git
synced 2025-09-05 06:32:41 +00:00
chg: [extractor] add cache + UI extractor + word/set extractor
This commit is contained in:
parent
ab24343b48
commit
0fa27c6a51
8 changed files with 208 additions and 69 deletions
|
@ -64,7 +64,7 @@ class CreditCards(AbstractModule):
|
|||
for card in cards:
|
||||
start, end, value = card
|
||||
if self.get_valid_card(value):
|
||||
extracted.append(card)
|
||||
extracted.append([start, end, value, f'tag:{tag}'])
|
||||
return extracted
|
||||
|
||||
def compute(self, message, r_result=False):
|
||||
|
|
|
@ -69,8 +69,7 @@ class Iban(AbstractModule):
|
|||
start, end, value = iban
|
||||
value = ''.join(e for e in value if e.isalnum())
|
||||
if self.is_valid_iban(value):
|
||||
print(value)
|
||||
extracted.append(iban)
|
||||
extracted.append([start, end, value, f'tag:{tag}'])
|
||||
return extracted
|
||||
|
||||
def compute(self, message):
|
||||
|
|
|
@ -130,7 +130,7 @@ class Mail(AbstractModule):
|
|||
mxdomains[mxdomain].append(mail)
|
||||
for mx in self.check_mx_record(mxdomains.keys()):
|
||||
for row in mxdomains[mx]:
|
||||
extracted.append(row)
|
||||
extracted.append([row[0], row[1], row[2], f'tag:{tag}'])
|
||||
return extracted
|
||||
|
||||
# # TODO: sanitize mails
|
||||
|
|
|
@ -62,7 +62,7 @@ class Onion(AbstractModule):
|
|||
url_unpack = crawlers.unpack_url(value)
|
||||
domain = url_unpack['domain']
|
||||
if crawlers.is_valid_onion_domain(domain):
|
||||
extracted.append(onion)
|
||||
extracted.append([start, end, value, f'tag:{tag}'])
|
||||
return extracted
|
||||
|
||||
def compute(self, message):
|
||||
|
|
|
@ -409,8 +409,12 @@ class Tools(AbstractModule):
|
|||
return TOOLS.keys()
|
||||
|
||||
def extract(self, obj_id, content, tag):
|
||||
extracted = []
|
||||
tool_name = tag.rsplit('"', 2)[1][:-5]
|
||||
return self.regex_finditer(TOOLS[tool_name]['regex'], obj_id, content)
|
||||
tools = self.regex_finditer(TOOLS[tool_name]['regex'], obj_id, content)
|
||||
for tool in tools:
|
||||
extracted.append([tool[0], tool[1], tool[2], f'tag:{tag}'])
|
||||
return extracted
|
||||
|
||||
def compute(self, message):
|
||||
item = Item(message)
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue