ail-framework/bin/lib/ail_core.py

#!/usr/bin/env python3
# -*-coding:UTF-8 -*

import os
import sys
import uuid

sys.path.append(os.environ['AIL_BIN'])
##################################
# Import Project packages
##################################
from lib.ConfigLoader import ConfigLoader

config_loader = ConfigLoader()
r_serv_db = config_loader.get_db_conn("Kvrocks_DB")
r_object = config_loader.get_db_conn("Kvrocks_Objects")
config_loader = None

AIL_OBJECTS = sorted({'chat', 'chat-subchannel', 'chat-thread', 'cookie-name', 'cve', 'cryptocurrency', 'decoded',
                      'domain', 'etag', 'favicon', 'file-name', 'hhhash','item', 'image', 'message', 'ocr', 'pgp',
                      'qrcode', 'screenshot', 'title', 'user-account', 'username'})

AIL_OBJECTS_WITH_SUBTYPES = {'chat', 'chat-subchannel', 'cryptocurrency', 'pgp', 'username', 'user-account'}

# TODO by object TYPE ????
AIL_OBJECTS_CORRELATIONS_DEFAULT = sorted({'chat', 'chat-subchannel', 'chat-thread', 'cve', 'cryptocurrency', 'decoded',
                                           'domain', 'favicon', 'file-name', 'item', 'image', 'message', 'ocr', 'pgp',
                                           'qrcode', 'screenshot', 'title', 'user-account', 'username'})

def get_ail_uuid():
    ail_uuid = r_serv_db.get('ail:uuid')
    if not ail_uuid:
        ail_uuid = _set_ail_uuid()
    return ail_uuid

def _set_ail_uuid():
    ail_uuid = generate_uuid()
    r_serv_db.set('ail:uuid', ail_uuid)
    return ail_uuid

def get_ail_uuid_int():
    ail_uuid = get_ail_uuid()
    header_uuid = ail_uuid.replace('-', '')
    return uuid.UUID(hex=header_uuid, version=4).int

def is_valid_uuid_v4(header_uuid):
    try:
        header_uuid = header_uuid.replace('-', '')
        uuid_test = uuid.UUID(hex=header_uuid, version=4)
        return uuid_test.hex == header_uuid
    except:
        return False

def generate_uuid():
    return str(uuid.uuid4())

#### AIL OBJECTS ####

def get_all_objects():
    return AIL_OBJECTS

def is_object_type(obj_type):
    return obj_type in AIL_OBJECTS

def get_objects_with_subtypes():
    return AIL_OBJECTS_WITH_SUBTYPES

def get_object_all_subtypes(obj_type):  # TODO Dynamic subtype
    if obj_type == 'chat':
        return r_object.smembers(f'all_chat:subtypes')
    if obj_type == 'chat-subchannel':
        return r_object.smembers(f'all_chat-subchannel:subtypes')
    if obj_type == 'chat-thread':
        return r_object.smembers(f'all_chat-thread:subtypes')
    if obj_type == 'cryptocurrency':
        return ['bitcoin', 'bitcoin-cash', 'dash', 'ethereum', 'litecoin', 'monero', 'tron', 'zcash']
    if obj_type == 'pgp':
        return ['key', 'mail', 'name']
    if obj_type == 'username':
        return ['telegram', 'twitter', 'jabber']
    if obj_type == 'user-account':
        return r_object.smembers(f'all_chat:subtypes')
    return []

def get_default_correlation_objects():
    return AIL_OBJECTS_CORRELATIONS_DEFAULT

def get_obj_queued():
    return ['item', 'image', 'message', 'ocr', 'qrcode'] # screenshot ???

def get_objects_tracked():
    return ['decoded', 'item', 'pgp', 'message', 'ocr', 'qrcode', 'title']

def get_objects_retro_hunted():
    return ['decoded', 'item', 'message']

def get_all_objects_with_subtypes_tuple():
    str_objs = []
    for obj_type in get_all_objects():
        subtypes = get_object_all_subtypes(obj_type)
        if subtypes:
            for subtype in subtypes:
                str_objs.append((obj_type, subtype))
        else:
            str_objs.append((obj_type, ''))
    return str_objs

def unpack_obj_global_id(global_id, r_type='tuple'):
    if r_type == 'dict':
        obj = global_id.split(':', 2)
        return {'type': obj[0], 'subtype': obj[1], 'id': obj[2]}
    else:  # tuple(type, subtype, id)
        return global_id.split(':', 2)    # TODO REPLACE get_obj_type_subtype_id_from_global_id(global_id)

def unpack_objs_global_id(objs_global_id, r_type='tuple'):
    objs = []
    for global_id in objs_global_id:
        objs.append(unpack_obj_global_id(global_id, r_type=r_type))
    return objs

def unpack_correl_obj__id(obj_type, global_id, r_type='tuple'):
    obj = global_id.split(':', 1)
    if r_type == 'dict':
        return {'type': obj_type, 'subtype': obj[0], 'id': obj[1]}
    else:  # tuple(type, subtype, id)
        return obj_type, obj[0], obj[1]

def unpack_correl_objs_id(obj_type, correl_objs_id, r_type='tuple'):
    objs = []
    for correl_obj_id in correl_objs_id:
        objs.append(unpack_correl_obj__id(obj_type, correl_obj_id, r_type=r_type))
    return objs

##-- AIL OBJECTS --##

####    Redis     ####

def _parse_zscan(response):
    cursor, r = response
    it = iter(r)
    return str(cursor), list(it)

def zscan_iter(r_redis, name):  # count ???
    cursor = 0
    while cursor != "0":
        cursor, data = _parse_zscan(r_redis.zscan(name, cursor=cursor))
        yield from data

## --    Redis     -- ##

def rreplace(s, old, new, occurrence):
    li = s.rsplit(old, occurrence)
    return new.join(li)

def paginate_iterator(iter_elems, nb_obj=50, page=1):
    dict_page = {'nb_all_elem': len(iter_elems)}
    nb_pages = dict_page['nb_all_elem'] / nb_obj
    if not nb_pages.is_integer():
        nb_pages = int(nb_pages)+1
    else:
        nb_pages = int(nb_pages)
    if page > nb_pages:
        page = nb_pages

    # multiple pages
    if nb_pages > 1:
        dict_page['list_elem'] = []
        start = nb_obj*(page - 1)
        stop = (nb_obj*page) - 1
        current_index = 0
        for elem in iter_elems:
            if current_index > stop:
                break
            if start <= current_index <= stop:
                dict_page['list_elem'].append(elem)
            current_index += 1
        stop += 1
        if stop > dict_page['nb_all_elem']:
            stop = dict_page['nb_all_elem']

    else:
        start = 0
        stop = dict_page['nb_all_elem']
        dict_page['list_elem'] = list(iter_elems)
    dict_page['page'] = page
    dict_page['nb_pages'] = nb_pages
    # UI
    dict_page['nb_first_elem'] = start+1
    dict_page['nb_last_elem'] = stop
    return dict_page
chg: [Kvrocks migration] rewrite obj tags + migration 2022-09-01 12:04:00 +00:00			`#!/usr/bin/env python3`
			`# --coding:UTF-8 -`

			`import os`
			`import sys`
chg: [api] refactor blueprint 2024-02-26 14:35:48 +00:00			`import uuid`
chg: [Kvrocks migration] rewrite obj tags + migration 2022-09-01 12:04:00 +00:00
			`sys.path.append(os.environ['AIL_BIN'])`
			`##################################`
			`# Import Project packages`
			`##################################`
			`from lib.ConfigLoader import ConfigLoader`

			`config_loader = ConfigLoader()`
chg: [MISP export + redis] refactor MISP, export all relationships between objects, relationships between investigated objects + bump redis-py version + theHive export 2023-01-16 15:27:49 +00:00			`r_serv_db = config_loader.get_db_conn("Kvrocks_DB")`
chg: [chats] add chats explorer v0 2023-11-02 15:28:33 +00:00			`r_object = config_loader.get_db_conn("Kvrocks_Objects")`
chg: [Kvrocks migration] rewrite obj tags + migration 2022-09-01 12:04:00 +00:00			`config_loader = None`

chg: [chats] add messages threads 2023-11-29 15:28:25 +00:00			`AIL_OBJECTS = sorted({'chat', 'chat-subchannel', 'chat-thread', 'cookie-name', 'cve', 'cryptocurrency', 'decoded',`
chg: [qrcode] extract qrcode content from images and screenshots + qrcode object + correlation 2024-10-01 13:12:15 +00:00			`'domain', 'etag', 'favicon', 'file-name', 'hhhash','item', 'image', 'message', 'ocr', 'pgp',`
			`'qrcode', 'screenshot', 'title', 'user-account', 'username'})`
chg: [tags] refactor tags + cleanup 2022-11-22 09:47:15 +00:00
chg: [api] get object + get investigation 2024-02-29 13:56:45 +00:00			`AIL_OBJECTS_WITH_SUBTYPES = {'chat', 'chat-subchannel', 'cryptocurrency', 'pgp', 'username', 'user-account'}`

chg: [correlation] description: get message content + don't show etag, cookie_name and hhash by default 2024-03-11 14:33:30 +00:00			`# TODO by object TYPE ????`
			`AIL_OBJECTS_CORRELATIONS_DEFAULT = sorted({'chat', 'chat-subchannel', 'chat-thread', 'cve', 'cryptocurrency', 'decoded',`
chg: [qrcode] extract qrcode content from images and screenshots + qrcode object + correlation 2024-10-01 13:12:15 +00:00			`'domain', 'favicon', 'file-name', 'item', 'image', 'message', 'ocr', 'pgp',`
			`'qrcode', 'screenshot', 'title', 'user-account', 'username'})`
chg: [correlation] description: get message content + don't show etag, cookie_name and hhash by default 2024-03-11 14:33:30 +00:00
chg: [Kvrocks migration] rewrite obj tags + migration 2022-09-01 12:04:00 +00:00			`def get_ail_uuid():`
fix: [core] fix instance ail:uuid 2023-05-15 08:37:03 +00:00			`ail_uuid = r_serv_db.get('ail:uuid')`
			`if not ail_uuid:`
			`ail_uuid = _set_ail_uuid()`
			`return ail_uuid`

			`def _set_ail_uuid():`
			`ail_uuid = generate_uuid()`
			`r_serv_db.set('ail:uuid', ail_uuid)`
			`return ail_uuid`
chg: [Kvrocks migration] rewrite obj tags + migration 2022-09-01 12:04:00 +00:00
chg: [flask] use the same cookie name + cache git commits, tags and branch name 2024-09-16 13:30:12 +00:00			`def get_ail_uuid_int():`
			`ail_uuid = get_ail_uuid()`
			`header_uuid = ail_uuid.replace('-', '')`
			`return uuid.UUID(hex=header_uuid, version=4).int`

chg: [api] refactor blueprint 2024-02-26 14:35:48 +00:00			`def is_valid_uuid_v4(header_uuid):`
			`try:`
			`header_uuid = header_uuid.replace('-', '')`
			`uuid_test = uuid.UUID(hex=header_uuid, version=4)`
			`return uuid_test.hex == header_uuid`
			`except:`
			`return False`

chg: [DB] remove ARDB + temp disable MISP import and auto export 2023-04-04 08:25:01 +00:00			`def generate_uuid():`
chg: [api] refactor blueprint 2024-02-26 14:35:48 +00:00			`return str(uuid.uuid4())`
chg: [DB] remove ARDB + temp disable MISP import and auto export 2023-04-04 08:25:01 +00:00
chg: [Kvrocks migration] rewrite obj tags + migration 2022-09-01 12:04:00 +00:00			`#### AIL OBJECTS ####`

			`def get_all_objects():`
chg: [tags] refactor tags + cleanup 2022-11-22 09:47:15 +00:00			`return AIL_OBJECTS`
chg: [Kvrocks migration] rewrite obj tags + migration 2022-09-01 12:04:00 +00:00
chg: [tools] reprocess objects by type 2024-03-13 13:04:23 +00:00			`def is_object_type(obj_type):`
			`return obj_type in AIL_OBJECTS`

chg: [subtype objects] migrate UI cryptocurrency, pgp, username 2023-02-28 10:01:27 +00:00			`def get_objects_with_subtypes():`
chg: [api] get object + get investigation 2024-02-29 13:56:45 +00:00			`return AIL_OBJECTS_WITH_SUBTYPES`
chg: [subtype objects] migrate UI cryptocurrency, pgp, username 2023-02-28 10:01:27 +00:00
chg: [chats] add chats explorer v0 2023-11-02 15:28:33 +00:00			`def get_object_all_subtypes(obj_type): # TODO Dynamic subtype`
chg: [core] add telegram importer + Chat object + message Object + add timeline engine 2023-08-18 09:05:21 +00:00			`if obj_type == 'chat':`
chg: [chats] add chats explorer v0 2023-11-02 15:28:33 +00:00			`return r_object.smembers(f'all_chat:subtypes')`
			`if obj_type == 'chat-subchannel':`
			`return r_object.smembers(f'all_chat-subchannel:subtypes')`
chg: [api] get chat/subchannel/thread messages 2024-02-29 15:18:22 +00:00			`if obj_type == 'chat-thread':`
			`return r_object.smembers(f'all_chat-thread:subtypes')`
chg: [Kvrocks migration] rewrite obj tags + migration 2022-09-01 12:04:00 +00:00			`if obj_type == 'cryptocurrency':`
chg: [tron] add TRON crytocurrency detection + correlation. Thanks @pventuzelo for the contribution 2024-05-08 13:14:51 +00:00			`return ['bitcoin', 'bitcoin-cash', 'dash', 'ethereum', 'litecoin', 'monero', 'tron', 'zcash']`
chg: [Kvrocks migration] rewrite obj tags + migration 2022-09-01 12:04:00 +00:00			`if obj_type == 'pgp':`
			`return ['key', 'mail', 'name']`
			`if obj_type == 'username':`
			`return ['telegram', 'twitter', 'jabber']`
chg: [chats] add chats participants + user-accounts basic template 2023-12-06 15:26:26 +00:00			`if obj_type == 'user-account':`
			`return r_object.smembers(f'all_chat:subtypes')`
fix: [tags] fix delete subtype tags 2023-04-06 14:26:56 +00:00			`return []`
chg: [Kvrocks migration] rewrite obj tags + migration 2022-09-01 12:04:00 +00:00
chg: [correlation] description: get message content + don't show etag, cookie_name and hhash by default 2024-03-11 14:33:30 +00:00			`def get_default_correlation_objects():`
			`return AIL_OBJECTS_CORRELATIONS_DEFAULT`

chg: [queues] timeout obj after 2 days 2024-01-08 12:50:56 +00:00			`def get_obj_queued():`
fix: [crawler] filter lookup parent + domain daterange 2024-10-07 09:03:56 +00:00			`return ['item', 'image', 'message', 'ocr', 'qrcode'] # screenshot ???`
chg: [queues] timeout obj after 2 days 2024-01-08 12:50:56 +00:00
chg: [trackers] refactor trackers: track objects + filter by object types/sources/subtypes 2023-05-04 14:35:56 +00:00			`def get_objects_tracked():`
chg: [qrcode] extract qrcode content from images and screenshots + qrcode object + correlation 2024-10-01 13:12:15 +00:00			`return ['decoded', 'item', 'pgp', 'message', 'ocr', 'qrcode', 'title']`
chg: [trackers] refactor trackers: track objects + filter by object types/sources/subtypes 2023-05-04 14:35:56 +00:00
chg: [objects + retro hunt] refactor retro hunt + objects retro hunts + get objects generator by filters (date_from, sources, mimetypes, ...) 2023-05-10 14:26:46 +00:00			`def get_objects_retro_hunted():`
fix: [tracker] fix message trackers 2024-02-15 15:22:00 +00:00			`return ['decoded', 'item', 'message']`
chg: [objects + retro hunt] refactor retro hunt + objects retro hunts + get objects generator by filters (date_from, sources, mimetypes, ...) 2023-05-10 14:26:46 +00:00
chg: [MISP export + redis] refactor MISP, export all relationships between objects, relationships between investigated objects + bump redis-py version + theHive export 2023-01-16 15:27:49 +00:00			`def get_all_objects_with_subtypes_tuple():`
			`str_objs = []`
			`for obj_type in get_all_objects():`
			`subtypes = get_object_all_subtypes(obj_type)`
			`if subtypes:`
			`for subtype in subtypes:`
			`str_objs.append((obj_type, subtype))`
			`else:`
			`str_objs.append((obj_type, ''))`
			`return str_objs`

chg: [core] add telegram importer + Chat object + message Object + add timeline engine 2023-08-18 09:05:21 +00:00			`def unpack_obj_global_id(global_id, r_type='tuple'):`
			`if r_type == 'dict':`
			`obj = global_id.split(':', 2)`
chg: [chats] add chats participants + user-accounts basic template 2023-12-06 15:26:26 +00:00			`return {'type': obj[0], 'subtype': obj[1], 'id': obj[2]}`
chg: [core] add telegram importer + Chat object + message Object + add timeline engine 2023-08-18 09:05:21 +00:00			`else: # tuple(type, subtype, id)`
chg: [ocr] extract text from image + add ocr object 2024-04-08 15:16:07 +00:00			`return global_id.split(':', 2) # TODO REPLACE get_obj_type_subtype_id_from_global_id(global_id)`
chg: [core] add telegram importer + Chat object + message Object + add timeline engine 2023-08-18 09:05:21 +00:00
chg: [chats] add chats participants + user-accounts basic template 2023-12-06 15:26:26 +00:00			`def unpack_objs_global_id(objs_global_id, r_type='tuple'):`
			`objs = []`
			`for global_id in objs_global_id:`
			`objs.append(unpack_obj_global_id(global_id, r_type=r_type))`
			`return objs`

			`def unpack_correl_obj__id(obj_type, global_id, r_type='tuple'):`
			`obj = global_id.split(':', 1)`
			`if r_type == 'dict':`
			`return {'type': obj_type, 'subtype': obj[0], 'id': obj[1]}`
			`else: # tuple(type, subtype, id)`
			`return obj_type, obj[0], obj[1]`

			`def unpack_correl_objs_id(obj_type, correl_objs_id, r_type='tuple'):`
			`objs = []`
			`for correl_obj_id in correl_objs_id:`
			`objs.append(unpack_correl_obj__id(obj_type, correl_obj_id, r_type=r_type))`
			`return objs`
chg: [core] add telegram importer + Chat object + message Object + add timeline engine 2023-08-18 09:05:21 +00:00
chg: [Kvrocks migration] rewrite obj tags + migration 2022-09-01 12:04:00 +00:00			`##-- AIL OBJECTS --##`
chg: [all] remove old objects + migrate cryptocurrencies module + cleanup code 2022-11-28 14:01:40 +00:00
chg: [objects + retro hunt] refactor retro hunt + objects retro hunts + get objects generator by filters (date_from, sources, mimetypes, ...) 2023-05-10 14:26:46 +00:00			`#### Redis ####`

			`def _parse_zscan(response):`
			`cursor, r = response`
			`it = iter(r)`
			`return str(cursor), list(it)`

			`def zscan_iter(r_redis, name): # count ???`
			`cursor = 0`
			`while cursor != "0":`
			`cursor, data = _parse_zscan(r_redis.zscan(name, cursor=cursor))`
			`yield from data`

			`## -- Redis -- ##`

chg: [module + queues] track + rename object global ID by module 2023-10-11 10:06:01 +00:00			`def rreplace(s, old, new, occurrence):`
			`li = s.rsplit(old, occurrence)`
			`return new.join(li)`

chg: [all] remove old objects + migrate cryptocurrencies module + cleanup code 2022-11-28 14:01:40 +00:00			`def paginate_iterator(iter_elems, nb_obj=50, page=1):`
chg: [MISP export + redis] refactor MISP, export all relationships between objects, relationships between investigated objects + bump redis-py version + theHive export 2023-01-16 15:27:49 +00:00			`dict_page = {'nb_all_elem': len(iter_elems)}`
chg: [all] remove old objects + migrate cryptocurrencies module + cleanup code 2022-11-28 14:01:40 +00:00			`nb_pages = dict_page['nb_all_elem'] / nb_obj`
			`if not nb_pages.is_integer():`
			`nb_pages = int(nb_pages)+1`
			`else:`
			`nb_pages = int(nb_pages)`
			`if page > nb_pages:`
			`page = nb_pages`

			`# multiple pages`
			`if nb_pages > 1:`
			`dict_page['list_elem'] = []`
			`start = nb_obj*(page - 1)`
			`stop = (nb_obj*page) - 1`
			`current_index = 0`
			`for elem in iter_elems:`
			`if current_index > stop:`
			`break`
			`if start <= current_index <= stop:`
			`dict_page['list_elem'].append(elem)`
			`current_index += 1`
			`stop += 1`
			`if stop > dict_page['nb_all_elem']:`
			`stop = dict_page['nb_all_elem']`

			`else:`
			`start = 0`
			`stop = dict_page['nb_all_elem']`
			`dict_page['list_elem'] = list(iter_elems)`
			`dict_page['page'] = page`
			`dict_page['nb_pages'] = nb_pages`
			`# UI`
			`dict_page['nb_first_elem'] = start+1`
			`dict_page['nb_last_elem'] = stop`
			`return dict_page`