#!/usr/bin/env python3
# -*-coding:UTF-8 -*

from packages import Paste
from Helper import Process

import os
import re
import time
import redis
import configparser

from collections import defaultdict

def get_dict_cve(list_paste_cve, only_one_same_cve_by_paste=False):
    dict_keyword = {}

    for paste_cve in list_paste_cve:
        paste_content = Paste.Paste(paste_cve).get_p_content()

        cve_list = reg_cve.findall(paste_content)
        if only_one_same_cve_by_paste:
            cve_list = set(cve_list)

        for cve in reg_cve.findall(paste_content):
            try:
                dict_keyword[cve] += 1
            except KeyError:
                dict_keyword[cve] = 1

    print('------------------------------------------------')
    if dict_keyword:
        res = [(k, dict_keyword[k]) for k in sorted(dict_keyword, key=dict_keyword.get, reverse=True)]
        for item in res:
            pass
            print(item)



if __name__ == '__main__':

    # CONFIG #
    configfile = os.path.join(os.environ['AIL_BIN'], 'packages/config.cfg')
    if not os.path.exists(configfile):
        raise Exception('Unable to find the configuration file. \
                        Did you set environment variables? \
                        Or activate the virtualenv.')

    cfg = configparser.ConfigParser()
    cfg.read(configfile)

    serv_metadata = redis.StrictRedis(
        host=cfg.get("ARDB_Metadata", "host"),
        port=cfg.getint("ARDB_Metadata", "port"),
        db=cfg.getint("ARDB_Metadata", "db"),
        decode_responses=True)

    serv_tags = redis.StrictRedis(
                host=cfg.get("ARDB_Tags", "host"),
                port=cfg.get("ARDB_Tags", "port"),
                db=cfg.get("ARDB_Tags", "db"),
                decode_responses=True)

    reg_cve = re.compile(r'CVE-[1-2]\d{1,4}-\d{1,7}')

    #all_past_cve = serv_tags.smembers('infoleak:automatic-detection="cve"')
    #all_past_cve_regular = serv_tags.sdiff('infoleak:automatic-detection="cve"', 'infoleak:submission="crawler"')
    #all_past_cve_crawler = serv_tags.sinter('infoleak:automatic-detection="cve"', 'infoleak:submission="crawler"')

    #print('{} + {} = {}'.format(len(all_past_cve_regular), len(all_past_cve_crawler), len(all_past_cve)))

    print('ALL_CVE')
    get_dict_cve(serv_tags.smembers('infoleak:automatic-detection="cve"'), True)
    print()
    print()
    print()
    print('REGULAR_CVE')
    get_dict_cve(serv_tags.sdiff('infoleak:automatic-detection="cve"', 'infoleak:submission="crawler"'), True)
    print()
    print()
    print()
    print('CRAWLER_CVE')
    get_dict_cve(serv_tags.sinter('infoleak:automatic-detection="cve"', 'infoleak:submission="crawler"'), True)