2018-05-04 11:53:29 +00:00
|
|
|
#!/usr/bin/env python3
|
2014-08-06 09:43:40 +00:00
|
|
|
# -*-coding:UTF-8 -*
|
|
|
|
|
2019-06-19 13:00:25 +00:00
|
|
|
import os
|
|
|
|
import sys
|
2019-06-24 11:43:16 +00:00
|
|
|
import ssl
|
2019-07-31 11:24:43 +00:00
|
|
|
import json
|
2019-06-24 11:43:16 +00:00
|
|
|
import time
|
2020-04-06 09:22:31 +00:00
|
|
|
import uuid
|
2019-06-19 13:00:25 +00:00
|
|
|
|
2014-08-14 15:55:18 +00:00
|
|
|
import redis
|
2019-05-02 15:31:14 +00:00
|
|
|
import random
|
2019-06-26 14:36:40 +00:00
|
|
|
import logging
|
|
|
|
import logging.handlers
|
2019-06-24 11:43:16 +00:00
|
|
|
|
2019-07-31 11:24:43 +00:00
|
|
|
from flask import Flask, render_template, jsonify, request, Request, Response, session, redirect, url_for
|
2019-05-02 15:31:14 +00:00
|
|
|
from flask_login import LoginManager, current_user, login_user, logout_user, login_required
|
|
|
|
|
2014-08-06 09:43:40 +00:00
|
|
|
import flask
|
2017-04-19 09:02:03 +00:00
|
|
|
import importlib
|
|
|
|
from os.path import join
|
2019-11-18 08:46:15 +00:00
|
|
|
|
|
|
|
# # TODO: put me in lib/Tag
|
|
|
|
from pytaxonomies import Taxonomies
|
|
|
|
|
2016-07-05 14:53:03 +00:00
|
|
|
sys.path.append(os.path.join(os.environ['AIL_BIN'], 'packages/'))
|
2019-11-18 08:46:15 +00:00
|
|
|
import Tag
|
|
|
|
|
2017-04-19 09:02:03 +00:00
|
|
|
sys.path.append('./modules/')
|
2014-12-24 14:42:20 +00:00
|
|
|
|
2019-05-02 15:31:14 +00:00
|
|
|
from User import User
|
|
|
|
|
2019-10-28 12:48:43 +00:00
|
|
|
sys.path.append(os.path.join(os.environ['AIL_BIN'], 'lib/'))
|
|
|
|
import ConfigLoader
|
|
|
|
|
2016-12-09 07:46:37 +00:00
|
|
|
# Import config
|
|
|
|
import Flask_config
|
2016-08-19 11:34:02 +00:00
|
|
|
|
2019-09-25 06:58:18 +00:00
|
|
|
# Import Blueprint
|
|
|
|
from blueprints.root import root
|
2019-10-28 12:48:43 +00:00
|
|
|
from blueprints.crawler_splash import crawler_splash
|
2019-11-14 16:05:58 +00:00
|
|
|
from blueprints.correlation import correlation
|
2020-01-07 15:14:56 +00:00
|
|
|
from blueprints.tags_ui import tags_ui
|
2020-02-17 09:52:25 +00:00
|
|
|
from blueprints.import_export import import_export
|
2020-01-07 15:14:56 +00:00
|
|
|
|
2019-06-19 13:00:25 +00:00
|
|
|
|
2019-07-30 11:49:21 +00:00
|
|
|
Flask_dir = os.environ['AIL_FLASK']
|
|
|
|
|
2016-12-09 07:46:37 +00:00
|
|
|
# CONFIG #
|
2019-10-28 12:48:43 +00:00
|
|
|
config_loader = ConfigLoader.ConfigLoader()
|
|
|
|
baseUrl = config_loader.get_config_str("Flask", "baseurl")
|
2020-07-06 15:13:36 +00:00
|
|
|
host = config_loader.get_config_str("Flask", "host")
|
2018-09-20 08:38:19 +00:00
|
|
|
baseUrl = baseUrl.replace('/', '')
|
|
|
|
if baseUrl != '':
|
|
|
|
baseUrl = '/'+baseUrl
|
2016-08-24 16:00:05 +00:00
|
|
|
|
2020-01-21 10:39:08 +00:00
|
|
|
try:
|
|
|
|
FLASK_PORT = config_loader.get_config_int("Flask", "port")
|
|
|
|
except Exception:
|
|
|
|
FLASK_PORT = 7000
|
|
|
|
|
2019-05-03 14:52:05 +00:00
|
|
|
# ========= REDIS =========#
|
2019-10-28 12:48:43 +00:00
|
|
|
r_serv_db = config_loader.get_redis_conn("ARDB_DB")
|
|
|
|
r_serv_tags = config_loader.get_redis_conn("ARDB_Tags")
|
|
|
|
r_cache = config_loader.get_redis_conn("Redis_Cache")
|
2019-06-26 14:36:40 +00:00
|
|
|
|
|
|
|
# logs
|
|
|
|
log_dir = os.path.join(os.environ['AIL_HOME'], 'logs')
|
|
|
|
if not os.path.isdir(log_dir):
|
|
|
|
os.makedirs(logs_dir)
|
|
|
|
|
2019-07-25 15:26:32 +00:00
|
|
|
# log_filename = os.path.join(log_dir, 'flask_server.logs')
|
|
|
|
# logger = logging.getLogger()
|
|
|
|
# formatter = logging.Formatter('%(asctime)s - %(levelname)s - %(message)s')
|
|
|
|
# handler_log = logging.handlers.TimedRotatingFileHandler(log_filename, when="midnight", interval=1)
|
|
|
|
# handler_log.suffix = '%Y-%m-%d.log'
|
|
|
|
# handler_log.setFormatter(formatter)
|
|
|
|
# handler_log.setLevel(30)
|
|
|
|
# logger.addHandler(handler_log)
|
|
|
|
# logger.setLevel(30)
|
2019-06-26 14:36:40 +00:00
|
|
|
|
2019-05-03 14:52:05 +00:00
|
|
|
# ========= =========#
|
|
|
|
|
2019-06-24 11:43:16 +00:00
|
|
|
# ========= TLS =========#
|
|
|
|
ssl_context = ssl.SSLContext(ssl.PROTOCOL_TLSv1_2)
|
2019-07-30 11:49:21 +00:00
|
|
|
ssl_context.load_cert_chain(certfile=os.path.join(Flask_dir, 'server.crt'), keyfile=os.path.join(Flask_dir, 'server.key'))
|
2019-06-24 11:43:16 +00:00
|
|
|
#print(ssl_context.get_ciphers())
|
|
|
|
# ========= =========#
|
|
|
|
|
2018-09-20 08:38:19 +00:00
|
|
|
Flask_config.app = Flask(__name__, static_url_path=baseUrl+'/static/')
|
2016-12-09 07:46:37 +00:00
|
|
|
app = Flask_config.app
|
2018-06-08 14:49:20 +00:00
|
|
|
app.config['MAX_CONTENT_LENGTH'] = 900 * 1024 * 1024
|
2014-08-26 15:33:28 +00:00
|
|
|
|
2019-09-25 06:58:18 +00:00
|
|
|
# ========= BLUEPRINT =========#
|
|
|
|
app.register_blueprint(root, url_prefix=baseUrl)
|
2019-10-28 12:48:43 +00:00
|
|
|
app.register_blueprint(crawler_splash, url_prefix=baseUrl)
|
2019-11-14 16:05:58 +00:00
|
|
|
app.register_blueprint(correlation, url_prefix=baseUrl)
|
2020-01-07 15:14:56 +00:00
|
|
|
app.register_blueprint(tags_ui, url_prefix=baseUrl)
|
2020-02-17 09:52:25 +00:00
|
|
|
app.register_blueprint(import_export, url_prefix=baseUrl)
|
2019-09-25 06:58:18 +00:00
|
|
|
# ========= =========#
|
|
|
|
|
2020-01-21 10:39:08 +00:00
|
|
|
# ========= Cookie name ========
|
2020-04-06 09:22:31 +00:00
|
|
|
app.config.update(SESSION_COOKIE_NAME='ail_framework_{}'.format(uuid.uuid4().int))
|
2020-01-21 10:39:08 +00:00
|
|
|
|
2019-05-02 15:31:14 +00:00
|
|
|
# ========= session ========
|
|
|
|
app.secret_key = str(random.getrandbits(256))
|
|
|
|
login_manager = LoginManager()
|
2019-09-25 06:58:18 +00:00
|
|
|
login_manager.login_view = 'root.login'
|
2019-05-02 15:31:14 +00:00
|
|
|
login_manager.init_app(app)
|
|
|
|
|
2019-09-25 06:58:18 +00:00
|
|
|
print()
|
|
|
|
|
2019-05-02 15:31:14 +00:00
|
|
|
# ========= LOGIN MANAGER ========
|
|
|
|
|
|
|
|
@login_manager.user_loader
|
|
|
|
def load_user(user_id):
|
|
|
|
return User.get(user_id)
|
|
|
|
|
2019-09-25 06:58:18 +00:00
|
|
|
# ========= HEADER GENERATION ======== DEPRECATED
|
2017-04-25 10:18:08 +00:00
|
|
|
|
|
|
|
# Get headers items that should be ignored (not displayed)
|
|
|
|
toIgnoreModule = set()
|
|
|
|
try:
|
|
|
|
with open('templates/ignored_modules.txt', 'r') as f:
|
|
|
|
lines = f.read().splitlines()
|
|
|
|
for line in lines:
|
|
|
|
toIgnoreModule.add(line)
|
|
|
|
|
|
|
|
except IOError:
|
2019-08-05 14:31:03 +00:00
|
|
|
pass
|
2017-04-25 10:18:08 +00:00
|
|
|
|
2017-04-19 13:14:20 +00:00
|
|
|
# Dynamically import routes and functions from modules
|
|
|
|
# Also, prepare header.html
|
|
|
|
to_add_to_header_dico = {}
|
2019-07-30 11:49:21 +00:00
|
|
|
for root, dirs, files in os.walk(os.path.join(Flask_dir, 'modules')):
|
2017-04-19 13:14:20 +00:00
|
|
|
sys.path.append(join(root))
|
2017-04-25 10:18:08 +00:00
|
|
|
|
|
|
|
# Ignore the module
|
|
|
|
curr_dir = root.split('/')[1]
|
|
|
|
if curr_dir in toIgnoreModule:
|
|
|
|
continue
|
|
|
|
|
2017-04-19 13:14:20 +00:00
|
|
|
for name in files:
|
|
|
|
module_name = root.split('/')[-2]
|
|
|
|
if name.startswith('Flask_') and name.endswith('.py'):
|
|
|
|
if name == 'Flask_config.py':
|
|
|
|
continue
|
|
|
|
name = name.strip('.py')
|
|
|
|
#print('importing {}'.format(name))
|
|
|
|
importlib.import_module(name)
|
|
|
|
elif name == 'header_{}.html'.format(module_name):
|
|
|
|
with open(join(root, name), 'r') as f:
|
|
|
|
to_add_to_header_dico[module_name] = f.read()
|
2014-08-26 15:33:28 +00:00
|
|
|
|
2017-04-19 13:14:20 +00:00
|
|
|
#create header.html
|
|
|
|
complete_header = ""
|
2019-07-30 11:49:21 +00:00
|
|
|
with open(os.path.join(Flask_dir, 'templates', 'header_base.html'), 'r') as f:
|
2017-04-19 13:14:20 +00:00
|
|
|
complete_header = f.read()
|
|
|
|
modified_header = complete_header
|
|
|
|
|
|
|
|
#Add the header in the supplied order
|
2018-04-17 14:06:32 +00:00
|
|
|
for module_name, txt in list(to_add_to_header_dico.items()):
|
2017-04-19 13:14:20 +00:00
|
|
|
to_replace = '<!--{}-->'.format(module_name)
|
|
|
|
if to_replace in complete_header:
|
|
|
|
modified_header = modified_header.replace(to_replace, txt)
|
|
|
|
del to_add_to_header_dico[module_name]
|
|
|
|
|
|
|
|
#Add the header for no-supplied order
|
|
|
|
to_add_to_header = []
|
|
|
|
for module_name, txt in to_add_to_header_dico.items():
|
|
|
|
to_add_to_header.append(txt)
|
|
|
|
|
|
|
|
modified_header = modified_header.replace('<!--insert here-->', '\n'.join(to_add_to_header))
|
|
|
|
|
|
|
|
#Write the header.html file
|
2019-07-30 11:49:21 +00:00
|
|
|
with open(os.path.join(Flask_dir, 'templates', 'header.html'), 'w') as f:
|
2017-04-19 13:14:20 +00:00
|
|
|
f.write(modified_header)
|
|
|
|
|
|
|
|
# ========= JINJA2 FUNCTIONS ========
|
2016-07-05 14:53:03 +00:00
|
|
|
def list_len(s):
|
|
|
|
return len(s)
|
|
|
|
app.jinja_env.filters['list_len'] = list_len
|
|
|
|
|
2016-08-04 09:55:38 +00:00
|
|
|
|
2016-08-09 09:59:36 +00:00
|
|
|
# ========= CACHE CONTROL ========
|
|
|
|
@app.after_request
|
|
|
|
def add_header(response):
|
|
|
|
"""
|
|
|
|
Add headers to both force latest IE rendering engine or Chrome Frame,
|
|
|
|
and also to cache the rendered page for 10 minutes.
|
|
|
|
"""
|
|
|
|
response.headers['X-UA-Compatible'] = 'IE=Edge,chrome=1'
|
2019-09-03 09:58:34 +00:00
|
|
|
if 'Cache-Control' not in response.headers:
|
|
|
|
response.headers['Cache-Control'] = 'private, max-age=0'
|
2016-08-09 09:59:36 +00:00
|
|
|
return response
|
2016-07-21 11:44:22 +00:00
|
|
|
|
2017-04-19 13:14:20 +00:00
|
|
|
# ========== ROUTES ============
|
2019-06-06 19:27:13 +00:00
|
|
|
|
2019-09-25 06:58:18 +00:00
|
|
|
#@app.route('/endpoints')
|
|
|
|
#def endpoints():
|
|
|
|
# for rule in app.url_map.iter_rules():
|
|
|
|
# str_endpoint = str(rule)
|
|
|
|
# if len(str_endpoint)>5:
|
|
|
|
# if str_endpoint[0:5]=='/api/': ## add baseUrl ???
|
|
|
|
# print(str_endpoint)
|
|
|
|
# #print(rule.endpoint) #internal endpoint name
|
|
|
|
# #print(rule.methods)
|
|
|
|
# return 'ok'
|
2017-04-19 13:14:20 +00:00
|
|
|
|
2019-06-20 08:11:23 +00:00
|
|
|
# ========== ERROR HANDLER ============
|
|
|
|
|
2019-07-31 11:24:43 +00:00
|
|
|
@app.errorhandler(405)
|
|
|
|
def _handle_client_error(e):
|
2019-10-28 12:48:43 +00:00
|
|
|
if request.path.startswith('/api/'): ## # TODO: add baseUrl
|
2019-08-06 09:29:12 +00:00
|
|
|
res_dict = {"status": "error", "reason": "Method Not Allowed: The method is not allowed for the requested URL"}
|
|
|
|
anchor_id = request.path[8:]
|
|
|
|
anchor_id = anchor_id.replace('/', '_')
|
2020-04-20 15:50:40 +00:00
|
|
|
api_doc_url = 'https://github.com/ail-project/ail-framework/tree/master/doc#{}'.format(anchor_id)
|
2019-08-06 09:29:12 +00:00
|
|
|
res_dict['documentation'] = api_doc_url
|
|
|
|
return Response(json.dumps(res_dict, indent=2, sort_keys=True), mimetype='application/json'), 405
|
2019-07-31 11:24:43 +00:00
|
|
|
else:
|
|
|
|
return e
|
|
|
|
|
2019-06-20 08:11:23 +00:00
|
|
|
@app.errorhandler(404)
|
2019-07-31 11:24:43 +00:00
|
|
|
def error_page_not_found(e):
|
2019-09-25 06:58:18 +00:00
|
|
|
if request.path.startswith('/api/'): ## # TODO: add baseUrl
|
2019-07-31 11:24:43 +00:00
|
|
|
return Response(json.dumps({"status": "error", "reason": "404 Not Found"}, indent=2, sort_keys=True), mimetype='application/json'), 404
|
|
|
|
else:
|
|
|
|
# avoid endpoint enumeration
|
|
|
|
return page_not_found(e)
|
|
|
|
|
2019-06-20 08:11:23 +00:00
|
|
|
@login_required
|
|
|
|
def page_not_found(e):
|
2019-06-20 08:56:31 +00:00
|
|
|
# avoid endpoint enumeration
|
2019-06-20 08:11:23 +00:00
|
|
|
return render_template('error/404.html'), 404
|
2017-04-19 13:14:20 +00:00
|
|
|
|
2018-05-23 14:58:56 +00:00
|
|
|
# ========== INITIAL taxonomies ============
|
2019-11-18 08:46:15 +00:00
|
|
|
default_taxonomies = ["infoleak", "gdpr", "fpf", "dark-web"]
|
|
|
|
|
|
|
|
# enable default taxonomies
|
|
|
|
for taxo in default_taxonomies:
|
|
|
|
Tag.enable_taxonomy(taxo)
|
2018-05-23 14:58:56 +00:00
|
|
|
|
2018-06-15 15:25:43 +00:00
|
|
|
# ========== INITIAL tags auto export ============
|
2019-11-18 08:46:15 +00:00
|
|
|
taxonomies = Taxonomies()
|
|
|
|
|
2018-06-15 15:25:43 +00:00
|
|
|
infoleak_tags = taxonomies.get('infoleak').machinetags()
|
|
|
|
infoleak_automatic_tags = []
|
|
|
|
for tag in taxonomies.get('infoleak').machinetags():
|
|
|
|
if tag.split('=')[0][:] == 'infoleak:automatic-detection':
|
|
|
|
r_serv_db.sadd('list_export_tags', tag)
|
|
|
|
|
2018-06-19 14:39:49 +00:00
|
|
|
r_serv_db.sadd('list_export_tags', 'infoleak:submission="manual"')
|
2016-12-09 07:46:37 +00:00
|
|
|
# ============ MAIN ============
|
2016-07-08 08:19:24 +00:00
|
|
|
|
2014-08-06 09:43:40 +00:00
|
|
|
if __name__ == "__main__":
|
2020-07-06 15:13:36 +00:00
|
|
|
app.run(host=host, port=FLASK_PORT, threaded=True, ssl_context=ssl_context)
|