2018-06-05 16:58:04 +02:00
|
|
|
#!/usr/bin/env python3
|
|
|
|
# -*-coding:UTF-8 -*
|
|
|
|
|
2023-01-16 16:27:49 +01:00
|
|
|
"""
|
|
|
|
Flask functions and routes for the Item Submit modules page
|
|
|
|
"""
|
2021-04-28 15:24:33 +02:00
|
|
|
##################################
|
|
|
|
# Import External packages
|
|
|
|
##################################
|
2021-05-31 15:31:41 +02:00
|
|
|
import re
|
2018-06-05 16:58:04 +02:00
|
|
|
import os
|
|
|
|
import sys
|
2021-04-28 15:24:33 +02:00
|
|
|
import string
|
|
|
|
import unicodedata
|
2018-06-08 16:49:20 +02:00
|
|
|
import uuid
|
2018-06-14 16:51:06 +02:00
|
|
|
|
2021-04-28 15:24:33 +02:00
|
|
|
from functools import wraps
|
2021-05-28 17:37:46 +02:00
|
|
|
|
|
|
|
# Flask
|
2023-01-16 16:27:49 +01:00
|
|
|
from flask import render_template, jsonify, request, Blueprint, url_for, redirect, abort
|
2021-04-28 15:24:33 +02:00
|
|
|
from Role_Manager import login_admin, login_analyst
|
|
|
|
from flask_login import login_required
|
|
|
|
|
2018-06-05 16:58:04 +02:00
|
|
|
|
2021-04-28 15:24:33 +02:00
|
|
|
##################################
|
|
|
|
# Import Project packages
|
|
|
|
##################################
|
2022-09-01 14:04:00 +02:00
|
|
|
from lib import Tag
|
|
|
|
|
2022-10-25 16:25:19 +02:00
|
|
|
from packages import Import_helper
|
2022-11-28 15:01:40 +01:00
|
|
|
|
2018-06-14 16:51:06 +02:00
|
|
|
|
2018-06-05 16:58:04 +02:00
|
|
|
# ============ VARIABLES ============
|
|
|
|
import Flask_config
|
|
|
|
|
|
|
|
app = Flask_config.app
|
2018-09-20 10:38:19 +02:00
|
|
|
baseUrl = Flask_config.baseUrl
|
2018-06-05 16:58:04 +02:00
|
|
|
|
2023-01-16 16:27:49 +01:00
|
|
|
r_serv_db = Flask_config.r_serv_db # TODO REMOVE ME
|
|
|
|
r_serv_log_submit = Flask_config.r_serv_log_submit # TODO REMOVE ME
|
|
|
|
|
|
|
|
logger = Flask_config.redis_logger
|
2018-06-14 16:51:06 +02:00
|
|
|
|
2018-06-05 16:58:04 +02:00
|
|
|
|
|
|
|
valid_filename_chars = "-_ %s%s" % (string.ascii_letters, string.digits)
|
|
|
|
|
2018-06-08 16:49:20 +02:00
|
|
|
UPLOAD_FOLDER = Flask_config.UPLOAD_FOLDER
|
2018-06-06 10:05:25 +02:00
|
|
|
|
2021-04-28 15:24:33 +02:00
|
|
|
text_max_size = int(Flask_config.SUBMIT_PASTE_TEXT_MAX_SIZE) / (1000*1000)
|
|
|
|
file_max_size = int(Flask_config.SUBMIT_PASTE_FILE_MAX_SIZE) / (1000*1000*1000)
|
|
|
|
allowed_extensions = ", ". join(Flask_config.SUBMIT_PASTE_FILE_ALLOWED_EXTENSIONS)
|
|
|
|
|
2023-01-16 16:27:49 +01:00
|
|
|
PasteSubmit = Blueprint('PasteSubmit', __name__, template_folder='templates')
|
2021-04-28 15:24:33 +02:00
|
|
|
|
|
|
|
# ============ Validators ============
|
|
|
|
def limit_content_length():
|
|
|
|
def decorator(f):
|
|
|
|
@wraps(f)
|
|
|
|
def wrapper(*args, **kwargs):
|
|
|
|
logger.debug('decorator')
|
|
|
|
cl = request.content_length
|
|
|
|
if cl is not None:
|
|
|
|
if cl > Flask_config.SUBMIT_PASTE_FILE_MAX_SIZE or ('file' not in request.files and cl > Flask_config.SUBMIT_PASTE_TEXT_MAX_SIZE):
|
|
|
|
logger.debug('abort')
|
|
|
|
abort(413)
|
|
|
|
return f(*args, **kwargs)
|
|
|
|
return wrapper
|
|
|
|
return decorator
|
|
|
|
|
|
|
|
|
2018-06-05 16:58:04 +02:00
|
|
|
# ============ FUNCTIONS ============
|
|
|
|
|
2018-06-06 10:05:25 +02:00
|
|
|
def allowed_file(filename):
|
2023-04-04 10:25:01 +02:00
|
|
|
if '.' not in filename:
|
2018-06-08 16:49:20 +02:00
|
|
|
return True
|
|
|
|
else:
|
2021-04-28 15:24:33 +02:00
|
|
|
file_ext = filename.rsplit('.', 1)[1].lower()
|
|
|
|
logger.debug(file_ext)
|
|
|
|
return file_ext in Flask_config.SUBMIT_PASTE_FILE_ALLOWED_EXTENSIONS
|
2018-06-06 10:05:25 +02:00
|
|
|
|
2018-06-05 16:58:04 +02:00
|
|
|
def clean_filename(filename, whitelist=valid_filename_chars, replace=' '):
|
|
|
|
# replace characters
|
|
|
|
for r in replace:
|
2023-04-04 10:25:01 +02:00
|
|
|
filename = filename.replace(r, '_')
|
2018-06-05 16:58:04 +02:00
|
|
|
|
|
|
|
# keep only valid ascii chars
|
|
|
|
cleaned_filename = unicodedata.normalize('NFKD', filename).encode('ASCII', 'ignore').decode()
|
|
|
|
|
|
|
|
# keep only whitelisted chars
|
|
|
|
return ''.join(c for c in cleaned_filename if c in whitelist)
|
|
|
|
|
|
|
|
# ============= ROUTES ==============
|
|
|
|
|
|
|
|
@PasteSubmit.route("/PasteSubmit/", methods=['GET'])
|
2019-05-02 17:31:14 +02:00
|
|
|
@login_required
|
2019-06-19 17:02:09 +02:00
|
|
|
@login_analyst
|
2018-06-05 16:58:04 +02:00
|
|
|
def PasteSubmit_page():
|
2019-07-25 17:26:32 +02:00
|
|
|
# Get all active tags/galaxy
|
2019-08-01 13:16:57 +02:00
|
|
|
active_taxonomies = Tag.get_active_taxonomies()
|
|
|
|
active_galaxies = Tag.get_active_galaxies()
|
2018-06-05 16:58:04 +02:00
|
|
|
|
2019-06-25 14:18:39 +02:00
|
|
|
return render_template("submit_items.html",
|
2018-06-05 16:58:04 +02:00
|
|
|
active_taxonomies = active_taxonomies,
|
2021-05-28 17:37:46 +02:00
|
|
|
active_galaxies = active_galaxies,
|
2021-04-28 15:24:33 +02:00
|
|
|
text_max_size = text_max_size,
|
|
|
|
file_max_size = file_max_size,
|
|
|
|
allowed_extensions = allowed_extensions)
|
2018-06-05 16:58:04 +02:00
|
|
|
|
|
|
|
@PasteSubmit.route("/PasteSubmit/submit", methods=['POST'])
|
2019-05-02 17:31:14 +02:00
|
|
|
@login_required
|
2019-06-19 17:02:09 +02:00
|
|
|
@login_analyst
|
2021-04-28 15:24:33 +02:00
|
|
|
@limit_content_length()
|
2018-06-05 16:58:04 +02:00
|
|
|
def submit():
|
2021-04-28 15:24:33 +02:00
|
|
|
logger.debug('submit')
|
2018-06-08 16:49:20 +02:00
|
|
|
|
2021-07-15 15:49:04 +02:00
|
|
|
password = request.form['archive_pass']
|
2018-06-05 16:58:04 +02:00
|
|
|
ltags = request.form['tags_taxonomies']
|
|
|
|
ltagsgalaxies = request.form['tags_galaxies']
|
|
|
|
paste_content = request.form['paste_content']
|
2021-04-28 15:24:33 +02:00
|
|
|
paste_source = request.form['paste_source']
|
2018-06-05 16:58:04 +02:00
|
|
|
|
2021-05-31 15:31:41 +02:00
|
|
|
if paste_source:
|
2023-04-04 10:25:01 +02:00
|
|
|
# limit source length
|
2021-05-31 15:31:41 +02:00
|
|
|
paste_source = paste_source.replace('/', '')[:80]
|
|
|
|
if paste_source in ['crawled', 'tests']:
|
2023-04-04 10:25:01 +02:00
|
|
|
content = 'Invalid source'
|
2021-05-31 15:31:41 +02:00
|
|
|
logger.info(paste_source)
|
|
|
|
return content, 400
|
|
|
|
|
|
|
|
if not re.match('^[0-9a-zA-Z-_\+@#&\.;=:!]*$', paste_source):
|
|
|
|
content = f'Invalid source name: Forbidden character(s)'
|
|
|
|
logger.info(content)
|
|
|
|
return content, 400
|
2021-05-28 17:37:46 +02:00
|
|
|
|
2019-06-05 16:18:30 +02:00
|
|
|
is_file = False
|
2019-06-05 16:41:59 +02:00
|
|
|
if 'file' in request.files:
|
2021-04-28 15:24:33 +02:00
|
|
|
file_import = request.files['file']
|
|
|
|
if file_import:
|
|
|
|
if file_import.filename:
|
2019-06-05 16:41:59 +02:00
|
|
|
is_file = True
|
2019-06-05 16:18:30 +02:00
|
|
|
|
2021-04-28 15:24:33 +02:00
|
|
|
logger.debug(f'is file ? {is_file}')
|
|
|
|
|
2018-06-18 13:58:31 +02:00
|
|
|
submitted_tag = 'infoleak:submission="manual"'
|
|
|
|
|
2023-04-04 10:25:01 +02:00
|
|
|
# active taxonomies
|
2019-08-01 13:16:57 +02:00
|
|
|
active_taxonomies = Tag.get_active_taxonomies()
|
2023-04-04 10:25:01 +02:00
|
|
|
# active galaxies
|
2019-08-01 13:16:57 +02:00
|
|
|
active_galaxies = Tag.get_active_galaxies()
|
2018-09-26 11:59:51 +02:00
|
|
|
|
2018-06-06 10:05:25 +02:00
|
|
|
if ltags or ltagsgalaxies:
|
2021-04-28 15:24:33 +02:00
|
|
|
logger.debug(f'ltags ? {ltags} {ltagsgalaxies}')
|
2019-12-02 17:15:48 +01:00
|
|
|
ltags = Tag.unpack_str_tags_list(ltags)
|
|
|
|
ltagsgalaxies = Tag.unpack_str_tags_list(ltagsgalaxies)
|
2019-07-26 14:28:02 +02:00
|
|
|
|
2019-12-02 17:15:48 +01:00
|
|
|
if not Tag.is_valid_tags_taxonomies_galaxy(ltags, ltagsgalaxies):
|
2018-06-20 10:02:26 +02:00
|
|
|
content = 'INVALID TAGS'
|
2021-04-28 15:24:33 +02:00
|
|
|
logger.info(content)
|
2018-06-20 10:02:26 +02:00
|
|
|
return content, 400
|
2018-06-05 16:58:04 +02:00
|
|
|
|
2018-06-08 16:49:20 +02:00
|
|
|
# add submitted tags
|
2019-07-26 14:28:02 +02:00
|
|
|
if not ltags:
|
|
|
|
ltags = []
|
|
|
|
ltags.append(submitted_tag)
|
2018-06-08 16:49:20 +02:00
|
|
|
|
2019-06-05 16:18:30 +02:00
|
|
|
if is_file:
|
2021-04-28 15:24:33 +02:00
|
|
|
logger.debug('file management')
|
2018-06-05 16:58:04 +02:00
|
|
|
|
2021-04-28 15:24:33 +02:00
|
|
|
if allowed_file(file_import.filename):
|
|
|
|
logger.debug('file extension allowed')
|
2018-06-05 16:58:04 +02:00
|
|
|
|
2021-04-28 15:24:33 +02:00
|
|
|
# get UUID
|
|
|
|
UUID = str(uuid.uuid4())
|
2018-06-05 16:58:04 +02:00
|
|
|
|
2021-04-28 15:24:33 +02:00
|
|
|
# create submitted dir
|
|
|
|
if not os.path.exists(UPLOAD_FOLDER):
|
|
|
|
logger.debug('create folder')
|
|
|
|
os.makedirs(UPLOAD_FOLDER)
|
2018-06-19 11:31:30 +02:00
|
|
|
|
2023-04-04 10:25:01 +02:00
|
|
|
if '.' not in file_import.filename:
|
2021-04-28 15:24:33 +02:00
|
|
|
logger.debug('add UUID to path')
|
|
|
|
full_path = os.path.join(UPLOAD_FOLDER, UUID)
|
|
|
|
else:
|
|
|
|
if file_import.filename[-6:] == 'tar.gz':
|
|
|
|
logger.debug('file extension is tar.gz')
|
|
|
|
file_type = 'tar.gz'
|
2018-06-08 16:49:20 +02:00
|
|
|
else:
|
2021-04-28 15:24:33 +02:00
|
|
|
file_type = file_import.filename.rsplit('.', 1)[1]
|
|
|
|
logger.debug(f'file type {file_type}')
|
|
|
|
name = UUID + '.' + file_type
|
|
|
|
full_path = os.path.join(UPLOAD_FOLDER, name)
|
|
|
|
logger.debug(f'full path {full_path}')
|
|
|
|
|
2023-04-04 10:25:01 +02:00
|
|
|
# Flask verify the file size
|
2021-04-28 15:24:33 +02:00
|
|
|
file_import.save(full_path)
|
|
|
|
logger.debug('file saved')
|
2021-05-28 17:37:46 +02:00
|
|
|
|
2021-04-28 15:24:33 +02:00
|
|
|
Import_helper.create_import_queue(ltags, ltagsgalaxies, full_path, UUID, password, True)
|
2018-06-06 10:05:25 +02:00
|
|
|
|
2021-04-28 15:24:33 +02:00
|
|
|
return render_template("submit_items.html",
|
2023-04-04 10:25:01 +02:00
|
|
|
active_taxonomies=active_taxonomies,
|
|
|
|
active_galaxies=active_galaxies,
|
|
|
|
UUID=UUID)
|
2018-06-06 10:05:25 +02:00
|
|
|
|
2021-04-28 15:24:33 +02:00
|
|
|
else:
|
|
|
|
content = f'wrong file type, allowed_extensions: {allowed_extensions} or remove the extension'
|
|
|
|
logger.info(content)
|
|
|
|
return content, 400
|
2018-06-06 10:05:25 +02:00
|
|
|
|
2018-06-18 17:16:22 +02:00
|
|
|
elif paste_content != '':
|
2021-04-28 15:24:33 +02:00
|
|
|
logger.debug(f'entering text paste management')
|
|
|
|
if sys.getsizeof(paste_content) < Flask_config.SUBMIT_PASTE_TEXT_MAX_SIZE:
|
|
|
|
logger.debug(f'size {sys.getsizeof(paste_content)}')
|
2018-06-08 16:49:20 +02:00
|
|
|
# get id
|
|
|
|
UUID = str(uuid.uuid4())
|
2021-04-28 15:24:33 +02:00
|
|
|
logger.debug('create import')
|
|
|
|
Import_helper.create_import_queue(ltags, ltagsgalaxies, paste_content, UUID, password, source=paste_source)
|
|
|
|
logger.debug('import OK')
|
2019-06-25 14:11:30 +02:00
|
|
|
return render_template("submit_items.html",
|
2018-09-26 11:59:51 +02:00
|
|
|
active_taxonomies = active_taxonomies,
|
|
|
|
active_galaxies = active_galaxies,
|
2018-06-08 16:49:20 +02:00
|
|
|
UUID = UUID)
|
|
|
|
|
|
|
|
else:
|
2021-04-28 15:24:33 +02:00
|
|
|
content = f'text paste size is over {Flask_config.SUBMIT_PASTE_TEXT_MAX_SIZE} bytes limit'
|
|
|
|
logger.info(content)
|
2018-06-20 10:02:26 +02:00
|
|
|
return content, 400
|
2018-06-08 16:49:20 +02:00
|
|
|
|
2018-06-20 10:02:26 +02:00
|
|
|
content = 'submit aborded'
|
2021-04-28 15:24:33 +02:00
|
|
|
logger.error(content)
|
2018-06-20 10:02:26 +02:00
|
|
|
return content, 400
|
2018-06-08 16:49:20 +02:00
|
|
|
|
|
|
|
return PasteSubmit_page()
|
2018-06-05 16:58:04 +02:00
|
|
|
|
|
|
|
@PasteSubmit.route("/PasteSubmit/submit_status", methods=['GET'])
|
2019-05-02 17:31:14 +02:00
|
|
|
@login_required
|
2019-06-19 17:02:09 +02:00
|
|
|
@login_analyst
|
2018-06-05 16:58:04 +02:00
|
|
|
def submit_status():
|
2018-06-08 16:49:20 +02:00
|
|
|
UUID = request.args.get('UUID')
|
|
|
|
|
|
|
|
if UUID:
|
|
|
|
end = r_serv_log_submit.get(UUID + ':end')
|
|
|
|
nb_total = r_serv_log_submit.get(UUID + ':nb_total')
|
|
|
|
nb_end = r_serv_log_submit.get(UUID + ':nb_end')
|
|
|
|
error = r_serv_log_submit.get(UUID + ':error')
|
|
|
|
processing = r_serv_log_submit.get(UUID + ':processing')
|
|
|
|
nb_sucess = r_serv_log_submit.get(UUID + ':nb_sucess')
|
|
|
|
paste_submit_link = list(r_serv_log_submit.smembers(UUID + ':paste_submit_link'))
|
|
|
|
|
2019-07-26 14:28:02 +02:00
|
|
|
if (end != None) and (nb_total != None) and (nb_end != None) and (processing != None):
|
2018-06-08 16:49:20 +02:00
|
|
|
|
|
|
|
link = ''
|
|
|
|
if paste_submit_link:
|
|
|
|
for paste in paste_submit_link:
|
2020-10-13 16:02:30 +02:00
|
|
|
url = url_for('objects_item.showItem') + '?id=' + paste
|
2018-06-08 16:49:20 +02:00
|
|
|
link += '<a target="_blank" href="' + url + '" class="list-group-item">' + paste +'</a>'
|
|
|
|
|
|
|
|
if nb_total == '-1':
|
|
|
|
in_progress = nb_sucess + ' / '
|
|
|
|
else:
|
|
|
|
in_progress = nb_sucess + ' / ' + nb_total
|
2018-06-05 16:58:04 +02:00
|
|
|
|
2018-06-08 16:49:20 +02:00
|
|
|
if int(nb_total) != 0:
|
|
|
|
prog = int(int(nb_end) * 100 / int(nb_total))
|
|
|
|
else:
|
|
|
|
prog = 0
|
2018-06-05 16:58:04 +02:00
|
|
|
|
2023-04-04 10:25:01 +02:00
|
|
|
isError = bool(error)
|
2018-06-05 16:58:04 +02:00
|
|
|
|
|
|
|
if end == '0':
|
|
|
|
end = False
|
|
|
|
else:
|
|
|
|
end = True
|
|
|
|
|
2018-06-08 16:49:20 +02:00
|
|
|
if processing == '0':
|
|
|
|
processing = False
|
|
|
|
else:
|
|
|
|
processing = True
|
|
|
|
|
2018-06-05 16:58:04 +02:00
|
|
|
return jsonify(end=end,
|
|
|
|
in_progress=in_progress,
|
|
|
|
prog=prog,
|
2018-06-08 16:49:20 +02:00
|
|
|
link=link,
|
|
|
|
processing=processing,
|
2018-06-05 16:58:04 +02:00
|
|
|
isError=isError,
|
|
|
|
error=error)
|
|
|
|
else:
|
2018-06-08 16:49:20 +02:00
|
|
|
# FIXME TODO
|
|
|
|
print(end)
|
|
|
|
print(nb_total)
|
|
|
|
print(nb_end)
|
|
|
|
print(error)
|
|
|
|
print(processing)
|
|
|
|
print(nb_sucess)
|
2018-06-05 16:58:04 +02:00
|
|
|
return 'to do'
|
|
|
|
else:
|
2018-06-08 16:49:20 +02:00
|
|
|
return 'INVALID UUID'
|
2018-06-05 16:58:04 +02:00
|
|
|
|
2018-06-14 16:51:06 +02:00
|
|
|
|
2018-06-05 16:58:04 +02:00
|
|
|
# ========= REGISTRATION =========
|
2018-09-20 10:38:19 +02:00
|
|
|
app.register_blueprint(PasteSubmit, url_prefix=baseUrl)
|