2019-01-30 14:30:01 +01:00
|
|
|
#!/usr/bin/env python3
|
|
|
|
# -*- coding: utf-8 -*-
|
|
|
|
|
|
|
|
from zipfile import ZipFile, ZIP_DEFLATED
|
|
|
|
from io import BytesIO
|
|
|
|
import os
|
2020-01-06 15:32:38 +01:00
|
|
|
from pathlib import Path
|
2020-04-22 12:03:10 +02:00
|
|
|
from datetime import datetime, timedelta
|
2020-05-23 03:37:24 +02:00
|
|
|
import json
|
2020-08-07 13:11:16 +02:00
|
|
|
import http
|
2019-01-30 14:30:01 +01:00
|
|
|
|
2020-06-26 12:07:25 +02:00
|
|
|
from flask import Flask, render_template, request, send_file, redirect, url_for, Response, flash, jsonify
|
2020-01-06 15:32:38 +01:00
|
|
|
from flask_bootstrap import Bootstrap # type: ignore
|
2020-04-01 17:44:06 +02:00
|
|
|
from flask_httpauth import HTTPDigestAuth # type: ignore
|
2019-01-30 14:30:01 +01:00
|
|
|
|
2020-09-21 16:41:30 +02:00
|
|
|
from lookyloo.helpers import get_homedir, update_user_agents, get_user_agents, get_config
|
2020-06-13 02:49:07 +02:00
|
|
|
from lookyloo.lookyloo import Lookyloo, Indexing
|
2020-06-29 11:59:01 +02:00
|
|
|
from lookyloo.exceptions import NoValidHarFile, MissingUUID
|
2020-04-22 14:58:01 +02:00
|
|
|
from .proxied import ReverseProxied
|
2019-01-30 14:30:01 +01:00
|
|
|
|
2020-10-01 11:48:00 +02:00
|
|
|
from typing import Optional, Dict, Any, Union
|
2019-01-30 14:30:01 +01:00
|
|
|
|
2020-04-03 17:51:58 +02:00
|
|
|
import logging
|
|
|
|
|
2020-01-06 15:32:38 +01:00
|
|
|
app: Flask = Flask(__name__)
|
2020-04-22 15:54:02 +02:00
|
|
|
app.wsgi_app = ReverseProxied(app.wsgi_app) # type: ignore
|
2019-01-30 14:30:01 +01:00
|
|
|
|
2020-01-06 15:32:38 +01:00
|
|
|
secret_file_path: Path = get_homedir() / 'secret_key'
|
2019-01-30 14:30:01 +01:00
|
|
|
|
|
|
|
if not secret_file_path.exists() or secret_file_path.stat().st_size < 64:
|
|
|
|
with secret_file_path.open('wb') as f:
|
|
|
|
f.write(os.urandom(64))
|
|
|
|
|
|
|
|
with secret_file_path.open('rb') as f:
|
|
|
|
app.config['SECRET_KEY'] = f.read()
|
|
|
|
|
|
|
|
Bootstrap(app)
|
|
|
|
app.config['BOOTSTRAP_SERVE_LOCAL'] = True
|
|
|
|
app.config['SESSION_COOKIE_NAME'] = 'lookyloo'
|
|
|
|
app.debug = False
|
2020-04-01 17:44:06 +02:00
|
|
|
auth = HTTPDigestAuth()
|
2019-01-30 14:30:01 +01:00
|
|
|
|
2020-03-31 14:12:49 +02:00
|
|
|
lookyloo: Lookyloo = Lookyloo()
|
2019-01-30 14:30:01 +01:00
|
|
|
|
2020-09-21 16:41:30 +02:00
|
|
|
user = get_config('generic', 'cache_clean_user')
|
|
|
|
time_delta_on_index = get_config('generic', 'time_delta_on_index')
|
|
|
|
blur_screenshot = get_config('generic', 'enable_default_blur_screenshot')
|
2020-04-01 17:44:06 +02:00
|
|
|
|
2020-09-21 16:41:30 +02:00
|
|
|
logging.basicConfig(level=get_config('generic', 'loglevel'))
|
2020-04-03 17:51:58 +02:00
|
|
|
|
2020-04-01 17:44:06 +02:00
|
|
|
|
2020-10-09 18:05:04 +02:00
|
|
|
# ##### Global methods passed to jinja
|
|
|
|
|
2020-05-23 03:37:24 +02:00
|
|
|
# Method to make sizes in bytes human readable
|
|
|
|
# Source: https://stackoverflow.com/questions/1094841/reusable-library-to-get-human-readable-version-of-file-size
|
|
|
|
def sizeof_fmt(num, suffix='B'):
|
|
|
|
for unit in ['', 'Ki', 'Mi', 'Gi', 'Ti', 'Pi', 'Ei', 'Zi']:
|
|
|
|
if abs(num) < 1024.0:
|
|
|
|
return "%3.1f%s%s" % (num, unit, suffix)
|
|
|
|
num /= 1024.0
|
|
|
|
return "%.1f%s%s" % (num, 'Yi', suffix)
|
|
|
|
|
|
|
|
|
|
|
|
app.jinja_env.globals.update(sizeof_fmt=sizeof_fmt)
|
|
|
|
|
|
|
|
|
2020-08-07 13:11:16 +02:00
|
|
|
def http_status_description(code: int):
|
2020-08-07 17:06:25 +02:00
|
|
|
if code in http.client.responses:
|
|
|
|
return http.client.responses[code]
|
|
|
|
return f'Invalid code: {code}'
|
2020-08-07 13:11:16 +02:00
|
|
|
|
|
|
|
|
|
|
|
app.jinja_env.globals.update(http_status_description=http_status_description)
|
|
|
|
|
|
|
|
|
2020-10-09 18:05:04 +02:00
|
|
|
# ##### Generic/configuration methods #####
|
|
|
|
|
2020-06-25 16:43:36 +02:00
|
|
|
@app.after_request
|
|
|
|
def after_request(response):
|
2020-06-25 17:08:11 +02:00
|
|
|
ua = request.headers.get('User-Agent')
|
2020-06-26 10:54:35 +02:00
|
|
|
real_ip = request.headers.get('X-Real-IP')
|
2020-06-25 17:08:11 +02:00
|
|
|
if ua:
|
2020-06-26 10:54:35 +02:00
|
|
|
if real_ip:
|
|
|
|
lookyloo.cache_user_agents(ua, real_ip)
|
|
|
|
else:
|
|
|
|
lookyloo.cache_user_agents(ua, request.remote_addr)
|
2020-06-25 16:43:36 +02:00
|
|
|
return response
|
|
|
|
|
|
|
|
|
2020-04-01 17:44:06 +02:00
|
|
|
@auth.get_password
|
2020-05-18 18:32:59 +02:00
|
|
|
def get_pw(username: str) -> Optional[str]:
|
2020-04-01 17:44:06 +02:00
|
|
|
if username in user:
|
|
|
|
return user.get(username)
|
|
|
|
return None
|
|
|
|
|
|
|
|
|
2020-10-09 18:05:04 +02:00
|
|
|
# ##### Hostnode level methods #####
|
2019-01-30 14:30:01 +01:00
|
|
|
|
2020-10-09 18:05:04 +02:00
|
|
|
@app.route('/tree/<string:tree_uuid>/host/<string:node_uuid>/hashes', methods=['GET'])
|
|
|
|
def hashes_hostnode(tree_uuid: str, node_uuid: str):
|
|
|
|
hashes = lookyloo.get_hashes(tree_uuid, hostnode_uuid=node_uuid)
|
|
|
|
return send_file(BytesIO('\n'.join(hashes).encode()),
|
2020-10-21 12:22:50 +02:00
|
|
|
mimetype='test/plain', as_attachment=True, attachment_filename=f'hashes.{node_uuid}.txt')
|
2019-01-30 14:30:01 +01:00
|
|
|
|
|
|
|
|
2020-10-09 18:05:04 +02:00
|
|
|
@app.route('/tree/<string:tree_uuid>/host/<string:node_uuid>/text', methods=['GET'])
|
2020-10-21 12:22:50 +02:00
|
|
|
def urls_hostnode(tree_uuid: str, node_uuid: str):
|
2020-06-29 11:59:01 +02:00
|
|
|
hostnode = lookyloo.get_hostnode_from_tree(tree_uuid, node_uuid)
|
2020-10-21 12:22:50 +02:00
|
|
|
return send_file(BytesIO('\n'.join(url.name for url in hostnode.urls).encode()),
|
|
|
|
mimetype='test/plain', as_attachment=True, attachment_filename=f'urls.{node_uuid}.txt')
|
2019-01-30 14:30:01 +01:00
|
|
|
|
|
|
|
|
2020-10-09 18:05:04 +02:00
|
|
|
@app.route('/tree/<string:tree_uuid>/host/<string:node_uuid>', methods=['GET'])
|
2020-05-20 19:11:15 +02:00
|
|
|
def hostnode_popup(tree_uuid: str, node_uuid: str):
|
2020-05-23 03:37:24 +02:00
|
|
|
keys_response = {
|
2020-05-19 17:47:55 +02:00
|
|
|
'js': "/static/javascript.png",
|
|
|
|
'exe': "/static/exe.png",
|
|
|
|
'css': "/static/css.png",
|
|
|
|
'font': "/static/font.png",
|
|
|
|
'html': "/static/html.png",
|
|
|
|
'json': "/static/json.png",
|
2020-07-16 01:08:39 +02:00
|
|
|
'text': "/static/json.png", # FIXME: Need new icon
|
2020-05-19 17:47:55 +02:00
|
|
|
'iframe': "/static/ifr.png",
|
|
|
|
'image': "/static/img.png",
|
2020-07-16 01:08:39 +02:00
|
|
|
'unset_mimetype': "/static/wtf.png",
|
|
|
|
'octet-stream': "/static/wtf.png",
|
2020-05-19 17:47:55 +02:00
|
|
|
'unknown_mimetype': "/static/wtf.png",
|
|
|
|
'video': "/static/video.png",
|
2020-07-16 01:08:39 +02:00
|
|
|
'livestream': "/static/video.png",
|
2020-05-19 17:47:55 +02:00
|
|
|
'response_cookie': "/static/cookie_received.png",
|
2020-07-29 14:00:46 +02:00
|
|
|
# redirect has to be last
|
2020-05-19 17:47:55 +02:00
|
|
|
'redirect': "/static/redirect.png",
|
|
|
|
'redirect_to_nothing': "/static/cookie_in_url.png"
|
|
|
|
}
|
2020-05-23 03:37:24 +02:00
|
|
|
keys_request = {
|
|
|
|
'request_cookie': "/static/cookie_read.png",
|
|
|
|
}
|
2020-09-21 16:41:30 +02:00
|
|
|
if get_config('generic', 'enable_context_by_users'):
|
2020-08-31 16:34:28 +02:00
|
|
|
enable_context_by_users = True
|
|
|
|
else:
|
|
|
|
enable_context_by_users = False
|
2020-05-19 17:47:55 +02:00
|
|
|
|
2020-06-29 11:59:01 +02:00
|
|
|
hostnode, urls = lookyloo.get_hostnode_investigator(tree_uuid, node_uuid)
|
2020-05-27 12:38:25 +02:00
|
|
|
|
2020-05-19 17:47:55 +02:00
|
|
|
return render_template('hostname_popup.html',
|
2020-05-20 19:11:15 +02:00
|
|
|
tree_uuid=tree_uuid,
|
2020-08-28 18:03:52 +02:00
|
|
|
hostnode_uuid=node_uuid,
|
2020-09-24 18:46:43 +02:00
|
|
|
hostnode=hostnode,
|
2020-05-19 17:47:55 +02:00
|
|
|
urls=urls,
|
2020-05-23 03:37:24 +02:00
|
|
|
keys_response=keys_response,
|
2020-08-31 16:34:28 +02:00
|
|
|
keys_request=keys_request,
|
|
|
|
enable_context_by_users=enable_context_by_users)
|
2020-05-23 03:37:24 +02:00
|
|
|
|
|
|
|
|
2020-10-09 18:05:04 +02:00
|
|
|
# ##### Tree level Methods #####
|
2020-05-26 17:45:04 +02:00
|
|
|
|
2020-10-09 18:05:04 +02:00
|
|
|
@app.route('/tree/<string:tree_uuid>/rebuild')
|
|
|
|
@auth.login_required
|
|
|
|
def rebuild_tree(tree_uuid: str):
|
|
|
|
try:
|
|
|
|
lookyloo.remove_pickle(tree_uuid)
|
|
|
|
return redirect(url_for('tree', tree_uuid=tree_uuid))
|
|
|
|
except Exception:
|
|
|
|
return redirect(url_for('index'))
|
2019-01-30 14:30:01 +01:00
|
|
|
|
|
|
|
|
2020-04-20 16:41:42 +02:00
|
|
|
@app.route('/tree/<string:tree_uuid>/trigger_modules/', defaults={'force': False})
|
|
|
|
@app.route('/tree/<string:tree_uuid>/trigger_modules/<int:force>', methods=['GET'])
|
2020-05-18 18:32:59 +02:00
|
|
|
def trigger_modules(tree_uuid: str, force: int):
|
2020-06-29 11:59:01 +02:00
|
|
|
lookyloo.trigger_modules(tree_uuid, True if force else False)
|
2020-04-20 16:41:42 +02:00
|
|
|
return redirect(url_for('modules', tree_uuid=tree_uuid))
|
|
|
|
|
|
|
|
|
2020-05-13 17:31:27 +02:00
|
|
|
@app.route('/tree/<string:tree_uuid>/stats', methods=['GET'])
|
2020-05-18 18:32:59 +02:00
|
|
|
def stats(tree_uuid: str):
|
2020-06-29 11:59:01 +02:00
|
|
|
stats = lookyloo.get_statistics(tree_uuid)
|
2020-05-13 17:31:27 +02:00
|
|
|
return render_template('statistics.html', uuid=tree_uuid, stats=stats)
|
|
|
|
|
|
|
|
|
2020-04-20 16:41:42 +02:00
|
|
|
@app.route('/tree/<string:tree_uuid>/modules', methods=['GET'])
|
2020-05-18 18:32:59 +02:00
|
|
|
def modules(tree_uuid: str):
|
2020-06-29 11:59:01 +02:00
|
|
|
modules_responses = lookyloo.get_modules_responses(tree_uuid)
|
2020-04-20 16:41:42 +02:00
|
|
|
if not modules_responses:
|
|
|
|
return redirect(url_for('tree', tree_uuid=tree_uuid))
|
|
|
|
|
2020-05-18 18:32:59 +02:00
|
|
|
vt_short_result: Dict[str, Dict[str, Any]] = {}
|
2020-04-20 16:41:42 +02:00
|
|
|
if 'vt' in modules_responses:
|
|
|
|
# VirusTotal cleanup
|
|
|
|
vt = modules_responses.pop('vt')
|
|
|
|
# Get malicious entries
|
|
|
|
for url, full_report in vt.items():
|
|
|
|
vt_short_result[url] = {
|
|
|
|
'permaurl': f'https://www.virustotal.com/gui/url/{full_report["id"]}/detection',
|
|
|
|
'malicious': []
|
|
|
|
}
|
|
|
|
for vendor, result in full_report['attributes']['last_analysis_results'].items():
|
|
|
|
if result['category'] == 'malicious':
|
|
|
|
vt_short_result[url]['malicious'].append((vendor, result['result']))
|
|
|
|
|
2020-06-09 15:06:35 +02:00
|
|
|
pi_short_result: Dict[str, str] = {}
|
|
|
|
if 'pi' in modules_responses:
|
|
|
|
pi = modules_responses.pop('pi')
|
|
|
|
for url, full_report in pi.items():
|
|
|
|
if not full_report:
|
|
|
|
continue
|
|
|
|
pi_short_result[url] = full_report['results'][0]['tag_label']
|
|
|
|
|
|
|
|
return render_template('modules.html', uuid=tree_uuid, vt=vt_short_result, pi=pi_short_result)
|
2020-04-20 16:41:42 +02:00
|
|
|
|
|
|
|
|
2020-10-09 18:05:04 +02:00
|
|
|
@app.route('/tree/<string:tree_uuid>/redirects', methods=['GET'])
|
|
|
|
def redirects(tree_uuid: str):
|
|
|
|
cache = lookyloo.capture_cache(tree_uuid)
|
|
|
|
if not cache:
|
|
|
|
return Response('Not available.', mimetype='text/text')
|
|
|
|
if not cache['redirects']:
|
|
|
|
return Response('No redirects.', mimetype='text/text')
|
2020-10-12 12:15:07 +02:00
|
|
|
if cache['url'] == cache['redirects'][0]: # type: ignore
|
|
|
|
to_return = BytesIO('\n'.join(cache['redirects']).encode()) # type: ignore
|
2020-10-09 18:05:04 +02:00
|
|
|
else:
|
2020-10-12 12:15:07 +02:00
|
|
|
to_return = BytesIO('\n'.join([cache['url']] + cache['redirects']).encode()) # type: ignore
|
2020-10-09 18:05:04 +02:00
|
|
|
return send_file(to_return, mimetype='text/text',
|
|
|
|
as_attachment=True, attachment_filename='redirects.txt')
|
|
|
|
|
|
|
|
|
2019-01-30 14:30:01 +01:00
|
|
|
@app.route('/tree/<string:tree_uuid>/image', methods=['GET'])
|
2020-05-18 18:32:59 +02:00
|
|
|
def image(tree_uuid: str):
|
2020-06-29 11:59:01 +02:00
|
|
|
to_return = lookyloo.get_screenshot(tree_uuid)
|
2019-01-30 14:30:01 +01:00
|
|
|
return send_file(to_return, mimetype='image/png',
|
|
|
|
as_attachment=True, attachment_filename='image.png')
|
|
|
|
|
|
|
|
|
2020-05-12 16:53:10 +02:00
|
|
|
@app.route('/tree/<string:tree_uuid>/html', methods=['GET'])
|
2020-05-18 18:32:59 +02:00
|
|
|
def html(tree_uuid: str):
|
2020-06-29 11:59:01 +02:00
|
|
|
to_return = lookyloo.get_html(tree_uuid)
|
2020-05-12 16:53:10 +02:00
|
|
|
return send_file(to_return, mimetype='text/html',
|
|
|
|
as_attachment=True, attachment_filename='page.html')
|
|
|
|
|
|
|
|
|
2020-05-26 17:45:04 +02:00
|
|
|
@app.route('/tree/<string:tree_uuid>/cookies', methods=['GET'])
|
|
|
|
def cookies(tree_uuid: str):
|
2020-06-29 11:59:01 +02:00
|
|
|
to_return = lookyloo.get_cookies(tree_uuid)
|
2020-05-26 17:45:04 +02:00
|
|
|
return send_file(to_return, mimetype='application/json',
|
|
|
|
as_attachment=True, attachment_filename='cookies.json')
|
|
|
|
|
|
|
|
|
2020-10-09 18:05:04 +02:00
|
|
|
@app.route('/tree/<string:tree_uuid>/hashes', methods=['GET'])
|
|
|
|
def hashes_tree(tree_uuid: str):
|
|
|
|
hashes = lookyloo.get_hashes(tree_uuid)
|
|
|
|
return send_file(BytesIO('\n'.join(hashes).encode()),
|
|
|
|
mimetype='test/plain', as_attachment=True, attachment_filename='hashes.txt')
|
|
|
|
|
|
|
|
|
2020-05-12 16:53:10 +02:00
|
|
|
@app.route('/tree/<string:tree_uuid>/export', methods=['GET'])
|
2020-05-18 18:32:59 +02:00
|
|
|
def export(tree_uuid: str):
|
2020-06-29 11:59:01 +02:00
|
|
|
to_return = lookyloo.get_capture(tree_uuid)
|
2020-05-12 16:53:10 +02:00
|
|
|
return send_file(to_return, mimetype='application/zip',
|
|
|
|
as_attachment=True, attachment_filename='capture.zip')
|
|
|
|
|
|
|
|
|
2020-08-10 12:35:16 +02:00
|
|
|
@app.route('/tree/<string:tree_uuid>/hide', methods=['GET'])
|
|
|
|
@auth.login_required
|
|
|
|
def hide_capture(tree_uuid: str):
|
|
|
|
lookyloo.hide_capture(tree_uuid)
|
|
|
|
return redirect(url_for('tree', tree_uuid=tree_uuid))
|
|
|
|
|
|
|
|
|
2020-10-09 18:05:04 +02:00
|
|
|
@app.route('/tree/<string:tree_uuid>/cache', methods=['GET'])
|
2020-05-18 18:32:59 +02:00
|
|
|
def cache_tree(tree_uuid: str):
|
2020-06-29 11:59:01 +02:00
|
|
|
lookyloo.cache_tree(tree_uuid)
|
2020-03-26 01:56:24 +01:00
|
|
|
return redirect(url_for('index'))
|
|
|
|
|
|
|
|
|
2020-05-11 19:58:46 +02:00
|
|
|
@app.route('/tree/<string:tree_uuid>/send_mail', methods=['POST', 'GET'])
|
2020-05-18 18:32:59 +02:00
|
|
|
def send_mail(tree_uuid: str):
|
2020-05-27 15:15:37 +02:00
|
|
|
email: str = request.form.get('email') if request.form.get('email') else '' # type: ignore
|
2020-08-20 15:05:27 +02:00
|
|
|
if '@' not in email:
|
|
|
|
# skip clearly incorrect emails
|
|
|
|
email = ''
|
2020-05-18 18:32:59 +02:00
|
|
|
comment: str = request.form.get('comment') if request.form.get('comment') else '' # type: ignore
|
2020-05-27 15:15:37 +02:00
|
|
|
lookyloo.send_mail(tree_uuid, email, comment)
|
2020-05-11 19:01:02 +02:00
|
|
|
return redirect(url_for('tree', tree_uuid=tree_uuid))
|
|
|
|
|
|
|
|
|
2019-01-30 14:30:01 +01:00
|
|
|
@app.route('/tree/<string:tree_uuid>', methods=['GET'])
|
2020-06-29 11:59:01 +02:00
|
|
|
@app.route('/tree/<string:tree_uuid>/<string:urlnode_uuid>', methods=['GET'])
|
|
|
|
def tree(tree_uuid: str, urlnode_uuid: Optional[str]=None):
|
2020-03-17 15:27:04 +01:00
|
|
|
if tree_uuid == 'False':
|
2020-03-23 12:45:57 +01:00
|
|
|
flash("Unable to process your request. The domain may not exist, or splash isn't started", 'error')
|
2020-03-17 15:27:04 +01:00
|
|
|
return redirect(url_for('index'))
|
2020-06-29 11:59:01 +02:00
|
|
|
try:
|
|
|
|
cache = lookyloo.capture_cache(tree_uuid)
|
|
|
|
except MissingUUID:
|
2020-03-17 14:17:18 +01:00
|
|
|
flash(f'Unable to find this UUID ({tree_uuid}). The capture may still be ongoing, try again later.', 'error')
|
|
|
|
return redirect(url_for('index'))
|
|
|
|
|
2020-05-18 18:32:59 +02:00
|
|
|
if not cache:
|
2020-05-26 17:45:04 +02:00
|
|
|
flash('Invalid cache.', 'error')
|
2020-05-18 18:32:59 +02:00
|
|
|
return redirect(url_for('index'))
|
|
|
|
|
2020-03-17 14:17:18 +01:00
|
|
|
if 'error' in cache:
|
|
|
|
flash(cache['error'], 'error')
|
2019-01-30 16:01:55 +01:00
|
|
|
|
2019-02-18 13:52:48 +01:00
|
|
|
try:
|
2020-09-21 16:41:30 +02:00
|
|
|
if get_config('generic', 'enable_mail_notification'):
|
2020-05-11 19:01:02 +02:00
|
|
|
enable_mail_notification = True
|
|
|
|
else:
|
|
|
|
enable_mail_notification = False
|
2020-09-21 16:41:30 +02:00
|
|
|
if get_config('generic', 'enable_context_by_users'):
|
2020-09-01 18:37:49 +02:00
|
|
|
enable_context_by_users = True
|
|
|
|
else:
|
|
|
|
enable_context_by_users = False
|
2020-06-29 11:59:01 +02:00
|
|
|
tree_json, start_time, user_agent, root_url, meta = lookyloo.load_tree(tree_uuid)
|
2019-02-18 13:52:48 +01:00
|
|
|
return render_template('tree.html', tree_json=tree_json, start_time=start_time,
|
2019-04-07 23:54:16 +02:00
|
|
|
user_agent=user_agent, root_url=root_url, tree_uuid=tree_uuid,
|
2020-06-29 11:59:01 +02:00
|
|
|
meta=meta, enable_mail_notification=enable_mail_notification,
|
2020-09-01 18:37:49 +02:00
|
|
|
enable_context_by_users=enable_context_by_users,
|
2020-08-13 15:56:46 +02:00
|
|
|
blur_screenshot=blur_screenshot,
|
2020-08-07 11:58:20 +02:00
|
|
|
urlnode_uuid=urlnode_uuid, has_redirects=True if cache['redirects'] else False)
|
2020-06-22 19:17:25 +02:00
|
|
|
|
2019-02-18 13:52:48 +01:00
|
|
|
except NoValidHarFile as e:
|
2019-04-05 14:05:54 +02:00
|
|
|
return render_template('error.html', error_message=e)
|
2019-01-30 14:30:01 +01:00
|
|
|
|
|
|
|
|
2020-10-09 18:05:04 +02:00
|
|
|
@app.route('/tree/<string:tree_uuid>/mark_as_legitimate', methods=['POST'])
|
|
|
|
@auth.login_required
|
|
|
|
def mark_as_legitimate(tree_uuid: str):
|
|
|
|
if request.data:
|
|
|
|
legitimate_entries = request.get_json(force=True)
|
|
|
|
lookyloo.add_to_legitimate(tree_uuid, **legitimate_entries)
|
|
|
|
else:
|
|
|
|
lookyloo.add_to_legitimate(tree_uuid)
|
|
|
|
return jsonify({'message': 'Legitimate entry added.'})
|
|
|
|
|
|
|
|
|
|
|
|
# ##### helpers #####
|
|
|
|
|
2020-05-18 18:32:59 +02:00
|
|
|
def index_generic(show_hidden: bool=False):
|
2019-01-30 14:30:01 +01:00
|
|
|
titles = []
|
2020-04-22 12:03:10 +02:00
|
|
|
if time_delta_on_index:
|
|
|
|
# We want to filter the captures on the index
|
|
|
|
cut_time = datetime.now() - timedelta(**time_delta_on_index)
|
|
|
|
else:
|
2020-05-18 18:32:59 +02:00
|
|
|
cut_time = None # type: ignore
|
2020-06-29 11:59:01 +02:00
|
|
|
for capture_uuid in lookyloo.capture_uuids:
|
|
|
|
cached = lookyloo.capture_cache(capture_uuid)
|
2020-07-03 18:25:16 +02:00
|
|
|
if not cached:
|
2020-04-23 00:12:10 +02:00
|
|
|
continue
|
|
|
|
if show_hidden:
|
|
|
|
if 'no_index' not in cached:
|
|
|
|
# Only display the hidden ones
|
|
|
|
continue
|
|
|
|
elif 'no_index' in cached:
|
2019-01-30 14:30:01 +01:00
|
|
|
continue
|
2020-07-06 15:45:24 +02:00
|
|
|
if 'timestamp' not in cached:
|
|
|
|
# this is a buggy capture, skip
|
|
|
|
continue
|
2020-10-12 12:15:07 +02:00
|
|
|
if cut_time and datetime.fromisoformat(cached['timestamp'][:-1]) < cut_time: # type: ignore
|
2020-04-22 12:03:10 +02:00
|
|
|
continue
|
2020-04-08 12:04:29 +02:00
|
|
|
titles.append((cached['uuid'], cached['title'], cached['timestamp'], cached['url'],
|
2020-03-26 01:56:24 +01:00
|
|
|
cached['redirects'], True if cached['incomplete_redirects'] == '1' else False))
|
2020-02-03 18:30:41 +01:00
|
|
|
titles = sorted(titles, key=lambda x: (x[2], x[3]), reverse=True)
|
2019-01-30 14:30:01 +01:00
|
|
|
return render_template('index.html', titles=titles)
|
2020-04-23 00:12:10 +02:00
|
|
|
|
|
|
|
|
2020-10-09 18:05:04 +02:00
|
|
|
# ##### Index level methods #####
|
|
|
|
|
2020-04-23 00:12:10 +02:00
|
|
|
@app.route('/', methods=['GET'])
|
|
|
|
def index():
|
|
|
|
if request.method == 'HEAD':
|
|
|
|
# Just returns ack if the webserver is running
|
|
|
|
return 'Ack'
|
|
|
|
update_user_agents()
|
|
|
|
return index_generic()
|
|
|
|
|
|
|
|
|
|
|
|
@app.route('/hidden', methods=['GET'])
|
|
|
|
@auth.login_required
|
|
|
|
def index_hidden():
|
|
|
|
return index_generic(show_hidden=True)
|
2020-06-26 12:07:25 +02:00
|
|
|
|
2020-06-13 02:49:07 +02:00
|
|
|
|
|
|
|
@app.route('/cookies', methods=['GET'])
|
|
|
|
def cookies_lookup():
|
|
|
|
i = Indexing()
|
|
|
|
cookies_names = [(name, freq, i.cookies_names_number_domains(name)) for name, freq in i.cookies_names]
|
|
|
|
return render_template('cookies.html', cookies_names=cookies_names)
|
|
|
|
|
|
|
|
|
2020-09-03 14:39:38 +02:00
|
|
|
@app.route('/ressources', methods=['GET'])
|
|
|
|
def ressources():
|
|
|
|
i = Indexing()
|
|
|
|
ressources = []
|
|
|
|
for h, freq in i.ressources:
|
|
|
|
domain_freq = i.ressources_number_domains(h)
|
|
|
|
context = lookyloo.context.find_known_content(h)
|
2020-09-03 16:31:45 +02:00
|
|
|
capture_uuid, url_uuid, hostnode_uuid = i.get_hash_uuids(h)
|
|
|
|
ressources.append((h, freq, domain_freq, context.get(h), capture_uuid, url_uuid, hostnode_uuid))
|
2020-09-03 14:39:38 +02:00
|
|
|
return render_template('ressources.html', ressources=ressources)
|
|
|
|
|
|
|
|
|
2020-10-09 18:05:04 +02:00
|
|
|
@app.route('/rebuild_all')
|
|
|
|
@auth.login_required
|
|
|
|
def rebuild_all():
|
|
|
|
lookyloo.rebuild_all()
|
|
|
|
return redirect(url_for('index'))
|
|
|
|
|
|
|
|
|
|
|
|
@app.route('/rebuild_cache')
|
|
|
|
@auth.login_required
|
|
|
|
def rebuild_cache():
|
|
|
|
lookyloo.rebuild_cache()
|
|
|
|
return redirect(url_for('index'))
|
|
|
|
|
|
|
|
|
|
|
|
@app.route('/submit', methods=['POST', 'GET'])
|
|
|
|
def submit():
|
|
|
|
to_query = request.get_json(force=True)
|
|
|
|
perma_uuid = lookyloo.enqueue_scrape(to_query)
|
|
|
|
return Response(perma_uuid, mimetype='text/text')
|
|
|
|
|
|
|
|
|
|
|
|
@app.route('/scrape', methods=['GET', 'POST'])
|
|
|
|
def scrape_web():
|
|
|
|
if request.form.get('url'):
|
|
|
|
# check if the post request has the file part
|
|
|
|
if 'cookies' in request.files and request.files['cookies'].filename:
|
|
|
|
cookie_file = request.files['cookies'].stream
|
|
|
|
else:
|
|
|
|
cookie_file = None
|
|
|
|
url = request.form.get('url')
|
|
|
|
if url:
|
|
|
|
depth: int = request.form.get('depth') if request.form.get('depth') else 1 # type: ignore
|
|
|
|
listing: bool = request.form.get('listing') if request.form.get('listing') else False # type: ignore
|
|
|
|
perma_uuid = lookyloo.scrape(url=url, cookies_pseudofile=cookie_file,
|
|
|
|
depth=depth, listing=listing,
|
|
|
|
user_agent=request.form.get('user_agent'),
|
|
|
|
referer=request.form.get('referer'), # type: ignore
|
|
|
|
os=request.form.get('os'), browser=request.form.get('browser'))
|
|
|
|
return redirect(url_for('tree', tree_uuid=perma_uuid))
|
|
|
|
user_agents: Dict[str, Any] = {}
|
|
|
|
if get_config('generic', 'use_user_agents_users'):
|
|
|
|
lookyloo.build_ua_file()
|
|
|
|
# NOTE: For now, just generate the file, so we have an idea of the size
|
|
|
|
# user_agents = get_user_agents('own_user_agents')
|
|
|
|
if not user_agents:
|
|
|
|
user_agents = get_user_agents()
|
|
|
|
user_agents.pop('by_frequency')
|
|
|
|
return render_template('scrape.html', user_agents=user_agents)
|
|
|
|
|
|
|
|
|
2020-06-13 02:49:07 +02:00
|
|
|
@app.route('/cookies/<string:cookie_name>', methods=['GET'])
|
|
|
|
def cookies_name_detail(cookie_name: str):
|
2020-06-20 02:09:45 +02:00
|
|
|
captures, domains = lookyloo.get_cookie_name_investigator(cookie_name)
|
2020-06-15 01:34:59 +02:00
|
|
|
return render_template('cookie_name.html', cookie_name=cookie_name, domains=domains, captures=captures)
|
2020-06-13 02:49:07 +02:00
|
|
|
|
2020-06-19 00:25:24 +02:00
|
|
|
|
|
|
|
@app.route('/body_hashes/<string:body_hash>', methods=['GET'])
|
|
|
|
def body_hash_details(body_hash: str):
|
2020-06-20 02:09:45 +02:00
|
|
|
captures, domains = lookyloo.get_body_hash_investigator(body_hash)
|
2020-06-19 00:25:24 +02:00
|
|
|
return render_template('body_hash.html', body_hash=body_hash, domains=domains, captures=captures)
|
|
|
|
|
2020-06-26 12:07:25 +02:00
|
|
|
|
2020-10-09 18:05:04 +02:00
|
|
|
# ##### Methods related to a specific URLNode #####
|
|
|
|
|
|
|
|
@app.route('/tree/<string:tree_uuid>/url/<string:node_uuid>/request_cookies', methods=['GET'])
|
|
|
|
def urlnode_request_cookies(tree_uuid: str, node_uuid: str):
|
|
|
|
urlnode = lookyloo.get_urlnode_from_tree(tree_uuid, node_uuid)
|
|
|
|
if not urlnode.request_cookie:
|
|
|
|
return
|
|
|
|
|
|
|
|
return send_file(BytesIO(json.dumps(urlnode.request_cookie, indent=2).encode()),
|
|
|
|
mimetype='text/plain', as_attachment=True, attachment_filename='request_cookies.txt')
|
|
|
|
|
|
|
|
|
|
|
|
@app.route('/tree/<string:tree_uuid>/url/<string:node_uuid>/response_cookies', methods=['GET'])
|
|
|
|
def urlnode_response_cookies(tree_uuid: str, node_uuid: str):
|
|
|
|
urlnode = lookyloo.get_urlnode_from_tree(tree_uuid, node_uuid)
|
|
|
|
if not urlnode.response_cookie:
|
|
|
|
return
|
|
|
|
|
|
|
|
return send_file(BytesIO(json.dumps(urlnode.response_cookie, indent=2).encode()),
|
|
|
|
mimetype='text/plain', as_attachment=True, attachment_filename='response_cookies.txt')
|
|
|
|
|
|
|
|
|
|
|
|
@app.route('/tree/<string:tree_uuid>/url/<string:node_uuid>/rendered_content', methods=['GET'])
|
|
|
|
def urlnode_rendered_content(tree_uuid: str, node_uuid: str):
|
|
|
|
urlnode = lookyloo.get_urlnode_from_tree(tree_uuid, node_uuid)
|
|
|
|
if not urlnode.rendered_html:
|
|
|
|
return
|
|
|
|
return send_file(BytesIO(urlnode.rendered_html.getvalue()), mimetype='text/plain',
|
|
|
|
as_attachment=True, attachment_filename='rendered_content.txt')
|
|
|
|
|
|
|
|
|
|
|
|
@app.route('/tree/<string:tree_uuid>/url/<string:node_uuid>/posted_data', methods=['GET'])
|
|
|
|
def urlnode_post_request(tree_uuid: str, node_uuid: str):
|
|
|
|
urlnode = lookyloo.get_urlnode_from_tree(tree_uuid, node_uuid)
|
|
|
|
if not urlnode.posted_data:
|
|
|
|
return
|
|
|
|
posted: Union[str, bytes]
|
|
|
|
if isinstance(urlnode.posted_data, (dict, list)):
|
|
|
|
# JSON blob, pretty print.
|
|
|
|
posted = json.dumps(urlnode.posted_data, indent=2)
|
2020-08-20 19:39:03 +02:00
|
|
|
else:
|
2020-10-09 18:05:04 +02:00
|
|
|
posted = urlnode.posted_data
|
|
|
|
|
|
|
|
if isinstance(posted, str):
|
|
|
|
to_return = BytesIO(posted.encode())
|
|
|
|
is_blob = False
|
|
|
|
else:
|
|
|
|
to_return = BytesIO(posted)
|
|
|
|
is_blob = True
|
|
|
|
to_return.seek(0)
|
|
|
|
|
|
|
|
if is_blob:
|
|
|
|
return send_file(to_return, mimetype='application/octet-stream',
|
|
|
|
as_attachment=True, attachment_filename='posted_data.bin')
|
|
|
|
else:
|
|
|
|
return send_file(to_return, mimetype='text/plain',
|
|
|
|
as_attachment=True, attachment_filename='posted_data.txt')
|
|
|
|
|
|
|
|
|
|
|
|
@app.route('/tree/<string:tree_uuid>/url/<string:node_uuid>/ressource', methods=['POST', 'GET'])
|
|
|
|
def get_ressource(tree_uuid: str, node_uuid: str):
|
|
|
|
if request.method == 'POST':
|
|
|
|
h_request = request.form.get('ressource_hash')
|
|
|
|
else:
|
|
|
|
h_request = None
|
|
|
|
ressource = lookyloo.get_ressource(tree_uuid, node_uuid, h_request)
|
|
|
|
to_return = BytesIO()
|
|
|
|
with ZipFile(to_return, 'w', ZIP_DEFLATED) as zfile:
|
|
|
|
if ressource:
|
|
|
|
filename, r = ressource
|
|
|
|
zfile.writestr(filename, r.getvalue())
|
|
|
|
else:
|
|
|
|
zfile.writestr('file.txt', b'Unknown Hash')
|
|
|
|
to_return.seek(0)
|
|
|
|
return send_file(to_return, mimetype='application/zip',
|
|
|
|
as_attachment=True, attachment_filename='file.zip')
|
|
|
|
|
|
|
|
|
|
|
|
@app.route('/tree/<string:tree_uuid>/url/<string:node_uuid>/hashes', methods=['GET'])
|
|
|
|
def hashes_urlnode(tree_uuid: str, node_uuid: str):
|
|
|
|
hashes = lookyloo.get_hashes(tree_uuid, urlnode_uuid=node_uuid)
|
|
|
|
return send_file(BytesIO('\n'.join(hashes).encode()),
|
|
|
|
mimetype='test/plain', as_attachment=True, attachment_filename='hashes.txt')
|
2020-08-20 19:39:03 +02:00
|
|
|
|
|
|
|
|
2020-10-09 18:05:04 +02:00
|
|
|
@app.route('/tree/<string:tree_uuid>/url/<string:node_uuid>/add_context', methods=['POST'])
|
2020-08-25 15:51:08 +02:00
|
|
|
@auth.login_required
|
2020-10-09 18:05:04 +02:00
|
|
|
def add_context(tree_uuid: str, node_uuid: str):
|
2020-08-25 15:51:08 +02:00
|
|
|
context_data = request.form
|
2020-08-28 18:26:47 +02:00
|
|
|
ressource_hash: str = context_data.get('hash_to_contextualize') # type: ignore
|
|
|
|
hostnode_uuid: str = context_data.get('hostnode_uuid') # type: ignore
|
2020-09-03 16:31:45 +02:00
|
|
|
callback_str: str = context_data.get('callback_str') # type: ignore
|
2020-08-28 18:03:52 +02:00
|
|
|
legitimate: bool = True if context_data.get('legitimate') else False
|
|
|
|
malicious: bool = True if context_data.get('malicious') else False
|
2020-08-28 18:26:47 +02:00
|
|
|
details: Dict[str, Dict] = {'malicious': {}, 'legitimate': {}}
|
2020-08-28 18:03:52 +02:00
|
|
|
if malicious:
|
|
|
|
malicious_details = {}
|
|
|
|
if context_data.get('malicious_type'):
|
|
|
|
malicious_details['type'] = context_data['malicious_type']
|
|
|
|
if context_data.get('malicious_target'):
|
|
|
|
malicious_details['target'] = context_data['malicious_target']
|
|
|
|
details['malicious'] = malicious_details
|
|
|
|
if legitimate:
|
|
|
|
legitimate_details = {}
|
|
|
|
if context_data.get('legitimate_domain'):
|
|
|
|
legitimate_details['domain'] = context_data['legitimate_domain']
|
|
|
|
if context_data.get('legitimate_description'):
|
2020-08-28 18:24:14 +02:00
|
|
|
legitimate_details['description'] = context_data['legitimate_description']
|
2020-08-28 18:03:52 +02:00
|
|
|
details['legitimate'] = legitimate_details
|
2020-10-09 18:05:04 +02:00
|
|
|
lookyloo.add_context(tree_uuid, node_uuid, ressource_hash, legitimate, malicious, details)
|
2020-09-03 16:31:45 +02:00
|
|
|
if callback_str == 'hostnode_popup':
|
|
|
|
return redirect(url_for('hostnode_popup', tree_uuid=tree_uuid, node_uuid=hostnode_uuid))
|
|
|
|
elif callback_str == 'ressources':
|
|
|
|
return redirect(url_for('ressources'))
|
2020-08-25 15:51:08 +02:00
|
|
|
|
|
|
|
|
2020-06-29 17:23:01 +02:00
|
|
|
# Query API
|
2020-06-29 11:59:01 +02:00
|
|
|
|
2020-06-26 12:07:25 +02:00
|
|
|
@app.route('/json/<string:tree_uuid>/redirects', methods=['GET'])
|
|
|
|
def json_redirects(tree_uuid: str):
|
2020-06-29 11:59:01 +02:00
|
|
|
cache = lookyloo.capture_cache(tree_uuid)
|
2020-06-26 12:07:25 +02:00
|
|
|
if not cache:
|
|
|
|
return {'error': 'UUID missing in cache, try again later.'}
|
|
|
|
|
2020-06-26 18:11:22 +02:00
|
|
|
to_return: Dict[str, Any] = {'response': {'url': cache['url'], 'redirects': []}}
|
2020-06-26 12:07:25 +02:00
|
|
|
if not cache['redirects']:
|
|
|
|
to_return['response']['info'] = 'No redirects'
|
|
|
|
return to_return
|
|
|
|
if cache['incomplete_redirects']:
|
|
|
|
# Trigger tree build, get all redirects
|
2020-06-29 11:59:01 +02:00
|
|
|
lookyloo.load_tree(tree_uuid)
|
|
|
|
cache = lookyloo.capture_cache(tree_uuid)
|
2020-06-26 18:11:22 +02:00
|
|
|
if cache:
|
|
|
|
to_return['response']['redirects'] = cache['redirects']
|
|
|
|
else:
|
|
|
|
to_return['response']['redirects'] = cache['redirects']
|
|
|
|
|
2020-06-26 12:07:25 +02:00
|
|
|
return jsonify(to_return)
|