AIL-framework/var/www/modules/search/Flask_search.py

#!/usr/bin/env python3
# -*-coding:UTF-8 -*

'''
    Flask functions and routes for the trending modules page
'''
import redis
import json
import os
import datetime
import flask
from flask import Flask, render_template, jsonify, request, Blueprint

import Paste
from whoosh import index
from whoosh.fields import Schema, TEXT, ID
from whoosh.qparser import QueryParser

# ============ VARIABLES ============
import Flask_config

app = Flask_config.app
cfg = Flask_config.cfg
r_serv_pasteName = Flask_config.r_serv_pasteName
r_serv_metadata = Flask_config.r_serv_metadata
max_preview_char = Flask_config.max_preview_char
max_preview_modal = Flask_config.max_preview_modal
bootstrap_label = Flask_config.bootstrap_label


baseindexpath = os.path.join(os.environ['AIL_HOME'], cfg.get("Indexer", "path"))
indexRegister_path = os.path.join(os.environ['AIL_HOME'],
                         cfg.get("Indexer", "register"))

searches = Blueprint('searches', __name__, template_folder='templates')

# ============ FUNCTIONS ============
def get_current_index():
    with open(indexRegister_path, "r") as f:
        allIndex = f.read()
        allIndex = allIndex.split() # format [time1\ntime2]
        allIndex.sort()
        try:
            indexname = allIndex[-1].strip('\n\r')
        except IndexError as e:
            indexname = "no-index"
        indexpath = os.path.join(baseindexpath, indexname)
    return indexpath

def get_index_list(selected_index=""):
    temp = []
    index_list = []
    for dirs in os.listdir(baseindexpath):
        if os.path.isdir(os.path.join(baseindexpath, dirs)):
            value = dirs
            name = to_iso_date(dirs) + " - " + \
                    str(get_dir_size(dirs) / (1000*1000)) + " Mb " + \
                    "(" + str(get_item_count(dirs)) + " Items" + ")"
            flag = dirs==selected_index.split('/')[-1]
            if dirs == "old_index":
                temp = [value, name, flag]
            else:
                index_list.append([value, name, flag])

    index_list.sort(reverse=True, key=lambda x: x[0])
    if len(temp) != 0:
        index_list.append(temp)
    return index_list

def get_dir_size(directory):
    cur_sum = 0
    for directory, subdirs, files in os.walk(os.path.join(baseindexpath,directory)):
        try:
            cur_sum += sum(os.path.getsize(os.path.join(directory, name)) for name in files)
        except OSError as e: #File disappeared
            pass
    return cur_sum

def get_item_count(dirs):
    ix = index.open_dir(os.path.join(baseindexpath, dirs))
    return ix.doc_count_all()

def to_iso_date(timestamp):
    if timestamp == "old_index":
        return "old_index"
    return str(datetime.datetime.fromtimestamp(int(timestamp))).split()[0]


# ============ ROUTES ============

@searches.route("/search", methods=['POST'])
def search():
    query = request.form['query']
    q = []
    q.append(query)
    r = [] #complete path
    c = [] #preview of the paste content
    paste_date = []
    paste_size = []
    paste_tags = []
    index_name = request.form['index_name']
    num_elem_to_get = 50

    # select correct index
    if index_name is None or index_name == "0":
        selected_index = get_current_index()
    else:
        selected_index = os.path.join(baseindexpath, index_name)

    # Search filename
    for path in r_serv_pasteName.smembers(q[0]):
        r.append(path)
        paste = Paste.Paste(path)
        content = paste.get_p_content()
        content_range = max_preview_char if len(content)>max_preview_char else len(content)-1
        c.append(content[0:content_range])
        curr_date = str(paste._get_p_date())
        curr_date = curr_date[0:4]+'/'+curr_date[4:6]+'/'+curr_date[6:]
        paste_date.append(curr_date)
        paste_size.append(paste._get_p_size())

    # Search full line
    schema = Schema(title=TEXT(stored=True), path=ID(stored=True), content=TEXT)

    print(selected_index)
    ix = index.open_dir(selected_index)
    with ix.searcher() as searcher:
        query = QueryParser("content", ix.schema).parse(" ".join(q))
        results = searcher.search_page(query, 1, pagelen=num_elem_to_get)
        for x in results:
            r.append(x.items()[0][1])
            path = x.items()[0][1]
            paste = Paste.Paste(path)
            content = paste.get_p_content()
            content_range = max_preview_char if len(content)>max_preview_char else len(content)-1
            c.append(content[0:content_range])
            curr_date = str(paste._get_p_date())
            curr_date = curr_date[0:4]+'/'+curr_date[4:6]+'/'+curr_date[6:]
            paste_date.append(curr_date)
            paste_size.append(paste._get_p_size())
            p_tags = r_serv_metadata.smembers('tag:'+path)
            l_tags = []
            for tag in p_tags:
                complete_tag = tag
                tag = tag.split('=')
                if len(tag) > 1:
                    if tag[1] != '':
                        tag = tag[1][1:-1]
                    # no value
                    else:
                        tag = tag[0][1:-1]
                # use for custom tags
                else:
                    tag = tag[0]

                l_tags.append( (tag, complete_tag) )

            paste_tags.append(l_tags)
        results = searcher.search(query)
        num_res = len(results)

    index_min = 1
    index_max = len(get_index_list())
    return render_template("search.html", r=r, c=c,
            query=request.form['query'], paste_date=paste_date,
            paste_size=paste_size, char_to_display=max_preview_modal,
            num_res=num_res, index_min=index_min, index_max=index_max,
            bootstrap_label=bootstrap_label,
            paste_tags=paste_tags,
            index_list=get_index_list(selected_index)
           )


@searches.route("/get_more_search_result", methods=['POST'])
def get_more_search_result():
    query = request.form['query']
    q = []
    q.append(query)
    page_offset = int(request.form['page_offset'])
    index_name = request.form['index_name']
    num_elem_to_get = 50

    # select correct index
    if index_name is None or index_name == "0":
        selected_index = get_current_index()
    else:
        selected_index = os.path.join(baseindexpath, index_name)

    path_array = []
    preview_array = []
    date_array = []
    size_array = []
    list_tags = []

    schema = Schema(title=TEXT(stored=True), path=ID(stored=True), content=TEXT)

    ix = index.open_dir(selected_index)
    with ix.searcher() as searcher:
        query = QueryParser("content", ix.schema).parse(" ".join(q))
        results = searcher.search_page(query, page_offset, num_elem_to_get)
        for x in results:
            path = x.items()[0][1]
            path_array.append(path)
            paste = Paste.Paste(path)
            content = paste.get_p_content()
            content_range = max_preview_char if len(content)>max_preview_char else len(content)-1
            preview_array.append(content[0:content_range])
            curr_date = str(paste._get_p_date())
            curr_date = curr_date[0:4]+'/'+curr_date[4:6]+'/'+curr_date[6:]
            date_array.append(curr_date)
            size_array.append(paste._get_p_size())
            p_tags = r_serv_metadata.smembers('tag:'+path)
            l_tags = []
            for tag in p_tags:
                tag = tag.split('=')
                if len(tag) > 1:
                    if tag[1] != '':
                        tag = tag[1][1:-1]
                    # no value
                    else:
                        tag = tag[0][1:-1]
                # use for custom tags
                else:
                    tag = tag[0]

                l_tags.append(tag)
            list_tags.append(l_tags)

        to_return = {}
        to_return["path_array"] = path_array
        to_return["preview_array"] = preview_array
        to_return["date_array"] = date_array
        to_return["size_array"] = size_array
        to_return["list_tags"] = list_tags
        to_return["bootstrap_label"] = bootstrap_label
        if len(path_array) < num_elem_to_get: #pagelength
            to_return["moreData"] = False
        else:
            to_return["moreData"] = True

    return jsonify(to_return)


# ========= REGISTRATION =========
app.register_blueprint(searches)
decode with redis connection 2018-05-04 13:53:29 +02:00			`#!/usr/bin/env python3`
Splitted Flask_server into module related to website sections 2016-12-09 08:46:37 +01:00			`# --coding:UTF-8 -`

			`'''`
			`Flask functions and routes for the trending modules page`
			`'''`
			`import redis`
			`import json`
			`import os`
Added backward support + renamed index with timestamp 2017-03-15 11:51:35 +01:00			`import datetime`
Splitted Flask_server into module related to website sections 2016-12-09 08:46:37 +01:00			`import flask`
Draft of new organisation of the web interface. Usage of Flask's blueprint 2017-04-19 11:02:03 +02:00			`from flask import Flask, render_template, jsonify, request, Blueprint`
Splitted Flask_server into module related to website sections 2016-12-09 08:46:37 +01:00
			`import Paste`
Added display of number of elements inside the index + changed variables names 2017-03-15 10:07:46 +01:00			`from whoosh import index`
			`from whoosh.fields import Schema, TEXT, ID`
			`from whoosh.qparser import QueryParser`
Splitted Flask_server into module related to website sections 2016-12-09 08:46:37 +01:00
			`# ============ VARIABLES ============`
			`import Flask_config`

			`app = Flask_config.app`
			`cfg = Flask_config.cfg`
			`r_serv_pasteName = Flask_config.r_serv_pasteName`
display tag on important paste and search 2018-05-17 11:00:05 +02:00			`r_serv_metadata = Flask_config.r_serv_metadata`
Splitted Flask_server into module related to website sections 2016-12-09 08:46:37 +01:00			`max_preview_char = Flask_config.max_preview_char`
			`max_preview_modal = Flask_config.max_preview_modal`
clean 2018-06-01 11:26:45 +02:00			`bootstrap_label = Flask_config.bootstrap_label`
Added possibility to choose the index in search + Updated search page with jinja2 iter0 2017-03-15 09:39:48 +01:00

			`baseindexpath = os.path.join(os.environ['AIL_HOME'], cfg.get("Indexer", "path"))`
frontend python 3.5 upgrade 2018-04-17 16:06:32 +02:00			`indexRegister_path = os.path.join(os.environ['AIL_HOME'],`
Added possibility to choose the index in search + Updated search page with jinja2 iter0 2017-03-15 09:39:48 +01:00			`cfg.get("Indexer", "register"))`

Draft of new organisation of the web interface. Usage of Flask's blueprint 2017-04-19 11:02:03 +02:00			`searches = Blueprint('searches', __name__, template_folder='templates')`

Splitted Flask_server into module related to website sections 2016-12-09 08:46:37 +01:00			`# ============ FUNCTIONS ============`
Added possibility to choose the index in search + Updated search page with jinja2 iter0 2017-03-15 09:39:48 +01:00			`def get_current_index():`
			`with open(indexRegister_path, "r") as f:`
			`allIndex = f.read()`
Fixed all_index newline bug + added print of what's happening 2017-03-15 14:29:49 +01:00			`allIndex = allIndex.split() # format [time1\ntime2]`
Added possibility to choose the index in search + Updated search page with jinja2 iter0 2017-03-15 09:39:48 +01:00			`allIndex.sort()`
Added backward support + renamed index with timestamp 2017-03-15 11:51:35 +01:00			`try:`
			`indexname = allIndex[-1].strip('\n\r')`
			`except IndexError as e:`
			`indexname = "no-index"`
			`indexpath = os.path.join(baseindexpath, indexname)`
Added possibility to choose the index in search + Updated search page with jinja2 iter0 2017-03-15 09:39:48 +01:00			`return indexpath`

			`def get_index_list(selected_index=""):`
Changed os.system by os.mkdir + fixed bug during rotation 2017-03-15 14:05:13 +01:00			`temp = []`
Added possibility to choose the index in search + Updated search page with jinja2 iter0 2017-03-15 09:39:48 +01:00			`index_list = []`
			`for dirs in os.listdir(baseindexpath):`
			`if os.path.isdir(os.path.join(baseindexpath, dirs)):`
Added display of number of elements inside the index + changed variables names 2017-03-15 10:07:46 +01:00			`value = dirs`
Added backward support + renamed index with timestamp 2017-03-15 11:51:35 +01:00			`name = to_iso_date(dirs) + " - " + \`
Added display of number of elements inside the index + changed variables names 2017-03-15 10:07:46 +01:00			`str(get_dir_size(dirs) / (1000*1000)) + " Mb " + \`
			`"(" + str(get_item_count(dirs)) + " Items" + ")"`
			`flag = dirs==selected_index.split('/')[-1]`
Changed os.system by os.mkdir + fixed bug during rotation 2017-03-15 14:05:13 +01:00			`if dirs == "old_index":`
			`temp = [value, name, flag]`
			`else:`
			`index_list.append([value, name, flag])`
Added backward support + renamed index with timestamp 2017-03-15 11:51:35 +01:00
Changed os.system by os.mkdir + fixed bug during rotation 2017-03-15 14:05:13 +01:00			`index_list.sort(reverse=True, key=lambda x: x[0])`
			`if len(temp) != 0:`
			`index_list.append(temp)`
Added possibility to choose the index in search + Updated search page with jinja2 iter0 2017-03-15 09:39:48 +01:00			`return index_list`

			`def get_dir_size(directory):`
			`cur_sum = 0`
			`for directory, subdirs, files in os.walk(os.path.join(baseindexpath,directory)):`
Added backward support + renamed index with timestamp 2017-03-15 11:51:35 +01:00			`try:`
			`cur_sum += sum(os.path.getsize(os.path.join(directory, name)) for name in files)`
			`except OSError as e: #File disappeared`
			`pass`
Added possibility to choose the index in search + Updated search page with jinja2 iter0 2017-03-15 09:39:48 +01:00			`return cur_sum`
Splitted Flask_server into module related to website sections 2016-12-09 08:46:37 +01:00
Added display of number of elements inside the index + changed variables names 2017-03-15 10:07:46 +01:00			`def get_item_count(dirs):`
			`ix = index.open_dir(os.path.join(baseindexpath, dirs))`
			`return ix.doc_count_all()`

Added backward support + renamed index with timestamp 2017-03-15 11:51:35 +01:00			`def to_iso_date(timestamp):`
			`if timestamp == "old_index":`
			`return "old_index"`
			`return str(datetime.datetime.fromtimestamp(int(timestamp))).split()[0]`

Splitted Flask_server into module related to website sections 2016-12-09 08:46:37 +01:00
			`# ============ ROUTES ============`

Draft of new organisation of the web interface. Usage of Flask's blueprint 2017-04-19 11:02:03 +02:00			`@searches.route("/search", methods=['POST'])`
Splitted Flask_server into module related to website sections 2016-12-09 08:46:37 +01:00			`def search():`
			`query = request.form['query']`
			`q = []`
			`q.append(query)`
			`r = [] #complete path`
			`c = [] #preview of the paste content`
			`paste_date = []`
			`paste_size = []`
display tag on important paste and search 2018-05-17 11:00:05 +02:00			`paste_tags = []`
Added display of number of elements inside the index + changed variables names 2017-03-15 10:07:46 +01:00			`index_name = request.form['index_name']`
Splitted Flask_server into module related to website sections 2016-12-09 08:46:37 +01:00			`num_elem_to_get = 50`

Added possibility to choose the index in search + Updated search page with jinja2 iter0 2017-03-15 09:39:48 +01:00			`# select correct index`
Added display of number of elements inside the index + changed variables names 2017-03-15 10:07:46 +01:00			`if index_name is None or index_name == "0":`
Added possibility to choose the index in search + Updated search page with jinja2 iter0 2017-03-15 09:39:48 +01:00			`selected_index = get_current_index()`
			`else:`
Added display of number of elements inside the index + changed variables names 2017-03-15 10:07:46 +01:00			`selected_index = os.path.join(baseindexpath, index_name)`
Added possibility to choose the index in search + Updated search page with jinja2 iter0 2017-03-15 09:39:48 +01:00
Splitted Flask_server into module related to website sections 2016-12-09 08:46:37 +01:00			`# Search filename`
			`for path in r_serv_pasteName.smembers(q[0]):`
			`r.append(path)`
			`paste = Paste.Paste(path)`
frontend python 3.5 upgrade 2018-04-17 16:06:32 +02:00			`content = paste.get_p_content()`
Splitted Flask_server into module related to website sections 2016-12-09 08:46:37 +01:00			`content_range = max_preview_char if len(content)>max_preview_char else len(content)-1`
			`c.append(content[0:content_range])`
			`curr_date = str(paste._get_p_date())`
			`curr_date = curr_date[0:4]+'/'+curr_date[4:6]+'/'+curr_date[6:]`
			`paste_date.append(curr_date)`
			`paste_size.append(paste._get_p_size())`

			`# Search full line`
			`schema = Schema(title=TEXT(stored=True), path=ID(stored=True), content=TEXT)`

taxonomie + add tags + tags display 2018-05-23 16:58:56 +02:00			`print(selected_index)`
Added possibility to choose the index in search + Updated search page with jinja2 iter0 2017-03-15 09:39:48 +01:00			`ix = index.open_dir(selected_index)`
Splitted Flask_server into module related to website sections 2016-12-09 08:46:37 +01:00			`with ix.searcher() as searcher:`
			`query = QueryParser("content", ix.schema).parse(" ".join(q))`
			`results = searcher.search_page(query, 1, pagelen=num_elem_to_get)`
			`for x in results:`
			`r.append(x.items()[0][1])`
display tag on important paste and search 2018-05-17 11:00:05 +02:00			`path = x.items()[0][1]`
			`paste = Paste.Paste(path)`
frontend python 3.5 upgrade 2018-04-17 16:06:32 +02:00			`content = paste.get_p_content()`
Splitted Flask_server into module related to website sections 2016-12-09 08:46:37 +01:00			`content_range = max_preview_char if len(content)>max_preview_char else len(content)-1`
			`c.append(content[0:content_range])`
			`curr_date = str(paste._get_p_date())`
			`curr_date = curr_date[0:4]+'/'+curr_date[4:6]+'/'+curr_date[6:]`
			`paste_date.append(curr_date)`
			`paste_size.append(paste._get_p_size())`
display tag on important paste and search 2018-05-17 11:00:05 +02:00			`p_tags = r_serv_metadata.smembers('tag:'+path)`
			`l_tags = []`
			`for tag in p_tags:`
taxonomie + add tags + tags display 2018-05-23 16:58:56 +02:00			`complete_tag = tag`
display tag on important paste and search 2018-05-17 11:00:05 +02:00			`tag = tag.split('=')`
			`if len(tag) > 1:`
			`if tag[1] != '':`
			`tag = tag[1][1:-1]`
			`# no value`
			`else:`
			`tag = tag[0][1:-1]`
			`# use for custom tags`
			`else:`
			`tag = tag[0]`

taxonomie + add tags + tags display 2018-05-23 16:58:56 +02:00			`l_tags.append( (tag, complete_tag) )`
display tag on important paste and search 2018-05-17 11:00:05 +02:00
			`paste_tags.append(l_tags)`
Splitted Flask_server into module related to website sections 2016-12-09 08:46:37 +01:00			`results = searcher.search(query)`
			`num_res = len(results)`

Added possibility to choose the index in search + Updated search page with jinja2 iter0 2017-03-15 09:39:48 +01:00			`index_min = 1`
			`index_max = len(get_index_list())`
frontend python 3.5 upgrade 2018-04-17 16:06:32 +02:00			`return render_template("search.html", r=r, c=c,`
			`query=request.form['query'], paste_date=paste_date,`
			`paste_size=paste_size, char_to_display=max_preview_modal,`
Added possibility to choose the index in search + Updated search page with jinja2 iter0 2017-03-15 09:39:48 +01:00			`num_res=num_res, index_min=index_min, index_max=index_max,`
display tag on important paste and search 2018-05-17 11:00:05 +02:00			`bootstrap_label=bootstrap_label,`
			`paste_tags=paste_tags,`
Added possibility to choose the index in search + Updated search page with jinja2 iter0 2017-03-15 09:39:48 +01:00			`index_list=get_index_list(selected_index)`
			`)`
Splitted Flask_server into module related to website sections 2016-12-09 08:46:37 +01:00

Draft of new organisation of the web interface. Usage of Flask's blueprint 2017-04-19 11:02:03 +02:00			`@searches.route("/get_more_search_result", methods=['POST'])`
Splitted Flask_server into module related to website sections 2016-12-09 08:46:37 +01:00			`def get_more_search_result():`
			`query = request.form['query']`
			`q = []`
			`q.append(query)`
			`page_offset = int(request.form['page_offset'])`
Added display of number of elements inside the index + changed variables names 2017-03-15 10:07:46 +01:00			`index_name = request.form['index_name']`
Splitted Flask_server into module related to website sections 2016-12-09 08:46:37 +01:00			`num_elem_to_get = 50`

Added possibility to choose the index in search + Updated search page with jinja2 iter0 2017-03-15 09:39:48 +01:00			`# select correct index`
Added display of number of elements inside the index + changed variables names 2017-03-15 10:07:46 +01:00			`if index_name is None or index_name == "0":`
Added possibility to choose the index in search + Updated search page with jinja2 iter0 2017-03-15 09:39:48 +01:00			`selected_index = get_current_index()`
			`else:`
Added display of number of elements inside the index + changed variables names 2017-03-15 10:07:46 +01:00			`selected_index = os.path.join(baseindexpath, index_name)`
Added possibility to choose the index in search + Updated search page with jinja2 iter0 2017-03-15 09:39:48 +01:00
Splitted Flask_server into module related to website sections 2016-12-09 08:46:37 +01:00			`path_array = []`
			`preview_array = []`
			`date_array = []`
			`size_array = []`
display tag on important paste and search 2018-05-17 11:00:05 +02:00			`list_tags = []`

Splitted Flask_server into module related to website sections 2016-12-09 08:46:37 +01:00			`schema = Schema(title=TEXT(stored=True), path=ID(stored=True), content=TEXT)`

Added possibility to choose the index in search + Updated search page with jinja2 iter0 2017-03-15 09:39:48 +01:00			`ix = index.open_dir(selected_index)`
Splitted Flask_server into module related to website sections 2016-12-09 08:46:37 +01:00			`with ix.searcher() as searcher:`
			`query = QueryParser("content", ix.schema).parse(" ".join(q))`
frontend python 3.5 upgrade 2018-04-17 16:06:32 +02:00			`results = searcher.search_page(query, page_offset, num_elem_to_get)`
Splitted Flask_server into module related to website sections 2016-12-09 08:46:37 +01:00			`for x in results:`
display tag on important paste and search 2018-05-17 11:00:05 +02:00			`path = x.items()[0][1]`
			`path_array.append(path)`
			`paste = Paste.Paste(path)`
frontend python 3.5 upgrade 2018-04-17 16:06:32 +02:00			`content = paste.get_p_content()`
Splitted Flask_server into module related to website sections 2016-12-09 08:46:37 +01:00			`content_range = max_preview_char if len(content)>max_preview_char else len(content)-1`
			`preview_array.append(content[0:content_range])`
			`curr_date = str(paste._get_p_date())`
			`curr_date = curr_date[0:4]+'/'+curr_date[4:6]+'/'+curr_date[6:]`
			`date_array.append(curr_date)`
			`size_array.append(paste._get_p_size())`
display tag on important paste and search 2018-05-17 11:00:05 +02:00			`p_tags = r_serv_metadata.smembers('tag:'+path)`
			`l_tags = []`
			`for tag in p_tags:`
			`tag = tag.split('=')`
			`if len(tag) > 1:`
			`if tag[1] != '':`
			`tag = tag[1][1:-1]`
			`# no value`
			`else:`
			`tag = tag[0][1:-1]`
			`# use for custom tags`
			`else:`
			`tag = tag[0]`

			`l_tags.append(tag)`
			`list_tags.append(l_tags)`

Splitted Flask_server into module related to website sections 2016-12-09 08:46:37 +01:00			`to_return = {}`
			`to_return["path_array"] = path_array`
			`to_return["preview_array"] = preview_array`
			`to_return["date_array"] = date_array`
			`to_return["size_array"] = size_array`
display tag on important paste and search 2018-05-17 11:00:05 +02:00			`to_return["list_tags"] = list_tags`
			`to_return["bootstrap_label"] = bootstrap_label`
Splitted Flask_server into module related to website sections 2016-12-09 08:46:37 +01:00			`if len(path_array) < num_elem_to_get: #pagelength`
			`to_return["moreData"] = False`
			`else:`
			`to_return["moreData"] = True`

			`return jsonify(to_return)`


Draft of new organisation of the web interface. Usage of Flask's blueprint 2017-04-19 11:02:03 +02:00			`# ========= REGISTRATION =========`
			`app.register_blueprint(searches)`