misp-modules/misp_modules/modules/expansion/wiki.py

59 lines
2.1 KiB
Python
Raw Permalink Normal View History

import json
from SPARQLWrapper import SPARQLWrapper, JSON
misperrors = {'error': 'Error'}
mispattributes = {'input': ['text'], 'output': ['text']}
2024-08-12 11:23:10 +02:00
moduleinfo = {
'version': '0.2',
'author': 'Roman Graf',
'description': 'An expansion hover module to extract information from Wikidata to have additional information about particular term for analysis.',
'module-type': ['hover'],
'name': 'Wikidata Lookup',
'logo': 'wikidata.png',
'requirements': ['SPARQLWrapper python library'],
'features': 'This module takes a text attribute as input and queries the Wikidata API. If the text attribute is clear enough to define a specific term, the API returns a wikidata link in response.',
'references': ['https://www.wikidata.org'],
'input': 'Text attribute.',
'output': 'Text attribute.',
}
moduleconfig = []
# sample query text 'Microsoft' should provide Wikidata link https://www.wikidata.org/wiki/Q2283 in response
wiki_api_url = 'https://query.wikidata.org/bigdata/namespace/wdq/sparql'
def handler(q=False):
if q is False:
return False
request = json.loads(q)
if not request.get('text'):
misperrors['error'] = 'Query text missing'
return misperrors
2018-12-11 15:29:09 +01:00
sparql = SPARQLWrapper(wiki_api_url, agent='Mozilla/5.0 (Macintosh; Intel Mac OS X 10_11_5) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/50.0.2661.102 Safari/537.36')
query_string = \
2018-12-11 15:29:09 +01:00
"SELECT ?item \n" \
"WHERE { \n" \
"?item rdfs:label\"" + request.get('text') + "\" @en \n" \
"}\n"
sparql.setQuery(query_string)
sparql.setReturnFormat(JSON)
results = sparql.query().convert()
try:
result = results["results"]["bindings"]
summary = result[0]["item"]["value"] if result else 'No additional data found on Wikidata'
except Exception as e:
misperrors['error'] = 'wikidata API not accessible {}'.format(e)
return misperrors['error']
r = {'results': [{'types': mispattributes['output'], 'values': summary}]}
return r
def introspection():
return mispattributes
def version():
moduleinfo['config'] = moduleconfig
return moduleinfo