new: [openai chatgpt] OpenAI source bot added

pull/251/head
Alexandre Dulaunoy 2023-08-08 11:45:53 +02:00
parent ebb012515e
commit 495b629d08
No known key found for this signature in database
GPG Key ID: 09E2CD4944E6CBCD
3 changed files with 55 additions and 0 deletions

View File

@ -36,6 +36,7 @@ python3 generate-tenable.py
python3 generate-microsoft-azure-appid.py
python3 generate-chrome-crux-1m.py
python3 generate-digitalside.py
python3 generate-gptbot.py
popd
./jq_all_the_things.sh

View File

@ -0,0 +1,20 @@
{
"description": "OpenAI gptbot crawler (https://openai.com/gptbot-ranges.txt)",
"list": [
"20.15.240.176/28",
"20.15.240.64/27",
"20.15.240.96/28",
"20.15.241.0/28",
"20.15.242.128/27",
"20.15.242.192/28",
"40.83.2.64/28"
],
"matching_attributes": [
"ip-src",
"ip-dst",
"domain|ip"
],
"name": "List of known IP address ranges for OpenAI GPT crawler bot",
"type": "cidr",
"version": 20230808
}

34
tools/generate-gptbot.py Executable file
View File

@ -0,0 +1,34 @@
#!/usr/bin/env python3
# -*- coding: utf-8 -*-
import json
from generator import download_to_file, get_version, write_to_file, get_abspath_source_file, consolidate_networks
def process(file, dst):
l = []
with open(get_abspath_source_file(file), 'r') as freetext_file:
for line in freetext_file:
cidr = line.rstrip()
l.append(cidr)
warninglist = {
'name': 'List of known IP address ranges for OpenAI GPT crawler bot',
'version': get_version(),
'description': 'OpenAI gptbot crawler (https://openai.com/gptbot-ranges.txt)',
'type': 'cidr',
'list': consolidate_networks(l),
'matching_attributes': ["ip-src", "ip-dst", "domain|ip"]
}
write_to_file(warninglist, dst)
if __name__ == '__main__':
gptbot_url = "https://openai.com/gptbot-ranges.txt"
gptbot_file = "openai-gptbot-ranges.json"
gptbot_dst = "openai-gptbot"
download_to_file(gptbot_url, gptbot_file)
process(gptbot_file, gptbot_dst)