2021-03-01 15:47:06 +00:00
|
|
|
#!/usr/bin/env python3
|
|
|
|
|
2021-03-01 15:59:38 +00:00
|
|
|
from bot_utils import setup, send_msg
|
2021-07-18 06:22:32 +00:00
|
|
|
from random import randint
|
|
|
|
from time import sleep
|
2021-03-01 15:47:06 +00:00
|
|
|
|
2021-10-06 11:09:10 +00:00
|
|
|
import traceback
|
|
|
|
import os
|
2021-11-10 12:46:43 +00:00
|
|
|
import sys
|
2021-10-06 11:09:10 +00:00
|
|
|
import re
|
|
|
|
import asyncio
|
|
|
|
import requests
|
|
|
|
import json
|
|
|
|
|
2021-07-16 11:12:58 +00:00
|
|
|
setup()
|
2021-03-01 16:13:00 +00:00
|
|
|
|
2021-11-10 12:46:43 +00:00
|
|
|
|
|
|
|
# Check and load Airtable environment variables
|
|
|
|
airtable_env_vars = ["AIRTABLE_API_KEY", "AIRTABLE_BASE", "AIRTABLE_TABLE", "AIRTABLE_FIELD"]
|
|
|
|
|
|
|
|
for e in airtable_env_vars:
|
|
|
|
# Check environment variable is defined
|
|
|
|
gete = os.getenv(e)
|
|
|
|
if not gete:
|
|
|
|
sys.exit("Configuration error: Environment variable " + e + " is not defined")
|
|
|
|
# Set variable
|
2021-11-10 12:52:32 +00:00
|
|
|
exec(e + " = \"" + gete + "\"")
|
2021-03-01 22:39:28 +00:00
|
|
|
|
2021-10-06 11:09:10 +00:00
|
|
|
|
2021-07-16 11:12:58 +00:00
|
|
|
async def run_checks():
|
|
|
|
try:
|
|
|
|
await block_skylinks_from_airtable()
|
|
|
|
except: # catch all exceptions
|
|
|
|
trace = traceback.format_exc()
|
|
|
|
await send_msg("```\n{}\n```".format(trace), force_notify=True)
|
|
|
|
|
2021-03-01 22:39:28 +00:00
|
|
|
|
|
|
|
def exec(command):
|
|
|
|
return os.popen(command).read().strip()
|
|
|
|
|
2021-03-01 15:47:06 +00:00
|
|
|
|
|
|
|
async def block_skylinks_from_airtable():
|
2021-03-01 22:39:28 +00:00
|
|
|
print("Pulling blocked skylinks from Airtable via api integration")
|
|
|
|
headers = {"Authorization": "Bearer " + AIRTABLE_API_KEY}
|
2021-03-01 22:08:38 +00:00
|
|
|
skylinks = []
|
2021-03-01 22:15:54 +00:00
|
|
|
offset = None
|
2021-07-18 06:22:32 +00:00
|
|
|
retry = 0
|
2021-03-01 22:08:38 +00:00
|
|
|
while len(skylinks) == 0 or offset:
|
2021-10-06 11:09:10 +00:00
|
|
|
print(
|
|
|
|
"Requesting a batch of records from Airtable with "
|
|
|
|
+ (offset if offset else "empty")
|
|
|
|
+ " offset"
|
|
|
|
+ (" (retry " + str(retry) + ")" if retry else "")
|
|
|
|
)
|
|
|
|
query = "&".join(
|
|
|
|
["fields%5B%5D=" + AIRTABLE_FIELD, ("offset=" + offset) if offset else ""]
|
|
|
|
)
|
2021-03-01 22:39:28 +00:00
|
|
|
response = requests.get(
|
2021-10-06 11:09:10 +00:00
|
|
|
"https://api.airtable.com/v0/"
|
|
|
|
+ AIRTABLE_BASE
|
|
|
|
+ "/"
|
|
|
|
+ AIRTABLE_TABLE
|
|
|
|
+ "?"
|
|
|
|
+ query,
|
2021-03-01 22:39:28 +00:00
|
|
|
headers=headers,
|
2021-03-01 22:08:38 +00:00
|
|
|
)
|
2021-03-01 16:19:13 +00:00
|
|
|
|
2021-07-18 06:22:32 +00:00
|
|
|
# rate limited - sleep for 2-10 secs and retry (up to 100 times, ~10 minutes)
|
|
|
|
# https://support.airtable.com/hc/en-us/articles/203313985-Public-REST-API
|
|
|
|
# > 5 requests per second, per base
|
|
|
|
if response.status_code == 429:
|
|
|
|
if retry < 100:
|
|
|
|
retry = retry + 1
|
2021-10-06 11:09:10 +00:00
|
|
|
sleep(randint(1, 10))
|
2021-07-18 06:22:32 +00:00
|
|
|
continue
|
|
|
|
else:
|
2021-10-06 11:09:10 +00:00
|
|
|
return await send_msg(
|
|
|
|
"Airtable: too many retries, aborting!", force_notify=True
|
|
|
|
)
|
2021-07-18 06:22:32 +00:00
|
|
|
retry = 0 # reset retry counter
|
|
|
|
|
2021-03-01 22:39:28 +00:00
|
|
|
if response.status_code != 200:
|
|
|
|
status_code = str(response.status_code)
|
|
|
|
response_text = response.text or "empty response"
|
2021-10-06 11:09:10 +00:00
|
|
|
message = (
|
|
|
|
"Airtable blocklist integration responded with code "
|
|
|
|
+ status_code
|
|
|
|
+ ": "
|
|
|
|
+ response_text
|
|
|
|
)
|
2021-07-16 11:12:58 +00:00
|
|
|
return await send_msg(message, force_notify=False)
|
2021-03-01 22:39:28 +00:00
|
|
|
|
|
|
|
data = response.json()
|
2021-03-01 16:56:30 +00:00
|
|
|
|
2021-03-03 13:07:29 +00:00
|
|
|
if len(data["records"]) == 0:
|
2021-10-06 11:09:10 +00:00
|
|
|
return print(
|
|
|
|
"Airtable returned 0 records - make sure your configuration is correct"
|
|
|
|
)
|
2021-03-03 13:07:29 +00:00
|
|
|
|
2021-10-06 11:09:10 +00:00
|
|
|
skylinks = skylinks + [
|
|
|
|
entry["fields"].get(AIRTABLE_FIELD, "") for entry in data["records"]
|
|
|
|
]
|
|
|
|
skylinks = [
|
|
|
|
skylink for skylink in skylinks if skylink
|
|
|
|
] # filter empty skylinks, most likely empty rows
|
2021-03-01 22:39:28 +00:00
|
|
|
|
|
|
|
offset = data.get("offset")
|
|
|
|
|
2021-03-01 22:22:53 +00:00
|
|
|
print("Airtable returned total " + str(len(skylinks)) + " skylinks to block")
|
2021-03-01 22:39:28 +00:00
|
|
|
|
2021-03-02 12:40:18 +00:00
|
|
|
skylinks_returned = skylinks
|
2021-10-06 11:09:10 +00:00
|
|
|
skylinks = [
|
|
|
|
skylink for skylink in skylinks if re.search("^[a-zA-Z0-9_-]{46}$", skylink)
|
|
|
|
]
|
2021-03-02 12:40:18 +00:00
|
|
|
|
|
|
|
if len(skylinks_returned) != len(skylinks):
|
2021-10-06 11:09:10 +00:00
|
|
|
invalid_skylinks = [
|
|
|
|
str(skylink) for skylink in list(set(skylinks_returned) - set(skylinks))
|
|
|
|
]
|
|
|
|
message = (
|
|
|
|
str(len(invalid_skylinks))
|
|
|
|
+ " of the skylinks returned from Airtable are not valid"
|
|
|
|
)
|
2021-07-16 11:12:58 +00:00
|
|
|
await send_msg(message, file=("\n".join(invalid_skylinks)))
|
2021-03-02 12:40:18 +00:00
|
|
|
|
2021-03-01 22:39:28 +00:00
|
|
|
apipassword = exec("docker exec sia cat /sia-data/apipassword")
|
2021-10-06 11:09:10 +00:00
|
|
|
ipaddress = exec(
|
|
|
|
"docker inspect -f '{{range.NetworkSettings.Networks}}{{.IPAddress}}{{end}}' sia"
|
|
|
|
)
|
2021-03-01 22:39:28 +00:00
|
|
|
|
2021-03-01 16:08:10 +00:00
|
|
|
print("Sending blocklist request to siad")
|
2021-03-01 22:39:28 +00:00
|
|
|
response = requests.post(
|
|
|
|
"http://" + ipaddress + ":9980/skynet/blocklist",
|
|
|
|
auth=("", apipassword),
|
|
|
|
headers={"user-agent": "Sia-Agent"},
|
|
|
|
data=json.dumps({"add": skylinks}),
|
|
|
|
)
|
|
|
|
|
2021-03-01 16:08:10 +00:00
|
|
|
if response.status_code == 204:
|
2021-03-01 17:50:01 +00:00
|
|
|
print("Siad blocklist successfully updated with provided skylink")
|
2021-03-01 16:08:10 +00:00
|
|
|
else:
|
2021-03-01 22:39:28 +00:00
|
|
|
status_code = str(response.status_code)
|
|
|
|
response_text = response.text or "empty response"
|
2021-10-06 11:09:10 +00:00
|
|
|
message = (
|
|
|
|
"Siad blocklist endpoint responded with code "
|
|
|
|
+ status_code
|
|
|
|
+ ": "
|
|
|
|
+ response_text
|
|
|
|
)
|
2021-07-16 11:12:58 +00:00
|
|
|
return await send_msg(message, force_notify=False)
|
2021-03-01 15:47:06 +00:00
|
|
|
|
2021-10-26 07:49:03 +00:00
|
|
|
# Remove from NGINX cache
|
|
|
|
# NOTE:
|
|
|
|
# If there are changes to how the NGINX cache is being cleared, the same
|
|
|
|
# changes need to be applied to the /scripts/blocklist-skylink.sh script.
|
2021-03-01 17:41:41 +00:00
|
|
|
print("Searching nginx cache for blocked files")
|
2021-07-18 07:13:30 +00:00
|
|
|
cached_files_count = 0
|
2021-07-18 07:28:24 +00:00
|
|
|
batch_size = 1000
|
2021-07-18 07:24:45 +00:00
|
|
|
for i in range(0, len(skylinks), batch_size):
|
2021-03-05 22:43:18 +00:00
|
|
|
cached_files_command = (
|
2021-07-23 14:48:19 +00:00
|
|
|
"find /data/nginx/cache/ -type f | xargs -r grep -Els '^Skynet-Skylink: ("
|
2021-10-06 11:09:10 +00:00
|
|
|
+ "|".join(skylinks[i : i + batch_size])
|
2021-03-05 22:43:18 +00:00
|
|
|
+ ")'"
|
|
|
|
)
|
2021-10-06 11:09:10 +00:00
|
|
|
cached_files_count += int(
|
|
|
|
exec(
|
|
|
|
'docker exec nginx bash -c "'
|
|
|
|
+ cached_files_command
|
|
|
|
+ ' | xargs -r rm -v | wc -l"'
|
|
|
|
)
|
|
|
|
)
|
2021-03-01 17:39:43 +00:00
|
|
|
|
2021-07-18 07:13:30 +00:00
|
|
|
if cached_files_count == 0:
|
2021-03-01 17:39:43 +00:00
|
|
|
return print("No nginx cached files matching blocked skylinks were found")
|
|
|
|
|
2021-10-06 11:09:10 +00:00
|
|
|
message = (
|
|
|
|
"Purged " + str(cached_files_count) + " blocklisted files from nginx cache"
|
|
|
|
)
|
2021-07-16 11:12:58 +00:00
|
|
|
return await send_msg(message)
|
2021-03-01 22:39:28 +00:00
|
|
|
|
|
|
|
|
2021-07-16 11:12:58 +00:00
|
|
|
loop = asyncio.get_event_loop()
|
|
|
|
loop.run_until_complete(run_checks())
|
2021-03-01 16:09:18 +00:00
|
|
|
|
2021-03-01 15:47:06 +00:00
|
|
|
# --- BASH EQUIVALENT
|
2021-03-02 11:43:23 +00:00
|
|
|
# skylinks=$(curl "https://api.airtable.com/v0/${AIRTABLE_BASE}/${AIRTABLE_TABLE}?fields%5B%5D=${AIRTABLE_FIELD}" -H "Authorization: Bearer ${AIRTABLE_KEY}" | python3 -c "import sys, json; print('[\"' + '\",\"'.join([entry['fields']['Link'] for entry in json.load(sys.stdin)['records']]) + '\"]')")
|
2021-03-01 15:47:06 +00:00
|
|
|
# apipassword=$(docker exec sia cat /sia-data/apipassword)
|
|
|
|
# ipaddress=$(docker inspect -f '{{range.NetworkSettings.Networks}}{{.IPAddress}}{{end}}' sia)
|
|
|
|
# curl -A "Sia-Agent" --user "":"${apipassword}" --data "{\"add\" : ${skylinks}}" "${ipaddress}:9980/skynet/blocklist"
|