Block skylinks in batches

This commit is contained in:
Filip Rysavy 2021-12-13 17:35:00 +01:00
parent d00b1f68bd
commit b4e2eec2fe
No known key found for this signature in database
GPG Key ID: EA1F430401C92D99
3 changed files with 46 additions and 17 deletions

View File

@ -0,0 +1 @@
- Block skylinks in batches to improve performance.

View File

@ -8,6 +8,9 @@
set -e # exit on first error
# Number of skylinks to block within one batch
BATCH_SIZE=1000
if [ -z "$1" ]; then
echo "Please provide either a skylink or file with skylinks separated by new lines" && exit 1
fi
@ -34,23 +37,45 @@ else
skylinks=("$1") # just single skylink passed as input argument
fi
for skylink in "${skylinks[@]}";
do
echo ".. ⌁ Blocking skylink ${skylink}"
# Add to Sia blocklist
docker exec sia siac skynet blocklist add "${skylink}"
# Remove from NGINX cache
# NOTE:
# If there are changes to how the NGINX cache is being cleared, the same
# changes need to be applied to the /setup-scripts/blocklist-airtable.py
# script.
cached_files_command="find /data/nginx/cache/ -type f | xargs -r grep -Els '^Skynet-Skylink: ${skylink}'"
docker exec -it nginx bash -c "${cached_files_command} | xargs -r rm"
echo ".. ⌁ Skylink ${skylink} Blocked"
echo "--------------------------------------------"
# Block skylinks in batches
skylinks_len=${#skylinks[@]}
for (( i = 0; i < $skylinks_len; i++ )); do
# Add skylink to batch
skylink="${skylinks[$i]}"
echo ".. ⌁ Adding skylink ${skylink} to batch..."
batch_skylinks+=("$skylink")
# For performance reasons on each iteration we do not block a single
# skylink, but we block skylinks in batches with BATCH_SIZE size mainly
# because of nginx cache search.
# If (batch len == batch size) or (we have last batch):
if (( ${#batch_skylinks[@]} == $BATCH_SIZE || $i == $skylinks_len - 1 )); then
echo "--------------------------------------------"
# Add to Sia blocklist
echo "Blocking batch skylinks in skyd..."
skylinks_space_separated="$(IFS=' '; echo "${batch_skylinks[*]}")"
docker exec sia siac skynet blocklist add $skylinks_space_separated
# Remove from NGINX cache
# NOTE:
# If there are changes to how the NGINX cache is being cleared, the same
# changes need to be applied to the /setup-scripts/blocklist-airtable.py
# script.
echo "Removing batch skylinks from Nginx cache..."
skylinks_pipe_separated="$(IFS='|'; echo "${batch_skylinks[*]}")"
cached_files_command="find /data/nginx/cache/ -type f | xargs -r grep -Els '^Skynet-Skylink: ($skylinks_pipe_separated)'"
docker exec -it nginx bash -c "${cached_files_command} | xargs -r rm"
# Clear batch
batch_skylinks=()
echo "--------------------------------------------"
fi
done
# Hot reload Nginx to get rid of deleted open files
echo "Hot reloading nginx..."
docker exec nginx nginx -s reload
echo "✓ All done !"

View File

@ -171,6 +171,9 @@ async def block_skylinks_from_airtable():
if cached_files_count == 0:
return print("No nginx cached files matching blocked skylinks were found")
else:
print("Hot reloading nginx")
exec('docker exec nginx nginx -s reload')
message = (
"Purged " + str(cached_files_count) + " blocklisted files from nginx cache"