feat: Add parameter to set amount of time to delete, add several optimizations and safeguards

This commit is contained in:
Carlos Solís 2025-03-11 09:58:00 -06:00
parent 6229d79089
commit b6bc842221

View file

@ -1,16 +1,20 @@
#!/bin/bash
#Check for mariadb vs. mysql
dbengine=""
dboptimizeengine=""
if [[ -n $(type mariadb) ]]; then
dbengine="mariadb"
dboptimizeengine="mariadb-optimize"
elif [[ -n $(type mysql) ]]; then
dbengine="mysql"
dboptimizeengine="mysqloptimize"
else
exit
fi
intense_optimizations=${1:-"0"}
period_amount=${2:-"12"}
db="friendica"
period="1 MONTH"
period="${period_amount} MONTH"
tmpfile=/tmp/friendica-delete-old-users.csv
url=friendica.example.net
avatarfolder=/var/www/friendica/avatar
@ -44,58 +48,61 @@ loop() {
apcontactcount=$("${dbengine}" "${db}" -N -B -q -e "delete from \`apcontact\` where \`uri-id\` = ${id}; select row_count();" || echo 0)
diasporacontactcount=$("${dbengine}" "${db}" -N -B -q -e "delete from \`diaspora-contact\` where \`uri-id\` = ${id}; select row_count();" || echo 0)
while read -r tmp_counter tmp_picturecount tmp_postthreadcount tmp_postthreadusercount tmp_postusercount tmp_posttagcount tmp_postcontentcount tmp_postcount tmp_photocount tmp_contactcount tmp_apcontactcount tmp_diasporacontactcount; do
if [[ "${tmp_counter}" -gt "${counter}" ]]; then
counter=$((tmp_counter + 1))
if [[ -n "${tmp_counter}" && -n "${tmp_picturecount}" && -n "${tmp_postthreadcount}" && -n "${tmp_postthreadusercount}" && -n "${tmp_postusercount}" && -n "${tmp_posttagcount}" && -n "${tmp_postcontentcount}" && -n "${tmp_postcount}" && -n "${tmp_photocount}" && -n "${tmp_contactcount}" && -n "${tmp_apcontactcount}" && -n "${tmp_diasporacontactcount}" ]]; then
picturecount=$((picturecount + tmp_picturecount))
postthreadcount=$((postthreadcount + tmp_postthreadcount))
postthreadusercount=$((postthreadusercount + tmp_postthreadusercount))
postusercount=$((postusercount + tmp_postusercount))
posttagcount=$((posttagcount + tmp_posttagcount))
postcontentcount=$((postcontentcount + tmp_postcontentcount))
postcount=$((postcount + tmp_postcount))
photocount=$((photocount + tmp_photocount))
contactcount=$((contactcount + tmp_contactcount))
apcontactcount=$((apcontactcount + tmp_apcontactcount))
diasporacontactcount=$((diasporacontactcount + tmp_diasporacontactcount))
fi
picturecount=$((picturecount + tmp_picturecount))
postthreadcount=$((postthreadcount + tmp_postthreadcount))
postthreadusercount=$((postthreadusercount + tmp_postthreadusercount))
postusercount=$((postusercount + tmp_postusercount))
posttagcount=$((posttagcount + tmp_posttagcount))
postcontentcount=$((postcontentcount + tmp_postcontentcount))
postcount=$((postcount + tmp_postcount))
photocount=$((photocount + tmp_photocount))
contactcount=$((contactcount + tmp_contactcount))
apcontactcount=$((apcontactcount + tmp_apcontactcount))
diasporacontactcount=$((diasporacontactcount + tmp_diasporacontactcount))
done <"${tmpfile}"
response_left=$(printf "%s %s %s %s@%s " "${counter}" "${id}" "${lastitem::-9}" "${nick}" "${baseurltrimmed}")
response=$(printf "%spicture:%s " "${response}" "${picturecount}")
response=$(printf "%spost-thread:%s " "${response}" "${postthreadcount}")
response=$(printf "%spost-thread-user:%s " "${response}" "${postthreadusercount}")
response=$(printf "%spost-user:%s " "${response}" "${postusercount}")
response=$(printf "%spost-tag:%s " "${response}" "${posttagcount}")
response=$(printf "%spost-content:%s " "${response}" "${postcontentcount}")
response=$(printf "%spost:%s " "${response}" "${postcount}")
response=$(printf "%sphoto:%s " "${response}" "${photocount}")
response=$(printf "%scontact:%s " "${response}" "${contactcount}")
response=$(printf "%sapcontact:%s " "${response}" "${apcontactcount}")
response=$(printf "%sdiaspora-contact:%s " "${response}" "${diasporacontactcount}")
echo "${counter}" "${picturecount}" "${postthreadcount} ${postthreadusercount} ${postusercount} ${posttagcount} ${postcontentcount} ${postcount} ${photocount} ${contactcount} ${apcontactcount} ${diasporacontactcount}" >"${tmpfile}"
#Previous line clearance
#Measure length of string, blank only the excess
#Since this string is panned to both sides, we will need to account for two lengths
final_string_length_left="${#response_left}"
final_string_length_right="${#response}"
final_string_length=$((final_string_length_left + final_string_length_right))
#The string that will be used to insert the blanks
blank_string=""
columns_length="${COLUMNS}"
#Account for the case where the string is more than a terminal line long
while [[ "${final_string_length}" -gt "${columns_length}" ]]; do
columns_length=$((columns_length + COLUMNS))
done
blank_string_length=$((columns_length - final_string_length))
#Add enough blank spaces to fill the rest of the line
for ((count = 0; count < "${blank_string_length}"; count++)); do
blank_string=$(printf "%s " "${blank_string}")
done
#Add backspaces to align the next output
for ((count = 0; count < $((final_string_length + blank_string_length)); count++)); do
response_left=$(printf "\b%s" "${response_left}")
done
response=$(printf "%s%s%s" "${response_left}" "${blank_string}" "${response}")
printf "%s\r" "${response}"
if [[ -n "${counter}" && -n "${picturecount}" && -n "${postthreadcount}" && -n "${postthreadusercount}" && -n "${postusercount}" && -n "${posttagcount}" && -n "${postcontentcount}" && -n "${postcount}" && -n "${photocount}" && -n "${contactcount}" && -n "${apcontactcount}" && -n "${diasporacontactcount}" ]]; then
echo "${counter}" "${picturecount}" "${postthreadcount} ${postthreadusercount} ${postusercount} ${posttagcount} ${postcontentcount} ${postcount} ${photocount} ${contactcount} ${apcontactcount} ${diasporacontactcount}" >"${tmpfile}"
fi
if [[ -n "${lastitem}" && "${#lastitem}" -gt 9 ]]; then
response_left=$(printf "%s %s %s %s@%s " "${counter}" "${id}" "${lastitem::-9}" "${nick}" "${baseurltrimmed}")
response=$(printf "%spicture:%s " "${response}" "${picturecount}")
response=$(printf "%spost-thread:%s " "${response}" "${postthreadcount}")
response=$(printf "%spost-thread-user:%s " "${response}" "${postthreadusercount}")
response=$(printf "%spost-user:%s " "${response}" "${postusercount}")
response=$(printf "%spost-tag:%s " "${response}" "${posttagcount}")
response=$(printf "%spost-content:%s " "${response}" "${postcontentcount}")
response=$(printf "%spost:%s " "${response}" "${postcount}")
response=$(printf "%sphoto:%s " "${response}" "${photocount}")
response=$(printf "%scontact:%s " "${response}" "${contactcount}")
response=$(printf "%sapcontact:%s " "${response}" "${apcontactcount}")
response=$(printf "%sdiaspora-contact:%s " "${response}" "${diasporacontactcount}")
#Previous line clearance
#Measure length of string, blank only the excess
#Since this string is panned to both sides, we will need to account for two lengths
final_string_length_left="${#response_left}"
final_string_length_right="${#response}"
final_string_length=$((final_string_length_left + final_string_length_right))
#The string that will be used to insert the blanks
blank_string=""
columns_length="${COLUMNS}"
#Account for the case where the string is more than a terminal line long
while [[ "${final_string_length}" -gt "${columns_length}" ]]; do
columns_length=$((columns_length + COLUMNS))
done
blank_string_length=$((columns_length - final_string_length))
#Add enough blank spaces to fill the rest of the line
for ((count = 0; count < "${blank_string_length}"; count++)); do
blank_string=$(printf "%s " "${blank_string}")
done
#Add backspaces to align the next output
for ((count = 0; count < $((final_string_length + blank_string_length)); count++)); do
response_left=$(printf "\b%s" "${response_left}")
done
response=$(printf "%s%s%s" "${response_left}" "${blank_string}" "${response}")
printf "%s\r" "${response}"
fi
}
#Check if our dependencies are installed
@ -104,7 +111,14 @@ if [[ -n $(type curl) && -n "${dbengine}" && -n $(type "${dbengine}") && -n $(ty
touch "${tmpfile}"
echo "0 0 0 0 0 0 0 0 0 0 0 0" >"${tmpfile}"
if [[ "${intense_optimizations}" -gt 0 ]]; then
"${dbengine}" "${db}" -N -B -q -e "alter table \`contact\` add index if not exists \`contact_baseurl\` (baseurl)"
"${dbengine}" "${db}" -v -e "\
alter table \`contact\` add index if not exists \`tmp_contact_baseurl\` (baseurl); \
alter table \`post-thread\` add index if not exists \`tmp_post_thread_id\` (\`owner-id\`, \`author-id\`, \`causer-id\`); \
alter table \`post-thread-user\` add index if not exists \`tmp_post_thread_user_id\` (\`owner-id\`, \`author-id\`, \`causer-id\`); \
alter table \`post-user\` add index if not exists \`tmp_post_user_id\` (\`owner-id\`, \`author-id\`, \`causer-id\`); \
alter table \`post\` add index if not exists \`tmp_post_id\` (\`owner-id\`, \`author-id\`, \`causer-id\`); \
alter table \`photo\` add index if not exists \`tmp_photo_id\` (\`contact-id\`); \
"
fi
counter=0
was_empty=0
@ -114,7 +128,7 @@ if [[ -n $(type curl) && -n "${dbengine}" && -n $(type "${dbengine}") && -n $(ty
counter=$((counter + 1))
current_counter=$((current_counter + 1))
loop "${id}" "${nick}" "${baseurl}" "${lastitem}" "${counter}" &
if [[ $(jobs -r -p | wc -l) -ge $(($(getconf _NPROCESSORS_ONLN) * 1)) ]]; then
if [[ $(jobs -r -p | wc -l) -ge $(($(getconf _NPROCESSORS_ONLN) * 2)) ]]; then
wait -n
fi
done < <("${dbengine}" "${db}" -N -B -q -e \
@ -122,7 +136,11 @@ if [[ -n $(type curl) && -n "${dbengine}" && -n $(type "${dbengine}") && -n $(ty
c.\`id\` not in (select \`cid\` from \`user-contact\`) and \
c.\`id\` not in (select \`uid\` from \`user\`) and \
c.\`id\` not in ( select \`contact-id\` from \`group_member\`) and \
c.\`contact-type\` != 4 and not pending and \`last-item\` < CURDATE() - INTERVAL ${period} limit 1000")
c.\`contact-type\` != 4 and not pending and \`last-item\` < CURDATE() - INTERVAL ${period} and \
c.\`nick\` not in ('threads.sys', 'relay', 'friendica', 'sharkey', 'bot', 'catodon', \
'flipboard', 'lemmy', 'mitra', 'mstdn_bot', 'peertube', 'piefed', 'admin') \
limit 1000")
#not regexp_replace(c.\`nick\`, '[[:punct:]].*', '') like regexp_replace( replace(c.\`baseurl\`, 'https://', ''), '[[:punct:]].+', '')
wait
if [[ "${current_counter}" -eq 0 ]]; then
was_empty=1
@ -130,14 +148,22 @@ if [[ -n $(type curl) && -n "${dbengine}" && -n $(type "${dbengine}") && -n $(ty
done
printf "\n\r"
if [[ "${intense_optimizations}" -gt 0 ]]; then
"${dbengine}" "${db}" -N -B -q -e "alter table \`post-thread\` auto_increment = 1; \
"${dbengine}" "${db}" -v -e "\
alter table \`post-thread\` auto_increment = 1; \
alter table \`post-thread-user\` auto_increment = 1; \
alter table \`post-user\` auto_increment = 1; \
alter table \`post-tag\` auto_increment = 1; \
alter table \`post\` auto_increment = 1; \
alter table \`photo\` auto_increment = 1; \
alter table \`contact\` auto_increment = 1"
"${dbengine}" "${db}" -N -B -q -e "alter table \`contact\` drop index \`contact_baseurl\`"
alter table \`contact\` auto_increment = 1; \
alter table \`contact\` drop index \`tmp_contact_baseurl\`; \
alter table \`post-thread\` drop index \`tmp_post_thread_id\`; \
alter table \`post-thread-user\` drop index \`tmp_post_thread_user_id\`; \
alter table \`post-user\` drop index \`tmp_post_user_id\`; \
alter table \`post\` drop index \`tmp_post_id\`; \
alter table \`photo\` drop index\`tmp_photo_id\`; \
"
"${dboptimizeengine}" "${db}"
fi
rm -rf "${tmpfile}"
date