feat: Add parameter to set amount of time to delete, add several optimizations and safeguards

This commit is contained in:
Carlos Solís 2025-03-11 09:58:00 -06:00
parent 6229d79089
commit b6bc842221

View file

@ -1,16 +1,20 @@
#!/bin/bash #!/bin/bash
#Check for mariadb vs. mysql #Check for mariadb vs. mysql
dbengine="" dbengine=""
dboptimizeengine=""
if [[ -n $(type mariadb) ]]; then if [[ -n $(type mariadb) ]]; then
dbengine="mariadb" dbengine="mariadb"
dboptimizeengine="mariadb-optimize"
elif [[ -n $(type mysql) ]]; then elif [[ -n $(type mysql) ]]; then
dbengine="mysql" dbengine="mysql"
dboptimizeengine="mysqloptimize"
else else
exit exit
fi fi
intense_optimizations=${1:-"0"} intense_optimizations=${1:-"0"}
period_amount=${2:-"12"}
db="friendica" db="friendica"
period="1 MONTH" period="${period_amount} MONTH"
tmpfile=/tmp/friendica-delete-old-users.csv tmpfile=/tmp/friendica-delete-old-users.csv
url=friendica.example.net url=friendica.example.net
avatarfolder=/var/www/friendica/avatar avatarfolder=/var/www/friendica/avatar
@ -44,58 +48,61 @@ loop() {
apcontactcount=$("${dbengine}" "${db}" -N -B -q -e "delete from \`apcontact\` where \`uri-id\` = ${id}; select row_count();" || echo 0) apcontactcount=$("${dbengine}" "${db}" -N -B -q -e "delete from \`apcontact\` where \`uri-id\` = ${id}; select row_count();" || echo 0)
diasporacontactcount=$("${dbengine}" "${db}" -N -B -q -e "delete from \`diaspora-contact\` where \`uri-id\` = ${id}; select row_count();" || echo 0) diasporacontactcount=$("${dbengine}" "${db}" -N -B -q -e "delete from \`diaspora-contact\` where \`uri-id\` = ${id}; select row_count();" || echo 0)
while read -r tmp_counter tmp_picturecount tmp_postthreadcount tmp_postthreadusercount tmp_postusercount tmp_posttagcount tmp_postcontentcount tmp_postcount tmp_photocount tmp_contactcount tmp_apcontactcount tmp_diasporacontactcount; do while read -r tmp_counter tmp_picturecount tmp_postthreadcount tmp_postthreadusercount tmp_postusercount tmp_posttagcount tmp_postcontentcount tmp_postcount tmp_photocount tmp_contactcount tmp_apcontactcount tmp_diasporacontactcount; do
if [[ "${tmp_counter}" -gt "${counter}" ]]; then if [[ -n "${tmp_counter}" && -n "${tmp_picturecount}" && -n "${tmp_postthreadcount}" && -n "${tmp_postthreadusercount}" && -n "${tmp_postusercount}" && -n "${tmp_posttagcount}" && -n "${tmp_postcontentcount}" && -n "${tmp_postcount}" && -n "${tmp_photocount}" && -n "${tmp_contactcount}" && -n "${tmp_apcontactcount}" && -n "${tmp_diasporacontactcount}" ]]; then
counter=$((tmp_counter + 1)) picturecount=$((picturecount + tmp_picturecount))
postthreadcount=$((postthreadcount + tmp_postthreadcount))
postthreadusercount=$((postthreadusercount + tmp_postthreadusercount))
postusercount=$((postusercount + tmp_postusercount))
posttagcount=$((posttagcount + tmp_posttagcount))
postcontentcount=$((postcontentcount + tmp_postcontentcount))
postcount=$((postcount + tmp_postcount))
photocount=$((photocount + tmp_photocount))
contactcount=$((contactcount + tmp_contactcount))
apcontactcount=$((apcontactcount + tmp_apcontactcount))
diasporacontactcount=$((diasporacontactcount + tmp_diasporacontactcount))
fi fi
picturecount=$((picturecount + tmp_picturecount))
postthreadcount=$((postthreadcount + tmp_postthreadcount))
postthreadusercount=$((postthreadusercount + tmp_postthreadusercount))
postusercount=$((postusercount + tmp_postusercount))
posttagcount=$((posttagcount + tmp_posttagcount))
postcontentcount=$((postcontentcount + tmp_postcontentcount))
postcount=$((postcount + tmp_postcount))
photocount=$((photocount + tmp_photocount))
contactcount=$((contactcount + tmp_contactcount))
apcontactcount=$((apcontactcount + tmp_apcontactcount))
diasporacontactcount=$((diasporacontactcount + tmp_diasporacontactcount))
done <"${tmpfile}" done <"${tmpfile}"
response_left=$(printf "%s %s %s %s@%s " "${counter}" "${id}" "${lastitem::-9}" "${nick}" "${baseurltrimmed}") if [[ -n "${counter}" && -n "${picturecount}" && -n "${postthreadcount}" && -n "${postthreadusercount}" && -n "${postusercount}" && -n "${posttagcount}" && -n "${postcontentcount}" && -n "${postcount}" && -n "${photocount}" && -n "${contactcount}" && -n "${apcontactcount}" && -n "${diasporacontactcount}" ]]; then
response=$(printf "%spicture:%s " "${response}" "${picturecount}") echo "${counter}" "${picturecount}" "${postthreadcount} ${postthreadusercount} ${postusercount} ${posttagcount} ${postcontentcount} ${postcount} ${photocount} ${contactcount} ${apcontactcount} ${diasporacontactcount}" >"${tmpfile}"
response=$(printf "%spost-thread:%s " "${response}" "${postthreadcount}") fi
response=$(printf "%spost-thread-user:%s " "${response}" "${postthreadusercount}") if [[ -n "${lastitem}" && "${#lastitem}" -gt 9 ]]; then
response=$(printf "%spost-user:%s " "${response}" "${postusercount}") response_left=$(printf "%s %s %s %s@%s " "${counter}" "${id}" "${lastitem::-9}" "${nick}" "${baseurltrimmed}")
response=$(printf "%spost-tag:%s " "${response}" "${posttagcount}") response=$(printf "%spicture:%s " "${response}" "${picturecount}")
response=$(printf "%spost-content:%s " "${response}" "${postcontentcount}") response=$(printf "%spost-thread:%s " "${response}" "${postthreadcount}")
response=$(printf "%spost:%s " "${response}" "${postcount}") response=$(printf "%spost-thread-user:%s " "${response}" "${postthreadusercount}")
response=$(printf "%sphoto:%s " "${response}" "${photocount}") response=$(printf "%spost-user:%s " "${response}" "${postusercount}")
response=$(printf "%scontact:%s " "${response}" "${contactcount}") response=$(printf "%spost-tag:%s " "${response}" "${posttagcount}")
response=$(printf "%sapcontact:%s " "${response}" "${apcontactcount}") response=$(printf "%spost-content:%s " "${response}" "${postcontentcount}")
response=$(printf "%sdiaspora-contact:%s " "${response}" "${diasporacontactcount}") response=$(printf "%spost:%s " "${response}" "${postcount}")
echo "${counter}" "${picturecount}" "${postthreadcount} ${postthreadusercount} ${postusercount} ${posttagcount} ${postcontentcount} ${postcount} ${photocount} ${contactcount} ${apcontactcount} ${diasporacontactcount}" >"${tmpfile}" response=$(printf "%sphoto:%s " "${response}" "${photocount}")
#Previous line clearance response=$(printf "%scontact:%s " "${response}" "${contactcount}")
#Measure length of string, blank only the excess response=$(printf "%sapcontact:%s " "${response}" "${apcontactcount}")
#Since this string is panned to both sides, we will need to account for two lengths response=$(printf "%sdiaspora-contact:%s " "${response}" "${diasporacontactcount}")
final_string_length_left="${#response_left}" #Previous line clearance
final_string_length_right="${#response}" #Measure length of string, blank only the excess
final_string_length=$((final_string_length_left + final_string_length_right)) #Since this string is panned to both sides, we will need to account for two lengths
#The string that will be used to insert the blanks final_string_length_left="${#response_left}"
blank_string="" final_string_length_right="${#response}"
columns_length="${COLUMNS}" final_string_length=$((final_string_length_left + final_string_length_right))
#Account for the case where the string is more than a terminal line long #The string that will be used to insert the blanks
while [[ "${final_string_length}" -gt "${columns_length}" ]]; do blank_string=""
columns_length=$((columns_length + COLUMNS)) columns_length="${COLUMNS}"
done #Account for the case where the string is more than a terminal line long
blank_string_length=$((columns_length - final_string_length)) while [[ "${final_string_length}" -gt "${columns_length}" ]]; do
#Add enough blank spaces to fill the rest of the line columns_length=$((columns_length + COLUMNS))
for ((count = 0; count < "${blank_string_length}"; count++)); do done
blank_string=$(printf "%s " "${blank_string}") blank_string_length=$((columns_length - final_string_length))
done #Add enough blank spaces to fill the rest of the line
#Add backspaces to align the next output for ((count = 0; count < "${blank_string_length}"; count++)); do
for ((count = 0; count < $((final_string_length + blank_string_length)); count++)); do blank_string=$(printf "%s " "${blank_string}")
response_left=$(printf "\b%s" "${response_left}") done
done #Add backspaces to align the next output
response=$(printf "%s%s%s" "${response_left}" "${blank_string}" "${response}") for ((count = 0; count < $((final_string_length + blank_string_length)); count++)); do
printf "%s\r" "${response}" response_left=$(printf "\b%s" "${response_left}")
done
response=$(printf "%s%s%s" "${response_left}" "${blank_string}" "${response}")
printf "%s\r" "${response}"
fi
} }
#Check if our dependencies are installed #Check if our dependencies are installed
@ -104,7 +111,14 @@ if [[ -n $(type curl) && -n "${dbengine}" && -n $(type "${dbengine}") && -n $(ty
touch "${tmpfile}" touch "${tmpfile}"
echo "0 0 0 0 0 0 0 0 0 0 0 0" >"${tmpfile}" echo "0 0 0 0 0 0 0 0 0 0 0 0" >"${tmpfile}"
if [[ "${intense_optimizations}" -gt 0 ]]; then if [[ "${intense_optimizations}" -gt 0 ]]; then
"${dbengine}" "${db}" -N -B -q -e "alter table \`contact\` add index if not exists \`contact_baseurl\` (baseurl)" "${dbengine}" "${db}" -v -e "\
alter table \`contact\` add index if not exists \`tmp_contact_baseurl\` (baseurl); \
alter table \`post-thread\` add index if not exists \`tmp_post_thread_id\` (\`owner-id\`, \`author-id\`, \`causer-id\`); \
alter table \`post-thread-user\` add index if not exists \`tmp_post_thread_user_id\` (\`owner-id\`, \`author-id\`, \`causer-id\`); \
alter table \`post-user\` add index if not exists \`tmp_post_user_id\` (\`owner-id\`, \`author-id\`, \`causer-id\`); \
alter table \`post\` add index if not exists \`tmp_post_id\` (\`owner-id\`, \`author-id\`, \`causer-id\`); \
alter table \`photo\` add index if not exists \`tmp_photo_id\` (\`contact-id\`); \
"
fi fi
counter=0 counter=0
was_empty=0 was_empty=0
@ -114,7 +128,7 @@ if [[ -n $(type curl) && -n "${dbengine}" && -n $(type "${dbengine}") && -n $(ty
counter=$((counter + 1)) counter=$((counter + 1))
current_counter=$((current_counter + 1)) current_counter=$((current_counter + 1))
loop "${id}" "${nick}" "${baseurl}" "${lastitem}" "${counter}" & loop "${id}" "${nick}" "${baseurl}" "${lastitem}" "${counter}" &
if [[ $(jobs -r -p | wc -l) -ge $(($(getconf _NPROCESSORS_ONLN) * 1)) ]]; then if [[ $(jobs -r -p | wc -l) -ge $(($(getconf _NPROCESSORS_ONLN) * 2)) ]]; then
wait -n wait -n
fi fi
done < <("${dbengine}" "${db}" -N -B -q -e \ done < <("${dbengine}" "${db}" -N -B -q -e \
@ -122,7 +136,11 @@ if [[ -n $(type curl) && -n "${dbengine}" && -n $(type "${dbengine}") && -n $(ty
c.\`id\` not in (select \`cid\` from \`user-contact\`) and \ c.\`id\` not in (select \`cid\` from \`user-contact\`) and \
c.\`id\` not in (select \`uid\` from \`user\`) and \ c.\`id\` not in (select \`uid\` from \`user\`) and \
c.\`id\` not in ( select \`contact-id\` from \`group_member\`) and \ c.\`id\` not in ( select \`contact-id\` from \`group_member\`) and \
c.\`contact-type\` != 4 and not pending and \`last-item\` < CURDATE() - INTERVAL ${period} limit 1000") c.\`contact-type\` != 4 and not pending and \`last-item\` < CURDATE() - INTERVAL ${period} and \
c.\`nick\` not in ('threads.sys', 'relay', 'friendica', 'sharkey', 'bot', 'catodon', \
'flipboard', 'lemmy', 'mitra', 'mstdn_bot', 'peertube', 'piefed', 'admin') \
limit 1000")
#not regexp_replace(c.\`nick\`, '[[:punct:]].*', '') like regexp_replace( replace(c.\`baseurl\`, 'https://', ''), '[[:punct:]].+', '')
wait wait
if [[ "${current_counter}" -eq 0 ]]; then if [[ "${current_counter}" -eq 0 ]]; then
was_empty=1 was_empty=1
@ -130,14 +148,22 @@ if [[ -n $(type curl) && -n "${dbengine}" && -n $(type "${dbengine}") && -n $(ty
done done
printf "\n\r" printf "\n\r"
if [[ "${intense_optimizations}" -gt 0 ]]; then if [[ "${intense_optimizations}" -gt 0 ]]; then
"${dbengine}" "${db}" -N -B -q -e "alter table \`post-thread\` auto_increment = 1; \ "${dbengine}" "${db}" -v -e "\
alter table \`post-thread\` auto_increment = 1; \
alter table \`post-thread-user\` auto_increment = 1; \ alter table \`post-thread-user\` auto_increment = 1; \
alter table \`post-user\` auto_increment = 1; \ alter table \`post-user\` auto_increment = 1; \
alter table \`post-tag\` auto_increment = 1; \ alter table \`post-tag\` auto_increment = 1; \
alter table \`post\` auto_increment = 1; \ alter table \`post\` auto_increment = 1; \
alter table \`photo\` auto_increment = 1; \ alter table \`photo\` auto_increment = 1; \
alter table \`contact\` auto_increment = 1" alter table \`contact\` auto_increment = 1; \
"${dbengine}" "${db}" -N -B -q -e "alter table \`contact\` drop index \`contact_baseurl\`" alter table \`contact\` drop index \`tmp_contact_baseurl\`; \
alter table \`post-thread\` drop index \`tmp_post_thread_id\`; \
alter table \`post-thread-user\` drop index \`tmp_post_thread_user_id\`; \
alter table \`post-user\` drop index \`tmp_post_user_id\`; \
alter table \`post\` drop index \`tmp_post_id\`; \
alter table \`photo\` drop index\`tmp_photo_id\`; \
"
"${dboptimizeengine}" "${db}"
fi fi
rm -rf "${tmpfile}" rm -rf "${tmpfile}"
date date