public-scripts/youtube-download-channel.sh

#!/bin/bash
#Parameters:
#1st parameter: Channel you want to turn into a playlist. Leave blank to save your subscriptions (cookie file required)
channel=${1:-"subscriptions"}
#2nd parameter: Time limit for the download. Leave blank to save all videos from the last month.
breaktime=${2:-"today-1month"}
#3rd parameter: Seconds between data requests. Decrease to make downloads faster, but your account may be temporarily blocked if you use a number too low.
sleeptime=${3:-"1.0"}
#4th parameter: Whether to enable exporting to FreeTube playlist database (1=on by default, 0=off)
enabledb=${4:-"1"}
#5th parameter: Whether to enable exporting to a CSV file (1=on by default, 0=off)
enablecsv=${5:-"1"}
#Internal variables:
#Via https://stackoverflow.com/questions/59895/how-do-i-get-the-directory-where-a-bash-script-is-located-from-within-the-script
folder=$(cd -- "$(dirname -- "${BASH_SOURCE[0]}")" &>/dev/null && pwd)
#Required to download your own subscriptions.
#Obtain this file through the procedure listed at
# https://github.com/yt-dlp/yt-dlp/wiki/FAQ#how-do-i-pass-cookies-to-yt-dlp
#and place it next to your script.
cookies="${folder}/yt-cookies.txt"
subfolder="${folder}/subscriptions"
temporary="/tmp/subscriptions-${channel}"
if [[ ! -w "/tmp" ]]; then
	temporary="${subfolder}/subscriptions-${channel}"
fi
archive="${subfolder}/${channel}.txt"
sortcsv="${temporary}/${channel}-sort.csv"
csv="${subfolder}/${channel}.csv"
tmpcsv="${temporary}/${channel}.csv"
json="${subfolder}/${channel}.db"
python="python3"
if [[ -f "/opt/venv/bin/python" ]]; then
	python="/opt/venv/bin/python"
fi
ytdl="yt-dlp"
if [[ -f "/usr/bin/yt-dlp" ]]; then
	ytdl="/usr/bin/yt-dlp"
fi
if [[ -f "/opt/venv/bin/yt-dlp" ]]; then
	ytdl="/opt/venv/bin/yt-dlp"
fi
if [[ -f "/data/data/com.termux/files/usr/bin/yt-dlp" ]]; then
	ytdl="/data/data/com.termux/files/usr/bin/yt-dlp"
fi
if [[ ! -d "${subfolder}" ]]; then
	mkdir -v "${subfolder}"
fi
if [[ ! -d "${temporary}" ]]; then
	mkdir -v "${temporary}"
fi
cd "${temporary}" || exit
if [[ ! -f "${archive}" ]]; then
	touch "${archive}"
fi
if [[ -f "${subfolder}/${channel}.tar.zst" ]]; then
	if [[ "${channel}" = "subscriptions" ]]; then
		find "${subfolder}" -iname "*.tar.zst" | while read -r c; do tar -xvp -I zstd -f "${c}"; done
	else
		tar -xvp -I zstd -f "${subfolder}/${channel}.tar.zst"
	fi
fi
url="https://www.youtube.com/@${channel}"
if [[ "${channel}" = "subscriptions" ]]; then
	url="https://www.youtube.com/feed/subscriptions"
fi
for full_url in "${url}/videos" "${url}/shorts" "${url}/streams"; do
	echo "${full_url}"
	if [[ -f "${cookies}" || "${channel}" = "subscriptions" ]]; then
		#If available, you can use the cookies from your browser directly. Substitute
		#	--cookies "${cookies}"
		#for the below, substituting for your browser of choice:
		#	--cookies-from-browser "firefox"
		#In case this still fails, you can resort to a PO Token. Follow the instructions at
		# https://github.com/yt-dlp/yt-dlp/wiki/PO-Token-Guide
		#and add a new variable with the contents of the PO Token in the form
		#	potoken="INSERTYOURPOTOKENHERE"
		#then substitute the "--extractor-args" line below with
		#	--extractor-args "youtubetab:approximate_date,youtube:player-client=default,mweb;po_token=mweb.gvs+${potoken}" \
		#including the backslash so the multiline command keeps working.
		"${python}" "${ytdl}" "${full_url}" \
			--cookies "${cookies}" \
			--extractor-args "youtubetab:approximate_date" \
			--skip-download --download-archive "${archive}" \
			--dateafter "${breaktime}" \
			--break-on-reject --lazy-playlist --write-info-json \
			--sleep-requests "${sleeptime}" \
			--parse-metadata "video::(?P<formats>)" \
			--parse-metadata "video::(?P<thumbnails>)" \
			--parse-metadata "video::(?P<subtitles>)" \
			--parse-metadata "video::(?P<automatic_captions>)" \
			--parse-metadata "video::(?P<chapters>)" \
			--parse-metadata "video::(?P<heatmap>)" \
			--parse-metadata "video::(?P<tags>)" \
			--parse-metadata "video::(?P<categories>)"
	else
		"${python}" "${ytdl}" "${full_url}" \
			--extractor-args "youtubetab:approximate_date" \
			--skip-download --download-archive "${archive}" \
			--dateafter "${breaktime}" \
			--break-on-reject --lazy-playlist --write-info-json \
			--sleep-requests "${sleeptime}" \
			--parse-metadata "video::(?P<formats>)" \
			--parse-metadata "video::(?P<thumbnails>)" \
			--parse-metadata "video::(?P<subtitles>)" \
			--parse-metadata "video::(?P<automatic_captions>)" \
			--parse-metadata "video::(?P<chapters>)" \
			--parse-metadata "video::(?P<heatmap>)" \
			--parse-metadata "video::(?P<tags>)" \
			--parse-metadata "video::(?P<categories>)"
	fi
done
if [[ ${enablecsv} = 1 ]]; then
	if [[ -f "${tmpcsv}" ]]; then
		rm -rf "${tmpcsv}"
	fi
	touch "${tmpcsv}"
fi
if [[ ${enabledb} = 1 ]]; then
	if [[ -f "${sortcsv}" ]]; then
		rm -rf "${sortcsv}"
	fi
	touch "${sortcsv}"
fi
breaktime_timestamp=$(date -d"${breaktime}" +"%s")
count=0
total=$(find "${temporary}" -type f -iname "*.info.json" | wc -l)
find "${temporary}" -type f -iname "*.info.json" | while read -r x; do
	count=$((count + 1))
	(
		if [[ -f "${x}" && "${channel}" != "subscriptions" && $(jq -rc ".uploader_id" "${x}") != "@${channel}" ]]; then
			echo "${count}/${total} ${x} not uploaded from ${channel}, removing..." && rm "${x}"
		fi
		if [[ -f "${x}" && "${breaktime}" =~ ^[0-9]+$ ]]; then
			file_timestamp=$(jq -rc '.timestamp' "${x}")
			if [[ "${breaktime_timestamp}" -ge "${file_timestamp}" ]]; then
				echo "${count}/${total} ${x} uploaded before ${breaktime}, removing..." && rm "${x}"
			fi
		fi
		if [[ -f "${x}" ]]; then
			if [[ $(stat -c%s "${x}") -gt 4096 ]]; then
				jq '.formats="" | .automatic_captions="" | .subtitles="" | .thumbnails="" | .tags="" | .chapters="" | .heatmap="" | .categories=""' "${x}" >"${x}.tmp" && mv "${x}.tmp" "${x}"
			fi
			echo "youtube $(jq -cr '.id' "${x}")" >>"${temporary}/${channel}.txt"
			if [[ ${enablecsv} = "1" ]]; then
				jq -c '[.upload_date, .timestamp, .duration, .uploader , .title, .webpage_url]' "${x}" | while read -r i; do
					echo "${i}" | sed -e "s/^\[//g" -e "s/\]$//g" -e "s/\\\\\"/＂/g" >>"${tmpcsv}"
				done
			fi
			if [[ ${enabledb} = "1" ]]; then
				jq -c '[.upload_date, .timestamp]' "${x}" | while read -r i; do
					echo "${i},${x##*/}" | sed -e "s/^\[//g" -e "s/\],/,/g" -e "s/\\\\\"/＂/g" >>"${sortcsv}"
				done
			fi
			echo "${count}/${total} ${x}"
		fi
	) &
	if [[ $(jobs -r -p | wc -l) -ge $(getconf _NPROCESSORS_ONLN) ]]; then
		wait -n
	fi

done
wait
sleep 1
if [[ ${enabledb} = "1" ]]; then
	sort "${sortcsv}" | uniq >"${temporary}/${channel}-sort-ordered.csv"
	if [[ -f "${temporary}/${channel}.db" ]]; then
		rm "${temporary}/${channel}.db"
	fi
	echo "{\"playlistName\":\"${channel}\",\"protected\":false,\"description\":\"Videos from ${channel} to watch later\",\"videos\":[" >"${temporary}/${channel}.db"
	count=0
	total=$(wc -l <"${temporary}/${channel}-sort-ordered.csv")
	while read -r line; do
		count=$((count + 1))
		file=$(echo "${line}" | cut -d ',' -f3-)
		if [[ -f "${file}" ]]; then
			jq -c "{\"videoId\": .id, \"title\": .title, \"author\": .uploader, \"authorId\": .channel_id, \"lengthSeconds\": .duration, \"published\": ( .timestamp * 1000 ), \"timeAdded\": $(date +%s)$(date +%N | cut -c-3), \"playlistItemId\": \"$(cat /proc/sys/kernel/random/uuid)\", \"type\": .media_type}" "${temporary}/${file}" >>"${temporary}/${channel}.db"
			echo "," >>"${temporary}/${channel}.db"
			echo "${count}/${total} ${file}"
		fi
	done <"${temporary}/${channel}-sort-ordered.csv"
	echo "],\"_id\":\"${channel}$(date +%s)\",\"createdAt\":$(date +%s),\"lastUpdatedAt\":$(date +%s)}" >>"${temporary}/${channel}.db"
	rm "${json}"
	grep -v -e ":[ ]*null" "${temporary}/${channel}.db" | tr '\n' '\r' | sed -e "s/,\r[,\r]*/,\r/g" | sed -e "s/,\r\]/\]/g" -e "s/\[\r,/\[/g" | tr '\r' '\n' | jq -c . >"${json}" && rm "${temporary}/${channel}.db"
	rm "${temporary}/${channel}-sort-ordered.csv" "${sortcsv}"
fi
if [[ ${enablecsv} = "1" ]]; then
	sort "${tmpcsv}" | uniq >"${temporary}/${channel}-without-header.csv"
	echo '"Upload Date", "Timestamp", "Duration", "Uploader", "Title", "Webpage URL"' >"${temporary}/${channel}-tmp.csv"
	cat "${temporary}/${channel}-without-header.csv" >>"${temporary}/${channel}-tmp.csv"
	mv "${temporary}/${channel}-tmp.csv" "${csv}"
	rm "${temporary}/${channel}-without-header.csv"
	rm "${tmpcsv}"
fi
cd "${temporary}" || exit
tar -cvp -I "zstd -T0" -f "${subfolder}/${channel}.tar.zst" -- *.info.json
count=0
total=$(find "${temporary}" -type f -iname "*.info.json" | wc -l)
sort "${temporary}/${channel}.txt" | uniq >"${archive}"
rm -rf "${temporary}"
-												feat: Add new script to download YouTube channel data

											
										
										
											2025-05-30 15:52:49 +00:00
+								#!/bin/bash
-												fix: Correct parsing, add comments

											
										
										
											2025-05-30 16:09:56 +00:00
+								#Parameters:
 								#1st parameter: Channel you want to turn into a playlist. Leave blank to save your subscriptions (cookie file required)
-												feat: Add new script to download YouTube channel data

											
										
										
											2025-05-30 15:52:49 +00:00
+								channel=${1:-"subscriptions"}
-												fix: Correct parsing, add comments

											
										
										
											2025-05-30 16:09:56 +00:00
+								#2nd parameter: Time limit for the download. Leave blank to save all videos from the last month.
-												feat: Add new script to download YouTube channel data

											
										
										
											2025-05-30 15:52:49 +00:00
+								breaktime=${2:-"today-1month"}
-												fix: Correct parsing, add comments

											
										
										
											2025-05-30 16:09:56 +00:00
+								#3rd parameter: Seconds between data requests. Decrease to make downloads faster, but your account may be temporarily blocked if you use a number too low.
-												feat: Add new script to download YouTube channel data

											
										
										
											2025-05-30 15:52:49 +00:00
+								sleeptime=${3:-"1.0"}
-												feat: Add the ability to split CSV and DB generation

											
										
										
											2025-06-02 14:21:59 +00:00
+								#4th parameter: Whether to enable exporting to FreeTube playlist database (1=on by default, 0=off)
 								enabledb=${4:-"1"}
 								#5th parameter: Whether to enable exporting to a CSV file (1=on by default, 0=off)
 								enablecsv=${5:-"1"}
-												fix: Correct parsing, add comments

											
										
										
											2025-05-30 16:09:56 +00:00
+								#Internal variables:
-												feat: Add new script to download YouTube channel data

											
										
										
											2025-05-30 15:52:49 +00:00
+								#Via https://stackoverflow.com/questions/59895/how-do-i-get-the-directory-where-a-bash-script-is-located-from-within-the-script
-												fix: Correct parsing, add comments

											
										
										
											2025-05-30 16:09:56 +00:00
+								folder=$(cd -- "$(dirname -- "${BASH_SOURCE[0]}")" &>/dev/null && pwd)
-												feat: Add new script to download YouTube channel data

											
										
										
											2025-05-30 15:52:49 +00:00
+								#Required to download your own subscriptions.
 								#Obtain this file through the procedure listed at
 								# https://github.com/yt-dlp/yt-dlp/wiki/FAQ#how-do-i-pass-cookies-to-yt-dlp
 								#and place it next to your script.
-												fix: Correct parsing, add comments

											
										
										
											2025-05-30 16:09:56 +00:00
+								cookies="${folder}/yt-cookies.txt"
-												fix: Reduce amount of folders created, added coverage to subscriptions

											
										
										
											2025-06-08 22:08:27 +00:00
+								subfolder="${folder}/subscriptions"
-												feat: Host more working files in temporary folder

											
										
										
											2025-06-13 20:16:04 +00:00
+								temporary="/tmp/subscriptions-${channel}"
-												feat: Add preliminary support for Termux, reduce temporary file size

											
										
										
											2025-06-16 14:42:44 +00:00
+								if [[ ! -w "/tmp" ]]; then
 									temporary="${subfolder}/subscriptions-${channel}"
 								fi
-												fix: Correct parsing, add comments

											
										
										
											2025-05-30 16:09:56 +00:00
+								archive="${subfolder}/${channel}.txt"
-												feat: Host more working files in temporary folder

											
										
										
											2025-06-13 20:16:04 +00:00
+								sortcsv="${temporary}/${channel}-sort.csv"
-												fix: Correct parsing, add comments

											
										
										
											2025-05-30 16:09:56 +00:00
+								csv="${subfolder}/${channel}.csv"
-												feat: Generate CSV in the temporary folder

											
										
										
											2025-06-24 15:25:48 -06:00
+								tmpcsv="${temporary}/${channel}.csv"
-												fix: Correct parsing, add compression of data after finishing

											
										
										
											2025-05-31 19:37:00 +00:00
+								json="${subfolder}/${channel}.db"
-												feat: Add video duration to CSV

											
										
										
											2025-06-24 13:44:20 -06:00
+								python="python3"
-												feat: Add new script to download YouTube channel data

											
										
										
											2025-05-30 15:52:49 +00:00
+								if [[ -f "/opt/venv/bin/python" ]]; then
-												fix: Correct parsing, add comments

											
										
										
											2025-05-30 16:09:56 +00:00
+									python="/opt/venv/bin/python"
-												feat: Add new script to download YouTube channel data

											
										
										
											2025-05-30 15:52:49 +00:00
+								fi
-												feat: Add preliminary support for Termux, reduce temporary file size

											
										
										
											2025-06-16 14:42:44 +00:00
+								ytdl="yt-dlp"
 								if [[ -f "/usr/bin/yt-dlp" ]]; then
 									ytdl="/usr/bin/yt-dlp"
 								fi
-												feat: Add new script to download YouTube channel data

											
										
										
											2025-05-30 15:52:49 +00:00
+								if [[ -f "/opt/venv/bin/yt-dlp" ]]; then
-												fix: Correct parsing, add comments

											
										
										
											2025-05-30 16:09:56 +00:00
+									ytdl="/opt/venv/bin/yt-dlp"
-												feat: Add new script to download YouTube channel data

											
										
										
											2025-05-30 15:52:49 +00:00
+								fi
-												feat: Add preliminary support for Termux, reduce temporary file size

											
										
										
											2025-06-16 14:42:44 +00:00
+								if [[ -f "/data/data/com.termux/files/usr/bin/yt-dlp" ]]; then
 									ytdl="/data/data/com.termux/files/usr/bin/yt-dlp"
 								fi
-												fix: Correct parsing, add compression of data after finishing

											
										
										
											2025-05-31 19:37:00 +00:00
+								if [[ ! -d "${subfolder}" ]]; then
 									mkdir -v "${subfolder}"
-												feat: Add new script to download YouTube channel data

											
										
										
											2025-05-30 15:52:49 +00:00
+								fi
-												feat: Store temporary files in /tmp, add fixes

											
										
										
											2025-06-11 00:11:24 +00:00
+								if [[ ! -d "${temporary}" ]]; then
 									mkdir -v "${temporary}"
 								fi
 								cd "${temporary}" || exit
-												feat: Add the ability to split CSV and DB generation

											
										
										
											2025-06-02 14:21:59 +00:00
+								if [[ ! -f "${archive}" ]]; then
 									touch "${archive}"
 								fi
-												feat: Store temporary files in /tmp, add fixes

											
										
										
											2025-06-11 00:11:24 +00:00
+								if [[ -f "${subfolder}/${channel}.tar.zst" ]]; then
-												fix: Reduce amount of folders created, added coverage to subscriptions

											
										
										
											2025-06-08 22:08:27 +00:00
+									if [[ "${channel}" = "subscriptions" ]]; then
-												feat: Store temporary files in /tmp, add fixes

											
										
										
											2025-06-11 00:11:24 +00:00
+										find "${subfolder}" -iname "*.tar.zst" | while read -r c; do tar -xvp -I zstd -f "${c}"; done
-												fix: Reduce amount of folders created, added coverage to subscriptions

											
										
										
											2025-06-08 22:08:27 +00:00
+									else
-												feat: Store temporary files in /tmp, add fixes

											
										
										
											2025-06-11 00:11:24 +00:00
+										tar -xvp -I zstd -f "${subfolder}/${channel}.tar.zst"
-												fix: Reduce amount of folders created, added coverage to subscriptions

											
										
										
											2025-06-08 22:08:27 +00:00
+									fi
-												fix: Correct parsing, add compression of data after finishing

											
										
										
											2025-05-31 19:37:00 +00:00
+								fi
-												fix: Correct parsing, add comments

											
										
										
											2025-05-30 16:09:56 +00:00
+								url="https://www.youtube.com/@${channel}"
 								if [[ "${channel}" = "subscriptions" ]]; then
 									url="https://www.youtube.com/feed/subscriptions"
-												feat: Add new script to download YouTube channel data

											
										
										
											2025-05-30 15:52:49 +00:00
+								fi
-												feat: Fetch livestreams and shorts

											
										
										
											2025-06-12 14:02:10 +00:00
+								for full_url in "${url}/videos" "${url}/shorts" "${url}/streams"; do
 									echo "${full_url}"
-												feat: Host more working files in temporary folder

											
										
										
											2025-06-13 20:16:04 +00:00
+									if [[ -f "${cookies}" || "${channel}" = "subscriptions" ]]; then
-												feat: Fetch livestreams and shorts

											
										
										
											2025-06-12 14:02:10 +00:00
+										#If available, you can use the cookies from your browser directly. Substitute
 										#	--cookies "${cookies}"
 										#for the below, substituting for your browser of choice:
 										#	--cookies-from-browser "firefox"
 										#In case this still fails, you can resort to a PO Token. Follow the instructions at
 										# https://github.com/yt-dlp/yt-dlp/wiki/PO-Token-Guide
 										#and add a new variable with the contents of the PO Token in the form
 										#	potoken="INSERTYOURPOTOKENHERE"
 										#then substitute the "--extractor-args" line below with
 										#	--extractor-args "youtubetab:approximate_date,youtube:player-client=default,mweb;po_token=mweb.gvs+${potoken}" \
 										#including the backslash so the multiline command keeps working.
 										"${python}" "${ytdl}" "${full_url}" \
 											--cookies "${cookies}" \
 											--extractor-args "youtubetab:approximate_date" \
 											--skip-download --download-archive "${archive}" \
 											--dateafter "${breaktime}" \
 											--break-on-reject --lazy-playlist --write-info-json \
-												feat: Add preliminary support for Termux, reduce temporary file size

											
										
										
											2025-06-16 14:42:44 +00:00
+											--sleep-requests "${sleeptime}" \
 											--parse-metadata "video::(?P<formats>)" \
 											--parse-metadata "video::(?P<thumbnails>)" \
-												fix: Optimize temporary file generation

											
										
										
											2025-06-16 17:21:36 +00:00
+											--parse-metadata "video::(?P<subtitles>)" \
-												feat: Add preliminary support for Termux, reduce temporary file size

											
										
										
											2025-06-16 14:42:44 +00:00
+											--parse-metadata "video::(?P<automatic_captions>)" \
-												fix: Optimize generation of temporary files even further

											
										
										
											2025-06-16 17:43:08 +00:00
+											--parse-metadata "video::(?P<chapters>)" \
 											--parse-metadata "video::(?P<heatmap>)" \
-												feat: Add preliminary support for Termux, reduce temporary file size

											
										
										
											2025-06-16 14:42:44 +00:00
+											--parse-metadata "video::(?P<tags>)" \
 											--parse-metadata "video::(?P<categories>)"
-												feat: Fetch livestreams and shorts

											
										
										
											2025-06-12 14:02:10 +00:00
+									else
 										"${python}" "${ytdl}" "${full_url}" \
 											--extractor-args "youtubetab:approximate_date" \
 											--skip-download --download-archive "${archive}" \
 											--dateafter "${breaktime}" \
 											--break-on-reject --lazy-playlist --write-info-json \
-												feat: Add preliminary support for Termux, reduce temporary file size

											
										
										
											2025-06-16 14:42:44 +00:00
+											--sleep-requests "${sleeptime}" \
 											--parse-metadata "video::(?P<formats>)" \
 											--parse-metadata "video::(?P<thumbnails>)" \
-												fix: Optimize temporary file generation

											
										
										
											2025-06-16 17:21:36 +00:00
+											--parse-metadata "video::(?P<subtitles>)" \
-												feat: Add preliminary support for Termux, reduce temporary file size

											
										
										
											2025-06-16 14:42:44 +00:00
+											--parse-metadata "video::(?P<automatic_captions>)" \
-												fix: Optimize generation of temporary files even further

											
										
										
											2025-06-16 17:43:08 +00:00
+											--parse-metadata "video::(?P<chapters>)" \
 											--parse-metadata "video::(?P<heatmap>)" \
-												feat: Add preliminary support for Termux, reduce temporary file size

											
										
										
											2025-06-16 14:42:44 +00:00
+											--parse-metadata "video::(?P<tags>)" \
 											--parse-metadata "video::(?P<categories>)"
-												feat: Fetch livestreams and shorts

											
										
										
											2025-06-12 14:02:10 +00:00
+									fi
 								done
-												fix: Optimize CSV generation

											
										
										
											2025-06-11 14:17:03 +00:00
+								if [[ ${enablecsv} = 1 ]]; then
-												feat: Generate CSV in the temporary folder

											
										
										
											2025-06-24 15:25:48 -06:00
+									if [[ -f "${tmpcsv}" ]]; then
 										rm -rf "${tmpcsv}"
-												fix: Optimize CSV generation

											
										
										
											2025-06-11 14:17:03 +00:00
+									fi
-												feat: Generate CSV in the temporary folder

											
										
										
											2025-06-24 15:25:48 -06:00
+									touch "${tmpcsv}"
-												fix: Correct syntax errors, optimize stale file deletion

											
										
										
											2025-06-09 05:07:30 +00:00
+								fi
-												fix: Optimize CSV generation

											
										
										
											2025-06-11 14:17:03 +00:00
+								if [[ ${enabledb} = 1 ]]; then
 									if [[ -f "${sortcsv}" ]]; then
 										rm -rf "${sortcsv}"
 									fi
 									touch "${sortcsv}"
-												feat: Add the ability to split CSV and DB generation

											
										
										
											2025-06-02 14:21:59 +00:00
+								fi
-												fix: Correct logic flow, add comments

											
										
										
											2025-06-10 14:21:26 +00:00
+								breaktime_timestamp=$(date -d"${breaktime}" +"%s")
-												feat: Store temporary files in /tmp, add fixes

											
										
										
											2025-06-11 00:11:24 +00:00
+								count=0
 								total=$(find "${temporary}" -type f -iname "*.info.json" | wc -l)
 								find "${temporary}" -type f -iname "*.info.json" | while read -r x; do
 									count=$((count + 1))
-												feat: Optimize file analysis loop

											
										
										
											2025-06-09 15:07:05 +00:00
+									(
-												feat: Store temporary files in /tmp, add fixes

											
										
										
											2025-06-11 00:11:24 +00:00
+										if [[ -f "${x}" && "${channel}" != "subscriptions" && $(jq -rc ".uploader_id" "${x}") != "@${channel}" ]]; then
-												fix: Optimize temporary file generation

											
										
										
											2025-06-16 17:21:36 +00:00
+											echo "${count}/${total} ${x} not uploaded from ${channel}, removing..." && rm "${x}"
-												fix: Correct syntax errors, optimize stale file deletion

											
										
										
											2025-06-09 05:07:30 +00:00
+										fi
-												feat: Store temporary files in /tmp, add fixes

											
										
										
											2025-06-11 00:11:24 +00:00
+										if [[ -f "${x}" && "${breaktime}" =~ ^[0-9]+$ ]]; then
 											file_timestamp=$(jq -rc '.timestamp' "${x}")
-												fix: Correct logic flow, add comments

											
										
										
											2025-06-10 14:21:26 +00:00
+											if [[ "${breaktime_timestamp}" -ge "${file_timestamp}" ]]; then
-												fix: Optimize temporary file generation

											
										
										
											2025-06-16 17:21:36 +00:00
+												echo "${count}/${total} ${x} uploaded before ${breaktime}, removing..." && rm "${x}"
-												fix: Correct logic flow, add comments

											
										
										
											2025-06-10 14:21:26 +00:00
+											fi
-												fix: Correct syntax errors, optimize stale file deletion

											
										
										
											2025-06-09 05:07:30 +00:00
+										fi
-												feat: Store temporary files in /tmp, add fixes

											
										
										
											2025-06-11 00:11:24 +00:00
+										if [[ -f "${x}" ]]; then
-												fix: Optimize temporary file generation

											
										
										
											2025-06-16 17:21:36 +00:00
+											if [[ $(stat -c%s "${x}") -gt 4096 ]]; then
-												fix: Optimize generation of temporary files even further

											
										
										
											2025-06-16 17:43:08 +00:00
+												jq '.formats="" | .automatic_captions="" | .subtitles="" | .thumbnails="" | .tags="" | .chapters="" | .heatmap="" | .categories=""' "${x}" >"${x}.tmp" && mv "${x}.tmp" "${x}"
-												fix: Optimize temporary file generation

											
										
										
											2025-06-16 17:21:36 +00:00
+											fi
-												feat: Host more working files in temporary folder

											
										
										
											2025-06-13 20:16:04 +00:00
+											echo "youtube $(jq -cr '.id' "${x}")" >>"${temporary}/${channel}.txt"
-												feat: Optimize file analysis loop

											
										
										
											2025-06-09 15:07:05 +00:00
+											if [[ ${enablecsv} = "1" ]]; then
-												feat: Add video duration to CSV

											
										
										
											2025-06-24 13:44:20 -06:00
+												jq -c '[.upload_date, .timestamp, .duration, .uploader , .title, .webpage_url]' "${x}" | while read -r i; do
-												feat: Generate CSV in the temporary folder

											
										
										
											2025-06-24 15:25:48 -06:00
+													echo "${i}" | sed -e "s/^\[//g" -e "s/\]$//g" -e "s/\\\\\"/＂/g" >>"${tmpcsv}"
-												feat: Optimize file analysis loop

											
										
										
											2025-06-09 15:07:05 +00:00
+												done
 											fi
-												fix: Optimize CSV generation

											
										
										
											2025-06-11 14:17:03 +00:00
+											if [[ ${enabledb} = "1" ]]; then
-												feat: Store temporary files in /tmp, add fixes

											
										
										
											2025-06-11 00:11:24 +00:00
+												jq -c '[.upload_date, .timestamp]' "${x}" | while read -r i; do
 													echo "${i},${x##*/}" | sed -e "s/^\[//g" -e "s/\],/,/g" -e "s/\\\\\"/＂/g" >>"${sortcsv}"
-												feat: Optimize file analysis loop

											
										
										
											2025-06-09 15:07:05 +00:00
+												done
 											fi
-												feat: Store temporary files in /tmp, add fixes

											
										
										
											2025-06-11 00:11:24 +00:00
+											echo "${count}/${total} ${x}"
-												fix: Correct syntax errors, optimize stale file deletion

											
										
										
											2025-06-09 05:07:30 +00:00
+										fi
-												feat: Optimize file analysis loop

											
										
										
											2025-06-09 15:07:05 +00:00
+									) &
 									if [[ $(jobs -r -p | wc -l) -ge $(getconf _NPROCESSORS_ONLN) ]]; then
 										wait -n
-												fix: Correct parsing, add comments

											
										
										
											2025-05-30 16:09:56 +00:00
+									fi
-												feat: Optimize file analysis loop

											
										
										
											2025-06-09 15:07:05 +00:00
-												feat: Add new script to download YouTube channel data

											
										
										
											2025-05-30 15:52:49 +00:00
+								done
 								wait
-												fix: Optimize CSV generation

											
										
										
											2025-06-11 14:17:03 +00:00
+								sleep 1
-												feat: Add the ability to split CSV and DB generation

											
										
										
											2025-06-02 14:21:59 +00:00
+								if [[ ${enabledb} = "1" ]]; then
-												feat: Host more working files in temporary folder

											
										
										
											2025-06-13 20:16:04 +00:00
+									sort "${sortcsv}" | uniq >"${temporary}/${channel}-sort-ordered.csv"
 									if [[ -f "${temporary}/${channel}.db" ]]; then
 										rm "${temporary}/${channel}.db"
-												feat: Optimize file analysis loop

											
										
										
											2025-06-09 15:07:05 +00:00
+									fi
-												feat: Host more working files in temporary folder

											
										
										
											2025-06-13 20:16:04 +00:00
+									echo "{\"playlistName\":\"${channel}\",\"protected\":false,\"description\":\"Videos from ${channel} to watch later\",\"videos\":[" >"${temporary}/${channel}.db"
-												feat: Store temporary files in /tmp, add fixes

											
										
										
											2025-06-11 00:11:24 +00:00
+									count=0
-												feat: Host more working files in temporary folder

											
										
										
											2025-06-13 20:16:04 +00:00
+									total=$(wc -l <"${temporary}/${channel}-sort-ordered.csv")
-												feat: Add the ability to split CSV and DB generation

											
										
										
											2025-06-02 14:21:59 +00:00
+									while read -r line; do
-												feat: Store temporary files in /tmp, add fixes

											
										
										
											2025-06-11 00:11:24 +00:00
+										count=$((count + 1))
-												feat: Add the ability to split CSV and DB generation

											
										
										
											2025-06-02 14:21:59 +00:00
+										file=$(echo "${line}" | cut -d ',' -f3-)
-												feat: Store temporary files in /tmp, add fixes

											
										
										
											2025-06-11 00:11:24 +00:00
+										if [[ -f "${file}" ]]; then
-												feat: Add preliminary support for Termux, reduce temporary file size

											
										
										
											2025-06-16 14:42:44 +00:00
+											jq -c "{\"videoId\": .id, \"title\": .title, \"author\": .uploader, \"authorId\": .channel_id, \"lengthSeconds\": .duration, \"published\": ( .timestamp * 1000 ), \"timeAdded\": $(date +%s)$(date +%N | cut -c-3), \"playlistItemId\": \"$(cat /proc/sys/kernel/random/uuid)\", \"type\": .media_type}" "${temporary}/${file}" >>"${temporary}/${channel}.db"
-												feat: Host more working files in temporary folder

											
										
										
											2025-06-13 20:16:04 +00:00
+											echo "," >>"${temporary}/${channel}.db"
-												feat: Store temporary files in /tmp, add fixes

											
										
										
											2025-06-11 00:11:24 +00:00
+											echo "${count}/${total} ${file}"
-												feat: Add the ability to split CSV and DB generation

											
										
										
											2025-06-02 14:21:59 +00:00
+										fi
-												feat: Host more working files in temporary folder

											
										
										
											2025-06-13 20:16:04 +00:00
+									done <"${temporary}/${channel}-sort-ordered.csv"
 									echo "],\"_id\":\"${channel}$(date +%s)\",\"createdAt\":$(date +%s),\"lastUpdatedAt\":$(date +%s)}" >>"${temporary}/${channel}.db"
-												feat: Add the ability to split CSV and DB generation

											
										
										
											2025-06-02 14:21:59 +00:00
+									rm "${json}"
-												feat: Host more working files in temporary folder

											
										
										
											2025-06-13 20:16:04 +00:00
+									grep -v -e ":[ ]*null" "${temporary}/${channel}.db" | tr '\n' '\r' | sed -e "s/,\r[,\r]*/,\r/g" | sed -e "s/,\r\]/\]/g" -e "s/\[\r,/\[/g" | tr '\r' '\n' | jq -c . >"${json}" && rm "${temporary}/${channel}.db"
 									rm "${temporary}/${channel}-sort-ordered.csv" "${sortcsv}"
-												feat: Add the ability to split CSV and DB generation

											
										
										
											2025-06-02 14:21:59 +00:00
+								fi
 								if [[ ${enablecsv} = "1" ]]; then
-												feat: Generate CSV in the temporary folder

											
										
										
											2025-06-24 15:25:48 -06:00
+									sort "${tmpcsv}" | uniq >"${temporary}/${channel}-without-header.csv"
 									echo '"Upload Date", "Timestamp", "Duration", "Uploader", "Title", "Webpage URL"' >"${temporary}/${channel}-tmp.csv"
 									cat "${temporary}/${channel}-without-header.csv" >>"${temporary}/${channel}-tmp.csv"
 									mv "${temporary}/${channel}-tmp.csv" "${csv}"
-												feat: Host more working files in temporary folder

											
										
										
											2025-06-13 20:16:04 +00:00
+									rm "${temporary}/${channel}-without-header.csv"
-												feat: Generate CSV in the temporary folder

											
										
										
											2025-06-24 15:25:48 -06:00
+									rm "${tmpcsv}"
-												feat: Add the ability to split CSV and DB generation

											
										
										
											2025-06-02 14:21:59 +00:00
+								fi
-												feat: Store temporary files in /tmp, add fixes

											
										
										
											2025-06-11 00:11:24 +00:00
+								cd "${temporary}" || exit
-												fix: Prevent loss of data already downloaded if interrupted

											
										
										
											2025-06-11 14:42:49 +00:00
+								tar -cvp -I "zstd -T0" -f "${subfolder}/${channel}.tar.zst" -- *.info.json
-												feat: Fetch livestreams and shorts

											
										
										
											2025-06-12 14:02:10 +00:00
+								count=0
 								total=$(find "${temporary}" -type f -iname "*.info.json" | wc -l)
-												feat: Host more working files in temporary folder

											
										
										
											2025-06-13 20:16:04 +00:00
+								sort "${temporary}/${channel}.txt" | uniq >"${archive}"
-												fix: Prevent loss of data already downloaded if interrupted

											
										
										
											2025-06-11 14:42:49 +00:00
+								rm -rf "${temporary}"