y/y.sh

306 lines
6.7 KiB
Bash
Raw Normal View History

2023-08-06 22:01:08 +02:00
#!/usr/bin/env bash
2023-06-23 20:07:30 +02:00
## y
2023-08-06 22:01:08 +02:00
# > algorithmically-enhanced yt-dlp (youtube-dl) wrapper for audio-downloads
2023-06-23 20:07:30 +02:00
## requires
# - `python3 -m pip install --upgrade yt-dlp`
# the main thing, you should already have it
# - `sudo apt install -y ffmpeg` to convert files of diffrent formats
# - `cargo install sd` a better `sed`
# - `sudo apt install -y lynx` to easily scrap web-pages
DN_TYPE=''
YDL()
{
which yt-dlp
if [ $? -eq 0 ]; then
yt-dlp $DN_TYPE --cookies-from-browser firefox $@
# --verbose
# --restrict-filenames
return
fi
echo 'no youtube-dl/yt-dlp found, you can install it with:
sudo apt install -y \
python3 python3-pip
python3 -m pip install --upgrade \
yt-dlp
'
exit 1
}
# load config
cd `realpath "$0" | xargs dirname`
. config.sh
# use new-line as separator of array elements
IFS=$'\n'
# parse cli options
OPT="$1"
URL="$2"
if [ -z "$URL" ]; then
OPT=''
URL="$1"
fi
SITE=` echo "$URL" \
| sd 'https?://(www\.)?' '' \
| sd '/.*' '' \
`
if [ OPT == 'band' ]; then
SITE='_CNAME.bandcamp.com'
fi
echo "URL : '$URL'"
echo "SITE : '$SITE'"
if [ "$OPT" == 'F' ]; then
YDL "$URL" -F
exit 1
fi
if [ "$OPT" == '22' ]; then
DN_TYPE='-f 22'
fi
to_mp3()
{
echo "to mp3: [ ${@} ]"
for UNCOMPRESSED in "${@}" ; do
MP3=` echo "$UNCOMPRESSED" \
| sd '\.\w+$' ' [conv].mp3' \
`
echo "'$UNCOMPRESSED'"
echo ">> '$MP3'"
ffmpeg -i "$UNCOMPRESSED" \
-codec:a libmp3lame \
-qscale:a 2 \
-loglevel quiet \
-y "$MP3"
rm "$UNCOMPRESSED"
done
}
get_bandcamp_track()
{
echo "> > track: '$1'"
YDL "$1" -f mp3-320 \
2024-04-24 17:58:40 +02:00
-o "$MUSIC_PATH/$ARTIST/%(album)s/%(track_number)02d %(title).50B [%(id)s].%(ext)s"
2023-06-23 20:07:30 +02:00
[ $? -eq 1 ] \
&& YDL "$1" -f mp3 \
2024-04-24 17:58:40 +02:00
-o "$MUSIC_PATH/$ARTIST/%(album)s/%(track_number)02d %(title).50B [%(id)s].%(ext)s"
2023-06-23 20:07:30 +02:00
}
get_bandcamp_album()
{
echo "> > album: '$1'"
SUBLINKS=(` lynx -dump -listonly -nonumbers "$1" \
| grep -Eiw "^(https://$SITE/track)" \
| sd '(\?|#).+$' '' \
| sort -u \
`)
for LINK in "${SUBLINKS[@]}" ; do
get_bandcamp_track "$LINK"
done
}
case "$SITE" in
'music.youtube.com')
echo '> youtube-music'
YDL "$URL" -f 251 \
2024-04-24 17:58:40 +02:00
-o "$MUSIC_PATH/%(artist)s - %(title).50B [%(id)s].%(ext)s"
2023-06-23 20:07:30 +02:00
;;
'youtube.com'| \
'm.youtube.com'| \
'youtu.be')
echo '> youtube'
if [[ "$URL" = *youtube\.com\/@* ]]; then
echo '> > store archive'
2023-10-15 06:20:02 +02:00
YDL "$URL" \
2024-04-24 17:58:40 +02:00
-o "$YT_PATH/%(uploader_id)s/%(title).50B [%(id)s].%(ext)s"
else
case "$OPT" in
'm')
echo '> > music'
YDL "$URL" -f 251 \
2024-04-24 17:58:40 +02:00
-o "$MUSIC_PATH/%(title).50B [%(id)s].%(ext)s"
;;
'a')
echo '> > audio'
YDL "$URL" -f 251 \
2024-04-24 17:58:40 +02:00
-o "$AUDIO_PATH/%(title).50B [%(id)s].%(ext)s"
;;
's')
echo '> > store archive'
2023-10-15 06:20:02 +02:00
YDL "$URL" \
2024-04-24 17:58:40 +02:00
-o "$YT_PATH/%(uploader_id)s/%(title).50B [%(id)s].%(ext)s"
2023-06-23 20:07:30 +02:00
;;
*)
echo '> > _video_'
YDL "$URL" \
2024-04-24 17:58:40 +02:00
-o "$DEFAULT_PATH/yt-%(title).50B [%(id)s].%(ext)s"
;;
esac
fi
2023-06-23 20:07:30 +02:00
;;
'soundcloud.com'| \
*.soundcloud.com )
echo '> soundcloud'
ARTIST=` echo "$URL" \
| sd 'https?://([\w-]+\.)?soundcloud.com/' '' \
| sd '/.*' '' \
`
echo "ARTIST : '$ARTIST'"
YDL "$URL" --add-metadata \
--postprocessor-args "-metadata artist='$ARTIST'" \
-o "$MUSIC_PATH/$ARTIST/%(title).200B.%(ext)s"
WAV_FILES=(` ls -RAd $MUSIC_PATH/$ARTIST/*.wav `)
[ $? -eq 0 ] \
&& to_mp3 "$WAV_FILES"
FLAC_FILES=(` ls -RAd $MUSIC_PATH/$ARTIST/*.flac `)
[ $? -eq 0 ] \
&& to_mp3 "$FLAC_FILES"
;;
'bandcamp.com'| \
*.bandcamp.com )
echo '> bandcamp'
ARTIST=''
if [ OPT == 'band' ]; then
ARTIST=` echo "$URL" \
| sd '^https?://(www\.)?' '' \
| sd '/.*$' '' \
| sd '\..+$' '' \
`
SITE=` echo "$URL" \
| sd '^https?://(www\.)?' '' \
| sd '/.*$' '' \
`
else
ARTIST=` echo "$SITE" \
| sd '\.bandcamp\.com.*' '' \
`
if [ -z "$ARTIST" ]; then
ARTIST="$SITE"
fi
fi
echo "ARTIST : '$ARTIST'"
if [[ "$URL" =~ '/track/' ]]; then
get_bandcamp_track "$URL"
elif [[ "$URL" =~ '/album/' ]]; then
get_bandcamp_album "$URL"
else
echo '> > discography'
SUBLINKS=(` lynx -dump -listonly -nonumbers "$URL" \
| grep -Eiw "^(https://$SITE/(album|track))" \
| sd '\?action=download' '' \
| uniq \
`)
for LINK in "${SUBLINKS[@]}" ; do
if [[ "$LINK" =~ '/track/' ]]; then
get_bandcamp_track "$LINK"
elif [[ "$LINK" =~ '/album/' ]]; then
get_bandcamp_album "$LINK"
fi
done
fi
RENAME_LIST=(` ls -RAd $MUSIC_PATH/$ARTIST/NA/* `)
if [ $? -eq 0 ]; then
for RENAME_FROM in "${RENAME_LIST[@]}"; do
RENAME_TO=` echo "$RENAME_FROM" \
| sd '/NA/NA ' '/' \
`
if [ "$RENAME_FROM" != "$RENAME_TO" ]; then
echo "'$RENAME_FROM'"
echo ">> '$RENAME_TO'"
mv "$RENAME_FROM" "$RENAME_TO"
fi
done
rmdir "$MUSIC_PATH/$ARTIST/NA/"
fi
;;
'twitter.com'| \
*.twitter.com )
echo '> twitter'
CLEAN_URL=` echo "$URL" \
| sd '^https?://([\w-]+\.)?twitter.com/' '' \
| sd '/?\?.*$' '' \
| sd -- '/status/' '--' \
| sd '/' '-' \
`
2024-04-24 17:58:40 +02:00
CLEAN_URL=${CLEAN_URL:0:50}
2023-06-23 20:07:30 +02:00
echo "CLEAN_URL : '$CLEAN_URL'"
YDL "$URL" -o "$DEFAULT_PATH/tw--$CLEAN_URL.%(ext)s"
;;
'reddit.com'| \
*.reddit.com )
echo '> reddit'
CLEAN_URL=` echo "$URL" \
| sd '^https?://([\w-]+\.)?reddit.com/(r/)?' '' \
| sd '/?\?.*$' '' \
| sd -- '/?comments/' '--' \
| sd '/' '-' \
`
2024-04-24 17:58:40 +02:00
CLEAN_URL=${CLEAN_URL:0:50}
2023-06-23 20:07:30 +02:00
echo "CLEAN_URL : '$CLEAN_URL'"
YDL "$URL" -o "$DEFAULT_PATH/r-$CLEAN_URL.%(ext)s"
;;
'instagram.com'| \
*.instagram.com )
echo '> instagram'
CLEAN_URL=` echo "$URL" \
| sd '^https?://([\w-]+\.)?instagram.com/p/' '' \
| sd '/?\?.*$' '' \
| sd '/+$' '' \
| sd '/' '-' \
`
2024-04-24 17:58:40 +02:00
CLEAN_URL=${CLEAN_URL:0:50}
2023-06-23 20:07:30 +02:00
echo "CLEAN_URL : '$CLEAN_URL'"
DATE=` date -u "+%Y%m%d%H%M%S" `
YDL "$URL" -o "$DEFAULT_PATH/ig-%(uploader_id).50B-$CLEAN_URL-(%(title).50B)_$DATE.%(ext)s"
;;
*)
echo '> _default_'
CLEAN_URL=` echo "$URL" \
| sd '^https?://(www\.)?' '' \
| sd '/+$' '' \
| sd '[\\\/\s\?\^\*\|:><]+' '-' \
`
CLEAN_URL=${CLEAN_URL%%/*}
2024-04-24 17:58:40 +02:00
CLEAN_URL=${CLEAN_URL:0:50}
2023-06-23 20:07:30 +02:00
echo "CLEAN_URL : '$CLEAN_URL'"
DATE=` date -u "+%Y%m%d%H%M%S" `
YDL "$URL" -o "$DEFAULT_PATH/$CLEAN_URL-[%(id)s]_$DATE.%(ext)s"
;;
esac