-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathyoutube-dl-batch.sh
executable file
·172 lines (144 loc) · 4.98 KB
/
youtube-dl-batch.sh
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
#!/bin/bash
# define the directory containing this script
DIR="$( cd "$( dirname "${BASH_SOURCE[0]}" )" >/dev/null 2>&1 && pwd )"
# source variables
source "${DIR}/vars.sh"
# if the system is using pyenv, set PATH in order to use pyenv, not system
# python
if [ -d "${HOME}/.pyenv" ]; then
export PATH=~/.pyenv/shims:~/.pyenv/bin:"$PATH"
fi
# create logger functions
logger_args () {
# this function send arguments to stdout and appends them to a logfile
local LOGFILE
# by default, we set this logger to write to a file that is located in the
# same directory as the script that sources this functions definition file
LOGFILE="${DIR}/${BASENAME_S}.log"
echo -e "$@" | tee -a $LOGFILE
return
}
main_logger () {
# basic logging info
echo -e "START_LOGFILE\n"
date
echo -e "Running $0 with process id $$\n"
# log pid to a file
PID_FILE="$(mktemp "${TMP_DIR}/${BASENAME_S}.$$.XXXXXXXXXX")"
echo -e $$ > $PID_FILE
return
}
path_logger () {
# log path and program info
echo -e "PATH is set to: $PATH\n"
echo -e "Using the following python:\n$(which python)\n"
echo -e "Pyenv is using the following python and version: \
\n$(pyenv which python)\n"
echo -e "Using the following youtube-dl:\n$(which youtube-dl)\n"
return
}
config_joiner () {
# takes 1 or more (config) files as arguments and joins them into one
# variable used for joining a base config file with directory specific
# config
cat "$@"
return
}
# generate logs for this session
main_logger
path_logger
# define functions for traps
trap_handle () {
# clean up upon receiving SIGTERM or SIGINT
echo -e "Caught signal SIGTERM or SIGINT"
if [[ "$child" ]]; then
echo -e "Killing child process\n$(ps -o pid,comm $child)\nwith pid
$child"
kill -TERM $child
fi
echo -e "${BASENAME}:\n$(date)\nExiting"
exit 0
return
}
# trap SIGINT and SIGTERM for this script
trap trap_handle INT TERM
# check to see if the file "archive" exists and create it if it doesn't
if [ ! -f $ARCHIVE_FILE ]; then
echo -e "Creating archive file...\n" && touch $ARCHIVE_FILE
else
echo -e "Found archive file: ${ARCHIVE_FILE}"
fi
# copy the archive file to diff it later if useful
cp $ARCHIVE_FILE "${ARCHIVE_FILE}.b"
# cd to download directory
if [[ -d "$DOWNLOAD_DIR" ]]; then
if cd $DOWNLOAD_DIR; then
echo "Changed directory to $DOWNLOAD_DIR"
else
echo "Coudn't cd to ${DOWNLOAD_DIR}. Exiting."
exit 1
fi
else
if mkdir -p $DOWNLOAD_DIR; then
echo "Created $DOWNLOAD_DIR"
if cd $DOWNLOAD_DIR; then
echo "Changed directory to ${DOWNLOAD_DIR}"
else
echo "Coudn't cd to ${DOWNLOAD_DIR}. Exiting."
exit 1
fi
else
echo "Couldn't create ${DOWNLOAD_DIR}. Exiting."
exit 1
fi
fi
# download media
for i in $(ls -1 "$BATCH_DIR"); do
# join the base and current config files and write to the tmp directory
CURRENT_DIR="${BATCH_DIR}/${i}"
# if there is a pause file in this directory, go to the next directory
if [ -e "${CURRENT_DIR}/pause" ]; then
echo -e "Found a file named "pause" in ${CURRENT_DIR} ; skipping \
downloading media in this directory"
continue
fi
# otherwise, proceed with the download
echo -e "Downloading content from ${CURRENT_DIR}...\n"
# join the local config file with the global config file and define a
# filename
CURRENT_CONFIG_PATH="${CURRENT_DIR}/${CONFIG_BASENAME}"
TMP_CONFIG_FILE_PATH="${TMP_DIR}/${i}_config.tmp"
# join the base config with the current directory's config file, and
# redirect to a temporary file
config_joiner "$BASE_CONFIG_PATH" "$CURRENT_CONFIG_PATH" > \
"$TMP_CONFIG_FILE_PATH"
# echo -e "The joined config file contains $(wc -l \
# "$TMP_CONFIG_FILE_PATH" | sed -E "s/(^ *)([0-9]+)(.*)/\2/g") lines\n"
# define the path of the batch file containing urls to be downloaded
BATCH_FILE_PATH="${CURRENT_DIR}/${BATCH_BASENAME}"
# download the media
echo -e "\nDownloading media from $CURRENT_DIR\n"
# execute youtube-dl in the background with the specified parameters
youtube-dl \
--download-archive "$ARCHIVE_FILE" \
--config-location "$TMP_CONFIG_FILE_PATH" \
--batch-file "$BATCH_FILE_PATH" \
&
# wait for this process so that the main script can catch SIGTERM or SIGINT
# and run the corresponding trap. We don't want to "exec" youtube-dl, since
# we need to keep the shell around to continue with the loop. There are
# likely some race conditions created here, so this approach could be
# improved upon.
child=$!
wait $child
# Log the success or failure of the last waited-for background command.
# wait, as called above, will exit with the exit status of the specified
# pid
wait_exit_status=$?
if [[ $wait_exit_status -gt 0 ]]; then
echo "There was an error: process $child exited with
status $wait_exit_status"
else
echo -e "Finished downloading media from $CURRENT_DIR\n"
fi
done