-
Notifications
You must be signed in to change notification settings - Fork 0
/
xgif
executable file
·431 lines (399 loc) · 14.3 KB
/
xgif
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
#!/usr/bin/env bash
set -euo pipefail
# Mac by default ships a version 3 bash that doesn't work with this script. I
# don't know if it works with version 4, and locally I can be sure it works
# with version 5. I'm going to have it quit with an error if the user has less
# than version 4, because that's all I'm sure does not work. Please report
# further version issues https://github.com/llimllib/ytgif
if [ ! "${BASH_VERSINFO:-0}" -ge 4 ]; then
printf "\033[31mYour version of bash (%s) is too old, please upgrade it to run this script\033[0m\n" "${BASH_VERSINFO[0]}"
exit
fi
function usage() {
cat <<"EOF"
Usage: ytgif [OPTIONS] <youtube-url> <output_file>
Download the video named in youtube-url and create a gif of it. Will embed the auto-generated subtitles if they're available. You can use the start and finish times to trim it to the duration you'd like.
OPTIONS
-v: print more verbose output
-scale n: scale the video's width to n pixels [default 640]
-fps n: set the fps of the output gif [default 20]
-gifsicle: post-process the image with `gifsicle -O2`
-start time: the time to start the video at
-finish time: the time to finish the video at
-nosubs: do not include subtitles in the output even if they're available
-sub-lang lang: sub language to choose
-autosubs: prefer youtube's auto-generated subtitles
-caption text: use a caption for the entire gif instead of subtitles
-fontsize: the font size for the caption. Defaults to 30 if caption set, otherwise to whatever ffmpeg defaults it to
-whisper: use OpenAI's `whisper` to generate captions
-whisper-large: use whisper's "large" model instead of its medium one. May download a large model file
TIME
The start and finish times can be specified in seconds, or mm:ss or hh:mm:ss.ms. ffmpeg is flexible in what it accepts. https://trac.ffmpeg.org/wiki/Seeking
INSTALLING
copy ytgif.bash to somewhere on your $PATH and rename it `ytgif`
WHISPER
For instructions on installing OpenAI whisper, go to https://github.com/openai/whisper#setup
EXAMPLES
Download the "I can't believe you've done this" clip, and turn the whole thing into "donethis.gif"
ytgif "https://www.youtube.com/watch?v=wKbU8B-QVZk" donethis.gif
Download the "don't call me shirley" clip from youtube, cut from 1:02 to 1:10.9 lower the fps to 10, and save it as airplane.gif:
ytgif -start 1:02 -finish 1:10.9 -fps 10 \
"https://www.youtube.com/watch?v=ixljWVyPby0" airplane.gif
Download a bit of a linear algebra lecture, and subtitle it in spanish:
ytgif -sub-lang es -start 26:54 -finish 27:02 \
"https://www.youtube.com/watch?v=QVKj3LADCnA" strang.gif
Create a tiny rickroll gif, optimize it, and don't include subtitles:
ytgif -gifsicle -scale 30 -start 0.5 -finish 3 -nosubs \
"https://www.youtube.com/watch?v=dQw4w9WgXcQ" rickroll.gif
Create a gif of owen wilson saying "wow":
ytgif -start 74.8 -finish 75.8 -nosubs -gifsicle \
"https://www.youtube.com/watch?v=KlLMlJ2tDkg&t=50s" wow.gif
Create a gif of Gob Bluth, and manually set the caption to "I've made a huge
mistake":
ytgif -v -start 13 -finish 17 -gifsicle -fps 10 \
-fontsize 40 -caption "I've made a huge mistake" \
"https://www.youtube.com/watch?v=GwQW3KW3DCc" mistake.gif
Create a gif of Dr. Frankenstein, and use OpenAI whisper to caption it
ytgif -start 49 -finish 55.5 -whisper \
https://www.youtube.com/watch?v=WamF64GFPzg frankenstein.gif
NOTES
- Be careful to quote the youtube URL, if it contains the & character it will not work unless quoted
- ytgif caches downloaded videos in `/tmp/ytgif_cache`, so you can quickly try edits to the gif without re-downloading videos. These can be quite large, so you may want to clear that folder when you're done making a gif
- youtube's auto subtitles are far from perfect, but often better than nothing
- generating a gif using OpenAI whisper is a bit slow, be patient
EOF
exit 1
}
verbose=
gifsicle=
scale=640
fps=20
start_=0
finish=()
nosubs=
sublang=
subflags=(--write-subs --write-auto-subs)
audiorequired=
caption=
fontsize=30
custom_fontsize=
whisper=
whisper_options=()
# parse command line flags
while true; do
case $1 in
-v)
verbose=true
shift
;;
-gifsicle)
gifsicle=true
shift
;;
-scale)
scale=$2
shift 2
;;
-fps)
fps=$2
shift 2
;;
-start)
start_=$2
shift 2
;;
-finish)
finish=(-to "$2")
shift 2
;;
-sub-lang)
sublang=$2
shift 2
;;
-nosubs)
subflags=(--no-write-subs)
nosubs="true"
shift
;;
-autosubs)
subflags=(--write-auto-subs)
shift
;;
-caption)
caption=$2
shift 2
;;
-fontsize)
fontsize=$2
custom_fontsize="true"
shift 2
;;
-whisper)
audiorequired="true"
whisper="true"
shift
;;
-whisper-large)
audiorequired="true"
whisper="true"
whisper_options=(--model large)
shift
;;
help|-h|--help)
usage
;;
*)
break
;;
esac
done
# if the -v flag has been set, show the commands we're running and let ffmpeg
# output more
ffmpegquiet=(-hide_banner -loglevel error)
ytdlpquiet=(--quiet)
if [ -n "$verbose" ]; then
set -x
ffmpegquiet=()
ytdlpquiet=()
fi
sublangs=()
if [ -n "$sublang" ]; then
sublangs=(--sub-langs "$sublang")
fi
# check for our dependencies, and suggest where to get them if they're not found
if ! command -v ffmpeg &> /dev/null
then
printf "\033[31mYou must install ffmpeg\033[0m: https://ffmpeg.org/download.html\n\n"
usage
fi
if ! command -v yt-dlp &> /dev/null
then
printf "\033[31mYou must install yt-dlp\033[0m: https://github.com/yt-dlp/yt-dlp#installation\n\n"
usage
fi
if [ -n "$gifsicle" ]; then
if ! command -v gifsicle &> /dev/null
then
printf "\033[31mYou must install gifsicle\033[0m: https://www.lcdf.org/gifsicle/\n\n"
usage
fi
fi
if [ -n "$whisper" ]; then
if ! command -v whisper &> /dev/null
then
printf "\033[31mYou must install whisper\033[0m: https://github.com/openai/whisper\n\n"
usage
fi
fi
# there should be two arguments remaining: the youtube URL and the output file name
if [ $# -lt 2 ]; then
usage
fi
yturl=$1
output=$2
ytgif_cache_folder="/tmp/ytgif_cache"
if [ ! -d $ytgif_cache_folder ]; then
mkdir $ytgif_cache_folder
fi
# when we try to expand a subtitle file glob, we want the expanded array to be
# empty if there are no subs available
# https://unix.stackexchange.com/a/34012
shopt -s nullglob
###########################
# Step 1: download.
#
# - download the video into a file called video_<youtube_url>.ext
# - ext is *usually* webm but we can't be sure
# - download the audio if necessary
# - right now we don't explicitly check for the subs file and download it if we
# need it - clear your cache if you need this. Sorry
###########################
# sanitize string to use it as our cache key - keep only ascii a-zA-Z0-9
yturl_clean=${yturl//[^a-zA-Z0-9]/}
# store the video in the cache folder, in the format video_<sanitized url>.ext
ytdl_video_outfile="$ytgif_cache_folder/video_$yturl_clean.%(ext)s"
# store the subtitles in the cache folder, in the format sub_<sanitized url>.ext
ytdl_sub_outfile="$ytgif_cache_folder/sub_$yturl_clean"
# check for cached video; if one does not exist, download the video
input_video=("$ytgif_cache_folder/video_$yturl_clean".*)
if [ ${#input_video[@]} -eq 0 ]; then
if ! yt-dlp -f bv \
"${ytdlpquiet[@]}" \
"${sublangs[@]}" \
"${subflags[@]}" \
-o "$ytdl_video_outfile" \
-o "subtitle:$ytdl_sub_outfile" \
"$yturl"; then
printf "\033[31mfailed running yt-dlp\033[0m\nre-running with -v may show why\n"
exit 1
fi
fi
# if $audiorequired is false, this variable will go unused
ytdl_audio_outfile="$ytgif_cache_folder/audio_$yturl_clean.%(ext)s"
# check for cached audio; if one does not exist, download the audio
input_audio=("$ytgif_cache_folder/audio_$yturl_clean".*)
if [ -n "$audiorequired" ] && [ ${#input_audio[@]} -eq 0 ]; then
if ! yt-dlp -f ba \
"${ytdlpquiet[@]}" \
"${sublangs[@]}" \
"${subflags[@]}" \
-o "$ytdl_audio_outfile" \
"$yturl"; then
printf "\033[31mfailed running yt-dlp\033[0m\nre-running with -v may show why\n"
exit 1
fi
fi
# evaluate the glob to get the input video, audio, and subtitle files
input_video=("$ytgif_cache_folder/video_$yturl_clean".*)
input_audio=("$ytgif_cache_folder/audio_$yturl_clean".*)
subtitles=("$ytgif_cache_folder/sub_$yturl_clean."*)
if [ -n "$verbose" ]; then
printf "⚠️ input_video: %s\n⚠️ subtitles: %s\n⚠️ audio: %s" "${input_video[@]}" "${subtitles[@]}" "${input_audio[@]}"
fi
###########################
# Step 2: clip files
# - clip the video file to the specified timing and save it as vclip_<youtube_url>.ext
# - if present, clip the audio file too and save as aclip_<youtube_url>.ext
###########################
ext=${input_video##*.}
vclipfile="$ytgif_cache_folder/vclip_$yturl_clean.$ext"
if ! ffmpeg -y "${ffmpegquiet[@]}" \
-ss "$start_" \
"${finish[@]}" \
-i "${input_video[0]}" \
-c copy -copyts \
-ss "$start_" \
"${finish[@]}" \
"$vclipfile"; then
printf "\033[31mfailed running ffmpeg\033[0m\nre-running with -v may show why\n"
exit 1
fi
ext=${input_audio##*.}
aclipfile="$ytgif_cache_folder/aclip_$yturl_clean.$ext"
# if we don't include the duplicate start and finish here, we get a clip that
# is clipped properly but the timing is wrong, it doesn't trim the start time
# of the file for reasons that are not clear to me
if ! ffmpeg -y "${ffmpegquiet[@]}" \
-ss "$start_" \
"${finish[@]}" \
-i "${input_audio[0]}" \
-c copy -copyts \
-ss "$start_" \
"${finish[@]}" \
"$aclipfile"; then
printf "\033[31mfailed running ffmpeg\033[0m\nre-running with -v may show why\n"
exit 1
fi
###########################
# Step 3: create output file
###########################
if [ -n "$whisper" ]; then
# run whisper to extract the subtitles
# add --model large to run the biggest model
# TODO: add option to use model size
# if ! whisper "$aclipfile" -o "$ytgif_cache_folder" ; then
if ! whisper "${whisper_options[@]}" "$aclipfile" -o "$ytgif_cache_folder" ; then
printf "\033[31mfailed running whisper\033[0m\nre-running with -v may show why\n"
exit 1
fi
subtitle="$aclipfile.srt"
# if fontsize has been set, add a "force_style" with the specified font
# size
#
# https://www.ffmpeg.org/ffmpeg-filters.html#subtitles-1
force_style=
if [ -n "$custom_fontsize" ] && [ -n "$fontsize" ]; then
force_style=":force_style='FontSize=$fontsize'"
fi
# convert the clipfile to a gif, using the subtitles we created with
# whisper
if ! ffmpeg -y "${ffmpegquiet[@]}" \
-i "$vclipfile" \
-filter_complex "\
[0:v] fps=$fps, \
scale=$scale:-1, \
split [a][b], \
[a] palettegen [p], \
[b][p] paletteuse, \
subtitles=$subtitle${force_style}" \
"$output"; then
printf "\033[31mfailed running ffmpeg\033[0m\nre-running with -v may show why\n"
exit 1
fi
elif [ -n "$caption" ]; then
caption_file="$ytgif_cache_folder/caption_$yturl_clean"
# to avoid the nightmare of quoting bash strings, dump the caption into a
# text file and use the `textfile` option to ffmpeg
echo "$caption" > "$caption_file"
if ! ffmpeg "${ffmpegquiet[@]}" \
-i "${vclipfile}" \
-filter_complex "\
[0:v] fps=$fps, \
scale=$scale:-1, \
split [a][b], \
[a] palettegen [p], \
[b][p] paletteuse, \
drawtext=borderw=1: \
bordercolor=black: \
fontcolor=white: \
fontsize=$fontsize: \
x=(w-text_w)/2: \
y=(h-text_h)-10: \
textfile=$caption_file" \
"$output"; then
printf "\033[31mfailed running ffmpeg\033[0m\nre-running with -v may show why\n"
exit 1
fi
# if we don't have any subtitles available, just encode to gif without them
elif [ ${#subtitles[@]} -eq 0 ] || [ -n "$nosubs" ]; then
if ! ffmpeg "${ffmpegquiet[@]}" \
-i "${vclipfile}" \
-filter_complex "\
[0:v] fps=$fps, \
scale=$scale:-1, \
split [a][b], \
[a] palettegen [p], \
[b][p] paletteuse" \
"$output"; then
printf "\033[31mfailed running ffmpeg\033[0m\nre-running with -v may show why\n"
exit 1
fi
# we have a subtitle file downloaded from youtube
else
# if fontsize has been set, add a "force_style" with the specified font
# size
#
# https://www.ffmpeg.org/ffmpeg-filters.html#subtitles-1
force_style=
if [ -n "$custom_fontsize" ] && [ -n "$fontsize" ]; then
force_style=":force_style='FontSize=$fontsize'"
fi
# we include -ss and finish twice because we need to tell ffmpeg to
# properly normalize the timestamps it uses for the subtitles. Honestly I
# just throw more and more flags at ffmpeg until something like what I want
# comes out the other side
# see https://video.stackexchange.com/a/30046
if ! ffmpeg "${ffmpegquiet[@]}" \
-i "${vclipfile}" \
-filter_complex "\
[0:v] fps=$fps, \
scale=$scale:-1, \
split [a][b], \
[a] palettegen [p], \
[b][p] paletteuse, \
subtitles=${subtitles[0]}${force_style}" \
"$output"; then
printf "\033[31mfailed running ffmpeg\033[0m\nre-running with -v may show why\n"
exit 1
fi
fi
###########################
# Step 3: optimize the file if requested
###########################
if [ -n "$gifsicle" ]; then
if ! gifsicle --batch -O2 "$output"; then
printf "\033[31mfailed running gifsicle\033[0m\nre-running with -v may show why\n"
exit 1
fi
fi
echo "created $output"