-
Notifications
You must be signed in to change notification settings - Fork 11
/
generateSlideshow.py
108 lines (88 loc) · 4.33 KB
/
generateSlideshow.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
from moviepy.editor import VideoFileClip, ImageSequenceClip, concatenate_videoclips, AudioFileClip, vfx
from pydub import AudioSegment
from PIL import Image, ImageDraw, ImageFont
import numpy as np
import os
import librosa
def create_endcard(num_memories, font_size=50, offset = 110):
input_image_path = rf'static{os.path.sep}images{os.path.sep}endCard_template.jpg'
output_image_path = rf'static{os.path.sep}images{os.path.sep}endCard.jpg'
text = str(num_memories) + " memories and counting..."
# Open the image
img = Image.open(input_image_path)
# Get the image dimensions
width, height = img.size
# Create a drawing object
draw = ImageDraw.Draw(img)
# Choose a font (you may need to provide the path to a font file)static\fonts\Inter-SemiBold.ttf
font = ImageFont.truetype(rf'static{os.path.sep}fonts{os.path.sep}Inter-SemiBold.ttf', font_size)
# Get the bounding box of the text
text_bbox = draw.textbbox((0, 0), text, font=font)
# Calculate the position to center the text
x = (width - text_bbox[2]) // 2
y = (height - text_bbox[3]) // 2 + offset
# Draw the text on the image
draw.text((x, y), text, font=font, fill="white")
# Save the modified image
img.save(output_image_path)
return(output_image_path)
def create_slideshow(input_folder, output_file, music_file, timestamps, mode = 'classic'):
image_files = sorted([f for f in os.listdir(input_folder) if f.endswith(('.png', '.jpg', '.jpeg', 'webp'))])
clips = []
print("image file count: " + str(len(image_files)))
print("beat count: " + str(len(timestamps)))
# Check if timestamps has fewer values than imagefiles
img_file_count = len(image_files)
beat_count = len(timestamps)
if len(timestamps) < len(image_files):
# Adjust the length of timestamps by repeating its elements
timestamps += timestamps[:len(image_files) - len(timestamps)]
print("image file count: " + str(len(image_files)))
print("beat count: " + str(len(timestamps)))
for image_file, timestamp in zip(image_files, timestamps):
image_path = os.path.join(input_folder, image_file)
clip = ImageSequenceClip([image_path], fps=1 / timestamp)
clips.append(clip)
print("appended clip: ", image_path)
endcard_img_path = create_endcard(len(image_files))
endcard_clip = ImageSequenceClip([endcard_img_path], fps=1/3)
clips.append(endcard_clip)
final_clip = concatenate_videoclips(clips, method="compose")
if mode == 'classic':
print("clipping video to classic mode")
final_clip = final_clip.fx(vfx.accel_decel, new_duration = 30)
music = AudioFileClip(music_file)
# Pad the audio with silence if it's shorter than the final clip
if music.duration < final_clip.duration:
print("music is shorter than final clip, will be padded with silence")
#silence_duration = final_clip.duration - music.duration
#silence = AudioSegment.silent(duration=silence_duration * 1000) # Duration in milliseconds
#music += silence # Concatenate silence and audio
else:
print("music is longer than final clip, clipping")
music = music.subclip(0, final_clip.duration)
music = music.audio_fadeout(3)
#print("Video Duration = ", final_clip.duration)
#print("Music Duration = ", music_processed.duration)
final_clip = final_clip.set_audio(music)
final_clip.write_videofile(output_file, codec="libx264", audio_codec="aac", threads = 6, fps=24)
def convert_to_durations(timestamps):
durations = []
# Calculate durations between consecutive timestamps
for i in range(1, len(timestamps)):
duration = timestamps[i] - timestamps[i - 1]
durations.append(duration)
return durations
def buildSlideshow(mode = 'classic'):
music = os.path.join(os.getcwd(), "curr_song.wav")
print("loading music from ", music)
audio_file = librosa.load(music)
y, sr = audio_file
tempo, beat_frames = librosa.beat.beat_track(y=y, sr=sr)
beat_times_raw = librosa.frames_to_time(beat_frames,sr=sr)
beat_times = [float(value) for value in beat_times_raw]
beat_times = convert_to_durations(beat_times)
print(beat_times)
input_folder = os.path.join(os.getcwd(), 'combined')
output_file = "static/slideshow_test.mp4"
create_slideshow(input_folder, output_file, music, beat_times, mode)