We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent edb0c2c commit 7bc7940Copy full SHA for 7bc7940
1 file changed
lightx2v/shot_runner/rs2v_infer.py
@@ -213,10 +213,9 @@ def load_audio(audio_path, target_sr):
213
video_seg = gen_clip_video[:, :, :segment_actual_video_frames]
214
audio_seg = audio_clip[:, : segment_actual_video_frames * audio_per_frame].sum(dim=0)
215
else:
216
- video_pad_len = pad_len // audio_per_frame
217
- audio_pad_len = video_pad_len * audio_per_frame
218
- video_seg = gen_clip_video[:, :, : gen_clip_video.shape[2] - video_pad_len]
219
- audio_seg = audio_clip[:, : audio_clip.shape[1] - audio_pad_len].sum(dim=0)
+ video_seg = gen_clip_video
+ audio_seg = audio_clip.sum(dim=0)
+
220
clip_input_info.overlap_latent = gen_latents[:, -1:]
221
222
if clip_input_info.return_result_tensor or not clip_input_info.stream_save_video:
0 commit comments