Skip to content

Commit 7bc7940

Browse files
committed
refactor: Simplify video and audio segment handling in ShotRS2VPipeline by removing padding logic
1 parent edb0c2c commit 7bc7940

1 file changed

Lines changed: 3 additions & 4 deletions

File tree

lightx2v/shot_runner/rs2v_infer.py

Lines changed: 3 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -213,10 +213,9 @@ def load_audio(audio_path, target_sr):
213213
video_seg = gen_clip_video[:, :, :segment_actual_video_frames]
214214
audio_seg = audio_clip[:, : segment_actual_video_frames * audio_per_frame].sum(dim=0)
215215
else:
216-
video_pad_len = pad_len // audio_per_frame
217-
audio_pad_len = video_pad_len * audio_per_frame
218-
video_seg = gen_clip_video[:, :, : gen_clip_video.shape[2] - video_pad_len]
219-
audio_seg = audio_clip[:, : audio_clip.shape[1] - audio_pad_len].sum(dim=0)
216+
video_seg = gen_clip_video
217+
audio_seg = audio_clip.sum(dim=0)
218+
220219
clip_input_info.overlap_latent = gen_latents[:, -1:]
221220

222221
if clip_input_info.return_result_tensor or not clip_input_info.stream_save_video:

0 commit comments

Comments
 (0)