diff --git a/README.md b/README.md index 885181f..1bfba1d 100644 --- a/README.md +++ b/README.md @@ -106,6 +106,24 @@ query = f'\n{text}' # text = 'Describe each image.' # query = '\n'.join([f'Image {i+1}: ' for i in range(len(images))]) + '\n' + text +## video input (require `pip install moviepy==1.0.3`) +# from moviepy.editor import VideoFileClip +# video_path = '/data/videos/example_1.mp4' +# num_frames = 12 +# max_partition = 1 +# text = 'Describe the video.' +# with VideoFileClip(video_path) as clip: +# total_frames = int(clip.fps * clip.duration) +# if total_frames <= num_frames: +# sampled_indices = range(total_frames) +# else: +# stride = total_frames / num_frames +# sampled_indices = [min(total_frames - 1, int((stride * i + stride * (i + 1)) / 2)) for i in range(num_frames)] +# frames = [clip.get_frame(index / clip.fps) for index in sampled_indices] +# frames = [Image.fromarray(frame, mode='RGB') for frame in frames] +# images = frames +# query = '\n'.join([''] * len(images)) + '\n' + text + ## text-only input # images = [] # max_partition = None