Spaces:
Runtime error
Runtime error
Update run.py
Browse files
run.py
CHANGED
|
@@ -26,6 +26,8 @@ def load_hf_dataset(dataset_path, auth_token):
|
|
| 26 |
|
| 27 |
def fast_caption(sys_prompt, usr_prompt, temp, top_p, max_tokens, model, key, endpoint, video_hf, video_hf_auth, parquet_index, video_od, video_od_auth, video_gd, video_gd_auth, frame_format, frame_limit):
|
| 28 |
progress_info = []
|
|
|
|
|
|
|
| 29 |
with tempfile.TemporaryDirectory() as temp_dir:
|
| 30 |
# temp_dir = '/opt/run'
|
| 31 |
csv_filename = os.path.join('/dev/shm', str(parquet_index).zfill(6) + '_gpt4o_caption.csv')
|
|
@@ -59,10 +61,8 @@ def fast_caption(sys_prompt, usr_prompt, temp, top_p, max_tokens, model, key, en
|
|
| 59 |
_chunk.append(_v.name)
|
| 60 |
md5 = hashlib.md5(binary).hexdigest()
|
| 61 |
|
| 62 |
-
processor = VideoProcessor(frame_format=frame_format, frame_limit=frame_limit)
|
| 63 |
frames = processor._decode(_v.name)
|
| 64 |
base64_list = processor.to_base64_list(frames)
|
| 65 |
-
api = AzureAPI(key=key, endpoint=endpoint, model=model, temp=temp, top_p=top_p, max_tokens=max_tokens)
|
| 66 |
caption = api.get_caption(sys_prompt, usr_prompt, base64_list)
|
| 67 |
writer.writerow({'md5': md5, 'caption': caption})
|
| 68 |
# writer.writerow({'md5': md5, 'caption': 'caption'})
|
|
|
|
| 26 |
|
| 27 |
def fast_caption(sys_prompt, usr_prompt, temp, top_p, max_tokens, model, key, endpoint, video_hf, video_hf_auth, parquet_index, video_od, video_od_auth, video_gd, video_gd_auth, frame_format, frame_limit):
|
| 28 |
progress_info = []
|
| 29 |
+
processor = VideoProcessor(frame_format=frame_format, frame_limit=frame_limit)
|
| 30 |
+
api = AzureAPI(key=key, endpoint=endpoint, model=model, temp=temp, top_p=top_p, max_tokens=max_tokens)
|
| 31 |
with tempfile.TemporaryDirectory() as temp_dir:
|
| 32 |
# temp_dir = '/opt/run'
|
| 33 |
csv_filename = os.path.join('/dev/shm', str(parquet_index).zfill(6) + '_gpt4o_caption.csv')
|
|
|
|
| 61 |
_chunk.append(_v.name)
|
| 62 |
md5 = hashlib.md5(binary).hexdigest()
|
| 63 |
|
|
|
|
| 64 |
frames = processor._decode(_v.name)
|
| 65 |
base64_list = processor.to_base64_list(frames)
|
|
|
|
| 66 |
caption = api.get_caption(sys_prompt, usr_prompt, base64_list)
|
| 67 |
writer.writerow({'md5': md5, 'caption': caption})
|
| 68 |
# writer.writerow({'md5': md5, 'caption': 'caption'})
|