diff --git a/ms-swift/silence_overlaps/only_overlap/.ipynb_checkpoints/overlap5s_isoverlap_train-checkpoint.json b/ms-swift/silence_overlaps/only_overlap/.ipynb_checkpoints/overlap5s_isoverlap_train-checkpoint.json new file mode 100644 index 0000000000000000000000000000000000000000..5aa2e4b4a35d1b8aafa37dbd5b07255db7d0b585 --- /dev/null +++ b/ms-swift/silence_overlaps/only_overlap/.ipynb_checkpoints/overlap5s_isoverlap_train-checkpoint.json @@ -0,0 +1,3522 @@ +[ + { + "key": "SODA_PROCESSED--train--69960", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--69960.wav", + "model_output": "No significant overlaps found." + }, + { + "key": "SODA_PROCESSED--train--500115", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--500115.wav", + "model_output": "Multiple speakers talk simultaneously from 00:18-00:25" + }, + { + "key": "SODA_PROCESSED--train--706051", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--706051.wav", + "model_output": "Multiple speakers talk simultaneously from 00:05-00:09" + }, + { + "key": "SODA_PROCESSED--train--868975", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--868975.wav", + "model_output": "Multiple speakers talk simultaneously from 00:22-00:28" + }, + { + "key": "SODA_PROCESSED--train--1149932", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--1149932.wav", + "model_output": "Multiple speakers talk simultaneously from 00:28-00:34" + }, + { + "key": "SODA_PROCESSED--train--449689", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--449689.wav", + "model_output": "Multiple speakers talk simultaneously from 00:37-00:44" + }, + { + "key": "SODA_PROCESSED--train--245101", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--245101.wav", + "model_output": "Multiple speakers talk simultaneously from 00:06-00:12" + }, + { + "key": "SODA_PROCESSED--train--12047", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--12047.wav", + "model_output": "Multiple speakers talk simultaneously from 00:10-00:16" + }, + { + "key": "SODA_PROCESSED--train--640494", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--640494.wav", + "model_output": "Multiple speakers talk simultaneously from 00:10-00:15" + }, + { + "key": "SODA_PROCESSED--train--787791", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--787791.wav", + "model_output": "Multiple speakers talk simultaneously from 00:08-00:14" + }, + { + "key": "SODA_PROCESSED--train--290375", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--290375.wav", + "model_output": "Multiple speakers talk simultaneously from 00:05-00:10" + }, + { + "key": "SODA_PROCESSED--train--374749", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--374749.wav", + "model_output": "Multiple speakers talk simultaneously from 00:15-00:20" + }, + { + "key": "SODA_PROCESSED--train--56287", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--56287.wav", + "model_output": "Multiple speakers talk simultaneously from 00:33-00:38" + }, + { + "key": "SODA_PROCESSED--train--497264", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--497264.wav", + "model_output": "Multiple speakers talk simultaneously from 00:20-00:27" + }, + { + "key": "SODA_PROCESSED--train--484021", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--484021.wav", + "model_output": "Multiple speakers talk simultaneously from 00:18-00:24" + }, + { + "key": "SODA_PROCESSED--train--583537", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--583537.wav", + "model_output": "No significant overlaps found." + }, + { + "key": "SODA_PROCESSED--train--1097575", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--1097575.wav", + "model_output": "Multiple speakers talk simultaneously from 00:18-00:25" + }, + { + "key": "SODA_PROCESSED--train--403051", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--403051.wav", + "model_output": "Multiple speakers talk simultaneously from 00:08-00:14" + }, + { + "key": "SODA_PROCESSED--train--960193", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--960193.wav", + "model_output": "Multiple speakers talk simultaneously from 00:10-00:16" + }, + { + "key": "SODA_PROCESSED--train--771154", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--771154.wav", + "model_output": "Multiple speakers talk simultaneously from 00:07-00:11" + }, + { + "key": "SODA_PROCESSED--train--137471", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--137471.wav", + "model_output": "Multiple speakers talk simultaneously from 00:52-00:58" + }, + { + "key": "SODA_PROCESSED--train--575640", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--575640.wav", + "model_output": "Multiple speakers talk simultaneously from 00:08-00:12" + }, + { + "key": "SODA_PROCESSED--train--89079", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--89079.wav", + "model_output": "Multiple speakers talk simultaneously from 00:08-00:15" + }, + { + "key": "SODA_PROCESSED--train--844892", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--844892.wav", + "model_output": "Multiple speakers talk simultaneously from 00:11-00:18" + }, + { + "key": "SODA_PROCESSED--train--737726", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--737726.wav", + "model_output": "Multiple speakers talk simultaneously from 00:08-00:14" + }, + { + "key": "SODA_PROCESSED--train--867206", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--867206.wav", + "model_output": "Multiple speakers talk simultaneously from 00:16-00:20" + }, + { + "key": "SODA_PROCESSED--train--810624", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--810624.wav", + "model_output": "Multiple speakers talk simultaneously from 00:16-00:21" + }, + { + "key": "SODA_PROCESSED--train--748043", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--748043.wav", + "model_output": "Multiple speakers talk simultaneously from 00:07-00:13" + }, + { + "key": "SODA_PROCESSED--train--610118", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--610118.wav", + "model_output": "Multiple speakers talk simultaneously from 00:07-00:11" + }, + { + "key": "SODA_PROCESSED--train--964867", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--964867.wav", + "model_output": "Multiple speakers talk simultaneously from 00:17-00:23" + }, + { + "key": "SODA_PROCESSED--train--189460", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--189460.wav", + "model_output": "Multiple speakers talk simultaneously from 00:30-00:34" + }, + { + "key": "SODA_PROCESSED--train--277828", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--277828.wav", + "model_output": "Multiple speakers talk simultaneously from 00:07-00:11" + }, + { + "key": "SODA_PROCESSED--train--115967", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--115967.wav", + "model_output": "Multiple speakers talk simultaneously from 00:12-00:18" + }, + { + "key": "SODA_PROCESSED--train--1084325", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--1084325.wav", + "model_output": "Multiple speakers talk simultaneously from 00:08-00:14" + }, + { + "key": "SODA_PROCESSED--train--536240", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--536240.wav", + "model_output": "Multiple speakers talk simultaneously from 00:08-00:12" + }, + { + "key": "SODA_PROCESSED--train--370577", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--370577.wav", + "model_output": "Multiple speakers talk simultaneously from 00:13-00:17" + }, + { + "key": "SODA_PROCESSED--train--1087984", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--1087984.wav", + "model_output": "Multiple speakers talk simultaneously from 00:15-00:21" + }, + { + "key": "SODA_PROCESSED--train--489920", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--489920.wav", + "model_output": "Multiple speakers talk simultaneously from 00:08-00:15" + }, + { + "key": "SODA_PROCESSED--train--1168213", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--1168213.wav", + "model_output": "No significant overlaps found." + }, + { + "key": "SODA_PROCESSED--train--845126", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--845126.wav", + "model_output": "Multiple speakers talk simultaneously from 00:23-00:27" + }, + { + "key": "SODA_PROCESSED--train--338555", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--338555.wav", + "model_output": "Multiple speakers talk simultaneously from 00:08-00:15" + }, + { + "key": "SODA_PROCESSED--train--934782", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--934782.wav", + "model_output": "Multiple speakers talk simultaneously from 00:45-00:56" + }, + { + "key": "SODA_PROCESSED--train--546350", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--546350.wav", + "model_output": "Multiple speakers talk simultaneously from 00:02-00:07" + }, + { + "key": "SODA_PROCESSED--train--1132437", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--1132437.wav", + "model_output": "Multiple speakers talk simultaneously from 00:07-00:14" + }, + { + "key": "SODA_PROCESSED--train--82144", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--82144.wav", + "model_output": "Multiple speakers talk simultaneously from 00:05-00:12" + }, + { + "key": "SODA_PROCESSED--train--96343", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--96343.wav", + "model_output": "Multiple speakers talk simultaneously from 00:07-00:11" + }, + { + "key": "SODA_PROCESSED--train--102351", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--102351.wav", + "model_output": "Multiple speakers talk simultaneously from 00:05-00:10" + }, + { + "key": "SODA_PROCESSED--train--742899", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--742899.wav", + "model_output": "Multiple speakers talk simultaneously from 00:08-00:14" + }, + { + "key": "SODA_PROCESSED--train--501206", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--501206.wav", + "model_output": "Multiple speakers talk simultaneously from 00:15-00:21" + }, + { + "key": "SODA_PROCESSED--train--680740", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--680740.wav", + "model_output": "Multiple speakers talk simultaneously from 00:10-00:21" + }, + { + "key": "SODA_PROCESSED--train--1128813", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--1128813.wav", + "model_output": "Multiple speakers talk simultaneously from 00:09-00:16" + }, + { + "key": "SODA_PROCESSED--train--1794", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--1794.wav", + "model_output": "Multiple speakers talk simultaneously from 00:11-00:18" + }, + { + "key": "SODA_PROCESSED--train--211161", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--211161.wav", + "model_output": "Multiple speakers talk simultaneously from 00:16-00:21" + }, + { + "key": "SODA_PROCESSED--train--1120331", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--1120331.wav", + "model_output": "Multiple speakers talk simultaneously from 00:12-00:19" + }, + { + "key": "SODA_PROCESSED--train--413405", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--413405.wav", + "model_output": "Multiple speakers talk simultaneously from 00:04-00:09" + }, + { + "key": "SODA_PROCESSED--train--583204", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--583204.wav", + "model_output": "Multiple speakers talk simultaneously from 00:06-00:11" + }, + { + "key": "SODA_PROCESSED--train--486716", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--486716.wav", + "model_output": "Multiple speakers talk simultaneously from 00:11-00:14" + }, + { + "key": "SODA_PROCESSED--train--806479", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--806479.wav", + "model_output": "Multiple speakers talk simultaneously from 00:10-00:14" + }, + { + "key": "SODA_PROCESSED--train--126313", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--126313.wav", + "model_output": "Multiple speakers talk simultaneously from 00:04-00:10" + }, + { + "key": "SODA_PROCESSED--train--1171436", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--1171436.wav", + "model_output": "Multiple speakers talk simultaneously from 00:07-00:14" + }, + { + "key": "SODA_PROCESSED--train--674707", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--674707.wav", + "model_output": "Multiple speakers talk simultaneously from 00:17-00:22" + }, + { + "key": "SODA_PROCESSED--train--1047480", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--1047480.wav", + "model_output": "Multiple speakers talk simultaneously from 00:12-00:21" + }, + { + "key": "SODA_PROCESSED--train--649949", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--649949.wav", + "model_output": "Multiple speakers talk simultaneously from 00:11-00:17" + }, + { + "key": "SODA_PROCESSED--train--489519", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--489519.wav", + "model_output": "Multiple speakers talk simultaneously from 00:10-00:14" + }, + { + "key": "SODA_PROCESSED--train--1080121", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--1080121.wav", + "model_output": "Multiple speakers talk simultaneously from 00:13-00:21" + }, + { + "key": "SODA_PROCESSED--train--730163", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--730163.wav", + "model_output": "Multiple speakers talk simultaneously from 00:08-00:12" + }, + { + "key": "SODA_PROCESSED--train--775640", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--775640.wav", + "model_output": "Multiple speakers talk simultaneously from 00:10-00:16" + }, + { + "key": "SODA_PROCESSED--train--403013", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--403013.wav", + "model_output": "Multiple speakers talk simultaneously from 00:09-00:14" + }, + { + "key": "SODA_PROCESSED--train--468603", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--468603.wav", + "model_output": "Multiple speakers talk simultaneously from 00:07-00:11" + }, + { + "key": "SODA_PROCESSED--train--834165", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--834165.wav", + "model_output": "Multiple speakers talk simultaneously from 00:13-00:18" + }, + { + "key": "SODA_PROCESSED--train--691830", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--691830.wav", + "model_output": "Multiple speakers talk simultaneously from 00:24-00:29" + }, + { + "key": "SODA_PROCESSED--train--115322", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--115322.wav", + "model_output": "Multiple speakers talk simultaneously from 00:08-00:13" + }, + { + "key": "SODA_PROCESSED--train--805432", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--805432.wav", + "model_output": "Multiple speakers talk simultaneously from 00:13-00:19" + }, + { + "key": "SODA_PROCESSED--train--906513", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--906513.wav", + "model_output": "Multiple speakers talk simultaneously from 00:18-00:22" + }, + { + "key": "SODA_PROCESSED--train--162201", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--162201.wav", + "model_output": "Multiple speakers talk simultaneously from 00:06-00:11" + }, + { + "key": "SODA_PROCESSED--train--121129", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--121129.wav", + "model_output": "Multiple speakers talk simultaneously from 00:26-00:33" + }, + { + "key": "SODA_PROCESSED--train--47850", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--47850.wav", + "model_output": "Multiple speakers talk simultaneously from 00:32-00:39" + }, + { + "key": "SODA_PROCESSED--train--931585", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--931585.wav", + "model_output": "Multiple speakers talk simultaneously from 00:04-00:09" + }, + { + "key": "SODA_PROCESSED--train--978945", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--978945.wav", + "model_output": "Multiple speakers talk simultaneously from 00:09-00:13" + }, + { + "key": "SODA_PROCESSED--train--13635", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--13635.wav", + "model_output": "Multiple speakers talk simultaneously from 00:21-00:27" + }, + { + "key": "SODA_PROCESSED--train--1080787", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--1080787.wav", + "model_output": "Multiple speakers talk simultaneously from 00:09-00:18" + }, + { + "key": "SODA_PROCESSED--train--860269", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--860269.wav", + "model_output": "Multiple speakers talk simultaneously from 00:06-00:11" + }, + { + "key": "SODA_PROCESSED--train--265976", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--265976.wav", + "model_output": "Multiple speakers talk simultaneously from 00:13-00:20" + }, + { + "key": "SODA_PROCESSED--train--1106201", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--1106201.wav", + "model_output": "Multiple speakers talk simultaneously from 00:14-00:21" + }, + { + "key": "SODA_PROCESSED--train--525710", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--525710.wav", + "model_output": "Multiple speakers talk simultaneously from 00:09-00:16" + }, + { + "key": "SODA_PROCESSED--train--671614", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--671614.wav", + "model_output": "Multiple speakers talk simultaneously from 00:07-00:14" + }, + { + "key": "SODA_PROCESSED--train--1017701", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--1017701.wav", + "model_output": "Multiple speakers talk simultaneously from 00:06-00:10" + }, + { + "key": "SODA_PROCESSED--train--1122880", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--1122880.wav", + "model_output": "Multiple speakers talk simultaneously from 00:08-00:15" + }, + { + "key": "SODA_PROCESSED--train--1151383", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--1151383.wav", + "model_output": "Multiple speakers talk simultaneously from 00:15-00:22" + }, + { + "key": "SODA_PROCESSED--train--1180469", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--1180469.wav", + "model_output": "Multiple speakers talk simultaneously from 00:03-00:08" + }, + { + "key": "SODA_PROCESSED--train--615914", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--615914.wav", + "model_output": "Multiple speakers talk simultaneously from 00:07-00:12" + }, + { + "key": "SODA_PROCESSED--train--992151", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--992151.wav", + "model_output": "Multiple speakers talk simultaneously from 00:11-00:17" + }, + { + "key": "SODA_PROCESSED--train--150383", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--150383.wav", + "model_output": "Multiple speakers talk simultaneously from 00:11-00:16" + }, + { + "key": "SODA_PROCESSED--train--303336", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--303336.wav", + "model_output": "Multiple speakers talk simultaneously from 00:17-00:21" + }, + { + "key": "SODA_PROCESSED--train--946489", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--946489.wav", + "model_output": "Multiple speakers talk simultaneously from 00:13-00:17" + }, + { + "key": "SODA_PROCESSED--train--725089", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--725089.wav", + "model_output": "Multiple speakers talk simultaneously from 00:10-00:14" + }, + { + "key": "SODA_PROCESSED--train--809183", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--809183.wav", + "model_output": "Multiple speakers talk simultaneously from 00:06-00:09" + }, + { + "key": "SODA_PROCESSED--train--375003", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--375003.wav", + "model_output": "Multiple speakers talk simultaneously from 00:03-00:09" + }, + { + "key": "SODA_PROCESSED--train--1076439", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--1076439.wav", + "model_output": "Multiple speakers talk simultaneously from 00:03-00:07" + }, + { + "key": "SODA_PROCESSED--train--162106", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--162106.wav", + "model_output": "Multiple speakers talk simultaneously from 00:08-00:13" + }, + { + "key": "SODA_PROCESSED--train--766234", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--766234.wav", + "model_output": "Multiple speakers talk simultaneously from 00:11-00:17" + }, + { + "key": "SODA_PROCESSED--train--185307", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--185307.wav", + "model_output": "Multiple speakers talk simultaneously from 00:13-00:19" + }, + { + "key": "SODA_PROCESSED--train--146504", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--146504.wav", + "model_output": "No significant overlaps found." + }, + { + "key": "SODA_PROCESSED--train--932676", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--932676.wav", + "model_output": "Multiple speakers talk simultaneously from 00:15-00:21" + }, + { + "key": "SODA_PROCESSED--train--242753", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--242753.wav", + "model_output": "Multiple speakers talk simultaneously from 00:18-00:23" + }, + { + "key": "SODA_PROCESSED--train--686928", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--686928.wav", + "model_output": "Multiple speakers talk simultaneously from 00:21-00:28" + }, + { + "key": "SODA_PROCESSED--train--321447", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--321447.wav", + "model_output": "Multiple speakers talk simultaneously from 00:13-00:22" + }, + { + "key": "SODA_PROCESSED--train--942720", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--942720.wav", + "model_output": "Multiple speakers talk simultaneously from 00:14-00:21" + }, + { + "key": "SODA_PROCESSED--train--1020192", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--1020192.wav", + "model_output": "Multiple speakers talk simultaneously from 00:06-00:13" + }, + { + "key": "SODA_PROCESSED--train--735517", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--735517.wav", + "model_output": "Multiple speakers talk simultaneously from 00:07-00:13" + }, + { + "key": "SODA_PROCESSED--train--421778", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--421778.wav", + "model_output": "Multiple speakers talk simultaneously from 00:51-01:00" + }, + { + "key": "SODA_PROCESSED--train--556060", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--556060.wav", + "model_output": "Multiple speakers talk simultaneously from 00:08-00:14" + }, + { + "key": "SODA_PROCESSED--train--578986", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--578986.wav", + "model_output": "Multiple speakers talk simultaneously from 00:12-00:19" + }, + { + "key": "SODA_PROCESSED--train--637306", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--637306.wav", + "model_output": "Multiple speakers talk simultaneously from 00:09-00:13" + }, + { + "key": "SODA_PROCESSED--train--397434", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--397434.wav", + "model_output": "Multiple speakers talk simultaneously from 00:02-00:07" + }, + { + "key": "SODA_PROCESSED--train--636981", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--636981.wav", + "model_output": "Multiple speakers talk simultaneously from 00:13-00:17" + }, + { + "key": "SODA_PROCESSED--train--1083511", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--1083511.wav", + "model_output": "Multiple speakers talk simultaneously from 00:07-00:11" + }, + { + "key": "SODA_PROCESSED--train--328835", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--328835.wav", + "model_output": "Multiple speakers talk simultaneously from 00:07-00:13" + }, + { + "key": "SODA_PROCESSED--train--677647", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--677647.wav", + "model_output": "Multiple speakers talk simultaneously from 00:13-00:22" + }, + { + "key": "SODA_PROCESSED--train--734147", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--734147.wav", + "model_output": "Multiple speakers talk simultaneously from 00:18-00:26" + }, + { + "key": "SODA_PROCESSED--train--231222", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--231222.wav", + "model_output": "Multiple speakers talk simultaneously from 00:10-00:13" + }, + { + "key": "SODA_PROCESSED--train--708040", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--708040.wav", + "model_output": "Multiple speakers talk simultaneously from 00:06-00:12" + }, + { + "key": "SODA_PROCESSED--train--1059254", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--1059254.wav", + "model_output": "Multiple speakers talk simultaneously from 00:05-00:12" + }, + { + "key": "SODA_PROCESSED--train--852467", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--852467.wav", + "model_output": "Multiple speakers talk simultaneously from 00:07-00:12" + }, + { + "key": "SODA_PROCESSED--train--819618", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--819618.wav", + "model_output": "Multiple speakers talk simultaneously from 00:06-00:11" + }, + { + "key": "SODA_PROCESSED--train--65367", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--65367.wav", + "model_output": "Multiple speakers talk simultaneously from 00:08-00:13" + }, + { + "key": "SODA_PROCESSED--train--541347", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--541347.wav", + "model_output": "Multiple speakers talk simultaneously from 00:06-00:10" + }, + { + "key": "SODA_PROCESSED--train--994948", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--994948.wav", + "model_output": "Multiple speakers talk simultaneously from 00:12-00:19" + }, + { + "key": "SODA_PROCESSED--train--1049130", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--1049130.wav", + "model_output": "No significant overlaps found." + }, + { + "key": "SODA_PROCESSED--train--991838", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--991838.wav", + "model_output": "Multiple speakers talk simultaneously from 00:08-00:12" + }, + { + "key": "SODA_PROCESSED--train--1070688", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--1070688.wav", + "model_output": "Multiple speakers talk simultaneously from 00:08-00:15" + }, + { + "key": "SODA_PROCESSED--train--385362", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--385362.wav", + "model_output": "Multiple speakers talk simultaneously from 00:12-00:21" + }, + { + "key": "SODA_PROCESSED--train--934119", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--934119.wav", + "model_output": "Multiple speakers talk simultaneously from 00:15-00:21" + }, + { + "key": "SODA_PROCESSED--train--31287", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--31287.wav", + "model_output": "Multiple speakers talk simultaneously from 00:31-00:37" + }, + { + "key": "SODA_PROCESSED--train--1073790", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--1073790.wav", + "model_output": "Multiple speakers talk simultaneously from 00:06-00:10" + }, + { + "key": "SODA_PROCESSED--train--1066203", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--1066203.wav", + "model_output": "Multiple speakers talk simultaneously from 00:11-00:16" + }, + { + "key": "SODA_PROCESSED--train--895260", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--895260.wav", + "model_output": "Multiple speakers talk simultaneously from 00:09-00:16" + }, + { + "key": "SODA_PROCESSED--train--596356", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--596356.wav", + "model_output": "Multiple speakers talk simultaneously from 00:09-00:15" + }, + { + "key": "SODA_PROCESSED--train--385591", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--385591.wav", + "model_output": "Multiple speakers talk simultaneously from 00:17-00:24" + }, + { + "key": "SODA_PROCESSED--train--481276", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--481276.wav", + "model_output": "Multiple speakers talk simultaneously from 00:09-00:13" + }, + { + "key": "SODA_PROCESSED--train--304811", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--304811.wav", + "model_output": "Multiple speakers talk simultaneously from 00:07-00:12" + }, + { + "key": "SODA_PROCESSED--train--692789", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--692789.wav", + "model_output": "Multiple speakers talk simultaneously from 00:13-00:18" + }, + { + "key": "SODA_PROCESSED--train--41116", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--41116.wav", + "model_output": "Multiple speakers talk simultaneously from 00:13-00:19" + }, + { + "key": "SODA_PROCESSED--train--58199", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--58199.wav", + "model_output": "Multiple speakers talk simultaneously from 00:19-00:25" + }, + { + "key": "SODA_PROCESSED--train--951661", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--951661.wav", + "model_output": "Multiple speakers talk simultaneously from 00:05-00:09" + }, + { + "key": "SODA_PROCESSED--train--181032", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--181032.wav", + "model_output": "Multiple speakers talk simultaneously from 00:04-00:11" + }, + { + "key": "SODA_PROCESSED--train--58019", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--58019.wav", + "model_output": "Multiple speakers talk simultaneously from 00:07-00:12" + }, + { + "key": "SODA_PROCESSED--train--90720", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--90720.wav", + "model_output": "No significant overlaps found." + }, + { + "key": "SODA_PROCESSED--train--389182", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--389182.wav", + "model_output": "Multiple speakers talk simultaneously from 00:09-00:12" + }, + { + "key": "SODA_PROCESSED--train--315768", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--315768.wav", + "model_output": "Multiple speakers talk simultaneously from 00:09-00:17" + }, + { + "key": "SODA_PROCESSED--train--860576", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--860576.wav", + "model_output": "Multiple speakers talk simultaneously from 00:12-00:17" + }, + { + "key": "SODA_PROCESSED--train--649458", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--649458.wav", + "model_output": "Multiple speakers talk simultaneously from 00:20-00:27" + }, + { + "key": "SODA_PROCESSED--train--1117467", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--1117467.wav", + "model_output": "Multiple speakers talk simultaneously from 00:08-00:14" + }, + { + "key": "SODA_PROCESSED--train--967919", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--967919.wav", + "model_output": "Multiple speakers talk simultaneously from 00:29-00:34" + }, + { + "key": "SODA_PROCESSED--train--154340", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--154340.wav", + "model_output": "Multiple speakers talk simultaneously from 00:18-00:26" + }, + { + "key": "SODA_PROCESSED--train--105890", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--105890.wav", + "model_output": "Multiple speakers talk simultaneously from 00:15-00:20" + }, + { + "key": "SODA_PROCESSED--train--660884", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--660884.wav", + "model_output": "Multiple speakers talk simultaneously from 00:07-00:14" + }, + { + "key": "SODA_PROCESSED--train--1020087", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--1020087.wav", + "model_output": "Multiple speakers talk simultaneously from 00:10-00:13" + }, + { + "key": "SODA_PROCESSED--train--604161", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--604161.wav", + "model_output": "No significant overlaps found." + }, + { + "key": "SODA_PROCESSED--train--674832", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--674832.wav", + "model_output": "No significant overlaps found." + }, + { + "key": "SODA_PROCESSED--train--672051", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--672051.wav", + "model_output": "Multiple speakers talk simultaneously from 00:07-00:13" + }, + { + "key": "SODA_PROCESSED--train--1011922", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--1011922.wav", + "model_output": "Multiple speakers talk simultaneously from 00:14-00:18" + }, + { + "key": "SODA_PROCESSED--train--228608", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--228608.wav", + "model_output": "Multiple speakers talk simultaneously from 00:16-00:23" + }, + { + "key": "SODA_PROCESSED--train--943593", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--943593.wav", + "model_output": "Multiple speakers talk simultaneously from 00:18-00:25" + }, + { + "key": "SODA_PROCESSED--train--1130331", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--1130331.wav", + "model_output": "Multiple speakers talk simultaneously from 00:05-00:11" + }, + { + "key": "SODA_PROCESSED--train--1188975", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--1188975.wav", + "model_output": "Multiple speakers talk simultaneously from 00:06-00:12" + }, + { + "key": "SODA_PROCESSED--train--27446", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--27446.wav", + "model_output": "Multiple speakers talk simultaneously from 00:16-00:23" + }, + { + "key": "SODA_PROCESSED--train--748822", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--748822.wav", + "model_output": "Multiple speakers talk simultaneously from 00:08-00:14" + }, + { + "key": "SODA_PROCESSED--train--221358", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--221358.wav", + "model_output": "Multiple speakers talk simultaneously from 00:03-00:08" + }, + { + "key": "SODA_PROCESSED--train--1182464", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--1182464.wav", + "model_output": "No significant overlaps found." + }, + { + "key": "SODA_PROCESSED--train--720445", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--720445.wav", + "model_output": "Multiple speakers talk simultaneously from 00:12-00:17" + }, + { + "key": "SODA_PROCESSED--train--206574", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--206574.wav", + "model_output": "Multiple speakers talk simultaneously from 00:14-00:22" + }, + { + "key": "SODA_PROCESSED--train--1174912", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--1174912.wav", + "model_output": "Multiple speakers talk simultaneously from 00:10-00:17" + }, + { + "key": "SODA_PROCESSED--train--609826", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--609826.wav", + "model_output": "Multiple speakers talk simultaneously from 00:06-00:10" + }, + { + "key": "SODA_PROCESSED--train--781246", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--781246.wav", + "model_output": "Multiple speakers talk simultaneously from 00:10-00:14" + }, + { + "key": "SODA_PROCESSED--train--876226", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--876226.wav", + "model_output": "No significant overlaps found." + }, + { + "key": "SODA_PROCESSED--train--187120", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--187120.wav", + "model_output": "Multiple speakers talk simultaneously from 00:15-00:21" + }, + { + "key": "SODA_PROCESSED--train--287169", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--287169.wav", + "model_output": "Multiple speakers talk simultaneously from 00:09-00:13" + }, + { + "key": "SODA_PROCESSED--train--49462", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--49462.wav", + "model_output": "Multiple speakers talk simultaneously from 00:09-00:14" + }, + { + "key": "SODA_PROCESSED--train--29858", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--29858.wav", + "model_output": "Multiple speakers talk simultaneously from 00:08-00:13" + }, + { + "key": "SODA_PROCESSED--train--371354", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--371354.wav", + "model_output": "Multiple speakers talk simultaneously from 00:14-00:18" + }, + { + "key": "SODA_PROCESSED--train--28766", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--28766.wav", + "model_output": "Multiple speakers talk simultaneously from 00:27-00:32" + }, + { + "key": "SODA_PROCESSED--train--596349", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--596349.wav", + "model_output": "Multiple speakers talk simultaneously from 00:10-00:14" + }, + { + "key": "SODA_PROCESSED--train--596068", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--596068.wav", + "model_output": "No significant overlaps found." + }, + { + "key": "SODA_PROCESSED--train--366333", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--366333.wav", + "model_output": "Multiple speakers talk simultaneously from 00:06-00:12" + }, + { + "key": "SODA_PROCESSED--train--717045", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--717045.wav", + "model_output": "Multiple speakers talk simultaneously from 00:11-00:16" + }, + { + "key": "SODA_PROCESSED--train--4948", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--4948.wav", + "model_output": "Multiple speakers talk simultaneously from 00:05-00:12" + }, + { + "key": "SODA_PROCESSED--train--835488", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--835488.wav", + "model_output": "Multiple speakers talk simultaneously from 00:07-00:10" + }, + { + "key": "SODA_PROCESSED--train--466262", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--466262.wav", + "model_output": "Multiple speakers talk simultaneously from 00:11-00:16" + }, + { + "key": "SODA_PROCESSED--train--535368", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--535368.wav", + "model_output": "Multiple speakers talk simultaneously from 00:08-00:13" + }, + { + "key": "SODA_PROCESSED--train--831005", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--831005.wav", + "model_output": "Multiple speakers talk simultaneously from 00:33-00:41" + }, + { + "key": "SODA_PROCESSED--train--419812", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--419812.wav", + "model_output": "Multiple speakers talk simultaneously from 00:17-00:24" + }, + { + "key": "SODA_PROCESSED--train--674667", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--674667.wav", + "model_output": "Multiple speakers talk simultaneously from 00:07-00:13" + }, + { + "key": "SODA_PROCESSED--train--731416", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--731416.wav", + "model_output": "Multiple speakers talk simultaneously from 00:12-00:17" + }, + { + "key": "SODA_PROCESSED--train--341205", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--341205.wav", + "model_output": "Multiple speakers talk simultaneously from 00:13-00:20" + }, + { + "key": "SODA_PROCESSED--train--962013", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--962013.wav", + "model_output": "Multiple speakers talk simultaneously from 00:14-00:17" + }, + { + "key": "SODA_PROCESSED--train--338268", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--338268.wav", + "model_output": "Multiple speakers talk simultaneously from 00:09-00:13" + }, + { + "key": "SODA_PROCESSED--train--923496", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--923496.wav", + "model_output": "Multiple speakers talk simultaneously from 00:13-00:18" + }, + { + "key": "SODA_PROCESSED--train--263928", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--263928.wav", + "model_output": "Multiple speakers talk simultaneously from 00:14-00:18" + }, + { + "key": "SODA_PROCESSED--train--179972", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--179972.wav", + "model_output": "Multiple speakers talk simultaneously from 00:29-00:36" + }, + { + "key": "SODA_PROCESSED--train--1050427", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--1050427.wav", + "model_output": "Multiple speakers talk simultaneously from 00:06-00:13" + }, + { + "key": "SODA_PROCESSED--train--406352", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--406352.wav", + "model_output": "Multiple speakers talk simultaneously from 00:08-00:11" + }, + { + "key": "SODA_PROCESSED--train--791383", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--791383.wav", + "model_output": "No significant overlaps found." + }, + { + "key": "SODA_PROCESSED--train--604536", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--604536.wav", + "model_output": "Multiple speakers talk simultaneously from 00:16-00:22" + }, + { + "key": "SODA_PROCESSED--train--984123", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--984123.wav", + "model_output": "Multiple speakers talk simultaneously from 00:14-00:22" + }, + { + "key": "SODA_PROCESSED--train--690063", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--690063.wav", + "model_output": "Multiple speakers talk simultaneously from 00:08-00:12" + }, + { + "key": "SODA_PROCESSED--train--201044", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--201044.wav", + "model_output": "Multiple speakers talk simultaneously from 00:10-00:15" + }, + { + "key": "SODA_PROCESSED--train--565509", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--565509.wav", + "model_output": "No significant overlaps found." + }, + { + "key": "SODA_PROCESSED--train--1123711", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--1123711.wav", + "model_output": "Multiple speakers talk simultaneously from 00:04-00:07" + }, + { + "key": "SODA_PROCESSED--train--322914", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--322914.wav", + "model_output": "Multiple speakers talk simultaneously from 00:08-00:16" + }, + { + "key": "SODA_PROCESSED--train--679971", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--679971.wav", + "model_output": "Multiple speakers talk simultaneously from 00:10-00:21" + }, + { + "key": "SODA_PROCESSED--train--334612", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--334612.wav", + "model_output": "Multiple speakers talk simultaneously from 00:07-00:13" + }, + { + "key": "SODA_PROCESSED--train--316554", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--316554.wav", + "model_output": "Multiple speakers talk simultaneously from 00:15-00:22" + }, + { + "key": "SODA_PROCESSED--train--511668", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--511668.wav", + "model_output": "Multiple speakers talk simultaneously from 00:23-00:27" + }, + { + "key": "SODA_PROCESSED--train--526278", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--526278.wav", + "model_output": "Multiple speakers talk simultaneously from 00:04-00:10" + }, + { + "key": "SODA_PROCESSED--train--821468", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--821468.wav", + "model_output": "Multiple speakers talk simultaneously from 00:11-00:17" + }, + { + "key": "SODA_PROCESSED--train--412543", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--412543.wav", + "model_output": "Multiple speakers talk simultaneously from 00:26-00:35" + }, + { + "key": "SODA_PROCESSED--train--1010433", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--1010433.wav", + "model_output": "Multiple speakers talk simultaneously from 00:21-00:29" + }, + { + "key": "SODA_PROCESSED--train--299895", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--299895.wav", + "model_output": "Multiple speakers talk simultaneously from 00:09-00:14" + }, + { + "key": "SODA_PROCESSED--train--645254", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--645254.wav", + "model_output": "Multiple speakers talk simultaneously from 00:30-00:34" + }, + { + "key": "SODA_PROCESSED--train--677446", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--677446.wav", + "model_output": "No significant overlaps found." + }, + { + "key": "SODA_PROCESSED--train--1107765", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--1107765.wav", + "model_output": "Multiple speakers talk simultaneously from 00:13-00:19" + }, + { + "key": "SODA_PROCESSED--train--346041", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--346041.wav", + "model_output": "Multiple speakers talk simultaneously from 00:04-00:09" + }, + { + "key": "SODA_PROCESSED--train--1146016", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--1146016.wav", + "model_output": "No significant overlaps found." + }, + { + "key": "SODA_PROCESSED--train--1123691", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--1123691.wav", + "model_output": "Multiple speakers talk simultaneously from 00:24-00:32" + }, + { + "key": "SODA_PROCESSED--train--205413", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--205413.wav", + "model_output": "No significant overlaps found." + }, + { + "key": "SODA_PROCESSED--train--69581", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--69581.wav", + "model_output": "Multiple speakers talk simultaneously from 00:08-00:13" + }, + { + "key": "SODA_PROCESSED--train--435477", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--435477.wav", + "model_output": "Multiple speakers talk simultaneously from 00:07-00:11" + }, + { + "key": "SODA_PROCESSED--train--716169", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--716169.wav", + "model_output": "Multiple speakers talk simultaneously from 00:12-00:22" + }, + { + "key": "SODA_PROCESSED--train--1113559", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--1113559.wav", + "model_output": "Multiple speakers talk simultaneously from 00:09-00:13" + }, + { + "key": "SODA_PROCESSED--train--873625", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--873625.wav", + "model_output": "Multiple speakers talk simultaneously from 00:45-00:52" + }, + { + "key": "SODA_PROCESSED--train--1087723", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--1087723.wav", + "model_output": "Multiple speakers talk simultaneously from 00:07-00:11" + }, + { + "key": "SODA_PROCESSED--train--606362", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--606362.wav", + "model_output": "Multiple speakers talk simultaneously from 00:09-00:15" + }, + { + "key": "SODA_PROCESSED--train--559369", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--559369.wav", + "model_output": "Multiple speakers talk simultaneously from 00:05-00:11" + }, + { + "key": "SODA_PROCESSED--train--115102", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--115102.wav", + "model_output": "Multiple speakers talk simultaneously from 00:10-00:15" + }, + { + "key": "SODA_PROCESSED--train--805520", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--805520.wav", + "model_output": "Multiple speakers talk simultaneously from 00:08-00:13" + }, + { + "key": "SODA_PROCESSED--train--180962", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--180962.wav", + "model_output": "Multiple speakers talk simultaneously from 00:11-00:18" + }, + { + "key": "SODA_PROCESSED--train--249372", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--249372.wav", + "model_output": "No significant overlaps found." + }, + { + "key": "SODA_PROCESSED--train--824468", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--824468.wav", + "model_output": "Multiple speakers talk simultaneously from 00:06-00:10" + }, + { + "key": "SODA_PROCESSED--train--1175954", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--1175954.wav", + "model_output": "Multiple speakers talk simultaneously from 00:02-00:07" + }, + { + "key": "SODA_PROCESSED--train--571406", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--571406.wav", + "model_output": "Multiple speakers talk simultaneously from 00:10-00:16" + }, + { + "key": "SODA_PROCESSED--train--439119", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--439119.wav", + "model_output": "Multiple speakers talk simultaneously from 00:12-00:19" + }, + { + "key": "SODA_PROCESSED--train--1051467", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--1051467.wav", + "model_output": "Multiple speakers talk simultaneously from 00:08-00:16" + }, + { + "key": "SODA_PROCESSED--train--1140564", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--1140564.wav", + "model_output": "Multiple speakers talk simultaneously from 00:10-00:16" + }, + { + "key": "SODA_PROCESSED--train--619961", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--619961.wav", + "model_output": "Multiple speakers talk simultaneously from 00:13-00:19" + }, + { + "key": "SODA_PROCESSED--train--41123", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--41123.wav", + "model_output": "Multiple speakers talk simultaneously from 00:09-00:13" + }, + { + "key": "SODA_PROCESSED--train--928982", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--928982.wav", + "model_output": "Multiple speakers talk simultaneously from 00:06-00:10" + }, + { + "key": "SODA_PROCESSED--train--142496", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--142496.wav", + "model_output": "Multiple speakers talk simultaneously from 00:07-00:12" + }, + { + "key": "SODA_PROCESSED--train--616846", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--616846.wav", + "model_output": "Multiple speakers talk simultaneously from 00:09-00:16" + }, + { + "key": "SODA_PROCESSED--train--1079940", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--1079940.wav", + "model_output": "Multiple speakers talk simultaneously from 00:07-00:12" + }, + { + "key": "SODA_PROCESSED--train--896752", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--896752.wav", + "model_output": "Multiple speakers talk simultaneously from 00:10-00:13" + }, + { + "key": "SODA_PROCESSED--train--233660", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--233660.wav", + "model_output": "Multiple speakers talk simultaneously from 00:11-00:16" + }, + { + "key": "SODA_PROCESSED--train--564472", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--564472.wav", + "model_output": "Multiple speakers talk simultaneously from 00:11-00:17" + }, + { + "key": "SODA_PROCESSED--train--977126", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--977126.wav", + "model_output": "Multiple speakers talk simultaneously from 00:18-00:24" + }, + { + "key": "SODA_PROCESSED--train--142004", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--142004.wav", + "model_output": "Multiple speakers talk simultaneously from 00:07-00:10" + }, + { + "key": "SODA_PROCESSED--train--1113674", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--1113674.wav", + "model_output": "Multiple speakers talk simultaneously from 00:19-00:25" + }, + { + "key": "SODA_PROCESSED--train--16779", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--16779.wav", + "model_output": "Multiple speakers talk simultaneously from 00:06-00:11" + }, + { + "key": "SODA_PROCESSED--train--98947", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--98947.wav", + "model_output": "Multiple speakers talk simultaneously from 00:17-00:24" + }, + { + "key": "SODA_PROCESSED--train--1080342", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--1080342.wav", + "model_output": "Multiple speakers talk simultaneously from 00:04-00:11" + }, + { + "key": "SODA_PROCESSED--train--29039", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--29039.wav", + "model_output": "Multiple speakers talk simultaneously from 00:06-00:15" + }, + { + "key": "SODA_PROCESSED--train--488132", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--488132.wav", + "model_output": "Multiple speakers talk simultaneously from 00:11-00:16" + }, + { + "key": "SODA_PROCESSED--train--650705", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--650705.wav", + "model_output": "Multiple speakers talk simultaneously from 00:07-00:13" + }, + { + "key": "SODA_PROCESSED--train--562877", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--562877.wav", + "model_output": "Multiple speakers talk simultaneously from 00:15-00:24" + }, + { + "key": "SODA_PROCESSED--train--25283", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--25283.wav", + "model_output": "Multiple speakers talk simultaneously from 00:09-00:14" + }, + { + "key": "SODA_PROCESSED--train--787888", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--787888.wav", + "model_output": "No significant overlaps found." + }, + { + "key": "SODA_PROCESSED--train--1001071", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--1001071.wav", + "model_output": "Multiple speakers talk simultaneously from 00:06-00:12" + }, + { + "key": "SODA_PROCESSED--train--635774", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--635774.wav", + "model_output": "Multiple speakers talk simultaneously from 00:05-00:09" + }, + { + "key": "SODA_PROCESSED--train--282928", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--282928.wav", + "model_output": "Multiple speakers talk simultaneously from 00:12-00:19" + }, + { + "key": "SODA_PROCESSED--train--463322", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--463322.wav", + "model_output": "Multiple speakers talk simultaneously from 00:15-00:22" + }, + { + "key": "SODA_PROCESSED--train--148115", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--148115.wav", + "model_output": "Multiple speakers talk simultaneously from 00:13-00:21" + }, + { + "key": "SODA_PROCESSED--train--746047", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--746047.wav", + "model_output": "Multiple speakers talk simultaneously from 00:18-00:25" + }, + { + "key": "SODA_PROCESSED--train--404560", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--404560.wav", + "model_output": "Multiple speakers talk simultaneously from 00:07-00:11" + }, + { + "key": "SODA_PROCESSED--train--63072", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--63072.wav", + "model_output": "Multiple speakers talk simultaneously from 00:12-00:19" + }, + { + "key": "SODA_PROCESSED--train--81191", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--81191.wav", + "model_output": "Multiple speakers talk simultaneously from 00:05-00:13" + }, + { + "key": "SODA_PROCESSED--train--905170", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--905170.wav", + "model_output": "Multiple speakers talk simultaneously from 00:25-00:32" + }, + { + "key": "SODA_PROCESSED--train--1108323", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--1108323.wav", + "model_output": "Multiple speakers talk simultaneously from 00:10-00:16" + }, + { + "key": "SODA_PROCESSED--train--188417", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--188417.wav", + "model_output": "Multiple speakers talk simultaneously from 00:12-00:21" + }, + { + "key": "SODA_PROCESSED--train--526216", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--526216.wav", + "model_output": "Multiple speakers talk simultaneously from 00:17-00:23" + }, + { + "key": "SODA_PROCESSED--train--276032", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--276032.wav", + "model_output": "No significant overlaps found." + }, + { + "key": "SODA_PROCESSED--train--1030006", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--1030006.wav", + "model_output": "Multiple speakers talk simultaneously from 00:08-00:13" + }, + { + "key": "SODA_PROCESSED--train--953260", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--953260.wav", + "model_output": "Multiple speakers talk simultaneously from 00:10-00:16" + }, + { + "key": "SODA_PROCESSED--train--241883", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--241883.wav", + "model_output": "Multiple speakers talk simultaneously from 00:07-00:14" + }, + { + "key": "SODA_PROCESSED--train--186110", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--186110.wav", + "model_output": "Multiple speakers talk simultaneously from 00:07-00:13" + }, + { + "key": "SODA_PROCESSED--train--828152", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--828152.wav", + "model_output": "Multiple speakers talk simultaneously from 00:07-00:14" + }, + { + "key": "SODA_PROCESSED--train--1007617", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--1007617.wav", + "model_output": "Multiple speakers talk simultaneously from 00:12-00:20" + }, + { + "key": "SODA_PROCESSED--train--254497", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--254497.wav", + "model_output": "Multiple speakers talk simultaneously from 00:06-00:14" + }, + { + "key": "SODA_PROCESSED--train--999278", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--999278.wav", + "model_output": "Multiple speakers talk simultaneously from 00:06-00:12" + }, + { + "key": "SODA_PROCESSED--train--627283", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--627283.wav", + "model_output": "Multiple speakers talk simultaneously from 00:06-00:14" + }, + { + "key": "SODA_PROCESSED--train--217814", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--217814.wav", + "model_output": "Multiple speakers talk simultaneously from 00:06-00:13" + }, + { + "key": "SODA_PROCESSED--train--352805", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--352805.wav", + "model_output": "Multiple speakers talk simultaneously from 00:16-00:20" + }, + { + "key": "SODA_PROCESSED--train--714054", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--714054.wav", + "model_output": "Multiple speakers talk simultaneously from 00:04-00:11" + }, + { + "key": "SODA_PROCESSED--train--1004891", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--1004891.wav", + "model_output": "Multiple speakers talk simultaneously from 00:23-00:28" + }, + { + "key": "SODA_PROCESSED--train--954404", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--954404.wav", + "model_output": "Multiple speakers talk simultaneously from 00:13-00:18" + }, + { + "key": "SODA_PROCESSED--train--32633", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--32633.wav", + "model_output": "Multiple speakers talk simultaneously from 00:04-00:08" + }, + { + "key": "SODA_PROCESSED--train--715956", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--715956.wav", + "model_output": "Multiple speakers talk simultaneously from 00:08-00:16" + }, + { + "key": "SODA_PROCESSED--train--447088", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--447088.wav", + "model_output": "Multiple speakers talk simultaneously from 00:13-00:21" + }, + { + "key": "SODA_PROCESSED--train--846507", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--846507.wav", + "model_output": "Multiple speakers talk simultaneously from 00:05-00:12" + }, + { + "key": "SODA_PROCESSED--train--840566", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--840566.wav", + "model_output": "Multiple speakers talk simultaneously from 00:06-00:13" + }, + { + "key": "SODA_PROCESSED--train--22719", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--22719.wav", + "model_output": "Multiple speakers talk simultaneously from 00:06-00:11" + }, + { + "key": "SODA_PROCESSED--train--727873", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--727873.wav", + "model_output": "Multiple speakers talk simultaneously from 00:06-00:15" + }, + { + "key": "SODA_PROCESSED--train--556475", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--556475.wav", + "model_output": "Multiple speakers talk simultaneously from 00:07-00:11" + }, + { + "key": "SODA_PROCESSED--train--762740", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--762740.wav", + "model_output": "Multiple speakers talk simultaneously from 00:04-00:11" + }, + { + "key": "SODA_PROCESSED--train--368483", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--368483.wav", + "model_output": "Multiple speakers talk simultaneously from 00:43-00:50" + }, + { + "key": "SODA_PROCESSED--train--921984", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--921984.wav", + "model_output": "Multiple speakers talk simultaneously from 00:09-00:15" + }, + { + "key": "SODA_PROCESSED--train--813478", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--813478.wav", + "model_output": "Multiple speakers talk simultaneously from 00:09-00:15" + }, + { + "key": "SODA_PROCESSED--train--158293", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--158293.wav", + "model_output": "Multiple speakers talk simultaneously from 00:05-00:13" + }, + { + "key": "SODA_PROCESSED--train--468879", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--468879.wav", + "model_output": "Multiple speakers talk simultaneously from 00:08-00:16" + }, + { + "key": "SODA_PROCESSED--train--277322", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--277322.wav", + "model_output": "Multiple speakers talk simultaneously from 00:12-00:18" + }, + { + "key": "SODA_PROCESSED--train--57082", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--57082.wav", + "model_output": "Multiple speakers talk simultaneously from 00:03-00:09" + }, + { + "key": "SODA_PROCESSED--train--798455", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--798455.wav", + "model_output": "Multiple speakers talk simultaneously from 00:07-00:14" + }, + { + "key": "SODA_PROCESSED--train--559292", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--559292.wav", + "model_output": "Multiple speakers talk simultaneously from 00:09-00:12" + }, + { + "key": "SODA_PROCESSED--train--990528", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--990528.wav", + "model_output": "Multiple speakers talk simultaneously from 00:16-00:19" + }, + { + "key": "SODA_PROCESSED--train--27924", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--27924.wav", + "model_output": "Multiple speakers talk simultaneously from 00:09-00:15" + }, + { + "key": "SODA_PROCESSED--train--193968", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--193968.wav", + "model_output": "Multiple speakers talk simultaneously from 00:04-00:11" + }, + { + "key": "SODA_PROCESSED--train--857144", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--857144.wav", + "model_output": "Multiple speakers talk simultaneously from 00:18-00:25" + }, + { + "key": "SODA_PROCESSED--train--776571", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--776571.wav", + "model_output": "Multiple speakers talk simultaneously from 00:05-00:10" + }, + { + "key": "SODA_PROCESSED--train--980776", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--980776.wav", + "model_output": "Multiple speakers talk simultaneously from 00:06-00:09" + }, + { + "key": "SODA_PROCESSED--train--188315", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--188315.wav", + "model_output": "Multiple speakers talk simultaneously from 00:07-00:13" + }, + { + "key": "SODA_PROCESSED--train--471264", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--471264.wav", + "model_output": "Multiple speakers talk simultaneously from 00:11-00:15" + }, + { + "key": "SODA_PROCESSED--train--876910", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--876910.wav", + "model_output": "Multiple speakers talk simultaneously from 00:11-00:17" + }, + { + "key": "SODA_PROCESSED--train--608672", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--608672.wav", + "model_output": "Multiple speakers talk simultaneously from 00:06-00:11" + }, + { + "key": "SODA_PROCESSED--train--1084179", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--1084179.wav", + "model_output": "No significant overlaps found." + }, + { + "key": "SODA_PROCESSED--train--1101616", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--1101616.wav", + "model_output": "Multiple speakers talk simultaneously from 00:13-00:19" + }, + { + "key": "SODA_PROCESSED--train--233562", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--233562.wav", + "model_output": "Multiple speakers talk simultaneously from 00:14-00:19" + }, + { + "key": "SODA_PROCESSED--train--273875", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--273875.wav", + "model_output": "Multiple speakers talk simultaneously from 00:04-00:09" + }, + { + "key": "SODA_PROCESSED--train--296467", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--296467.wav", + "model_output": "Multiple speakers talk simultaneously from 00:08-00:13" + }, + { + "key": "SODA_PROCESSED--train--193891", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--193891.wav", + "model_output": "Multiple speakers talk simultaneously from 00:15-00:22" + }, + { + "key": "SODA_PROCESSED--train--986089", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--986089.wav", + "model_output": "No significant overlaps found." + }, + { + "key": "SODA_PROCESSED--train--39376", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--39376.wav", + "model_output": "No significant overlaps found." + }, + { + "key": "SODA_PROCESSED--train--316553", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--316553.wav", + "model_output": "Multiple speakers talk simultaneously from 00:11-00:16" + }, + { + "key": "SODA_PROCESSED--train--630141", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--630141.wav", + "model_output": "Multiple speakers talk simultaneously from 00:13-00:19" + }, + { + "key": "SODA_PROCESSED--train--531935", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--531935.wav", + "model_output": "Multiple speakers talk simultaneously from 00:12-00:18" + }, + { + "key": "SODA_PROCESSED--train--690452", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--690452.wav", + "model_output": "Multiple speakers talk simultaneously from 00:21-00:26" + }, + { + "key": "SODA_PROCESSED--train--1052554", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--1052554.wav", + "model_output": "Multiple speakers talk simultaneously from 00:07-00:11" + }, + { + "key": "SODA_PROCESSED--train--538365", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--538365.wav", + "model_output": "Multiple speakers talk simultaneously from 00:18-00:25" + }, + { + "key": "SODA_PROCESSED--train--7207", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--7207.wav", + "model_output": "Multiple speakers talk simultaneously from 00:06-00:10" + }, + { + "key": "SODA_PROCESSED--train--729972", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--729972.wav", + "model_output": "Multiple speakers talk simultaneously from 00:10-00:17" + }, + { + "key": "SODA_PROCESSED--train--966021", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--966021.wav", + "model_output": "Multiple speakers talk simultaneously from 00:06-00:12" + }, + { + "key": "SODA_PROCESSED--train--514047", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--514047.wav", + "model_output": "Multiple speakers talk simultaneously from 00:16-00:23" + }, + { + "key": "SODA_PROCESSED--train--891432", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--891432.wav", + "model_output": "Multiple speakers talk simultaneously from 00:02-00:07" + }, + { + "key": "SODA_PROCESSED--train--465565", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--465565.wav", + "model_output": "Multiple speakers talk simultaneously from 00:18-00:22" + }, + { + "key": "SODA_PROCESSED--train--208819", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--208819.wav", + "model_output": "Multiple speakers talk simultaneously from 00:05-00:14" + }, + { + "key": "SODA_PROCESSED--train--903126", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--903126.wav", + "model_output": "Multiple speakers talk simultaneously from 00:07-00:12" + }, + { + "key": "SODA_PROCESSED--train--719833", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--719833.wav", + "model_output": "Multiple speakers talk simultaneously from 00:06-00:13" + }, + { + "key": "SODA_PROCESSED--train--514230", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--514230.wav", + "model_output": "Multiple speakers talk simultaneously from 00:03-00:08" + }, + { + "key": "SODA_PROCESSED--train--297496", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--297496.wav", + "model_output": "Multiple speakers talk simultaneously from 00:07-00:12" + }, + { + "key": "SODA_PROCESSED--train--713730", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--713730.wav", + "model_output": "Multiple speakers talk simultaneously from 00:09-00:13" + }, + { + "key": "SODA_PROCESSED--train--271652", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--271652.wav", + "model_output": "Multiple speakers talk simultaneously from 00:04-00:08" + }, + { + "key": "SODA_PROCESSED--train--456190", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--456190.wav", + "model_output": "Multiple speakers talk simultaneously from 00:14-00:19" + }, + { + "key": "SODA_PROCESSED--train--778927", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--778927.wav", + "model_output": "Multiple speakers talk simultaneously from 00:10-00:16" + }, + { + "key": "SODA_PROCESSED--train--391765", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--391765.wav", + "model_output": "Multiple speakers talk simultaneously from 00:12-00:20" + }, + { + "key": "SODA_PROCESSED--train--905725", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--905725.wav", + "model_output": "Multiple speakers talk simultaneously from 00:09-00:14" + }, + { + "key": "SODA_PROCESSED--train--571413", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--571413.wav", + "model_output": "Multiple speakers talk simultaneously from 00:17-00:22" + }, + { + "key": "SODA_PROCESSED--train--120698", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--120698.wav", + "model_output": "Multiple speakers talk simultaneously from 00:11-00:16" + }, + { + "key": "SODA_PROCESSED--train--655306", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--655306.wav", + "model_output": "Multiple speakers talk simultaneously from 00:23-00:28" + }, + { + "key": "SODA_PROCESSED--train--8155", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--8155.wav", + "model_output": "Multiple speakers talk simultaneously from 00:05-00:11" + }, + { + "key": "SODA_PROCESSED--train--957212", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--957212.wav", + "model_output": "Multiple speakers talk simultaneously from 00:09-00:16" + }, + { + "key": "SODA_PROCESSED--train--477747", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--477747.wav", + "model_output": "Multiple speakers talk simultaneously from 00:05-00:13" + }, + { + "key": "SODA_PROCESSED--train--115625", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--115625.wav", + "model_output": "No significant overlaps found." + }, + { + "key": "SODA_PROCESSED--train--1177869", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--1177869.wav", + "model_output": "Multiple speakers talk simultaneously from 00:11-00:18" + }, + { + "key": "SODA_PROCESSED--train--1051089", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--1051089.wav", + "model_output": "Multiple speakers talk simultaneously from 00:23-00:30" + }, + { + "key": "SODA_PROCESSED--train--1169363", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--1169363.wav", + "model_output": "Multiple speakers talk simultaneously from 00:07-00:10" + }, + { + "key": "SODA_PROCESSED--train--19531", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--19531.wav", + "model_output": "Multiple speakers talk simultaneously from 00:07-00:10" + }, + { + "key": "SODA_PROCESSED--train--156618", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--156618.wav", + "model_output": "Multiple speakers talk simultaneously from 00:07-00:12" + }, + { + "key": "SODA_PROCESSED--train--769683", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--769683.wav", + "model_output": "Multiple speakers talk simultaneously from 00:06-00:11" + }, + { + "key": "SODA_PROCESSED--train--1092370", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--1092370.wav", + "model_output": "Multiple speakers talk simultaneously from 00:10-00:15" + }, + { + "key": "SODA_PROCESSED--train--778704", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--778704.wav", + "model_output": "Multiple speakers talk simultaneously from 00:09-00:15" + }, + { + "key": "SODA_PROCESSED--train--908191", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--908191.wav", + "model_output": "No significant overlaps found." + }, + { + "key": "SODA_PROCESSED--train--1112132", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--1112132.wav", + "model_output": "Multiple speakers talk simultaneously from 00:05-00:12" + }, + { + "key": "SODA_PROCESSED--train--417260", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--417260.wav", + "model_output": "Multiple speakers talk simultaneously from 00:12-00:15" + }, + { + "key": "SODA_PROCESSED--train--994009", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--994009.wav", + "model_output": "Multiple speakers talk simultaneously from 00:09-00:15" + }, + { + "key": "SODA_PROCESSED--train--415948", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--415948.wav", + "model_output": "Multiple speakers talk simultaneously from 00:10-00:17" + }, + { + "key": "SODA_PROCESSED--train--30336", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--30336.wav", + "model_output": "Multiple speakers talk simultaneously from 00:03-00:07" + }, + { + "key": "SODA_PROCESSED--train--269886", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--269886.wav", + "model_output": "Multiple speakers talk simultaneously from 00:12-00:17" + }, + { + "key": "SODA_PROCESSED--train--49720", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--49720.wav", + "model_output": "Multiple speakers talk simultaneously from 00:05-00:11" + }, + { + "key": "SODA_PROCESSED--train--82238", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--82238.wav", + "model_output": "Multiple speakers talk simultaneously from 00:18-00:22" + }, + { + "key": "SODA_PROCESSED--train--231370", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--231370.wav", + "model_output": "Multiple speakers talk simultaneously from 00:14-00:18" + }, + { + "key": "SODA_PROCESSED--train--277060", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--277060.wav", + "model_output": "Multiple speakers talk simultaneously from 00:03-00:07" + }, + { + "key": "SODA_PROCESSED--train--421624", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--421624.wav", + "model_output": "Multiple speakers talk simultaneously from 00:04-00:11" + }, + { + "key": "SODA_PROCESSED--train--191104", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--191104.wav", + "model_output": "Multiple speakers talk simultaneously from 00:38-00:41" + }, + { + "key": "SODA_PROCESSED--train--262975", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--262975.wav", + "model_output": "Multiple speakers talk simultaneously from 00:06-00:11" + }, + { + "key": "SODA_PROCESSED--train--104948", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--104948.wav", + "model_output": "Multiple speakers talk simultaneously from 00:06-00:11" + }, + { + "key": "SODA_PROCESSED--train--475793", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--475793.wav", + "model_output": "Multiple speakers talk simultaneously from 00:03-00:08" + }, + { + "key": "SODA_PROCESSED--train--1129671", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--1129671.wav", + "model_output": "Multiple speakers talk simultaneously from 00:09-00:16" + }, + { + "key": "SODA_PROCESSED--train--803822", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--803822.wav", + "model_output": "Multiple speakers talk simultaneously from 00:24-00:30" + }, + { + "key": "SODA_PROCESSED--train--638647", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--638647.wav", + "model_output": "Multiple speakers talk simultaneously from 00:59-01:05" + }, + { + "key": "SODA_PROCESSED--train--460378", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--460378.wav", + "model_output": "Multiple speakers talk simultaneously from 00:07-00:10" + }, + { + "key": "SODA_PROCESSED--train--98281", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--98281.wav", + "model_output": "Multiple speakers talk simultaneously from 00:08-00:15" + }, + { + "key": "SODA_PROCESSED--train--590679", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--590679.wav", + "model_output": "Multiple speakers talk simultaneously from 00:19-00:22" + }, + { + "key": "SODA_PROCESSED--train--449068", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--449068.wav", + "model_output": "Multiple speakers talk simultaneously from 00:21-00:25" + }, + { + "key": "SODA_PROCESSED--train--581770", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--581770.wav", + "model_output": "No significant overlaps found." + }, + { + "key": "SODA_PROCESSED--train--437038", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--437038.wav", + "model_output": "Multiple speakers talk simultaneously from 00:04-00:10" + }, + { + "key": "SODA_PROCESSED--train--1076109", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--1076109.wav", + "model_output": "Multiple speakers talk simultaneously from 00:19-00:27" + }, + { + "key": "SODA_PROCESSED--train--132857", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--132857.wav", + "model_output": "Multiple speakers talk simultaneously from 00:06-00:12" + }, + { + "key": "SODA_PROCESSED--train--1041859", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--1041859.wav", + "model_output": "Multiple speakers talk simultaneously from 00:19-00:23" + }, + { + "key": "SODA_PROCESSED--train--580598", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--580598.wav", + "model_output": "Multiple speakers talk simultaneously from 00:07-00:12" + }, + { + "key": "SODA_PROCESSED--train--43736", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--43736.wav", + "model_output": "Multiple speakers talk simultaneously from 00:14-00:20" + }, + { + "key": "SODA_PROCESSED--train--12295", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--12295.wav", + "model_output": "Multiple speakers talk simultaneously from 00:15-00:20" + }, + { + "key": "SODA_PROCESSED--train--84371", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--84371.wav", + "model_output": "No significant overlaps found." + }, + { + "key": "SODA_PROCESSED--train--40901", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--40901.wav", + "model_output": "Multiple speakers talk simultaneously from 00:16-00:22" + }, + { + "key": "SODA_PROCESSED--train--811940", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--811940.wav", + "model_output": "Multiple speakers talk simultaneously from 00:20-00:25" + }, + { + "key": "SODA_PROCESSED--train--698246", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--698246.wav", + "model_output": "Multiple speakers talk simultaneously from 00:19-00:22" + }, + { + "key": "SODA_PROCESSED--train--1188579", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--1188579.wav", + "model_output": "No significant overlaps found." + }, + { + "key": "SODA_PROCESSED--train--752118", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--752118.wav", + "model_output": "Multiple speakers talk simultaneously from 00:04-00:13" + }, + { + "key": "SODA_PROCESSED--train--251891", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--251891.wav", + "model_output": "Multiple speakers talk simultaneously from 00:11-00:16" + }, + { + "key": "SODA_PROCESSED--train--601727", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--601727.wav", + "model_output": "Multiple speakers talk simultaneously from 00:08-00:13" + }, + { + "key": "SODA_PROCESSED--train--437704", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--437704.wav", + "model_output": "Multiple speakers talk simultaneously from 00:16-00:20" + }, + { + "key": "SODA_PROCESSED--train--938056", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--938056.wav", + "model_output": "Multiple speakers talk simultaneously from 00:04-00:09" + }, + { + "key": "SODA_PROCESSED--train--952835", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--952835.wav", + "model_output": "Multiple speakers talk simultaneously from 00:12-00:18" + }, + { + "key": "SODA_PROCESSED--train--648176", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--648176.wav", + "model_output": "Multiple speakers talk simultaneously from 00:08-00:14" + }, + { + "key": "SODA_PROCESSED--train--311173", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--311173.wav", + "model_output": "Multiple speakers talk simultaneously from 00:09-00:15" + }, + { + "key": "SODA_PROCESSED--train--24058", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--24058.wav", + "model_output": "Multiple speakers talk simultaneously from 00:08-00:16" + }, + { + "key": "SODA_PROCESSED--train--220023", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--220023.wav", + "model_output": "Multiple speakers talk simultaneously from 00:09-00:13" + }, + { + "key": "SODA_PROCESSED--train--475039", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--475039.wav", + "model_output": "Multiple speakers talk simultaneously from 00:08-00:16" + }, + { + "key": "SODA_PROCESSED--train--875462", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--875462.wav", + "model_output": "Multiple speakers talk simultaneously from 00:21-00:28" + }, + { + "key": "SODA_PROCESSED--train--156744", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--156744.wav", + "model_output": "Multiple speakers talk simultaneously from 00:10-00:14" + }, + { + "key": "SODA_PROCESSED--train--471036", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--471036.wav", + "model_output": "Multiple speakers talk simultaneously from 00:05-00:12" + }, + { + "key": "SODA_PROCESSED--train--82370", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--82370.wav", + "model_output": "Multiple speakers talk simultaneously from 00:06-00:10" + }, + { + "key": "SODA_PROCESSED--train--538753", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--538753.wav", + "model_output": "Multiple speakers talk simultaneously from 00:08-00:11" + }, + { + "key": "SODA_PROCESSED--train--520823", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--520823.wav", + "model_output": "No significant overlaps found." + }, + { + "key": "SODA_PROCESSED--train--933257", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--933257.wav", + "model_output": "Multiple speakers talk simultaneously from 00:16-00:24" + }, + { + "key": "SODA_PROCESSED--train--494198", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--494198.wav", + "model_output": "Multiple speakers talk simultaneously from 00:06-00:11" + }, + { + "key": "SODA_PROCESSED--train--33171", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--33171.wav", + "model_output": "Multiple speakers talk simultaneously from 00:12-00:15" + }, + { + "key": "SODA_PROCESSED--train--631363", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--631363.wav", + "model_output": "Multiple speakers talk simultaneously from 00:12-00:19" + }, + { + "key": "SODA_PROCESSED--train--246434", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--246434.wav", + "model_output": "No significant overlaps found." + }, + { + "key": "SODA_PROCESSED--train--420707", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--420707.wav", + "model_output": "Multiple speakers talk simultaneously from 00:14-00:18" + }, + { + "key": "SODA_PROCESSED--train--104984", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--104984.wav", + "model_output": "Multiple speakers talk simultaneously from 00:11-00:18" + }, + { + "key": "SODA_PROCESSED--train--324306", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--324306.wav", + "model_output": "Multiple speakers talk simultaneously from 00:05-00:12" + }, + { + "key": "SODA_PROCESSED--train--1180329", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--1180329.wav", + "model_output": "Multiple speakers talk simultaneously from 00:09-00:15" + }, + { + "key": "SODA_PROCESSED--train--8820", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--8820.wav", + "model_output": "Multiple speakers talk simultaneously from 00:20-00:27" + }, + { + "key": "SODA_PROCESSED--train--578559", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--578559.wav", + "model_output": "Multiple speakers talk simultaneously from 00:55-01:07" + }, + { + "key": "SODA_PROCESSED--train--76363", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--76363.wav", + "model_output": "Multiple speakers talk simultaneously from 00:05-00:11" + }, + { + "key": "SODA_PROCESSED--train--872171", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--872171.wav", + "model_output": "Multiple speakers talk simultaneously from 00:13-00:20" + }, + { + "key": "SODA_PROCESSED--train--761001", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--761001.wav", + "model_output": "Multiple speakers talk simultaneously from 00:05-00:10" + }, + { + "key": "SODA_PROCESSED--train--927063", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--927063.wav", + "model_output": "Multiple speakers talk simultaneously from 00:03-00:08" + }, + { + "key": "SODA_PROCESSED--train--431708", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--431708.wav", + "model_output": "Multiple speakers talk simultaneously from 00:06-00:12" + }, + { + "key": "SODA_PROCESSED--train--244490", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--244490.wav", + "model_output": "Multiple speakers talk simultaneously from 00:16-00:23" + }, + { + "key": "SODA_PROCESSED--train--1186756", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--1186756.wav", + "model_output": "Multiple speakers talk simultaneously from 00:04-00:10" + }, + { + "key": "SODA_PROCESSED--train--338832", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--338832.wav", + "model_output": "Multiple speakers talk simultaneously from 00:08-00:15" + }, + { + "key": "SODA_PROCESSED--train--1050100", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--1050100.wav", + "model_output": "Multiple speakers talk simultaneously from 00:03-00:07" + }, + { + "key": "SODA_PROCESSED--train--566903", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--566903.wav", + "model_output": "Multiple speakers talk simultaneously from 00:09-00:12" + }, + { + "key": "SODA_PROCESSED--train--258235", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--258235.wav", + "model_output": "Multiple speakers talk simultaneously from 00:10-00:16" + }, + { + "key": "SODA_PROCESSED--train--412246", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--412246.wav", + "model_output": "Multiple speakers talk simultaneously from 00:27-00:32" + }, + { + "key": "SODA_PROCESSED--train--860535", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--860535.wav", + "model_output": "Multiple speakers talk simultaneously from 00:16-00:22" + }, + { + "key": "SODA_PROCESSED--train--584031", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--584031.wav", + "model_output": "Multiple speakers talk simultaneously from 00:06-00:15" + }, + { + "key": "SODA_PROCESSED--train--925277", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--925277.wav", + "model_output": "No significant overlaps found." + }, + { + "key": "SODA_PROCESSED--train--243573", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--243573.wav", + "model_output": "Multiple speakers talk simultaneously from 00:03-00:08" + }, + { + "key": "SODA_PROCESSED--train--633173", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--633173.wav", + "model_output": "Multiple speakers talk simultaneously from 00:09-00:14" + }, + { + "key": "SODA_PROCESSED--train--1088159", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--1088159.wav", + "model_output": "Multiple speakers talk simultaneously from 00:10-00:18" + }, + { + "key": "SODA_PROCESSED--train--706924", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--706924.wav", + "model_output": "Multiple speakers talk simultaneously from 00:21-00:24" + }, + { + "key": "SODA_PROCESSED--train--1166623", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--1166623.wav", + "model_output": "Multiple speakers talk simultaneously from 00:09-00:14" + }, + { + "key": "SODA_PROCESSED--train--366989", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--366989.wav", + "model_output": "Multiple speakers talk simultaneously from 00:36-00:40" + }, + { + "key": "SODA_PROCESSED--train--153751", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--153751.wav", + "model_output": "Multiple speakers talk simultaneously from 00:28-00:34" + }, + { + "key": "SODA_PROCESSED--train--101351", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--101351.wav", + "model_output": "Multiple speakers talk simultaneously from 00:06-00:14" + }, + { + "key": "SODA_PROCESSED--train--514225", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--514225.wav", + "model_output": "Multiple speakers talk simultaneously from 00:13-00:20" + }, + { + "key": "SODA_PROCESSED--train--194829", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--194829.wav", + "model_output": "Multiple speakers talk simultaneously from 00:03-00:09" + }, + { + "key": "SODA_PROCESSED--train--1085362", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--1085362.wav", + "model_output": "Multiple speakers talk simultaneously from 00:07-00:13" + }, + { + "key": "SODA_PROCESSED--train--419304", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--419304.wav", + "model_output": "No significant overlaps found." + }, + { + "key": "SODA_PROCESSED--train--207527", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--207527.wav", + "model_output": "Multiple speakers talk simultaneously from 00:06-00:10" + }, + { + "key": "SODA_PROCESSED--train--1131334", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--1131334.wav", + "model_output": "Multiple speakers talk simultaneously from 00:12-00:15" + }, + { + "key": "SODA_PROCESSED--train--214477", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--214477.wav", + "model_output": "Multiple speakers talk simultaneously from 00:18-00:22" + }, + { + "key": "SODA_PROCESSED--train--203528", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--203528.wav", + "model_output": "Multiple speakers talk simultaneously from 00:12-00:19" + }, + { + "key": "SODA_PROCESSED--train--1010589", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--1010589.wav", + "model_output": "Multiple speakers talk simultaneously from 00:12-00:18" + }, + { + "key": "SODA_PROCESSED--train--956648", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--956648.wav", + "model_output": "Multiple speakers talk simultaneously from 00:04-00:08" + }, + { + "key": "SODA_PROCESSED--train--559740", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--559740.wav", + "model_output": "Multiple speakers talk simultaneously from 00:08-00:13" + }, + { + "key": "SODA_PROCESSED--train--603030", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--603030.wav", + "model_output": "Multiple speakers talk simultaneously from 00:13-00:19" + }, + { + "key": "SODA_PROCESSED--train--934138", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--934138.wav", + "model_output": "Multiple speakers talk simultaneously from 00:12-00:17" + }, + { + "key": "SODA_PROCESSED--train--387024", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--387024.wav", + "model_output": "Multiple speakers talk simultaneously from 00:05-00:08" + }, + { + "key": "SODA_PROCESSED--train--44625", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--44625.wav", + "model_output": "Multiple speakers talk simultaneously from 00:07-00:14" + }, + { + "key": "SODA_PROCESSED--train--833014", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--833014.wav", + "model_output": "Multiple speakers talk simultaneously from 00:09-00:16" + }, + { + "key": "SODA_PROCESSED--train--243315", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--243315.wav", + "model_output": "No significant overlaps found." + }, + { + "key": "SODA_PROCESSED--train--108309", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--108309.wav", + "model_output": "Multiple speakers talk simultaneously from 00:04-00:09" + }, + { + "key": "SODA_PROCESSED--train--595180", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--595180.wav", + "model_output": "Multiple speakers talk simultaneously from 00:13-00:20" + }, + { + "key": "SODA_PROCESSED--train--556505", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--556505.wav", + "model_output": "Multiple speakers talk simultaneously from 00:18-00:25" + }, + { + "key": "SODA_PROCESSED--train--727552", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--727552.wav", + "model_output": "Multiple speakers talk simultaneously from 00:34-00:39" + }, + { + "key": "SODA_PROCESSED--train--524306", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--524306.wav", + "model_output": "Multiple speakers talk simultaneously from 00:14-00:20" + }, + { + "key": "SODA_PROCESSED--train--762905", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--762905.wav", + "model_output": "Multiple speakers talk simultaneously from 00:12-00:22" + }, + { + "key": "SODA_PROCESSED--train--757426", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--757426.wav", + "model_output": "Multiple speakers talk simultaneously from 00:11-00:15" + }, + { + "key": "SODA_PROCESSED--train--935998", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--935998.wav", + "model_output": "Multiple speakers talk simultaneously from 00:07-00:12" + }, + { + "key": "SODA_PROCESSED--train--179376", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--179376.wav", + "model_output": "No significant overlaps found." + }, + { + "key": "SODA_PROCESSED--train--951487", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--951487.wav", + "model_output": "Multiple speakers talk simultaneously from 00:05-00:10" + }, + { + "key": "SODA_PROCESSED--train--289733", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--289733.wav", + "model_output": "Multiple speakers talk simultaneously from 00:06-00:14" + }, + { + "key": "SODA_PROCESSED--train--676747", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--676747.wav", + "model_output": "Multiple speakers talk simultaneously from 00:24-00:28" + }, + { + "key": "SODA_PROCESSED--train--974933", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--974933.wav", + "model_output": "Multiple speakers talk simultaneously from 00:25-00:33" + }, + { + "key": "SODA_PROCESSED--train--1074077", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--1074077.wav", + "model_output": "Multiple speakers talk simultaneously from 00:11-00:15" + }, + { + "key": "SODA_PROCESSED--train--740576", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--740576.wav", + "model_output": "Multiple speakers talk simultaneously from 00:10-00:16" + }, + { + "key": "SODA_PROCESSED--train--413649", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--413649.wav", + "model_output": "Multiple speakers talk simultaneously from 00:14-00:21" + }, + { + "key": "SODA_PROCESSED--train--209436", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--209436.wav", + "model_output": "Multiple speakers talk simultaneously from 00:36-00:44" + }, + { + "key": "SODA_PROCESSED--train--1028263", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--1028263.wav", + "model_output": "Multiple speakers talk simultaneously from 00:13-00:18" + }, + { + "key": "SODA_PROCESSED--train--1574", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--1574.wav", + "model_output": "Multiple speakers talk simultaneously from 00:13-00:22" + }, + { + "key": "SODA_PROCESSED--train--977434", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--977434.wav", + "model_output": "Multiple speakers talk simultaneously from 00:10-00:16" + }, + { + "key": "SODA_PROCESSED--train--1096861", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--1096861.wav", + "model_output": "Multiple speakers talk simultaneously from 00:09-00:15" + }, + { + "key": "SODA_PROCESSED--train--1029082", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--1029082.wav", + "model_output": "Multiple speakers talk simultaneously from 00:05-00:11" + }, + { + "key": "SODA_PROCESSED--train--1020068", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--1020068.wav", + "model_output": "Multiple speakers talk simultaneously from 00:10-00:16" + }, + { + "key": "SODA_PROCESSED--train--937978", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--937978.wav", + "model_output": "Multiple speakers talk simultaneously from 00:23-00:27" + }, + { + "key": "SODA_PROCESSED--train--985415", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--985415.wav", + "model_output": "Multiple speakers talk simultaneously from 00:07-00:11" + }, + { + "key": "SODA_PROCESSED--train--476626", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--476626.wav", + "model_output": "Multiple speakers talk simultaneously from 00:40-00:45" + }, + { + "key": "SODA_PROCESSED--train--1022590", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--1022590.wav", + "model_output": "Multiple speakers talk simultaneously from 00:04-00:08" + }, + { + "key": "SODA_PROCESSED--train--153526", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--153526.wav", + "model_output": "Multiple speakers talk simultaneously from 00:18-00:22" + }, + { + "key": "SODA_PROCESSED--train--560596", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--560596.wav", + "model_output": "Multiple speakers talk simultaneously from 00:04-00:09" + }, + { + "key": "SODA_PROCESSED--train--41171", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--41171.wav", + "model_output": "Multiple speakers talk simultaneously from 00:10-00:14" + }, + { + "key": "SODA_PROCESSED--train--926731", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--926731.wav", + "model_output": "Multiple speakers talk simultaneously from 00:04-00:10" + }, + { + "key": "SODA_PROCESSED--train--15103", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--15103.wav", + "model_output": "Multiple speakers talk simultaneously from 00:08-00:17" + }, + { + "key": "SODA_PROCESSED--train--1124666", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--1124666.wav", + "model_output": "Multiple speakers talk simultaneously from 00:11-00:17" + }, + { + "key": "SODA_PROCESSED--train--737676", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--737676.wav", + "model_output": "Multiple speakers talk simultaneously from 00:08-00:15" + }, + { + "key": "SODA_PROCESSED--train--682132", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--682132.wav", + "model_output": "Multiple speakers talk simultaneously from 00:10-00:13" + }, + { + "key": "SODA_PROCESSED--train--310941", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--310941.wav", + "model_output": "Multiple speakers talk simultaneously from 00:15-00:21" + }, + { + "key": "SODA_PROCESSED--train--617278", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--617278.wav", + "model_output": "Multiple speakers talk simultaneously from 00:16-00:20" + }, + { + "key": "SODA_PROCESSED--train--836018", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--836018.wav", + "model_output": "Multiple speakers talk simultaneously from 00:06-00:11" + }, + { + "key": "SODA_PROCESSED--train--894199", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--894199.wav", + "model_output": "No significant overlaps found." + }, + { + "key": "SODA_PROCESSED--train--218746", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--218746.wav", + "model_output": "Multiple speakers talk simultaneously from 00:16-00:22" + }, + { + "key": "SODA_PROCESSED--train--218634", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--218634.wav", + "model_output": "Multiple speakers talk simultaneously from 00:05-00:10" + }, + { + "key": "SODA_PROCESSED--train--508884", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--508884.wav", + "model_output": "Multiple speakers talk simultaneously from 00:30-00:37" + }, + { + "key": "SODA_PROCESSED--train--667784", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--667784.wav", + "model_output": "Multiple speakers talk simultaneously from 00:04-00:11" + }, + { + "key": "SODA_PROCESSED--train--700208", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--700208.wav", + "model_output": "Multiple speakers talk simultaneously from 00:08-00:14" + }, + { + "key": "SODA_PROCESSED--train--767328", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--767328.wav", + "model_output": "Multiple speakers talk simultaneously from 00:06-00:10" + }, + { + "key": "SODA_PROCESSED--train--571155", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--571155.wav", + "model_output": "Multiple speakers talk simultaneously from 00:17-00:24" + }, + { + "key": "SODA_PROCESSED--train--633328", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--633328.wav", + "model_output": "Multiple speakers talk simultaneously from 00:24-00:32" + }, + { + "key": "SODA_PROCESSED--train--1001007", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--1001007.wav", + "model_output": "Multiple speakers talk simultaneously from 00:06-00:09" + }, + { + "key": "SODA_PROCESSED--train--843172", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--843172.wav", + "model_output": "Multiple speakers talk simultaneously from 00:04-00:10" + }, + { + "key": "SODA_PROCESSED--train--100933", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--100933.wav", + "model_output": "Multiple speakers talk simultaneously from 00:09-00:15" + }, + { + "key": "SODA_PROCESSED--train--883174", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--883174.wav", + "model_output": "Multiple speakers talk simultaneously from 00:17-00:25" + }, + { + "key": "SODA_PROCESSED--train--252183", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--252183.wav", + "model_output": "Multiple speakers talk simultaneously from 00:15-00:22" + }, + { + "key": "SODA_PROCESSED--train--634390", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--634390.wav", + "model_output": "Multiple speakers talk simultaneously from 00:08-00:13" + }, + { + "key": "SODA_PROCESSED--train--1031234", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--1031234.wav", + "model_output": "Multiple speakers talk simultaneously from 00:10-00:16" + }, + { + "key": "SODA_PROCESSED--train--876642", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--876642.wav", + "model_output": "Multiple speakers talk simultaneously from 00:11-00:15" + }, + { + "key": "SODA_PROCESSED--train--55746", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--55746.wav", + "model_output": "Multiple speakers talk simultaneously from 00:10-00:16" + }, + { + "key": "SODA_PROCESSED--train--171463", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--171463.wav", + "model_output": "No significant overlaps found." + }, + { + "key": "SODA_PROCESSED--train--159893", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--159893.wav", + "model_output": "Multiple speakers talk simultaneously from 00:08-00:13" + }, + { + "key": "SODA_PROCESSED--train--535550", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--535550.wav", + "model_output": "Multiple speakers talk simultaneously from 00:13-00:21" + }, + { + "key": "SODA_PROCESSED--train--237231", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--237231.wav", + "model_output": "Multiple speakers talk simultaneously from 00:04-00:09" + }, + { + "key": "SODA_PROCESSED--train--1185164", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--1185164.wav", + "model_output": "Multiple speakers talk simultaneously from 00:09-00:15" + }, + { + "key": "SODA_PROCESSED--train--719372", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--719372.wav", + "model_output": "Multiple speakers talk simultaneously from 00:07-00:14" + }, + { + "key": "SODA_PROCESSED--train--726133", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--726133.wav", + "model_output": "Multiple speakers talk simultaneously from 00:05-00:12" + }, + { + "key": "SODA_PROCESSED--train--730476", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--730476.wav", + "model_output": "Multiple speakers talk simultaneously from 00:08-00:16" + }, + { + "key": "SODA_PROCESSED--train--1025535", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--1025535.wav", + "model_output": "Multiple speakers talk simultaneously from 00:04-00:15, 00:42-00:47" + }, + { + "key": "SODA_PROCESSED--train--302394", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--302394.wav", + "model_output": "Multiple speakers talk simultaneously from 00:10-00:14" + }, + { + "key": "SODA_PROCESSED--train--967872", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--967872.wav", + "model_output": "Multiple speakers talk simultaneously from 00:06-00:10" + }, + { + "key": "SODA_PROCESSED--train--356688", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--356688.wav", + "model_output": "Multiple speakers talk simultaneously from 00:07-00:13" + }, + { + "key": "SODA_PROCESSED--train--169891", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--169891.wav", + "model_output": "Multiple speakers talk simultaneously from 00:05-00:11" + }, + { + "key": "SODA_PROCESSED--train--486837", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--486837.wav", + "model_output": "Multiple speakers talk simultaneously from 00:23-00:28" + }, + { + "key": "SODA_PROCESSED--train--1104244", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--1104244.wav", + "model_output": "Multiple speakers talk simultaneously from 00:07-00:15" + }, + { + "key": "SODA_PROCESSED--train--760966", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--760966.wav", + "model_output": "Multiple speakers talk simultaneously from 00:18-00:23" + }, + { + "key": "SODA_PROCESSED--train--453454", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--453454.wav", + "model_output": "No significant overlaps found." + }, + { + "key": "SODA_PROCESSED--train--1031152", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--1031152.wav", + "model_output": "Multiple speakers talk simultaneously from 00:17-00:24" + }, + { + "key": "SODA_PROCESSED--train--1097788", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--1097788.wav", + "model_output": "Multiple speakers talk simultaneously from 00:06-00:10" + }, + { + "key": "SODA_PROCESSED--train--532492", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--532492.wav", + "model_output": "Multiple speakers talk simultaneously from 00:19-00:25" + }, + { + "key": "SODA_PROCESSED--train--331396", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--331396.wav", + "model_output": "Multiple speakers talk simultaneously from 00:04-00:09" + }, + { + "key": "SODA_PROCESSED--train--330048", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--330048.wav", + "model_output": "Multiple speakers talk simultaneously from 00:12-00:17" + }, + { + "key": "SODA_PROCESSED--train--1095086", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--1095086.wav", + "model_output": "Multiple speakers talk simultaneously from 00:09-00:14" + }, + { + "key": "SODA_PROCESSED--train--286623", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--286623.wav", + "model_output": "Multiple speakers talk simultaneously from 00:10-00:14" + }, + { + "key": "SODA_PROCESSED--train--295395", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--295395.wav", + "model_output": "No significant overlaps found." + }, + { + "key": "SODA_PROCESSED--train--302689", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--302689.wav", + "model_output": "Multiple speakers talk simultaneously from 00:30-00:35" + }, + { + "key": "SODA_PROCESSED--train--826028", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--826028.wav", + "model_output": "Multiple speakers talk simultaneously from 00:15-00:21" + }, + { + "key": "SODA_PROCESSED--train--179580", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--179580.wav", + "model_output": "Multiple speakers talk simultaneously from 00:04-00:09" + }, + { + "key": "SODA_PROCESSED--train--219689", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--219689.wav", + "model_output": "Multiple speakers talk simultaneously from 00:13-00:17" + }, + { + "key": "SODA_PROCESSED--train--4955", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--4955.wav", + "model_output": "Multiple speakers talk simultaneously from 00:06-00:13" + }, + { + "key": "SODA_PROCESSED--train--1007416", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--1007416.wav", + "model_output": "Multiple speakers talk simultaneously from 00:15-00:21" + }, + { + "key": "SODA_PROCESSED--train--28408", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--28408.wav", + "model_output": "Multiple speakers talk simultaneously from 00:19-00:25" + }, + { + "key": "SODA_PROCESSED--train--888611", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--888611.wav", + "model_output": "Multiple speakers talk simultaneously from 00:06-00:10" + }, + { + "key": "SODA_PROCESSED--train--1013581", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--1013581.wav", + "model_output": "Multiple speakers talk simultaneously from 00:15-00:21" + }, + { + "key": "SODA_PROCESSED--train--472748", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--472748.wav", + "model_output": "Multiple speakers talk simultaneously from 00:15-00:19" + }, + { + "key": "SODA_PROCESSED--train--473100", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--473100.wav", + "model_output": "Multiple speakers talk simultaneously from 00:18-00:22" + }, + { + "key": "SODA_PROCESSED--train--1022129", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--1022129.wav", + "model_output": "Multiple speakers talk simultaneously from 00:09-00:15" + }, + { + "key": "SODA_PROCESSED--train--285043", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--285043.wav", + "model_output": "Multiple speakers talk simultaneously from 00:10-00:14" + }, + { + "key": "SODA_PROCESSED--train--168398", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--168398.wav", + "model_output": "Multiple speakers talk simultaneously from 00:49-00:59" + }, + { + "key": "SODA_PROCESSED--train--774546", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--774546.wav", + "model_output": "No significant overlaps found." + }, + { + "key": "SODA_PROCESSED--train--1055385", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--1055385.wav", + "model_output": "Multiple speakers talk simultaneously from 00:09-00:16" + }, + { + "key": "SODA_PROCESSED--train--42187", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--42187.wav", + "model_output": "Multiple speakers talk simultaneously from 00:01-00:08" + }, + { + "key": "SODA_PROCESSED--train--125527", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--125527.wav", + "model_output": "Multiple speakers talk simultaneously from 00:04-00:08" + }, + { + "key": "SODA_PROCESSED--train--419679", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--419679.wav", + "model_output": "Multiple speakers talk simultaneously from 00:03-00:08" + }, + { + "key": "SODA_PROCESSED--train--193134", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--193134.wav", + "model_output": "Multiple speakers talk simultaneously from 00:07-00:11" + }, + { + "key": "SODA_PROCESSED--train--903704", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--903704.wav", + "model_output": "Multiple speakers talk simultaneously from 00:08-00:15" + }, + { + "key": "SODA_PROCESSED--train--848051", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--848051.wav", + "model_output": "Multiple speakers talk simultaneously from 00:04-00:11" + }, + { + "key": "SODA_PROCESSED--train--797399", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--797399.wav", + "model_output": "Multiple speakers talk simultaneously from 00:09-00:13" + }, + { + "key": "SODA_PROCESSED--train--1050248", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--1050248.wav", + "model_output": "Multiple speakers talk simultaneously from 00:17-00:24" + }, + { + "key": "SODA_PROCESSED--train--810606", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--810606.wav", + "model_output": "Multiple speakers talk simultaneously from 00:43-00:51" + }, + { + "key": "SODA_PROCESSED--train--420178", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--420178.wav", + "model_output": "Multiple speakers talk simultaneously from 00:17-00:25" + }, + { + "key": "SODA_PROCESSED--train--748077", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--748077.wav", + "model_output": "Multiple speakers talk simultaneously from 00:10-00:17" + }, + { + "key": "SODA_PROCESSED--train--911067", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--911067.wav", + "model_output": "Multiple speakers talk simultaneously from 00:04-00:08" + }, + { + "key": "SODA_PROCESSED--train--901379", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--901379.wav", + "model_output": "Multiple speakers talk simultaneously from 00:08-00:14" + }, + { + "key": "SODA_PROCESSED--train--144310", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--144310.wav", + "model_output": "Multiple speakers talk simultaneously from 00:07-00:11" + }, + { + "key": "SODA_PROCESSED--train--280675", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--280675.wav", + "model_output": "Multiple speakers talk simultaneously from 00:17-00:24" + }, + { + "key": "SODA_PROCESSED--train--378283", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--378283.wav", + "model_output": "Multiple speakers talk simultaneously from 00:19-00:25" + }, + { + "key": "SODA_PROCESSED--train--187351", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--187351.wav", + "model_output": "Multiple speakers talk simultaneously from 00:05-00:11" + }, + { + "key": "SODA_PROCESSED--train--327822", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--327822.wav", + "model_output": "Multiple speakers talk simultaneously from 00:10-00:19" + }, + { + "key": "SODA_PROCESSED--train--68508", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--68508.wav", + "model_output": "Multiple speakers talk simultaneously from 00:22-00:29" + }, + { + "key": "SODA_PROCESSED--train--609913", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--609913.wav", + "model_output": "Multiple speakers talk simultaneously from 00:11-00:16" + }, + { + "key": "SODA_PROCESSED--train--258272", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--258272.wav", + "model_output": "Multiple speakers talk simultaneously from 00:09-00:16" + }, + { + "key": "SODA_PROCESSED--train--662948", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--662948.wav", + "model_output": "Multiple speakers talk simultaneously from 00:12-00:18" + }, + { + "key": "SODA_PROCESSED--train--140026", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--140026.wav", + "model_output": "Multiple speakers talk simultaneously from 00:07-00:12" + }, + { + "key": "SODA_PROCESSED--train--1131940", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--1131940.wav", + "model_output": "Multiple speakers talk simultaneously from 00:16-00:22" + }, + { + "key": "SODA_PROCESSED--train--317784", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--317784.wav", + "model_output": "Multiple speakers talk simultaneously from 00:17-00:22" + }, + { + "key": "SODA_PROCESSED--train--109817", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--109817.wav", + "model_output": "Multiple speakers talk simultaneously from 00:11-00:17" + }, + { + "key": "SODA_PROCESSED--train--588465", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--588465.wav", + "model_output": "Multiple speakers talk simultaneously from 00:03-00:08" + }, + { + "key": "SODA_PROCESSED--train--126878", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--126878.wav", + "model_output": "Multiple speakers talk simultaneously from 00:07-00:13" + }, + { + "key": "SODA_PROCESSED--train--770919", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--770919.wav", + "model_output": "Multiple speakers talk simultaneously from 00:09-00:15" + }, + { + "key": "SODA_PROCESSED--train--73764", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--73764.wav", + "model_output": "No significant overlaps found." + }, + { + "key": "SODA_PROCESSED--train--605295", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--605295.wav", + "model_output": "Multiple speakers talk simultaneously from 00:08-00:14" + }, + { + "key": "SODA_PROCESSED--train--258280", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--258280.wav", + "model_output": "Multiple speakers talk simultaneously from 00:03-00:10" + }, + { + "key": "SODA_PROCESSED--train--165189", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--165189.wav", + "model_output": "Multiple speakers talk simultaneously from 00:19-00:26" + }, + { + "key": "SODA_PROCESSED--train--70224", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--70224.wav", + "model_output": "Multiple speakers talk simultaneously from 00:11-00:16" + }, + { + "key": "SODA_PROCESSED--train--708343", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--708343.wav", + "model_output": "Multiple speakers talk simultaneously from 00:06-00:11" + }, + { + "key": "SODA_PROCESSED--train--214621", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--214621.wav", + "model_output": "Multiple speakers talk simultaneously from 00:10-00:17" + }, + { + "key": "SODA_PROCESSED--train--205208", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--205208.wav", + "model_output": "No significant overlaps found." + }, + { + "key": "SODA_PROCESSED--train--1142459", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--1142459.wav", + "model_output": "Multiple speakers talk simultaneously from 00:17-00:22" + }, + { + "key": "SODA_PROCESSED--train--164800", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--164800.wav", + "model_output": "Multiple speakers talk simultaneously from 00:06-00:14" + }, + { + "key": "SODA_PROCESSED--train--76986", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--76986.wav", + "model_output": "No significant overlaps found." + }, + { + "key": "SODA_PROCESSED--train--940934", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--940934.wav", + "model_output": "Multiple speakers talk simultaneously from 00:10-00:14" + }, + { + "key": "SODA_PROCESSED--train--640525", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--640525.wav", + "model_output": "Multiple speakers talk simultaneously from 00:15-00:20" + }, + { + "key": "SODA_PROCESSED--train--869455", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--869455.wav", + "model_output": "Multiple speakers talk simultaneously from 00:42-00:51" + }, + { + "key": "SODA_PROCESSED--train--836452", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--836452.wav", + "model_output": "No significant overlaps found." + }, + { + "key": "SODA_PROCESSED--train--842885", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--842885.wav", + "model_output": "Multiple speakers talk simultaneously from 00:06-00:13" + }, + { + "key": "SODA_PROCESSED--train--1182226", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--1182226.wav", + "model_output": "No significant overlaps found." + }, + { + "key": "SODA_PROCESSED--train--456887", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--456887.wav", + "model_output": "Multiple speakers talk simultaneously from 00:08-00:15" + }, + { + "key": "SODA_PROCESSED--train--118976", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--118976.wav", + "model_output": "Multiple speakers talk simultaneously from 00:10-00:19" + }, + { + "key": "SODA_PROCESSED--train--748910", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--748910.wav", + "model_output": "Multiple speakers talk simultaneously from 00:08-00:13" + }, + { + "key": "SODA_PROCESSED--train--152375", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--152375.wav", + "model_output": "Multiple speakers talk simultaneously from 00:30-00:35" + }, + { + "key": "SODA_PROCESSED--train--815822", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--815822.wav", + "model_output": "Multiple speakers talk simultaneously from 00:15-00:21" + }, + { + "key": "SODA_PROCESSED--train--766305", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--766305.wav", + "model_output": "Multiple speakers talk simultaneously from 00:11-00:16" + }, + { + "key": "SODA_PROCESSED--train--65045", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--65045.wav", + "model_output": "Multiple speakers talk simultaneously from 00:17-00:23" + }, + { + "key": "SODA_PROCESSED--train--268426", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--268426.wav", + "model_output": "Multiple speakers talk simultaneously from 00:12-00:18" + }, + { + "key": "SODA_PROCESSED--train--221517", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--221517.wav", + "model_output": "Multiple speakers talk simultaneously from 00:09-00:15" + }, + { + "key": "SODA_PROCESSED--train--869501", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--869501.wav", + "model_output": "Multiple speakers talk simultaneously from 00:22-00:29" + }, + { + "key": "SODA_PROCESSED--train--718092", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--718092.wav", + "model_output": "Multiple speakers talk simultaneously from 00:04-00:08" + }, + { + "key": "SODA_PROCESSED--train--201813", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--201813.wav", + "model_output": "Multiple speakers talk simultaneously from 00:48-00:55" + }, + { + "key": "SODA_PROCESSED--train--915430", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--915430.wav", + "model_output": "Multiple speakers talk simultaneously from 00:06-00:12" + }, + { + "key": "SODA_PROCESSED--train--1107341", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--1107341.wav", + "model_output": "Multiple speakers talk simultaneously from 00:14-00:22" + }, + { + "key": "SODA_PROCESSED--train--903574", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--903574.wav", + "model_output": "Multiple speakers talk simultaneously from 00:03-00:09" + }, + { + "key": "SODA_PROCESSED--train--741600", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--741600.wav", + "model_output": "Multiple speakers talk simultaneously from 00:18-00:24" + }, + { + "key": "SODA_PROCESSED--train--836740", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--836740.wav", + "model_output": "Multiple speakers talk simultaneously from 00:08-00:14" + }, + { + "key": "SODA_PROCESSED--train--463700", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--463700.wav", + "model_output": "Multiple speakers talk simultaneously from 00:08-00:15" + }, + { + "key": "SODA_PROCESSED--train--414445", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--414445.wav", + "model_output": "No significant overlaps found." + }, + { + "key": "SODA_PROCESSED--train--617839", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--617839.wav", + "model_output": "Multiple speakers talk simultaneously from 00:08-00:14" + }, + { + "key": "SODA_PROCESSED--train--846418", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--846418.wav", + "model_output": "Multiple speakers talk simultaneously from 00:20-00:28" + }, + { + "key": "SODA_PROCESSED--train--11862", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--11862.wav", + "model_output": "Multiple speakers talk simultaneously from 00:08-00:13" + }, + { + "key": "SODA_PROCESSED--train--146698", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--146698.wav", + "model_output": "Multiple speakers talk simultaneously from 00:03-00:07" + }, + { + "key": "SODA_PROCESSED--train--743500", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--743500.wav", + "model_output": "Multiple speakers talk simultaneously from 00:06-00:09" + }, + { + "key": "SODA_PROCESSED--train--185821", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--185821.wav", + "model_output": "Multiple speakers talk simultaneously from 00:09-00:16" + }, + { + "key": "SODA_PROCESSED--train--585968", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--585968.wav", + "model_output": "Multiple speakers talk simultaneously from 00:06-00:14" + }, + { + "key": "SODA_PROCESSED--train--487317", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--487317.wav", + "model_output": "Multiple speakers talk simultaneously from 00:23-00:30" + }, + { + "key": "SODA_PROCESSED--train--545009", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--545009.wav", + "model_output": "No significant overlaps found." + }, + { + "key": "SODA_PROCESSED--train--75062", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--75062.wav", + "model_output": "Multiple speakers talk simultaneously from 00:09-00:15" + }, + { + "key": "SODA_PROCESSED--train--343780", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--343780.wav", + "model_output": "Multiple speakers talk simultaneously from 00:08-00:14" + }, + { + "key": "SODA_PROCESSED--train--900948", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--900948.wav", + "model_output": "Multiple speakers talk simultaneously from 00:13-00:20" + }, + { + "key": "SODA_PROCESSED--train--1144076", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--1144076.wav", + "model_output": "Multiple speakers talk simultaneously from 00:19-00:28" + }, + { + "key": "SODA_PROCESSED--train--719199", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--719199.wav", + "model_output": "No significant overlaps found." + }, + { + "key": "SODA_PROCESSED--train--78189", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--78189.wav", + "model_output": "Multiple speakers talk simultaneously from 00:13-00:21" + }, + { + "key": "SODA_PROCESSED--train--490986", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--490986.wav", + "model_output": "No significant overlaps found." + }, + { + "key": "SODA_PROCESSED--train--218430", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--218430.wav", + "model_output": "Multiple speakers talk simultaneously from 00:08-00:11" + }, + { + "key": "SODA_PROCESSED--train--782660", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--782660.wav", + "model_output": "Multiple speakers talk simultaneously from 00:17-00:21" + }, + { + "key": "SODA_PROCESSED--train--14913", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--14913.wav", + "model_output": "Multiple speakers talk simultaneously from 00:11-00:17" + }, + { + "key": "SODA_PROCESSED--train--861085", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--861085.wav", + "model_output": "Multiple speakers talk simultaneously from 00:13-00:21" + }, + { + "key": "SODA_PROCESSED--train--908444", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--908444.wav", + "model_output": "Multiple speakers talk simultaneously from 00:03-00:09" + }, + { + "key": "SODA_PROCESSED--train--1007774", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--1007774.wav", + "model_output": "Multiple speakers talk simultaneously from 00:09-00:16" + }, + { + "key": "SODA_PROCESSED--train--399572", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--399572.wav", + "model_output": "Multiple speakers talk simultaneously from 00:04-00:08" + }, + { + "key": "SODA_PROCESSED--train--930750", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--930750.wav", + "model_output": "Multiple speakers talk simultaneously from 00:06-00:11" + }, + { + "key": "SODA_PROCESSED--train--4814", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--4814.wav", + "model_output": "Multiple speakers talk simultaneously from 00:05-00:12" + }, + { + "key": "SODA_PROCESSED--train--532510", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--532510.wav", + "model_output": "Multiple speakers talk simultaneously from 00:08-00:12" + }, + { + "key": "SODA_PROCESSED--train--61606", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--61606.wav", + "model_output": "No significant overlaps found." + }, + { + "key": "SODA_PROCESSED--train--303363", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--303363.wav", + "model_output": "Multiple speakers talk simultaneously from 00:10-00:17" + }, + { + "key": "SODA_PROCESSED--train--999053", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--999053.wav", + "model_output": "Multiple speakers talk simultaneously from 00:12-00:18" + }, + { + "key": "SODA_PROCESSED--train--33760", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--33760.wav", + "model_output": "Multiple speakers talk simultaneously from 00:17-00:24" + }, + { + "key": "SODA_PROCESSED--train--226853", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--226853.wav", + "model_output": "Multiple speakers talk simultaneously from 00:13-00:18" + }, + { + "key": "SODA_PROCESSED--train--913166", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--913166.wav", + "model_output": "Multiple speakers talk simultaneously from 00:21-00:26" + }, + { + "key": "SODA_PROCESSED--train--795559", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--795559.wav", + "model_output": "Multiple speakers talk simultaneously from 00:06-00:13" + }, + { + "key": "SODA_PROCESSED--train--933043", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--933043.wav", + "model_output": "Multiple speakers talk simultaneously from 00:10-00:15" + }, + { + "key": "SODA_PROCESSED--train--932576", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--932576.wav", + "model_output": "Multiple speakers talk simultaneously from 00:11-00:18" + }, + { + "key": "SODA_PROCESSED--train--775321", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--775321.wav", + "model_output": "Multiple speakers talk simultaneously from 00:05-00:13" + }, + { + "key": "SODA_PROCESSED--train--795181", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--795181.wav", + "model_output": "Multiple speakers talk simultaneously from 00:16-00:22" + }, + { + "key": "SODA_PROCESSED--train--1030451", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--1030451.wav", + "model_output": "Multiple speakers talk simultaneously from 00:10-00:16" + }, + { + "key": "SODA_PROCESSED--train--1023331", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--1023331.wav", + "model_output": "Multiple speakers talk simultaneously from 00:18-00:26" + }, + { + "key": "SODA_PROCESSED--train--961025", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--961025.wav", + "model_output": "Multiple speakers talk simultaneously from 00:11-00:19" + }, + { + "key": "SODA_PROCESSED--train--962210", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--962210.wav", + "model_output": "Multiple speakers talk simultaneously from 00:14-00:20" + }, + { + "key": "SODA_PROCESSED--train--906269", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--906269.wav", + "model_output": "Multiple speakers talk simultaneously from 00:21-00:27" + }, + { + "key": "SODA_PROCESSED--train--385442", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--385442.wav", + "model_output": "Multiple speakers talk simultaneously from 00:06-00:11" + }, + { + "key": "SODA_PROCESSED--train--109428", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--109428.wav", + "model_output": "Multiple speakers talk simultaneously from 00:10-00:16" + }, + { + "key": "SODA_PROCESSED--train--197137", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--197137.wav", + "model_output": "Multiple speakers talk simultaneously from 00:21-00:27" + }, + { + "key": "SODA_PROCESSED--train--523646", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--523646.wav", + "model_output": "Multiple speakers talk simultaneously from 00:04-00:08" + }, + { + "key": "SODA_PROCESSED--train--98673", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--98673.wav", + "model_output": "Multiple speakers talk simultaneously from 00:05-00:12" + }, + { + "key": "SODA_PROCESSED--train--317167", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--317167.wav", + "model_output": "Multiple speakers talk simultaneously from 00:04-00:07" + }, + { + "key": "SODA_PROCESSED--train--90368", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--90368.wav", + "model_output": "Multiple speakers talk simultaneously from 00:12-00:18" + }, + { + "key": "SODA_PROCESSED--train--20810", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--20810.wav", + "model_output": "Multiple speakers talk simultaneously from 00:06-00:10" + }, + { + "key": "SODA_PROCESSED--train--301485", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--301485.wav", + "model_output": "Multiple speakers talk simultaneously from 00:12-00:19" + }, + { + "key": "SODA_PROCESSED--train--372789", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--372789.wav", + "model_output": "Multiple speakers talk simultaneously from 00:03-00:08" + }, + { + "key": "SODA_PROCESSED--train--744708", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--744708.wav", + "model_output": "Multiple speakers talk simultaneously from 00:06-00:13" + }, + { + "key": "SODA_PROCESSED--train--874990", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--874990.wav", + "model_output": "Multiple speakers talk simultaneously from 00:10-00:16" + }, + { + "key": "SODA_PROCESSED--train--369090", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--369090.wav", + "model_output": "Multiple speakers talk simultaneously from 00:06-00:13" + }, + { + "key": "SODA_PROCESSED--train--894939", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--894939.wav", + "model_output": "Multiple speakers talk simultaneously from 00:06-00:13" + }, + { + "key": "SODA_PROCESSED--train--1186623", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--1186623.wav", + "model_output": "Multiple speakers talk simultaneously from 00:06-00:13" + }, + { + "key": "SODA_PROCESSED--train--1092169", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--1092169.wav", + "model_output": "Multiple speakers talk simultaneously from 00:18-00:23" + }, + { + "key": "SODA_PROCESSED--train--113543", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--113543.wav", + "model_output": "Multiple speakers talk simultaneously from 00:07-00:13" + }, + { + "key": "SODA_PROCESSED--train--888565", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--888565.wav", + "model_output": "Multiple speakers talk simultaneously from 00:11-00:16" + }, + { + "key": "SODA_PROCESSED--train--322068", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--322068.wav", + "model_output": "Multiple speakers talk simultaneously from 00:07-00:14" + }, + { + "key": "SODA_PROCESSED--train--970059", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--970059.wav", + "model_output": "Multiple speakers talk simultaneously from 00:09-00:13" + }, + { + "key": "SODA_PROCESSED--train--334902", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--334902.wav", + "model_output": "No significant overlaps found." + }, + { + "key": "SODA_PROCESSED--train--152172", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--152172.wav", + "model_output": "Multiple speakers talk simultaneously from 00:10-00:16" + }, + { + "key": "SODA_PROCESSED--train--855653", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--855653.wav", + "model_output": "Multiple speakers talk simultaneously from 00:05-00:11" + }, + { + "key": "SODA_PROCESSED--train--202914", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--202914.wav", + "model_output": "Multiple speakers talk simultaneously from 00:07-00:16" + }, + { + "key": "SODA_PROCESSED--train--527126", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--527126.wav", + "model_output": "Multiple speakers talk simultaneously from 00:21-00:27" + }, + { + "key": "SODA_PROCESSED--train--480349", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--480349.wav", + "model_output": "Multiple speakers talk simultaneously from 00:08-00:11" + }, + { + "key": "SODA_PROCESSED--train--784738", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--784738.wav", + "model_output": "Multiple speakers talk simultaneously from 00:15-00:21" + }, + { + "key": "SODA_PROCESSED--train--418520", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--418520.wav", + "model_output": "Multiple speakers talk simultaneously from 00:17-00:23" + }, + { + "key": "SODA_PROCESSED--train--159547", + "audio_url": "/root/autodl-tmp/output_overlapslong/newoverlapjson/overlap5s700/SODA_PROCESSED--train--159547.wav", + "model_output": "Multiple speakers talk simultaneously from 00:08-00:13" + } +] \ No newline at end of file diff --git a/ms-swift/swift/tuners/__pycache__/lora.cpython-310.pyc b/ms-swift/swift/tuners/__pycache__/lora.cpython-310.pyc new file mode 100644 index 0000000000000000000000000000000000000000..9a84171d197e6e2b2939e5e82d99cb82d1d3881d Binary files /dev/null and b/ms-swift/swift/tuners/__pycache__/lora.cpython-310.pyc differ diff --git a/ms-swift/swift/tuners/__pycache__/mapping.cpython-310.pyc b/ms-swift/swift/tuners/__pycache__/mapping.cpython-310.pyc new file mode 100644 index 0000000000000000000000000000000000000000..8e525518b983fa4eb731f8aaf027ebe45f24cbc8 Binary files /dev/null and b/ms-swift/swift/tuners/__pycache__/mapping.cpython-310.pyc differ diff --git a/ms-swift/swift/tuners/__pycache__/part.cpython-310.pyc b/ms-swift/swift/tuners/__pycache__/part.cpython-310.pyc new file mode 100644 index 0000000000000000000000000000000000000000..95b0f18b0197792a6df6536f3195526013dff0b5 Binary files /dev/null and b/ms-swift/swift/tuners/__pycache__/part.cpython-310.pyc differ diff --git a/ms-swift/swift/tuners/__pycache__/restuning.cpython-310.pyc b/ms-swift/swift/tuners/__pycache__/restuning.cpython-310.pyc new file mode 100644 index 0000000000000000000000000000000000000000..099e3a469d2d1f9218c31e7d099c1841e7f6a034 Binary files /dev/null and b/ms-swift/swift/tuners/__pycache__/restuning.cpython-310.pyc differ diff --git a/ms-swift/swift/tuners/__pycache__/restuning_components.cpython-310.pyc b/ms-swift/swift/tuners/__pycache__/restuning_components.cpython-310.pyc new file mode 100644 index 0000000000000000000000000000000000000000..d6cecb67629246f39dd0443f9b84f20891bff238 Binary files /dev/null and b/ms-swift/swift/tuners/__pycache__/restuning_components.cpython-310.pyc differ diff --git a/ms-swift/swift/tuners/__pycache__/side.cpython-310.pyc b/ms-swift/swift/tuners/__pycache__/side.cpython-310.pyc new file mode 100644 index 0000000000000000000000000000000000000000..01bbb3202a3c31d85c27b67fa37703698402a1c9 Binary files /dev/null and b/ms-swift/swift/tuners/__pycache__/side.cpython-310.pyc differ diff --git a/ms-swift/swift/tuners/__pycache__/utils.cpython-310.pyc b/ms-swift/swift/tuners/__pycache__/utils.cpython-310.pyc new file mode 100644 index 0000000000000000000000000000000000000000..bcb409f3892ea7f10fbdebf336ecd749f593f023 Binary files /dev/null and b/ms-swift/swift/tuners/__pycache__/utils.cpython-310.pyc differ diff --git a/ms-swift/swift/tuners/adapter.py b/ms-swift/swift/tuners/adapter.py new file mode 100644 index 0000000000000000000000000000000000000000..290040b551b5e969eeb7b59bcc7dfd63536b57e3 --- /dev/null +++ b/ms-swift/swift/tuners/adapter.py @@ -0,0 +1,189 @@ +# Copyright (c) Alibaba, Inc. and its affiliates. +import inspect +import re +import types +from dataclasses import dataclass, field +from typing import List, Union + +import torch +from torch import nn +from transformers.activations import ACT2CLS + +from swift.utils.torch_utils import find_sub_module, get_logger +from .utils import ActivationMixin, SwiftAdapter, SwiftConfig, SwiftOutput + +logger = get_logger() + + +@dataclass +class AdapterConfig(SwiftConfig): + """ + The configuration class for the adapter module. + + Adapters project input tokens by an MLP layer. + 'Parameter-Efficient Transfer Learning for NLP' by Houlsby et al.(2019) + See http://arxiv.org/abs/1902.00751 + + Args: + dim(`int`): The dimension of the hidden states + target_modules(`Union[str, List[str]]`): The feedforward module to be replaced. + in regex format if this argument is str, else will match with `end with` if List[str]. + hidden_pos(`Union[str, int]`): The position of the hidden state to be passed into the adapter, + can be int (args) or str (kwargs) + method_name(`str`): The method to be replaced, default is `forward` + adapter_length: The length of the adapter length (intermediate length) + act_layer: The activation layer of the adapter + """ + + dim: int = field(default=None, metadata={'help': 'The dimension of the hidden states'}) + + target_modules: Union[str, List[str]] = field( + default=None, + metadata={ + 'help': + 'The feedforward module to be replaced. in regex format if this argument is str, ' + 'else will match with `end with` if List[str].' + }) + + hidden_pos: Union[str, int] = field( + default=None, + metadata={ + 'help': 'The position of the hidden state to be passed into the adapter, can be int (args) or str (kwargs)' + }) + + method_name: str = field(default='forward', metadata={'help': 'The method to be replaced, default is `forward`'}) + + adapter_length: int = field( + default=128, metadata={'help': 'The length of the adapter length (intermediate length)'}) + + act_layer: str = field(default='gelu', metadata={'help': 'The activation layer of the adapter'}) + + def __post_init__(self): + from .mapping import SwiftTuners + self.swift_type = SwiftTuners.ADAPTER + + +class Adapter(SwiftAdapter): + + @staticmethod + def prepare_model(model: nn.Module, config: AdapterConfig, adapter_name: str) -> SwiftOutput: + """Prepare a model with `AdapterConfig`""" + module_keys = [key for key, _ in model.named_modules()] + + for module_key in module_keys: + if isinstance(config.target_modules, str): + target_module_found = re.fullmatch(config.target_modules, module_key) + else: + target_module_found = any(module_key.endswith(target_key) for target_key in config.target_modules) + + if target_module_found: # noqa + module = model.get_submodule(module_key) + + def _forward(self, *args, **kwargs): + args = getattr(self, f'forward_origin_{adapter_name}')(*args, **kwargs) + if isinstance(args, (tuple, list, dict)): + if isinstance(config.hidden_pos, int): + _type = type(args) + args = list(args) + args[config.hidden_pos] = getattr(self, f'adapter_{adapter_name}')(args[config.hidden_pos]) + args = _type(args) + else: + args[config.hidden_pos] = getattr(self, f'adapter_{adapter_name}')(args[config.hidden_pos]) + elif isinstance(args, torch.Tensor): + args = getattr(self, f'adapter_{adapter_name}')(args) + return args + + def _feed_forward_chunk(self, attention_output): + return _forward(self, attention_output) + + # TODO The `config.method_name` method should not be replaced twice. + + setattr(module, f'forward_origin_{adapter_name}', getattr(module, config.method_name)) + num_args_in_forward_chunk_fn = len( + inspect.signature(getattr(module, f'forward_origin_{adapter_name}')).parameters) + if config.method_name == 'feed_forward_chunk' and num_args_in_forward_chunk_fn == 1: + setattr(module, config.method_name, types.MethodType(_feed_forward_chunk, module)) + else: + setattr(module, config.method_name, types.MethodType(_forward, module)) + adapter_module = AdapterModule(config.dim, adapter_name, module_key, config.adapter_length, + ACT2CLS[config.act_layer]) + setattr(module, f'adapter_{adapter_name}', adapter_module) + logger.info(f'Adapter modules(module_key): {module_key}.adapter_{adapter_name}') + + def state_dict_callback(state_dict, adapter_name: str, **kwargs): + return {key: value for key, value in state_dict.items() if f'adapter_{adapter_name}' in key} + + def mark_trainable_callback(model): + return + + return SwiftOutput( + config=config, state_dict_callback=state_dict_callback, mark_trainable_callback=mark_trainable_callback) + + @staticmethod + def activate_adapter(module: torch.nn.Module, adapter_name: str, activate: bool, offload: str = None): + modules = find_sub_module(module, f'adapter_{adapter_name}') + for _module in modules: + _module: ActivationMixin + _module: nn.Module + _module.set_activation(adapter_name, activate) + SwiftAdapter.save_memory(_module, adapter_name, _module.module_key, activate, offload) + + +class AdapterModule(nn.Module, ActivationMixin): + """The implementation of adapter tuning method. + + Adapters project input tokens by an MLP layer. + 'Parameter-Efficient Transfer Learning for NLP' by Houlsby et al.(2019) + See http://arxiv.org/abs/1902.00751 + + Args: + dim: An integer indicating the embedding dimension. + adapter_length: An integer indicating the length of adapter tuning. + """ + + def __init__( + self, + dim, + adapter_name, + module_key, + adapter_length=None, + act_layer=nn.GELU, + ): + super(AdapterModule, self).__init__() + super(nn.Module, self).__init__(module_key) + self.dim = dim + self.adapter_name = adapter_name + self.adapter_length = adapter_length + self.linear1 = nn.Linear(dim, adapter_length) + self.act = act_layer() + self.linear2 = nn.Linear(adapter_length, dim) + self.init_weights() + self._prepared = False + self.mark_all_sub_modules_as_plugin() + + def init_weights(self): + + def _init_weights(m): + if isinstance(m, nn.Linear): + nn.init.xavier_uniform_(m.weight) + nn.init.normal_(m.bias, std=1e-6) + + self.apply(_init_weights) + + def forward(self, x, identity=None): + if not self.is_activated(self.adapter_name): + return x + if not self._prepared: + self.linear1.to(x.device) + self.act.to(x.device) + self.linear2.to(x.device) + self._prepared = True + + x_dtype = x.dtype + x = x.to(self.linear1.weight.dtype) + out = self.linear2(self.act(self.linear1(x))) + if identity is None: + identity = x + identity = identity.to(out.dtype) + out = identity + out + return out.to(x_dtype) diff --git a/ms-swift/swift/tuners/longlora/__pycache__/longlora.cpython-310.pyc b/ms-swift/swift/tuners/longlora/__pycache__/longlora.cpython-310.pyc new file mode 100644 index 0000000000000000000000000000000000000000..6d22a0f14ce27e7780dc8dcda96504d484a60b41 Binary files /dev/null and b/ms-swift/swift/tuners/longlora/__pycache__/longlora.cpython-310.pyc differ diff --git a/ms-swift/swift/tuners/peft.py b/ms-swift/swift/tuners/peft.py new file mode 100644 index 0000000000000000000000000000000000000000..f561db4fc049d167f87c56bfae28b201dc967b6d --- /dev/null +++ b/ms-swift/swift/tuners/peft.py @@ -0,0 +1,392 @@ +# Copyright (c) Alibaba, Inc. and its affiliates. +# Copyright 2023-present the HuggingFace Inc. team. +import os.path +from dataclasses import asdict, dataclass, field +from functools import partial, reduce +from types import MethodType +from typing import Dict, Optional + +import json +import peft +import torch +import torch.nn +import transformers +from modelscope import snapshot_download +from peft import (AdaLoraConfig, BOFTConfig, BOFTModel, LoftQConfig, LoHaConfig, LoKrConfig, LoraModel, OFTConfig, + PeftConfig, PeftModel, PeftModelForCausalLM, PeftModelForSeq2SeqLM, + PeftModelForSequenceClassification, PeftModelForTokenClassification, PrefixTuningConfig, + PromptEncoderConfig, PromptLearningConfig, PromptTuningConfig, VeraConfig, VeraModel, get_peft_config, + get_peft_model, get_peft_model_state_dict) +from peft.config import PeftConfigMixin +from peft.tuners import lora +from peft.tuners.adalora import AdaLoraModel, RankAllocator +from peft.tuners.lora import Embedding +from transformers import Trainer + +from swift.utils import get_logger + +try: + from peft import FourierFTModel +except ImportError: + FourierFTModel = None + +try: + from peft import BoneModel +except ImportError: + BoneModel = None + +logger = get_logger() +dispatchers = [] + + +@dataclass +class LoraConfig(peft.LoraConfig): + lora_dtype: Optional[str] = field( + default=None, metadata={'help': 'The lora dtype, default None means following the original layer\'s dtype'}) + + lorap_lr_ratio: Optional[float] = field(default=None, metadata={'help': 'The lr ratio of lora_B in lora+'}) + + lorap_emb_lr: float = field(default=1e-6, metadata={'help': 'The lr for embedding in lora+'}) + + def to_peft_config(self) -> peft.LoraConfig: + _dict = asdict(self) + _dict.pop('lora_dtype') + _dict.pop('lorap_lr_ratio') + _dict.pop('lorap_emb_lr') + return peft.LoraConfig(**_dict) + + def save_pretrained(self, save_directory: str, **kwargs) -> None: + self.to_peft_config().save_pretrained(save_directory, **kwargs) + additional_args = { + 'lora_dtype': self.lora_dtype, + 'lorap_lr_ratio': self.lorap_lr_ratio, + 'lorap_emb_lr': self.lorap_emb_lr, + } + with open(os.path.join(save_directory, 'additional_config.json'), 'w', encoding='utf-8') as f: + json.dump(additional_args, f) + + @classmethod + def from_pretrained(cls, pretrained_model_name_or_path: str, subfolder: Optional[str] = None, **kwargs): + if hasattr(PeftConfigMixin, 'from_pretrained_origin'): + self = PeftConfigMixin.from_pretrained_origin(pretrained_model_name_or_path, subfolder, **kwargs) + else: + self = super(LoraConfig, cls).from_pretrained(pretrained_model_name_or_path, subfolder, **kwargs) + + if type(self) == peft.LoraConfig: + self = LoraConfig(**self.to_dict()) + + if os.path.isfile(os.path.join(pretrained_model_name_or_path, 'additional_config.json')): + with open( + os.path.join(pretrained_model_name_or_path, 'additional_config.json'), 'r', encoding='utf-8') as f: + _json = json.load(f) + for key, value in _json.items(): + setattr(self, key, value) + + return self + + +def _create_and_replace_hook(self, peft_config, adapter_name, target, *args, **kwargs): + all_supported_names = ('linear', ) + all_supported_types = (torch.nn.Embedding, torch.nn.Conv2d, transformers.pytorch_utils.Conv1D, lora.Linear) + target_modules = getattr(peft_config, 'target_modules', None) + if target is None: + return + + if isinstance(target_modules, str) and not any( + [name in target.__class__.__name__.lower() + for name in all_supported_names]) and not any([isinstance(target, type_) for type_ in all_supported_types]): + return + + if target.__class__.__name__ == 'NonDynamicallyQuantizableLinear': + return + + return self._create_and_replace_origin(peft_config, adapter_name, target, *args, **kwargs) + + +def _convert_dtype(target: torch.nn.Module, adapter_name: str, lora_dtype: str): + if lora_dtype is not None: + torch_dtype = eval(f'torch.{lora_dtype}') + if hasattr(target, 'lora_A') and adapter_name in target.lora_A: + target.lora_A[adapter_name].to(torch_dtype) + target.lora_B[adapter_name].to(torch_dtype) + if hasattr(target, 'lora_embedding_A') and adapter_name in target.lora_embedding_A: + target.lora_embedding_A[adapter_name].to(torch_dtype) + target.lora_embedding_B[adapter_name].to(torch_dtype) + + +def create_optimizer_param_groups(self: PeftModel, **defaults): + if not isinstance(self.peft_config[self.active_adapter], + LoraConfig) or self.peft_config[self.active_adapter].lorap_lr_ratio is None: + return None + + def get_module(name): + parent_idx = 2 if 'lora' in name else 1 + module_names = name.split(sep='.')[:-parent_idx] + module = reduce(getattr, module_names, self.base_model) + return module + + param_groups = { + 'groupA': {}, + 'groupB': {}, + 'groupB_no_decay': {}, + 'embedding': {}, + } + + decay_parameters = Trainer.get_decay_parameter_names(None, self.base_model) + for name, param in self.base_model.named_parameters(): + if not param.requires_grad: + continue + + module = get_module(name) + if isinstance(module, Embedding): + param_groups['embedding'][name] = param + elif 'lora_B' in name or param.ndim == 1: + if name in decay_parameters: + param_groups['groupB'][name] = param + else: + param_groups['groupB_no_decay'][name] = param + else: + param_groups['groupA'][name] = param + + lr = defaults['lr'] + weight_decay = defaults.get('weight_decay', 0.0) + + param_groups = [ + { + 'params': list(param_groups['groupA'].values()), + 'weight_decay': weight_decay, + 'lr': lr, + }, + { + 'params': list(param_groups['embedding'].values()), + 'weight_decay': weight_decay, + 'lr': self.peft_config[self.active_adapter].lorap_emb_lr, + }, + { + 'params': list(param_groups['groupB'].values()), + 'weight_decay': weight_decay, + 'lr': lr * self.peft_config[self.active_adapter].lorap_lr_ratio, + }, + { + 'params': list(param_groups['groupB_no_decay'].values()), + 'weight_decay': 0.0, + 'lr': lr * self.peft_config[self.active_adapter].lorap_lr_ratio, + }, + ] + return param_groups + + +def adalora_forward(self, *args, **kwargs): + from peft.utils.integrations import gather_params_ctx + outputs = self.model.forward(*args, **kwargs) + + if (getattr(outputs, 'loss', None) is not None) and isinstance(outputs.loss, torch.Tensor): + # Calculate the orthogonal regularization + orth_reg_weight = self.peft_config[self.trainable_adapter_name].orth_reg_weight + + if orth_reg_weight <= 0: + raise ValueError('orth_reg_weight should be greater than 0. ') + + regu_loss = 0 + num_param = 0 + for n, p in self.model.named_parameters(): + if ('lora_A' in n or 'lora_B' in n) and self.trainable_adapter_name in n: + if p.shape == torch.Size([0]): + with gather_params_ctx(p, fwd_module=self): + para_cov = p @ p.T if 'lora_A' in n else p.T @ p + else: + para_cov = p @ p.T if 'lora_A' in n else p.T @ p + I = torch.eye(*para_cov.size(), out=torch.empty_like(para_cov)) # noqa: E741 + I.requires_grad = False + num_param += 1 + if isinstance(regu_loss, torch.Tensor): + regu_loss = regu_loss.to(para_cov.device) + regu_loss += torch.norm(para_cov - I, p='fro') + if num_param > 0: + regu_loss = regu_loss / num_param + else: + regu_loss = 0 + if isinstance(regu_loss, torch.Tensor) and isinstance(outputs.loss, torch.Tensor): + regu_loss = regu_loss.to(outputs.loss.device) + outputs.loss += orth_reg_weight * regu_loss + return outputs + + +def adalora_mask_to_budget(self, model, budget): + value_ipt = {} + vector_ipt = {} + triplet_ipt = {} + # Get the importance score for A, E, B + for n, p in model.named_parameters(): + if f'lora_A.{self.adapter_name}' in n: + entry_ipt = self._element_score(n) + comb_ipt = torch.mean(entry_ipt, dim=1, keepdim=True) + name_m = n.replace('lora_A', '%s') + if name_m not in vector_ipt: + vector_ipt[name_m] = [comb_ipt] + else: + vector_ipt[name_m].append(comb_ipt) + if f'lora_B.{self.adapter_name}' in n: + entry_ipt = self._element_score(n) + comb_ipt = torch.mean(entry_ipt, dim=0, keepdim=False).view(-1, 1) + name_m = n.replace('lora_B', '%s') + if name_m not in vector_ipt: + vector_ipt[name_m] = [comb_ipt] + else: + vector_ipt[name_m].append(comb_ipt) + if f'lora_E.{self.adapter_name}' in n: + entry_ipt = self._element_score(n) + name_m = n.replace('lora_E', '%s') + value_ipt[name_m] = entry_ipt + + all_score = [] + # Calculate the score for each triplet + for name_m in vector_ipt: + ipt_E = value_ipt[name_m] + ipt_AB = torch.cat(vector_ipt[name_m], dim=1) + sum_ipt = self._combine_ipt(ipt_E, ipt_AB) + name_E = name_m % 'lora_E' + triplet_ipt[name_E] = sum_ipt.view(-1, 1) + sum_ipt = sum_ipt.view(-1) + if all_score: + sum_ipt = sum_ipt.to(all_score[0].device) + all_score.append(sum_ipt) + + # Get the threshold by ranking ipt + mask_threshold = torch.kthvalue( + torch.cat(all_score), + k=self.init_bgt - budget, + )[0].item() + + rank_pattern = {} + # Mask the unimportant triplets + with torch.no_grad(): + for n, p in model.named_parameters(): + if f'lora_E.{self.adapter_name}' in n: + p.masked_fill_(triplet_ipt[n] <= mask_threshold, 0.0) + rank_pattern[n] = (~(triplet_ipt[n] <= mask_threshold)).view(-1).tolist() + return rank_pattern + + +def keep_device_forward(self, *args, **kwargs): + x = args[0] + if self.weight.device != x.device: + return self.forward_origin(x.to(self.weight.device), *args[1:], **kwargs) + else: + return self.forward_origin(*args, **kwargs) + + +def hot_patch_peft_module(): + from peft.tuners.lora import LoraLayer + if hasattr('LoraModel', '_create_and_replace_origin'): + return + + # Fix Lora does not support NonDynamicallyQuantizableLinear + LoraModel._create_and_replace_origin = LoraModel._create_and_replace + LoraModel._create_and_replace = _create_and_replace_hook + AdaLoraModel._create_and_replace_origin = AdaLoraModel._create_and_replace + AdaLoraModel._create_and_replace = _create_and_replace_hook + VeraModel._create_and_replace_origin = VeraModel._create_and_replace + VeraModel._create_and_replace = _create_and_replace_hook + BOFTModel._create_and_replace_origin = BOFTModel._create_and_replace + BOFTModel._create_and_replace = _create_and_replace_hook + if FourierFTModel is not None: + FourierFTModel._create_and_replace_origin = FourierFTModel._create_and_replace + FourierFTModel._create_and_replace = _create_and_replace_hook + if BoneModel is not None: + BoneModel._create_and_replace_origin = BoneModel._create_and_replace + BoneModel._create_and_replace = _create_and_replace_hook + + # Support type conversion + def __new_init__(self, model: torch.nn.Module, config: Dict[str, LoraConfig], adapter_name: str): + + self.__init_origin__(model, config, adapter_name) + active_adapters = self.active_adapter + if isinstance(active_adapters, str): + active_adapters = [active_adapters] + for active_adapter in active_adapters: + active_config = config[active_adapter] if isinstance(config, dict) else config + if hasattr(active_config, 'lora_dtype'): + for name, module in model.named_modules(): + if isinstance(module, LoraLayer): + _convert_dtype(module, active_adapter, active_config.lora_dtype) + for lora in list(module.lora_A.values()) + list(module.lora_B.values()): + if not hasattr(lora, 'forward_origin'): + lora.forward_origin = lora.forward + lora.forward = MethodType(keep_device_forward, lora) + + LoraModel.__init_origin__ = LoraModel.__init__ + LoraModel.__init__ = __new_init__ + + # Support LoRA+ + PeftModel.create_optimizer_param_groups = create_optimizer_param_groups + + PeftConfigMixin.from_pretrained_origin = PeftConfigMixin.from_pretrained + PeftConfigMixin.from_pretrained = LoraConfig.from_pretrained + + # Compatible with SwiftModel + def dummy_function(*args, **kwargs): + logger.warn(f'The function {kwargs["func"]} has no effects, consider using other functions.') + + PeftModel.activate_adapter = PeftModel.set_adapter + PeftModel.deactivate_adapter = partial(dummy_function, func='deactivate_adapter') + PeftModel.set_active_adapters = partial(dummy_function, func='set_active_adapters') + + # Fix adalora does not support device_map + AdaLoraModel.forward = adalora_forward + RankAllocator.mask_to_budget = adalora_mask_to_budget + + +def get_wrapped_class(module_class): + """Get a custom wrapper class for peft classes to download the models from the ModelScope hub + + Args: + module_class: The actual module class + + Returns: + The wrapper + """ + + class PeftWrapper(module_class): + + @classmethod + def from_pretrained(cls, model, model_id, *args, revision: Optional[str] = None, **kwargs): + if not os.path.exists(model_id): + model_id = snapshot_download(model_id, revision=revision) + return module_class.from_pretrained(model, model_id, *args, **kwargs) + + PeftWrapper.__name__ = module_class.__name__ + PeftWrapper.__qualname__ = module_class.__qualname__ + return PeftWrapper + + +def wrap_module(module): + if not hasattr(module, 'from_pretrained'): + return module + + return get_wrapped_class(module) + + +hot_patch_peft_module() +PeftModel = wrap_module(PeftModel) +PeftConfig = wrap_module(PeftConfig) +PeftModelForSeq2SeqLM = wrap_module(PeftModelForSeq2SeqLM) +PeftModelForSequenceClassification = wrap_module(PeftModelForSequenceClassification) +PeftModelForTokenClassification = wrap_module(PeftModelForTokenClassification) +PeftModelForCausalLM = wrap_module(PeftModelForCausalLM) +PromptEncoderConfig = wrap_module(PromptEncoderConfig) +PromptTuningConfig = wrap_module(PromptTuningConfig) +PrefixTuningConfig = wrap_module(PrefixTuningConfig) +PromptLearningConfig = wrap_module(PromptLearningConfig) +LoraConfig = wrap_module(LoraConfig) +AdaLoraConfig = wrap_module(AdaLoraConfig) +LoHaConfig = wrap_module(LoHaConfig) +LoKrConfig = wrap_module(LoKrConfig) +LoftQConfig = wrap_module(LoftQConfig) +OFTConfig = wrap_module(OFTConfig) +BOFTConfig = wrap_module(BOFTConfig) +VeraConfig = wrap_module(VeraConfig) +OFTConfig = wrap_module(OFTConfig) +get_peft_config = get_peft_config +get_peft_model_state_dict = get_peft_model_state_dict +get_peft_model = get_peft_model diff --git a/ms-swift/swift/tuners/scetuning/__pycache__/__init__.cpython-310.pyc b/ms-swift/swift/tuners/scetuning/__pycache__/__init__.cpython-310.pyc new file mode 100644 index 0000000000000000000000000000000000000000..0e5dc98d94efce8a4e3544841ab9de516a71ec66 Binary files /dev/null and b/ms-swift/swift/tuners/scetuning/__pycache__/__init__.cpython-310.pyc differ diff --git a/ms-swift/swift/tuners/scetuning/__pycache__/scetuning.cpython-310.pyc b/ms-swift/swift/tuners/scetuning/__pycache__/scetuning.cpython-310.pyc new file mode 100644 index 0000000000000000000000000000000000000000..cf62e3719597b6eb8631f90ec6db4a738bcfb52a Binary files /dev/null and b/ms-swift/swift/tuners/scetuning/__pycache__/scetuning.cpython-310.pyc differ diff --git a/ms-swift/swift/tuners/scetuning/__pycache__/scetuning_components.cpython-310.pyc b/ms-swift/swift/tuners/scetuning/__pycache__/scetuning_components.cpython-310.pyc new file mode 100644 index 0000000000000000000000000000000000000000..b94f9a73b5e1f73f663562fa90c4f344054a6c54 Binary files /dev/null and b/ms-swift/swift/tuners/scetuning/__pycache__/scetuning_components.cpython-310.pyc differ diff --git a/ms-swift/swift/tuners/scetuning/scetuning_components.py b/ms-swift/swift/tuners/scetuning/scetuning_components.py new file mode 100644 index 0000000000000000000000000000000000000000..7b7b981d15bc394710f504ffb630fd08cb061d75 --- /dev/null +++ b/ms-swift/swift/tuners/scetuning/scetuning_components.py @@ -0,0 +1,127 @@ +# Copyright (c) Alibaba, Inc. and its affiliates. +import math + +import torch +import torch.nn as nn + +from swift.utils.logger import get_logger + +logger = get_logger() + + +def detach_tensors(feats): + if type(feats) in [list, tuple]: + feats = [detach_tensors(feat) if feat is not None else None for feat in feats] + elif isinstance(feats, dict): + feats = {key: detach_tensors(val) for key, val in feats.items()} + elif isinstance(feats, torch.Tensor): + feats = feats.detach() + else: + feats = feats.detach() + return feats + + +def probe_tensors(module, feats, name): + feats = detach_tensors(feats) + setattr(module, name, feats) + + +def probe_input_pre_hook(self, args): + input = args[0] + probe_tensors(self, input, 'probe_input_data') + return args + + +def probe_output_hook(self, args, result): + output = result + probe_tensors(self, output, 'probe_output_data') + return output + + +def choose_weight_type(weight_type, dim): + if weight_type == 'gate': + scaling = nn.Linear(dim, 1) + elif weight_type == 'scale': + scaling = nn.Parameter(torch.Tensor(1)) + scaling.data.fill_(1) + elif weight_type == 'scale_channel': + scaling = nn.Parameter(torch.Tensor(dim)) + scaling.data.fill_(1) + elif weight_type and weight_type.startswith('scalar'): + scaling = float(weight_type.split('_')[-1]) + else: + scaling = None + return scaling + + +def get_weight_value(weight_type, scaling, x): + if weight_type in ['gate']: + scaling = torch.mean(torch.sigmoid(scaling(x)), dim=1).view(-1, 1, 1) + elif weight_type in ['scale', 'scale_channel'] or weight_type.startswith('scalar'): + scaling = scaling + else: + scaling = None + return scaling + + +class SCEAdapter(nn.Module): + + def __init__(self, + dim, + adapter_length, + adapter_type=None, + adapter_weight=None, + act_layer=nn.GELU, + zero_init_last=True, + use_bias=True): + super(SCEAdapter, self).__init__() + self.dim = dim + self.adapter_length = adapter_length + self.adapter_type = adapter_type + self.adapter_weight = adapter_weight + self.zero_init_last = zero_init_last + self.ln1 = nn.Linear(dim, adapter_length, bias=use_bias) + self.activate = act_layer() + self.ln2 = nn.Linear(adapter_length, dim, bias=use_bias) + self.init_weights() + self.init_scaling() + + def _zero_init_weights(self, m): + if isinstance(m, nn.Linear): + nn.init.zeros_(m.weight) + nn.init.zeros_(m.bias) + + def _kaiming_init_weights(self, m): + if isinstance(m, nn.Linear): + nn.init.kaiming_uniform_(m.weight, a=math.sqrt(5)) + + def init_weights(self): + self._kaiming_init_weights(self.ln1) + if self.zero_init_last: + self._zero_init_weights(self.ln2) + else: + self._kaiming_init_weights(self.ln2) + + def init_scaling(self): + if self.adapter_weight: + self.scaling = choose_weight_type(self.adapter_weight, self.dim) + else: + self.scaling = None + + def forward(self, x, x_shortcut=None, use_shortcut=True, **kwargs): + if x_shortcut is None: + x_shortcut = x + x_shape = x.shape + if len(x_shape) == 4: + b, d, h, w = x_shape + x = x.permute(0, 2, 3, 1).reshape(b, h * w, d) + out = self.ln2(self.activate(self.ln1(x))) + if self.adapter_weight: + scaling = get_weight_value(self.adapter_weight, self.scaling, out) + out = out * scaling if scaling is not None else out + if len(x_shape) == 4: + b, d, h, w = x_shape + out = out.reshape(b, h, w, -1).permute(0, 3, 1, 2).contiguous() + if use_shortcut: + out = x_shortcut + out + return out diff --git a/ms-swift/swift/tuners/side.py b/ms-swift/swift/tuners/side.py new file mode 100644 index 0000000000000000000000000000000000000000..a315bcd3a9527c38d96ac34a9da59cf04e01c91c --- /dev/null +++ b/ms-swift/swift/tuners/side.py @@ -0,0 +1,245 @@ +# Copyright (c) Alibaba, Inc. and its affiliates. +import copy +import re +import types +from collections import OrderedDict +from dataclasses import dataclass, field +from functools import partial +from itertools import repeat +from typing import Union + +import torch +from torch import nn + +from swift.utils.logger import get_logger +from swift.utils.torch_utils import find_sub_module +from .utils import ActivationMixin, SwiftAdapter, SwiftConfig, SwiftOutput + +logger = get_logger() + + +@dataclass +class SideConfig(SwiftConfig): + """ + The configuration class for the side module. + + Side-Tuning only needs to train one side network and + weights the output of pre-trained model and side network. + 'Side-Tuning: A Baseline for Network Adaptation via Additive Side Networks' + by Zhang et al.(2019) + See https://arxiv.org/abs/1912.13503 + + Args: + target_modules: The feedforward module to be replaced, in regex format + """ + + dim: int = field(default=None, metadata={'help': 'The dimension of the hidden states'}) + + target_modules: str = field( + default=None, metadata={'help': 'The target module to be replaced, in full match format'}) + + side_module_name: str = field(default='fcn4', metadata={'help': 'The name of the additive side networks'}) + + source_hidden_pos: Union[str, int] = field( + default=0, + metadata={ + 'help': 'The position of the hidden state input to the target module, can be int (args) or str (kwargs)' + }) + + target_hidden_pos: Union[str, int] = field( + default=0, + metadata={ + 'help': 'The position of the hidden state output from the target module, can be int (args) or str (kwargs)' + }) + + def __post_init__(self): + from .mapping import SwiftTuners + self.swift_type = SwiftTuners.SIDE + + +class Side(SwiftAdapter): + + @staticmethod + def prepare_model(model: nn.Module, config: SideConfig, adapter_name: str) -> SwiftOutput: + """Prepare a model with `SideConfig`""" + module_keys = [key for key, _ in model.named_modules()] + + for module_key in module_keys: + if re.fullmatch(config.target_modules, module_key): # noqa + tgt_module = model.get_submodule(module_key) + logger.info(f'Matching target module [{module_key}] of type {type(tgt_module)}') + if isinstance(tgt_module, (nn.ModuleList, nn.ModuleDict)): + raise Exception( + f'Type of {type(tgt_module)} may not be supported because of its customized forward') + + def _forward(self, *args, **kwargs): + args_main = getattr(self, f'forward_origin_{adapter_name}')(*args, **kwargs) + + if isinstance(config.source_hidden_pos, int): + x = args[config.source_hidden_pos] + else: + x = kwargs[config.source_hidden_pos] + + x_main = args_main[config.target_hidden_pos] \ + if isinstance(args_main, (tuple, list, dict)) else args_main + out = getattr(self, f'side_{adapter_name}')(x, x_main) + if isinstance(args_main, (tuple, list, dict)): + args_main[config.target_hidden_pos] = out + else: + args_main = out + return args_main + + if isinstance(tgt_module, nn.Sequential) and not hasattr(tgt_module, 'tgt_module_keys'): + tgt_module.tgt_module_keys = copy.deepcopy(list(tgt_module._modules.keys())) + + def forward_seq(self, input, *args, **kwargs): + for idx, module in enumerate(self): + if idx >= len(tgt_module.tgt_module_keys): + continue + input = module(input) + return input + + setattr(tgt_module, f'forward_origin_{adapter_name}', types.MethodType(forward_seq, tgt_module)) + else: + setattr(tgt_module, f'forward_origin_{adapter_name}', tgt_module.forward) + tgt_module.forward = types.MethodType(_forward, tgt_module) + side_module = SideModule(config.dim, adapter_name, module_key, config.side_module_name) + setattr(tgt_module, f'side_{adapter_name}', side_module) + logger.info(f'Side modules(module_key): {module_key}.side_{adapter_name}') + + def state_dict_callback(state_dict, adapter_name, **kwargs): + return {key: value for key, value in state_dict.items() if f'side_{adapter_name}' in key} + + def mark_trainable_callback(model): + return + + return SwiftOutput( + config=config, state_dict_callback=state_dict_callback, mark_trainable_callback=mark_trainable_callback) + + @staticmethod + def activate_adapter(module: torch.nn.Module, adapter_name: str, activate: bool, offload: str = None): + modules = find_sub_module(module, f'side_{adapter_name}') + for _module in modules: + _module: ActivationMixin + _module: nn.Module + _module.set_activation(adapter_name, activate) + SwiftAdapter.save_memory(_module, adapter_name, _module.module_key, activate, offload) + + +class SideModule(nn.Module, ActivationMixin): + """The implementation of vision side-tuning method. + + Side-Tuning only needs to train one side network and + weights the output of pre-trained model and side network. + 'Side-Tuning: A Baseline for Network Adaptation via Additive Side Networks' + by Zhang et al.(2019) + See https://arxiv.org/abs/1912.13503 + + Args: + side_module_name: The name of the additive side networks. + """ + + def __init__(self, dim, adapter_name, module_key, side_module_name='fcn4'): + super(SideModule, self).__init__() + super(nn.Module, self).__init__(module_key) + self.adapter_name = adapter_name + + side_module_name = side_module_name.lower() + if side_module_name == 'fcn4': + self.side_net = FCN4(out_dims=dim) + elif side_module_name == 'mlp': + self.side_net = Mlp(dim) + elif side_module_name == 'alexnet': + import torchvision + mm = torchvision.models.alexnet(pretrained=True) + self.side_net = nn.Sequential( + OrderedDict([('features', mm.features), ('avgpool', mm.avgpool), ('flatten', nn.Flatten()), + ('fc', nn.Linear(9216, dim, bias=False))])) + else: + raise ValueError(f'Unsupported side_module_name: {side_module_name}') + self.alpha = nn.Parameter(torch.tensor(0.0)) + self.mark_all_sub_modules_as_plugin() + + def forward(self, x, x_main): + if not self.is_activated(self.adapter_name): + return x_main + alpha_squashed = torch.sigmoid(self.alpha) + x_side = self.side_net(x) + x_out = alpha_squashed * x_main + (1 - alpha_squashed) * x_side + return x_out + + +class FCN4(nn.Module): + """The implementation of simple FCN4 network for side network. + """ + + def __init__(self, out_dims=-1, **kwargs): + super(FCN4, self).__init__(**kwargs) + + self.conv1 = nn.Sequential( + nn.Conv2d(3, 16, kernel_size=3, stride=1, padding=1, bias=False, dilation=1), nn.GroupNorm(2, 16), + nn.ReLU()) + self.conv2 = nn.Sequential( + nn.Conv2d(16, 16, kernel_size=3, stride=2, padding=0, bias=False, dilation=1), nn.GroupNorm(2, 16), + nn.ReLU()) + self.conv3 = nn.Sequential( + nn.Conv2d(16, 32, kernel_size=3, stride=2, padding=0, bias=False, dilation=1), nn.GroupNorm(2, 32), + nn.ReLU()) + self.conv4 = nn.Sequential( + nn.Conv2d(32, 64, kernel_size=3, stride=1, padding=0, bias=False, dilation=1), nn.GroupNorm(2, 64), + nn.ReLU()) + self.pool = nn.AdaptiveAvgPool2d((1, 1)) + if out_dims > 0: + self.fc = nn.Linear(64, out_dims) + else: + self.fc = None + + def forward(self, x): + x = self.conv1(x) + x = self.conv2(x) + x = self.conv3(x) + x = self.conv4(x) + x = self.pool(x) + x = x.view(x.size(0), -1) + if self.fc is not None: + x = self.fc(x) + return x + + +class Mlp(nn.Module): + """ MLP as used in Vision Transformer. + """ + + def __init__( + self, + in_features, + hidden_features=None, + out_features=None, + act_layer=nn.GELU, + norm_layer=None, + bias=True, + drop=0., + use_conv=False, + ): + super().__init__() + out_features = out_features or in_features + hidden_features = hidden_features or in_features + bias = tuple(repeat(bias, 2)) + drop_probs = tuple(repeat(drop, 2)) + linear_layer = partial(nn.Conv2d, kernel_size=1) if use_conv else nn.Linear + + self.fc1 = linear_layer(in_features, hidden_features, bias=bias[0]) + self.act = act_layer() + self.drop1 = nn.Dropout(drop_probs[0]) + self.norm = norm_layer(hidden_features) if norm_layer is not None else nn.Identity() + self.fc2 = linear_layer(hidden_features, out_features, bias=bias[1]) + self.drop2 = nn.Dropout(drop_probs[1]) + + def forward(self, x): + x = self.fc1(x) + x = self.act(x) + x = self.drop1(x) + x = self.norm(x) + x = self.fc2(x) + x = self.drop2(x) + return x diff --git a/ms-swift/swift/ui/app.py b/ms-swift/swift/ui/app.py new file mode 100644 index 0000000000000000000000000000000000000000..81df06f4ff32cf6e7af990980b6fd1f4a73373cb --- /dev/null +++ b/ms-swift/swift/ui/app.py @@ -0,0 +1,92 @@ +# Copyright (c) Alibaba, Inc. and its affiliates. +import os +from functools import partial +from typing import List, Union + +import gradio as gr +from packaging import version +from transformers.utils import strtobool + +import swift +from swift.llm import DeployArguments, EvalArguments, ExportArguments, RLHFArguments, SwiftPipeline, WebUIArguments +from swift.ui.llm_eval.llm_eval import LLMEval +from swift.ui.llm_export.llm_export import LLMExport +from swift.ui.llm_infer.llm_infer import LLMInfer +from swift.ui.llm_train.llm_train import LLMTrain + +locale_dict = { + 'title': { + 'zh': '🚀SWIFT: 轻量级大模型训练推理框架', + 'en': '🚀SWIFT: Scalable lightWeight Infrastructure for Fine-Tuning and Inference' + }, + 'sub_title': { + 'zh': + '请查看 ' + 'SWIFT 文档来查看更多功能,使用SWIFT_UI_LANG=en环境变量来切换英文界面', + 'en': + 'Please check ' + 'SWIFT Documentation for more usages, Use SWIFT_UI_LANG=zh variable to switch to Chinese UI', + }, + 'star_beggar': { + 'zh': + '喜欢SWIFT就动动手指给我们加个star吧🥺 ', + 'en': + 'If you like SWIFT, ' + 'please take a few seconds to star us🥺 ' + }, +} + + +class SwiftWebUI(SwiftPipeline): + + args_class = WebUIArguments + args: args_class + + def run(self): + lang = os.environ.get('SWIFT_UI_LANG') or self.args.lang + share_env = os.environ.get('WEBUI_SHARE') + share = strtobool(share_env) if share_env else self.args.share + server = os.environ.get('WEBUI_SERVER') or self.args.server_name + port_env = os.environ.get('WEBUI_PORT') + port = int(port_env) if port_env else self.args.server_port + LLMTrain.set_lang(lang) + LLMInfer.set_lang(lang) + LLMExport.set_lang(lang) + LLMEval.set_lang(lang) + with gr.Blocks(title='SWIFT WebUI', theme=gr.themes.Base()) as app: + try: + _version = swift.__version__ + except AttributeError: + _version = '' + gr.HTML(f"

{locale_dict['title'][lang]}({_version})

") + gr.HTML(f"

{locale_dict['sub_title'][lang]}

") + with gr.Tabs(): + LLMTrain.build_ui(LLMTrain) + LLMInfer.build_ui(LLMInfer) + LLMExport.build_ui(LLMExport) + LLMEval.build_ui(LLMEval) + + concurrent = {} + if version.parse(gr.__version__) < version.parse('4.0.0'): + concurrent = {'concurrency_count': 5} + app.load( + partial(LLMTrain.update_input_model, arg_cls=RLHFArguments), + inputs=[LLMTrain.element('model')], + outputs=[LLMTrain.element('train_record')] + list(LLMTrain.valid_elements().values())) + app.load( + partial(LLMInfer.update_input_model, arg_cls=DeployArguments, has_record=False), + inputs=[LLMInfer.element('model')], + outputs=list(LLMInfer.valid_elements().values())) + app.load( + partial(LLMExport.update_input_model, arg_cls=ExportArguments, has_record=False), + inputs=[LLMExport.element('model')], + outputs=list(LLMExport.valid_elements().values())) + app.load( + partial(LLMEval.update_input_model, arg_cls=EvalArguments, has_record=False), + inputs=[LLMEval.element('model')], + outputs=list(LLMEval.valid_elements().values())) + app.queue(**concurrent).launch(server_name=server, inbrowser=True, server_port=port, height=800, share=share) + + +def webui_main(args: Union[List[str], WebUIArguments, None] = None): + return SwiftWebUI(args).main() diff --git a/ms-swift/swift/ui/base.py b/ms-swift/swift/ui/base.py new file mode 100644 index 0000000000000000000000000000000000000000..6ca62a6fef2859964292f15e1bd4ac4fda029bbb --- /dev/null +++ b/ms-swift/swift/ui/base.py @@ -0,0 +1,388 @@ +# Copyright (c) Alibaba, Inc. and its affiliates. +import dataclasses +import os +import sys +import time +import typing +from collections import OrderedDict +from dataclasses import fields +from datetime import datetime +from functools import wraps +from typing import Any, Dict, List, Type + +import gradio as gr +import json +from gradio import Accordion, Audio, Button, Checkbox, Dropdown, File, Image, Slider, Tab, TabItem, Textbox, Video +from modelscope.hub.utils.utils import get_cache_dir + +from swift.llm import TEMPLATE_MAPPING, BaseArguments, get_matched_model_meta + +all_langs = ['zh', 'en'] +builder: Type['BaseUI'] = None +base_builder: Type['BaseUI'] = None + + +def update_data(fn): + + @wraps(fn) + def wrapper(*args, **kwargs): + elem_id = kwargs.get('elem_id', None) + self = args[0] + + if builder is not None: + choices = base_builder.choice(elem_id) + if choices: + choices = [str(choice) if choice is not None else None for choice in choices] + kwargs['choices'] = choices + + if not isinstance(self, (Tab, TabItem, Accordion)) and 'interactive' not in kwargs: # noqa + kwargs['interactive'] = True + + if 'is_list' in kwargs: + self.is_list = kwargs.pop('is_list') + + if base_builder and base_builder.default(elem_id) is not None and not kwargs.get('value'): + kwargs['value'] = base_builder.default(elem_id) + + if builder is not None: + if elem_id in builder.locales(builder.lang): + values = builder.locale(elem_id, builder.lang) + if 'info' in values: + kwargs['info'] = values['info'] + if 'value' in values: + kwargs['value'] = values['value'] + if 'label' in values: + kwargs['label'] = values['label'] + if hasattr(builder, 'visible'): + kwargs['visible'] = builder.visible + argument = base_builder.argument(elem_id) + if argument and 'label' in kwargs: + kwargs['label'] = kwargs['label'] + f'({argument})' + + kwargs['elem_classes'] = 'align' + ret = fn(self, **kwargs) + self.constructor_args.update(kwargs) + + if builder is not None: + builder.element_dict[elem_id] = self + return ret + + return wrapper + + +Textbox.__init__ = update_data(Textbox.__init__) +Dropdown.__init__ = update_data(Dropdown.__init__) +Checkbox.__init__ = update_data(Checkbox.__init__) +Slider.__init__ = update_data(Slider.__init__) +TabItem.__init__ = update_data(TabItem.__init__) +Accordion.__init__ = update_data(Accordion.__init__) +Button.__init__ = update_data(Button.__init__) +File.__init__ = update_data(File.__init__) +Image.__init__ = update_data(Image.__init__) +Video.__init__ = update_data(Video.__init__) +Audio.__init__ = update_data(Audio.__init__) + + +class BaseUI: + + choice_dict: Dict[str, List] = {} + default_dict: Dict[str, Any] = {} + locale_dict: Dict[str, Dict] = {} + element_dict: Dict[str, Dict] = {} + arguments: Dict[str, str] = {} + sub_ui: List[Type['BaseUI']] = [] + group: str = None + lang: str = all_langs[0] + int_regex = r'^[-+]?[0-9]+$' + float_regex = r'[-+]?(?:\d*\.*\d+)' + bool_regex = r'^(T|t)rue$|^(F|f)alse$' + cache_dir = os.path.join(get_cache_dir(), 'swift-web-ui') + os.makedirs(cache_dir, exist_ok=True) + quote = '\'' if sys.platform != 'win32' else '"' + visible = True + _locale = { + 'local_dir_alert': { + 'value': { + 'zh': '无法识别model_type和template,请手动选择', + 'en': 'Cannot recognize the model_type and template, please choose manually' + } + }, + } + + @classmethod + def build_ui(cls, base_tab: Type['BaseUI']): + """Build UI""" + global builder, base_builder + cls.element_dict = {} + old_builder = builder + old_base_builder = base_builder + builder = cls + base_builder = base_tab + cls.do_build_ui(base_tab) + builder = old_builder + base_builder = old_base_builder + if cls is base_tab: + for ui in cls.sub_ui: + ui.after_build_ui(base_tab) + + @classmethod + def after_build_ui(cls, base_tab: Type['BaseUI']): + pass + + @classmethod + def do_build_ui(cls, base_tab: Type['BaseUI']): + """Build UI""" + pass + + @classmethod + def save_cache(cls, key, value): + timestamp = str(int(time.time())) + key = key.replace('/', '-') + filename = os.path.join(cls.cache_dir, key + '-' + timestamp) + with open(filename, 'w', encoding='utf-8') as f: + json.dump(value, f) + + @classmethod + def list_cache(cls, key): + files = [] + key = key.replace('/', '-') + for _, _, filenames in os.walk(cls.cache_dir): + for filename in filenames: + if filename.startswith(key): + idx = filename.rfind('-') + key, ts = filename[:idx], filename[idx + 1:] + dt_object = datetime.fromtimestamp(int(ts)) + formatted_time = dt_object.strftime('%Y/%m/%d %H:%M:%S') + files.append(formatted_time) + return sorted(files, reverse=True) + + @classmethod + def load_cache(cls, key, timestamp) -> BaseArguments: + dt_object = datetime.strptime(timestamp, '%Y/%m/%d %H:%M:%S') + timestamp = int(dt_object.timestamp()) + key = key.replace('/', '-') + filename = key + '-' + str(timestamp) + with open(os.path.join(cls.cache_dir, filename), 'r', encoding='utf-8') as f: + return json.load(f) + + @classmethod + def clear_cache(cls, key): + key = key.replace('/', '-') + for _, _, filenames in os.walk(cls.cache_dir): + for filename in filenames: + if filename.startswith(key): + os.remove(os.path.join(cls.cache_dir, filename)) + + @classmethod + def choice(cls, elem_id): + """Get choice by elem_id""" + for sub_ui in BaseUI.sub_ui: + _choice = sub_ui.choice(elem_id) + if _choice: + return _choice + return cls.choice_dict.get(elem_id, []) + + @classmethod + def default(cls, elem_id): + """Get choice by elem_id""" + if elem_id in cls.default_dict: + return cls.default_dict.get(elem_id) + for sub_ui in BaseUI.sub_ui: + _choice = sub_ui.default(elem_id) + if _choice: + return _choice + return None + + @classmethod + def locale(cls, elem_id, lang): + """Get locale by elem_id""" + return cls.locales(lang)[elem_id] + + @classmethod + def locales(cls, lang): + """Get locale by lang""" + locales = OrderedDict() + for sub_ui in cls.sub_ui: + _locales = sub_ui.locales(lang) + locales.update(_locales) + for key, value in cls.locale_dict.items(): + locales[key] = {k: v[lang] for k, v in value.items()} + return locales + + @classmethod + def elements(cls): + """Get all elements""" + elements = OrderedDict() + elements.update(cls.element_dict) + for sub_ui in cls.sub_ui: + _elements = sub_ui.elements() + elements.update(_elements) + return elements + + @classmethod + def valid_elements(cls): + valid_elements = OrderedDict() + elements = cls.elements() + for key, value in elements.items(): + if isinstance(value, (Textbox, Dropdown, Slider, Checkbox)) and key != 'train_record': + valid_elements[key] = value + return valid_elements + + @classmethod + def element_keys(cls): + return list(cls.elements().keys()) + + @classmethod + def valid_element_keys(cls): + return [ + key for key, value in cls.elements().items() + if isinstance(value, (Textbox, Dropdown, Slider, Checkbox)) and key != 'train_record' + ] + + @classmethod + def element(cls, elem_id): + """Get element by elem_id""" + elements = cls.elements() + return elements[elem_id] + + @classmethod + def argument(cls, elem_id): + """Get argument by elem_id""" + return cls.arguments.get(elem_id) + + @classmethod + def set_lang(cls, lang): + cls.lang = lang + for sub_ui in cls.sub_ui: + sub_ui.lang = lang + + @staticmethod + def get_choices_from_dataclass(dataclass): + choice_dict = {} + for f in fields(dataclass): + default_value = f.default + if 'MISSING_TYPE' in str(default_value): + default_value = None + if 'choices' in f.metadata: + choice_dict[f.name] = list(f.metadata['choices']) + if 'Literal' in str(f.type) and typing.get_args(f.type): + choice_dict[f.name] = list(typing.get_args(f.type)) + if f.name in choice_dict and default_value not in choice_dict[f.name]: + choice_dict[f.name].insert(0, default_value) + return choice_dict + + @staticmethod + def get_default_value_from_dataclass(dataclass): + default_dict = {} + for f in fields(dataclass): + if f.default.__class__ is dataclasses._MISSING_TYPE: + default_dict[f.name] = f.default_factory() + else: + default_dict[f.name] = f.default + if isinstance(default_dict[f.name], list): + try: + default_dict[f.name] = ' '.join(default_dict[f.name]) + except TypeError: + default_dict[f.name] = None + if not default_dict[f.name]: + default_dict[f.name] = None + return default_dict + + @staticmethod + def get_argument_names(dataclass): + arguments = {} + for f in fields(dataclass): + arguments[f.name] = f'--{f.name}' + return arguments + + @classmethod + def update_input_model(cls, model, allow_keys=None, has_record=True, arg_cls=BaseArguments, is_ref_model=False): + keys = cls.valid_element_keys() + if allow_keys: + keys = [key for key in keys if key in allow_keys] + + if not model: + ret = [gr.update()] * (len(keys) + int(has_record)) + if len(ret) == 1: + return ret[0] + else: + return ret + + model_meta = get_matched_model_meta(model) + local_args_path = os.path.join(model, 'args.json') + if model_meta is None and not os.path.exists(local_args_path): + gr.Info(cls._locale['local_dir_alert']['value'][cls.lang]) + ret = [gr.update()] * (len(keys) + int(has_record)) + if len(ret) == 1: + return ret[0] + else: + return ret + + if os.path.exists(local_args_path): + try: + if hasattr(arg_cls, 'resume_from_checkpoint'): + try: + args = arg_cls(resume_from_checkpoint=model, load_data_args=True) + except Exception as e: + if 'using `--model`' in str(e): # TODO a dirty fix + args = arg_cls(model=model, load_data_args=True) + else: + raise e + else: + args = arg_cls(ckpt_dir=model, load_data_args=True) + except ValueError: + return [gr.update()] * (len(keys) + int(has_record)) + values = [] + for key in keys: + arg_value = getattr(args, key, None) + if arg_value and key != 'model': + if key in ('torch_dtype', 'bnb_4bit_compute_dtype'): + arg_value = str(arg_value).split('.')[1] + if isinstance(arg_value, list) and key != 'dataset': + try: + arg_value = ' '.join(arg_value) + except Exception: + arg_value = None + values.append(gr.update(value=arg_value)) + else: + values.append(gr.update()) + ret = [gr.update(choices=[])] * int(has_record) + values + if len(ret) == 1: + return ret[0] + else: + return ret + else: + values = [] + for key in keys: + if key not in ('template', 'model_type', 'ref_model_type', 'system'): + values.append(gr.update()) + elif key in ('template', 'model_type', 'ref_model_type'): + if key == 'ref_model_type': + if is_ref_model: + values.append(gr.update(value=getattr(model_meta, 'model_type'))) + else: + values.append(gr.update()) + else: + values.append(gr.update(value=getattr(model_meta, key))) + else: + values.append(gr.update(value=TEMPLATE_MAPPING[model_meta.template].default_system)) + + if has_record: + return [gr.update(choices=cls.list_cache(model))] + values + else: + if len(values) == 1: + return values[0] + return values + + @classmethod + def update_all_settings(cls, model, train_record, base_tab): + if not train_record: + return [gr.update()] * len(cls.elements()) + cache = cls.load_cache(model, train_record) + updates = [] + for key, value in base_tab.valid_elements().items(): + if key in cache: + updates.append(gr.update(value=cache[key])) + else: + updates.append(gr.update()) + return updates diff --git a/ms-swift/swift/ui/llm_eval/__init__.py b/ms-swift/swift/ui/llm_eval/__init__.py new file mode 100644 index 0000000000000000000000000000000000000000..b937315b6e719ae8289fee2908aa486222eb76c5 --- /dev/null +++ b/ms-swift/swift/ui/llm_eval/__init__.py @@ -0,0 +1 @@ +# Copyright (c) Alibaba, Inc. and its affiliates. diff --git a/ms-swift/swift/ui/llm_eval/eval.py b/ms-swift/swift/ui/llm_eval/eval.py new file mode 100644 index 0000000000000000000000000000000000000000..ded9038bbae8d7a25e1bc2085bf74459fde787b5 --- /dev/null +++ b/ms-swift/swift/ui/llm_eval/eval.py @@ -0,0 +1,130 @@ +# Copyright (c) Alibaba, Inc. and its affiliates. +from typing import Type + +import gradio as gr + +from swift.ui.base import BaseUI +from swift.utils import get_logger + +logger = get_logger() + + +class Eval(BaseUI): + + group = 'llm_eval' + + locale_dict = { + 'eval_backend': { + 'label': { + 'zh': '评测后端', + 'en': 'Eval backend' + }, + 'info': { + 'zh': '选择评测后端', + 'en': 'Select eval backend' + } + }, + 'eval_dataset': { + 'label': { + 'zh': '评测数据集', + 'en': 'Evaluation dataset' + }, + 'info': { + 'zh': '选择评测数据集,支持多选 (先选择评测后端)', + 'en': 'Select eval dataset, multiple datasets supported (select eval backend first)' + } + }, + 'eval_limit': { + 'label': { + 'zh': '评测数据个数', + 'en': 'Eval numbers for each dataset' + }, + 'info': { + 'zh': '每个评测集的取样数', + 'en': 'Number of rows sampled from each dataset' + } + }, + 'eval_output_dir': { + 'label': { + 'zh': '评测输出目录', + 'en': 'Eval output dir' + }, + 'info': { + 'zh': '评测结果的输出目录', + 'en': 'The dir to save the eval results' + } + }, + 'custom_eval_config': { + 'label': { + 'zh': '自定义数据集评测配置', + 'en': 'Custom eval config' + }, + 'info': { + 'zh': '可以使用该配置评测自己的数据集,详见github文档的评测部分', + 'en': 'Use this config to eval your own datasets, check the docs in github for details' + } + }, + 'eval_url': { + 'label': { + 'zh': '评测链接', + 'en': 'The eval url' + }, + 'info': { + 'zh': + 'OpenAI样式的评测链接(如:http://localhost:8080/v1/chat/completions),用于评测接口(模型类型输入为实际模型类型)', + 'en': + 'The OpenAI style link(like: http://localhost:8080/v1/chat/completions) for ' + 'evaluation(Input actual model type into model_type)' + } + }, + 'api_key': { + 'label': { + 'zh': '接口token', + 'en': 'The url token' + }, + 'info': { + 'zh': 'eval_url的token', + 'en': 'The token used with eval_url' + } + }, + 'infer_backend': { + 'label': { + 'zh': '推理框架', + 'en': 'Infer backend' + }, + } + } + + @classmethod + def do_build_ui(cls, base_tab: Type['BaseUI']): + try: + from swift.llm.argument.eval_args import EvalArguments + eval_dataset_dict = EvalArguments.list_eval_dataset() + default_backend = EvalArguments.eval_backend + except Exception as e: + logger.warn(e) + eval_dataset_dict = {} + default_backend = None + + with gr.Row(): + gr.Dropdown(elem_id='eval_backend', choices=list(eval_dataset_dict.keys()), value=default_backend, scale=20) + gr.Dropdown( + elem_id='eval_dataset', + is_list=True, + choices=eval_dataset_dict.get(default_backend, []), + multiselect=True, + allow_custom_value=True, + scale=20) + gr.Textbox(elem_id='eval_limit', scale=20) + gr.Dropdown(elem_id='infer_backend', scale=20) + with gr.Row(): + gr.Textbox(elem_id='custom_eval_config', scale=20) + gr.Textbox(elem_id='eval_output_dir', scale=20) + gr.Textbox(elem_id='eval_url', scale=20) + gr.Textbox(elem_id='api_key', scale=20) + + def update_eval_dataset(backend): + return gr.update(choices=eval_dataset_dict[backend]) + + cls.element('eval_backend').change(update_eval_dataset, [cls.element('eval_backend')], + [cls.element('eval_dataset')]) diff --git a/ms-swift/swift/ui/llm_eval/model.py b/ms-swift/swift/ui/llm_eval/model.py new file mode 100644 index 0000000000000000000000000000000000000000..570afabf8c63d37a3d1487a97d2591102b93eefd --- /dev/null +++ b/ms-swift/swift/ui/llm_eval/model.py @@ -0,0 +1,78 @@ +# Copyright (c) Alibaba, Inc. and its affiliates. +from functools import partial +from typing import Type + +import gradio as gr + +from swift.llm import TEMPLATE_MAPPING, EvalArguments, ModelType +from swift.llm.model.register import get_all_models +from swift.ui.base import BaseUI + + +class Model(BaseUI): + + group = 'llm_eval' + + locale_dict = { + 'checkpoint': { + 'value': { + 'zh': '训练后的模型', + 'en': 'Trained model' + } + }, + 'model_type': { + 'label': { + 'zh': '选择模型类型', + 'en': 'Select Model Type' + }, + 'info': { + 'zh': 'SWIFT已支持的模型类型', + 'en': 'Base model type supported by SWIFT' + } + }, + 'model': { + 'label': { + 'zh': '模型id或路径', + 'en': 'Model id or path' + }, + 'info': { + 'zh': '实际的模型id,如果是训练后的模型请填入checkpoint-xxx的目录', + 'en': 'The actual model id or path, if is a trained model, please fill in the checkpoint-xxx dir' + } + }, + 'reset': { + 'value': { + 'zh': '恢复初始值', + 'en': 'Reset to default' + }, + }, + 'template': { + 'label': { + 'zh': '模型Prompt模板类型', + 'en': 'Prompt template type' + }, + 'info': { + 'zh': '选择匹配模型的Prompt模板', + 'en': 'Choose the template type of the model' + } + }, + } + + @classmethod + def do_build_ui(cls, base_tab: Type['BaseUI']): + with gr.Row(): + gr.Dropdown( + elem_id='model', + scale=20, + choices=get_all_models(), + value='Qwen/Qwen2.5-7B-Instruct', + allow_custom_value=True) + gr.Dropdown(elem_id='model_type', choices=ModelType.get_model_name_list(), scale=20) + gr.Dropdown(elem_id='template', choices=list(TEMPLATE_MAPPING.keys()), scale=20) + + @classmethod + def after_build_ui(cls, base_tab: Type['BaseUI']): + cls.element('model').change( + partial(cls.update_input_model, arg_cls=EvalArguments, has_record=False), + inputs=[cls.element('model')], + outputs=list(cls.valid_elements().values())) diff --git a/ms-swift/swift/ui/llm_export/llm_export.py b/ms-swift/swift/ui/llm_export/llm_export.py new file mode 100644 index 0000000000000000000000000000000000000000..b71ccf6d7f3d12cf5cd279bff716d2b9557a4373 --- /dev/null +++ b/ms-swift/swift/ui/llm_export/llm_export.py @@ -0,0 +1,191 @@ +# Copyright (c) Alibaba, Inc. and its affiliates. +import os +import re +import sys +import time +from datetime import datetime +from functools import partial +from typing import Type + +import gradio as gr +import json +import torch +from json import JSONDecodeError +from transformers.utils import is_torch_cuda_available, is_torch_npu_available + +from swift.llm import ExportArguments +from swift.ui.base import BaseUI +from swift.ui.llm_export.export import Export +from swift.ui.llm_export.model import Model +from swift.ui.llm_export.runtime import ExportRuntime +from swift.utils import get_device_count + + +class LLMExport(BaseUI): + group = 'llm_export' + + sub_ui = [Model, Export, ExportRuntime] + + locale_dict = { + 'llm_export': { + 'label': { + 'zh': 'LLM导出', + 'en': 'LLM export', + } + }, + 'more_params': { + 'label': { + 'zh': '更多参数', + 'en': 'More params' + }, + 'info': { + 'zh': '以json格式或--xxx xxx命令行格式填入', + 'en': 'Fill in with json format or --xxx xxx cmd format' + } + }, + 'export': { + 'value': { + 'zh': '开始导出', + 'en': 'Begin Export' + }, + }, + 'gpu_id': { + 'label': { + 'zh': '选择可用GPU', + 'en': 'Choose GPU' + }, + 'info': { + 'zh': '选择使用的GPU号,如CUDA不可用只能选择CPU', + 'en': 'Select GPU to export' + } + }, + } + + choice_dict = BaseUI.get_choices_from_dataclass(ExportArguments) + default_dict = BaseUI.get_default_value_from_dataclass(ExportArguments) + arguments = BaseUI.get_argument_names(ExportArguments) + + @classmethod + def do_build_ui(cls, base_tab: Type['BaseUI']): + with gr.TabItem(elem_id='llm_export', label=''): + default_device = 'cpu' + device_count = get_device_count() + if device_count > 0: + default_device = '0' + with gr.Blocks(): + Model.build_ui(base_tab) + Export.build_ui(base_tab) + ExportRuntime.build_ui(base_tab) + with gr.Row(): + gr.Textbox(elem_id='more_params', lines=4, scale=20) + gr.Button(elem_id='export', scale=2, variant='primary') + gr.Dropdown( + elem_id='gpu_id', + multiselect=True, + choices=[str(i) for i in range(device_count)] + ['cpu'], + value=default_device, + scale=8) + + cls.element('export').click( + cls.export_model, list(base_tab.valid_elements().values()), + [cls.element('runtime_tab'), cls.element('running_tasks')]) + + base_tab.element('running_tasks').change( + partial(ExportRuntime.task_changed, base_tab=base_tab), [base_tab.element('running_tasks')], + list(base_tab.valid_elements().values()) + [cls.element('log')]) + ExportRuntime.element('kill_task').click( + ExportRuntime.kill_task, + [ExportRuntime.element('running_tasks')], + [ExportRuntime.element('running_tasks')] + [ExportRuntime.element('log')], + ) + + @classmethod + def export(cls, *args): + export_args = cls.get_default_value_from_dataclass(ExportArguments) + kwargs = {} + kwargs_is_list = {} + other_kwargs = {} + more_params = {} + more_params_cmd = '' + keys = cls.valid_element_keys() + for key, value in zip(keys, args): + compare_value = export_args.get(key) + compare_value_arg = str(compare_value) if not isinstance(compare_value, (list, dict)) else compare_value + compare_value_ui = str(value) if not isinstance(value, (list, dict)) else value + if key in export_args and compare_value_ui != compare_value_arg and value: + if isinstance(value, str) and re.fullmatch(cls.int_regex, value): + value = int(value) + elif isinstance(value, str) and re.fullmatch(cls.float_regex, value): + value = float(value) + elif isinstance(value, str) and re.fullmatch(cls.bool_regex, value): + value = True if value.lower() == 'true' else False + kwargs[key] = value if not isinstance(value, list) else ' '.join(value) + kwargs_is_list[key] = isinstance(value, list) or getattr(cls.element(key), 'is_list', False) + else: + other_kwargs[key] = value + if key == 'more_params' and value: + try: + more_params = json.loads(value) + except (JSONDecodeError or TypeError): + more_params_cmd = value + + kwargs.update(more_params) + model = kwargs.get('model') + if os.path.exists(model) and os.path.exists(os.path.join(model, 'args.json')): + kwargs['ckpt_dir'] = kwargs.pop('model') + export_args = ExportArguments( + **{ + key: value.split(' ') if key in kwargs_is_list and kwargs_is_list[key] else value + for key, value in kwargs.items() + }) + params = '' + sep = f'{cls.quote} {cls.quote}' + for e in kwargs: + if isinstance(kwargs[e], list): + params += f'--{e} {cls.quote}{sep.join(kwargs[e])}{cls.quote} ' + elif e in kwargs_is_list and kwargs_is_list[e]: + all_args = [arg for arg in kwargs[e].split(' ') if arg.strip()] + params += f'--{e} {cls.quote}{sep.join(all_args)}{cls.quote} ' + else: + params += f'--{e} {cls.quote}{kwargs[e]}{cls.quote} ' + params += more_params_cmd + ' ' + devices = other_kwargs['gpu_id'] + devices = [d for d in devices if d] + assert (len(devices) == 1 or 'cpu' not in devices) + gpus = ','.join(devices) + cuda_param = '' + if gpus != 'cpu': + if is_torch_npu_available(): + cuda_param = f'ASCEND_RT_VISIBLE_DEVICES={gpus}' + elif is_torch_cuda_available(): + cuda_param = f'CUDA_VISIBLE_DEVICES={gpus}' + else: + cuda_param = '' + now = datetime.now() + time_str = f'{now.year}{now.month}{now.day}{now.hour}{now.minute}{now.second}' + file_path = f'output/{export_args.model_type}-{time_str}' + if not os.path.exists(file_path): + os.makedirs(file_path, exist_ok=True) + log_file = os.path.join(os.getcwd(), f'{file_path}/run_export.log') + export_args.log_file = log_file + params += f'--log_file "{log_file}" ' + params += '--ignore_args_error true ' + additional_param = '' + if export_args.quant_method == 'gptq': + additional_param = 'OMP_NUM_THREADS=14' + if sys.platform == 'win32': + if cuda_param: + cuda_param = f'set {cuda_param} && ' + if additional_param: + additional_param = f'set {additional_param} && ' + run_command = f'{cuda_param}{additional_param}start /b swift export {params} > {log_file} 2>&1' + else: + run_command = f'{cuda_param} {additional_param} nohup swift export {params} > {log_file} 2>&1 &' + return run_command, export_args, log_file + + @classmethod + def export_model(cls, *args): + run_command, export_args, log_file = cls.export(*args) + os.system(run_command) + time.sleep(2) + return gr.update(open=True), ExportRuntime.refresh_tasks(log_file) diff --git a/ms-swift/swift/ui/llm_export/model.py b/ms-swift/swift/ui/llm_export/model.py new file mode 100644 index 0000000000000000000000000000000000000000..d42862f71ded65990b2104b7dda4d625a0953544 --- /dev/null +++ b/ms-swift/swift/ui/llm_export/model.py @@ -0,0 +1,83 @@ +# Copyright (c) Alibaba, Inc. and its affiliates. +from functools import partial +from typing import Type + +import gradio as gr + +from swift.llm import TEMPLATE_MAPPING, ExportArguments, ModelType +from swift.llm.model.register import get_all_models +from swift.ui.base import BaseUI + + +class Model(BaseUI): + + group = 'llm_export' + + locale_dict = { + 'checkpoint': { + 'value': { + 'zh': '训练后的模型', + 'en': 'Trained model' + } + }, + 'model_type': { + 'label': { + 'zh': '选择模型类型', + 'en': 'Select Model Type' + }, + 'info': { + 'zh': 'SWIFT已支持的模型类型', + 'en': 'Base model type supported by SWIFT' + } + }, + 'model': { + 'label': { + 'zh': '模型id或路径', + 'en': 'Model id or path' + }, + 'info': { + 'zh': '实际的模型id,如果是训练后的模型请填入checkpoint-xxx的目录', + 'en': 'The actual model id or path, if is a trained model, please fill in the checkpoint-xxx dir' + } + }, + 'reset': { + 'value': { + 'zh': '恢复初始值', + 'en': 'Reset to default' + }, + }, + 'template': { + 'label': { + 'zh': '模型Prompt模板类型', + 'en': 'Prompt template type' + }, + 'info': { + 'zh': '选择匹配模型的Prompt模板', + 'en': 'Choose the template type of the model' + } + }, + } + + ignored_models = ['int1', 'int2', 'int4', 'int8', 'awq', 'gptq', 'bnb', 'eetq', 'aqlm', 'hqq'] + + @classmethod + def do_build_ui(cls, base_tab: Type['BaseUI']): + with gr.Row(): + all_models = [ + model for model in get_all_models() if not any([ignored in model for ignored in cls.ignored_models]) + ] + gr.Dropdown( + elem_id='model', + scale=20, + choices=all_models, + value='Qwen/Qwen2.5-7B-Instruct', + allow_custom_value=True) + gr.Dropdown(elem_id='model_type', choices=ModelType.get_model_name_list(), scale=20) + gr.Dropdown(elem_id='template', choices=list(TEMPLATE_MAPPING.keys()), scale=20) + + @classmethod + def after_build_ui(cls, base_tab: Type['BaseUI']): + cls.element('model').change( + partial(cls.update_input_model, arg_cls=ExportArguments, has_record=False), + inputs=[cls.element('model')], + outputs=list(cls.valid_elements().values())) diff --git a/ms-swift/swift/ui/llm_export/runtime.py b/ms-swift/swift/ui/llm_export/runtime.py new file mode 100644 index 0000000000000000000000000000000000000000..f34ac4dfb0e917b2a9e1d9c3fdeb635c62315275 --- /dev/null +++ b/ms-swift/swift/ui/llm_export/runtime.py @@ -0,0 +1,75 @@ +# Copyright (c) Alibaba, Inc. and its affiliates. +from swift.ui.llm_infer.runtime import Runtime +from swift.utils import get_logger + +logger = get_logger() + + +class ExportRuntime(Runtime): + + group = 'llm_export' + + cmd = 'export' + + locale_dict = { + 'runtime_tab': { + 'label': { + 'zh': '运行时', + 'en': 'Runtime' + }, + }, + 'running_cmd': { + 'label': { + 'zh': '运行命令', + 'en': 'Command line' + }, + 'info': { + 'zh': '执行的实际命令', + 'en': 'The actual command' + } + }, + 'show_log': { + 'value': { + 'zh': '展示导出状态', + 'en': 'Show export status' + }, + }, + 'stop_show_log': { + 'value': { + 'zh': '停止展示', + 'en': 'Stop showing running status' + }, + }, + 'log': { + 'label': { + 'zh': '日志输出', + 'en': 'Logging content' + }, + 'info': { + 'zh': '如果日志无更新请再次点击"展示日志内容"', + 'en': 'Please press "Show log" if the log content is not updating' + } + }, + 'running_tasks': { + 'label': { + 'zh': '运行中导出任务', + 'en': 'Running export task' + }, + 'info': { + 'zh': '所有的swift export命令启动的任务', + 'en': 'All tasks started by swift export' + } + }, + 'refresh_tasks': { + 'value': { + 'zh': '找回导出任务', + 'en': 'Find export' + }, + }, + 'kill_task': { + 'value': { + 'zh': '杀死导出任务', + 'en': 'Kill export' + }, + }, + } diff --git a/ms-swift/swift/ui/llm_infer/__init__.py b/ms-swift/swift/ui/llm_infer/__init__.py new file mode 100644 index 0000000000000000000000000000000000000000..b937315b6e719ae8289fee2908aa486222eb76c5 --- /dev/null +++ b/ms-swift/swift/ui/llm_infer/__init__.py @@ -0,0 +1 @@ +# Copyright (c) Alibaba, Inc. and its affiliates. diff --git a/ms-swift/swift/ui/llm_infer/generate.py b/ms-swift/swift/ui/llm_infer/generate.py new file mode 100644 index 0000000000000000000000000000000000000000..b83b212a95b2efb2c981522e96641f565bb61f05 --- /dev/null +++ b/ms-swift/swift/ui/llm_infer/generate.py @@ -0,0 +1,65 @@ +# Copyright (c) Alibaba, Inc. and its affiliates. +from typing import Type + +import gradio as gr + +from swift.ui.base import BaseUI + + +class Generate(BaseUI): + + group = 'llm_infer' + + locale_dict = { + 'max_new_tokens': { + 'label': { + 'zh': '生成序列最大长度', + 'en': 'Max new tokens' + }, + }, + 'temperature': { + 'label': { + 'zh': 'temperature', + 'en': 'temperature' + }, + }, + 'top_k': { + 'label': { + 'zh': 'top_k', + 'en': 'top_k' + }, + }, + 'top_p': { + 'label': { + 'zh': 'top_p', + 'en': 'top_p' + }, + }, + 'repetition_penalty': { + 'label': { + 'zh': 'repetition_penalty', + 'en': 'repetition_penalty' + }, + }, + 'system': { + 'label': { + 'zh': 'system字段', + 'en': 'system' + }, + 'info': { + 'zh': 'system字段支持在加载模型后修改', + 'en': 'system can be modified after the model weights loaded' + } + }, + } + + @classmethod + def do_build_ui(cls, base_tab: Type['BaseUI']): + with gr.Row(): + gr.Textbox(elem_id='max_new_tokens', lines=1, value='2048') + gr.Slider(elem_id='temperature', minimum=0.0, maximum=10, step=0.1, value=0.3) + gr.Slider(elem_id='top_k', minimum=1, maximum=100, step=5, value=20) + gr.Slider(elem_id='top_p', minimum=0.0, maximum=1.0, step=0.05, value=0.7) + gr.Slider(elem_id='repetition_penalty', minimum=0.0, maximum=10, step=0.05, value=1.05) + with gr.Row(): + gr.Textbox(elem_id='system', lines=4, scale=20) diff --git a/ms-swift/swift/ui/llm_infer/llm_infer.py b/ms-swift/swift/ui/llm_infer/llm_infer.py new file mode 100644 index 0000000000000000000000000000000000000000..70480631879158441604e7d9034b8beb048f3181 --- /dev/null +++ b/ms-swift/swift/ui/llm_infer/llm_infer.py @@ -0,0 +1,396 @@ +# Copyright (c) Alibaba, Inc. and its affiliates. +import os +import re +import signal +import sys +import time +from copy import deepcopy +from datetime import datetime +from functools import partial +from typing import List, Type + +import gradio as gr +import json +import torch +from json import JSONDecodeError +from transformers.utils import is_torch_cuda_available, is_torch_npu_available + +from swift.llm import DeployArguments, InferArguments, InferClient, InferRequest, RequestConfig +from swift.ui.base import BaseUI +from swift.ui.llm_infer.model import Model +from swift.ui.llm_infer.runtime import Runtime +from swift.utils import get_device_count, get_logger + +logger = get_logger() + + +class LLMInfer(BaseUI): + + group = 'llm_infer' + + is_multimodal = True + + sub_ui = [Model, Runtime] + + locale_dict = { + 'generate_alert': { + 'value': { + 'zh': '请先部署模型', + 'en': 'Please deploy model first', + } + }, + 'port': { + 'label': { + 'zh': '端口', + 'en': 'port' + }, + }, + 'llm_infer': { + 'label': { + 'zh': 'LLM推理', + 'en': 'LLM Inference', + } + }, + 'load_alert': { + 'value': { + 'zh': '部署中,请点击"展示部署状态"查看', + 'en': 'Start to deploy model, ' + 'please Click "Show running ' + 'status" to view details', + } + }, + 'loaded_alert': { + 'value': { + 'zh': '模型加载完成', + 'en': 'Model loaded' + } + }, + 'port_alert': { + 'value': { + 'zh': '该端口已被占用', + 'en': 'The port has been occupied' + } + }, + 'chatbot': { + 'value': { + 'zh': '对话框', + 'en': 'Chat bot' + }, + }, + 'infer_model_type': { + 'label': { + 'zh': 'Lora模块', + 'en': 'Lora module' + }, + 'info': { + 'zh': '发送给server端哪个LoRA,默认为`default`', + 'en': 'Which LoRA to use on server, default value is `default`' + } + }, + 'prompt': { + 'label': { + 'zh': '请输入:', + 'en': 'Input:' + }, + }, + 'clear_history': { + 'value': { + 'zh': '清除对话信息', + 'en': 'Clear history' + }, + }, + 'submit': { + 'value': { + 'zh': '🚀 发送', + 'en': '🚀 Send' + }, + }, + 'gpu_id': { + 'label': { + 'zh': '选择可用GPU', + 'en': 'Choose GPU' + }, + 'info': { + 'zh': '选择训练使用的GPU号,如CUDA不可用只能选择CPU', + 'en': 'Select GPU to train' + } + }, + } + + choice_dict = BaseUI.get_choices_from_dataclass(InferArguments) + default_dict = BaseUI.get_default_value_from_dataclass(InferArguments) + arguments = BaseUI.get_argument_names(InferArguments) + + @classmethod + def do_build_ui(cls, base_tab: Type['BaseUI']): + with gr.TabItem(elem_id='llm_infer', label=''): + default_device = 'cpu' + device_count = get_device_count() + if device_count > 0: + default_device = '0' + with gr.Blocks(): + infer_request = gr.State(None) + Model.build_ui(base_tab) + Runtime.build_ui(base_tab) + with gr.Row(): + gr.Dropdown( + elem_id='gpu_id', + multiselect=True, + choices=[str(i) for i in range(device_count)] + ['cpu'], + value=default_device, + scale=8) + infer_model_type = gr.Textbox(elem_id='infer_model_type', scale=4) + gr.Textbox(elem_id='port', lines=1, value='8000', scale=4) + chatbot = gr.Chatbot(elem_id='chatbot', elem_classes='control-height') + with gr.Row(): + prompt = gr.Textbox(elem_id='prompt', lines=1, interactive=True) + with gr.Tabs(visible=cls.is_multimodal): + with gr.TabItem(label='Image'): + image = gr.Image(type='filepath') + with gr.TabItem(label='Video'): + video = gr.Video() + with gr.TabItem(label='Audio'): + audio = gr.Audio(type='filepath') + + with gr.Row(): + clear_history = gr.Button(elem_id='clear_history') + submit = gr.Button(elem_id='submit') + + cls.element('load_checkpoint').click( + cls.deploy_model, list(base_tab.valid_elements().values()), + [cls.element('runtime_tab'), cls.element('running_tasks')]) + submit.click( + cls.send_message, + inputs=[ + cls.element('running_tasks'), + cls.element('template'), prompt, image, video, audio, infer_request, infer_model_type, + cls.element('system'), + cls.element('max_new_tokens'), + cls.element('temperature'), + cls.element('top_k'), + cls.element('top_p'), + cls.element('repetition_penalty') + ], + outputs=[prompt, chatbot, image, video, audio, infer_request], + queue=True) + + clear_history.click( + fn=cls.clear_session, inputs=[], outputs=[prompt, chatbot, image, video, audio, infer_request]) + + base_tab.element('running_tasks').change( + partial(Runtime.task_changed, base_tab=base_tab), [base_tab.element('running_tasks')], + list(cls.valid_elements().values()) + [cls.element('log')]) + Runtime.element('kill_task').click( + Runtime.kill_task, + [Runtime.element('running_tasks')], + [Runtime.element('running_tasks')] + [Runtime.element('log')], + ) + + @classmethod + def deploy(cls, *args): + deploy_args = cls.get_default_value_from_dataclass(DeployArguments) + kwargs = {} + kwargs_is_list = {} + other_kwargs = {} + more_params = {} + more_params_cmd = '' + keys = cls.valid_element_keys() + for key, value in zip(keys, args): + compare_value = deploy_args.get(key) + compare_value_arg = str(compare_value) if not isinstance(compare_value, (list, dict)) else compare_value + compare_value_ui = str(value) if not isinstance(value, (list, dict)) else value + if key in deploy_args and compare_value_ui != compare_value_arg and value: + if isinstance(value, str) and re.fullmatch(cls.int_regex, value): + value = int(value) + elif isinstance(value, str) and re.fullmatch(cls.float_regex, value): + value = float(value) + elif isinstance(value, str) and re.fullmatch(cls.bool_regex, value): + value = True if value.lower() == 'true' else False + kwargs[key] = value if not isinstance(value, list) else ' '.join(value) + kwargs_is_list[key] = isinstance(value, list) or getattr(cls.element(key), 'is_list', False) + else: + other_kwargs[key] = value + if key == 'more_params' and value: + try: + more_params = json.loads(value) + except (JSONDecodeError or TypeError): + more_params_cmd = value + + kwargs.update(more_params) + model = kwargs.get('model') + if os.path.exists(model) and os.path.exists(os.path.join(model, 'args.json')): + kwargs['ckpt_dir'] = kwargs.pop('model') + with open(os.path.join(kwargs['ckpt_dir'], 'args.json'), 'r', encoding='utf-8') as f: + _json = json.load(f) + kwargs['model_type'] = _json['model_type'] + kwargs['train_type'] = _json['train_type'] + deploy_args = DeployArguments( + **{ + key: value.split(' ') if key in kwargs_is_list and kwargs_is_list[key] else value + for key, value in kwargs.items() + }) + if deploy_args.port in Runtime.get_all_ports(): + raise gr.Error(cls.locale('port_alert', cls.lang)['value']) + params = '' + sep = f'{cls.quote} {cls.quote}' + for e in kwargs: + if isinstance(kwargs[e], list): + params += f'--{e} {cls.quote}{sep.join(kwargs[e])}{cls.quote} ' + elif e in kwargs_is_list and kwargs_is_list[e]: + all_args = [arg for arg in kwargs[e].split(' ') if arg.strip()] + params += f'--{e} {cls.quote}{sep.join(all_args)}{cls.quote} ' + else: + params += f'--{e} {cls.quote}{kwargs[e]}{cls.quote} ' + if 'port' not in kwargs: + params += f'--port "{deploy_args.port}" ' + params += more_params_cmd + ' ' + devices = other_kwargs['gpu_id'] + devices = [d for d in devices if d] + assert (len(devices) == 1 or 'cpu' not in devices) + gpus = ','.join(devices) + cuda_param = '' + if gpus != 'cpu': + if is_torch_npu_available(): + cuda_param = f'ASCEND_RT_VISIBLE_DEVICES={gpus}' + elif is_torch_cuda_available(): + cuda_param = f'CUDA_VISIBLE_DEVICES={gpus}' + else: + cuda_param = '' + now = datetime.now() + time_str = f'{now.year}{now.month}{now.day}{now.hour}{now.minute}{now.second}' + file_path = f'output/{deploy_args.model_type}-{time_str}' + if not os.path.exists(file_path): + os.makedirs(file_path, exist_ok=True) + log_file = os.path.join(os.getcwd(), f'{file_path}/run_deploy.log') + deploy_args.log_file = log_file + params += f'--log_file "{log_file}" ' + params += '--ignore_args_error true ' + if sys.platform == 'win32': + if cuda_param: + cuda_param = f'set {cuda_param} && ' + run_command = f'{cuda_param}start /b swift deploy {params} > {log_file} 2>&1' + else: + run_command = f'{cuda_param} nohup swift deploy {params} > {log_file} 2>&1 &' + return run_command, deploy_args, log_file + + @classmethod + def deploy_model(cls, *args): + run_command, deploy_args, log_file = cls.deploy(*args) + logger.info(f'Running deployment command: {run_command}') + os.system(run_command) + gr.Info(cls.locale('load_alert', cls.lang)['value']) + time.sleep(2) + running_task = Runtime.refresh_tasks(log_file) + return gr.update(open=True), running_task + + @classmethod + def register_clean_hook(cls): + signal.signal(signal.SIGINT, LLMInfer.signal_handler) + if os.name != 'nt': + signal.signal(signal.SIGTERM, LLMInfer.signal_handler) + + @staticmethod + def signal_handler(*args, **kwargs): + LLMInfer.clean_deployment() + sys.exit(0) + + @classmethod + def clear_session(cls): + return '', [], gr.update(value=None), gr.update(value=None), gr.update(value=None), [] + + @classmethod + def _replace_tag_with_media(cls, infer_request: InferRequest): + total_history = [] + messages = deepcopy(infer_request.messages) + if messages[0]['role'] == 'system': + messages.pop(0) + for i in range(0, len(messages), 2): + slices = messages[i:i + 2] + if len(slices) == 2: + user, assistant = slices + else: + user = slices[0] + assistant = {'role': 'assistant', 'content': None} + user['content'] = (user['content'] or '').replace('', '').replace('