diff --git "a/cotSFT/.ipynb_checkpoints/overlaps-checkpoint.json" "b/cotSFT/.ipynb_checkpoints/overlaps-checkpoint.json" new file mode 100644--- /dev/null +++ "b/cotSFT/.ipynb_checkpoints/overlaps-checkpoint.json" @@ -0,0 +1,44025 @@ +{ + "DialogSum--val--1": { + "original_text": "A: Does this happen all the time or mostly when you are [interrupt] doing physical activities like running or lifting weights, or does it occur even when you're just resting or lying down comfortably?\nB: Sorry to cut in, but I just remembered—could this be related to stress? I've been under a lot of pressure at work lately.\nA: Stress can definitely contribute to breathing issues. But I was about to ask if this happens mostly when you are active or at rest?\nB: It happens a lot when I work out.\nA: I see. I am going to send you to a pulmonary specialist who can run tests on you for asthma.\nB: Thank you for your help, doctor.", + "cleaned_text": "A:Does this happen all the time or mostly when you are doing physical activities like running or lifting weights, or does it occur even when you're just resting or lying down comfortably?\nB: Sorry to cut in, but I just remembered—could this be related to stress? I've been under a lot of pressure at work lately.\nA: Stress can definitely contribute to breathing issues. But I was about to ask if this happens mostly when you are active or at rest?\nB: It happens a lot when I work out.\nA: I see. I am going to send you to a pulmonary specialist who can run tests on you for asthma.\nB: Thank you for your help, doctor.", + "total_duration": 27.99047619047619, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--1/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--1/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--1/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Does this happen all the time or mostly when you are", + "original_text": "Does this happen all the time or mostly when you are [interrupt] doing physical activities like running or lifting weights, or does it occur even when you're just resting or lying down comfortably?", + "start_time": 0, + "end_time": 10.08907029478458, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--1/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": true, + "text_after_interrupt": "doing physical activities like running or lifting weights, or does it occur even when you're just resting or lying down comfortably?" + }, + { + "speaker": "B", + "text": "Sorry to cut in, but I just remembered—could this be related to stress? I've been under a lot of pressure at work lately.", + "original_text": "Sorry to cut in, but I just remembered—could this be related to stress? I've been under a lot of pressure at work lately.", + "start_time": 3.378503401360544, + "end_time": 9.78721088435374, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--1/temp/line_1_B.wav", + "silence_duration": 0.3163795165716884, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Stress can definitely contribute to breathing issues. But I was about to ask if this happens mostly when you are active or at rest?", + "original_text": "Stress can definitely contribute to breathing issues. But I was about to ask if this happens mostly when you are active or at rest?", + "start_time": 10.481494066700877, + "end_time": 18.457548488469584, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--1/temp/line_2_A.wav", + "silence_duration": 0.3924237719162964, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "It happens a lot when I work out.", + "original_text": "It happens a lot when I work out.", + "start_time": 18.773897185126465, + "end_time": 20.527003761090185, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--1/temp/line_3_B.wav", + "silence_duration": 0.3163486966568813, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I see. I am going to send you to a pulmonary specialist who can run tests on you for asthma.", + "original_text": "I see. I am going to send you to a pulmonary specialist who can run tests on you for asthma.", + "start_time": 20.8438323417376, + "end_time": 26.24247179751991, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--1/temp/line_4_A.wav", + "silence_duration": 0.316828580647413, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Thank you for your help, doctor.", + "original_text": "Thank you for your help, doctor.", + "start_time": 26.632125652542648, + "end_time": 27.990492999481422, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--1/temp/line_5_B.wav", + "silence_duration": 0.38965385502273464, + "is_interrupted": false + } + ] + }, + "DialogSum--val--2": { + "original_text": "A: Hey Jimmy. Let's go workout later today. \nB: Sure. What time do you want to [interrupt] plan on meeting up? I was hoping we could get an early start so we have enough time for a proper warm-up and cool-down session. \nA: Actually, I was thinking around 3:30. Does that work for you? \nB: That sounds good. Today we work on Legs and forearm. \nA: Hey. I just played basketball earlier, so my legs are a little sore. Let's work out on arms and stomach today. \nB: I'm on a weekly schedule. You're messing everything [interrupt] up with this change. But I guess I can adjust since I understand you're already fatigued from your basketball game earlier this afternoon. \nA: up? I get it, but it's just switching two days. You can do legs on Friday. \nB: Aright. I'll meet you at the gym at 3:30 then.", + "cleaned_text": "A: Hey Jimmy. Let's go workout later today. \nB:Sure. What time do you want to plan on meeting up? I was hoping we could get an early start so we have enough time for a proper warm-up and cool-down session.\nA: Actually, I was thinking around 3:30. Does that work for you? \nB: That sounds good. Today we work on Legs and forearm. \nA: Hey. I just played basketball earlier, so my legs are a little sore. Let's work out on arms and stomach today. \nB:I'm on a weekly schedule. You're messing everything up with this change. But I guess I can adjust since I understand you're already fatigued from your basketball game earlier this afternoon.\nA: up? I get it, but it's just switching two days. You can do legs on Friday. \nB: Aright. I'll meet you at the gym at 3:30 then.", + "total_duration": 38.40775510204082, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--2/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--2/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--2/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Hey Jimmy. Let's go workout later today.", + "original_text": "Hey Jimmy. Let's go workout later today.", + "start_time": 0, + "end_time": 2.9373242630385485, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--2/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Sure. What time do you want to", + "original_text": "Sure. What time do you want to [interrupt] plan on meeting up? I was hoping we could get an early start so we have enough time for a proper warm-up and cool-down session.", + "start_time": 3.2446845404980387, + "end_time": 11.08141923437559, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--2/temp/line_1_B.wav", + "silence_duration": 0.30736027745949024, + "is_interrupted": true, + "text_after_interrupt": "plan on meeting up? I was hoping we could get an early start so we have enough time for a proper warm-up and cool-down session." + }, + { + "speaker": "A", + "text": "Actually, I was thinking around 3:30. Does that work for you?", + "original_text": "Actually, I was thinking around 3:30. Does that work for you?", + "start_time": 4.962961184488968, + "end_time": 8.933573429386927, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--2/temp/line_2_A.wav", + "silence_duration": 0.3938659441122258, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "That sounds good. Today we work on Legs and forearm.", + "original_text": "That sounds good. Today we work on Legs and forearm.", + "start_time": 11.52205302068251, + "end_time": 14.401327397099744, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--2/temp/line_3_B.wav", + "silence_duration": 0.44063378630692074, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Hey. I just played basketball earlier, so my legs are a little sore. Let's work out on arms and stomach today.", + "original_text": "Hey. I just played basketball earlier, so my legs are a little sore. Let's work out on arms and stomach today.", + "start_time": 14.955914577979453, + "end_time": 22.46756990677764, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--2/temp/line_4_A.wav", + "silence_duration": 0.5545871808797085, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I'm on a weekly schedule. You're messing everything", + "original_text": "I'm on a weekly schedule. You're messing everything [interrupt] up with this change. But I guess I can adjust since I understand you're already fatigued from your basketball game earlier this afternoon.", + "start_time": 22.83354482725263, + "end_time": 31.912547094826326, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--2/temp/line_5_B.wav", + "silence_duration": 0.3659749204749916, + "is_interrupted": true, + "text_after_interrupt": "up with this change. But I guess I can adjust since I understand you're already fatigued from your basketball game earlier this afternoon." + }, + { + "speaker": "A", + "text": "up? I get it, but it's just switching two days. You can do legs on Friday.", + "original_text": "up? I get it, but it's just switching two days. You can do legs on Friday.", + "start_time": 29.919814692231366, + "end_time": 35.353284079986466, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--2/temp/line_6_A.wav", + "silence_duration": 0.42180713384610197, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Aright. I'll meet you at the gym at 3:30 then.", + "original_text": "Aright. I'll meet you at the gym at 3:30 then.", + "start_time": 35.93483841194411, + "end_time": 38.40776358201214, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--2/temp/line_7_B.wav", + "silence_duration": 0.5815543319576504, + "is_interrupted": false + } + ] + }, + "DialogSum--val--3": { + "original_text": "A: I need to stop eating such unhealthy foods. \nB: I know what you mean. I've started eating better myself. \nA: What foods do you eat now? \nB: I tend to stick to fruits, vegetables, and [interrupt] lean proteins like chicken and fish, which provide essential amino acids for muscle repair and help maintain a healthy metabolism throughout the day. \nA: Sorry to cut in, but when you say vegetables, are you including things like potatoes or more leafy greens? \nB: Mostly leafy greens, but I do include some root vegetables like carrots. I was going to say chicken as well. \nA: Oh, I see. So, are those the only things you eat? \nB: That's basically what I eat. I try to keep my meals simple and balanced. \nA: Why aren't you eating anything else? \nB: Well, fruits and vegetables are very healthy, and they provide essential nutrients. \nA: And the chicken? \nB: It's really healthy to eat when you bake it, especially if you avoid adding too much oil or seasoning.", + "cleaned_text": "A: I need to stop eating such unhealthy foods. \nB: I know what you mean. I've started eating better myself. \nA: What foods do you eat now? \nB:I tend to stick to fruits, vegetables, and lean proteins like chicken and fish, which provide essential amino acids for muscle repair and help maintain a healthy metabolism throughout the day.\nA: Sorry to cut in, but when you say vegetables, are you including things like potatoes or more leafy greens? \nB: Mostly leafy greens, but I do include some root vegetables like carrots. I was going to say chicken as well. \nA: Oh, I see. So, are those the only things you eat? \nB: That's basically what I eat. I try to keep my meals simple and balanced. \nA: Why aren't you eating anything else? \nB: Well, fruits and vegetables are very healthy, and they provide essential nutrients. \nA: And the chicken? \nB: It's really healthy to eat when you bake it, especially if you avoid adding too much oil or seasoning.", + "total_duration": 48.438639455782315, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--3/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--3/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--3/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "I need to stop eating such unhealthy foods.", + "original_text": "I need to stop eating such unhealthy foods.", + "start_time": 0, + "end_time": 2.6122448979591835, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--3/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I know what you mean. I've started eating better myself.", + "original_text": "I know what you mean. I've started eating better myself.", + "start_time": 3.1141582057077657, + "end_time": 5.749623058315475, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--3/temp/line_1_B.wav", + "silence_duration": 0.5019133077485822, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "What foods do you eat now?", + "original_text": "What foods do you eat now?", + "start_time": 6.283986192448483, + "end_time": 7.955822927142361, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--3/temp/line_2_A.wav", + "silence_duration": 0.5343631341330084, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I tend to stick to fruits, vegetables, and", + "original_text": "I tend to stick to fruits, vegetables, and [interrupt] lean proteins like chicken and fish, which provide essential amino acids for muscle repair and help maintain a healthy metabolism throughout the day.", + "start_time": 8.481352545523423, + "end_time": 19.290241434412312, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--3/temp/line_3_B.wav", + "silence_duration": 0.5255296183810619, + "is_interrupted": true, + "text_after_interrupt": "lean proteins like chicken and fish, which provide essential amino acids for muscle repair and help maintain a healthy metabolism throughout the day." + }, + { + "speaker": "A", + "text": "Sorry to cut in, but when you say vegetables, are you including things like potatoes or more leafy greens?", + "original_text": "Sorry to cut in, but when you say vegetables, are you including things like potatoes or more leafy greens?", + "start_time": 10.873007874321608, + "end_time": 17.64162465436696, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--3/temp/line_4_A.wav", + "silence_duration": 0.34413041209388523, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Mostly leafy greens, but I do include some root vegetables like carrots. I was going to say chicken as well.", + "original_text": "Mostly leafy greens, but I do include some root vegetables like carrots. I was going to say chicken as well.", + "start_time": 19.75173884566092, + "end_time": 25.951466736817384, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--3/temp/line_5_B.wav", + "silence_duration": 0.4614974112486091, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Oh, I see. So, are those the only things you eat?", + "original_text": "Oh, I see. So, are those the only things you eat?", + "start_time": 26.343399512204602, + "end_time": 29.80317275483499, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--3/temp/line_6_A.wav", + "silence_duration": 0.3919327753872168, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "That's basically what I eat. I try to keep my meals simple and balanced.", + "original_text": "That's basically what I eat. I try to keep my meals simple and balanced.", + "start_time": 30.37399082512552, + "end_time": 34.425872911293325, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--3/temp/line_7_B.wav", + "silence_duration": 0.5708180702905321, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Why aren't you eating anything else?", + "original_text": "Why aren't you eating anything else?", + "start_time": 34.85809735573295, + "end_time": 36.80857354620914, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--3/temp/line_8_A.wav", + "silence_duration": 0.4322244444396284, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Well, fruits and vegetables are very healthy, and they provide essential nutrients.", + "original_text": "Well, fruits and vegetables are very healthy, and they provide essential nutrients.", + "start_time": 37.34025723386521, + "end_time": 41.61272888919401, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--3/temp/line_9_B.wav", + "silence_duration": 0.53168368765607, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "And the chicken?", + "original_text": "And the chicken?", + "start_time": 42.03077904746347, + "end_time": 42.94796725608025, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--3/temp/line_10_A.wav", + "silence_duration": 0.41805015826945835, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "It's really healthy to eat when you bake it, especially if you avoid adding too much oil or seasoning.", + "original_text": "It's really healthy to eat when you bake it, especially if you avoid adding too much oil or seasoning.", + "start_time": 43.39993033797596, + "end_time": 48.43866049670612, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--3/temp/line_11_B.wav", + "silence_duration": 0.4519630818957151, + "is_interrupted": false + } + ] + }, + "DialogSum--val--4": { + "original_text": "A: Do you believe in UFOs? \nB: Of course, they are out there. \nA: But I never [interrupt] thought I'd meet someone who actually believes in them so strongly, especially someone who claims to have direct experiences with extraterrestrial beings. \nB: Are you serious? They are called UFOs, so not everybody can see them. \nA: Wait, you mean that you can see them? \nB: That's right. I can see them in my dreams. \nA: They come to the earth? \nB: No. Their task is to send the aliens here from outer space. \nA: Aliens from outer space? Do you talk to them? What do they usually say when you communicate with them? \nB: OK, OK, one by one, please! They look like robots, but they can speak. Their mission is to make friends with human beings. \nA: That means that you talk to them? In which language? \nB: Of course in English, they learn English on Mars too. \nA: Oh, and what do they look like again? You were about to say before I interrupted. \nB: They look like robots, but with a more organic touch, like they're part machine, part living being.", + "cleaned_text": "A: Do you believe in UFOs? \nB: Of course, they are out there. \nA:But I never thought I'd meet someone who actually believes in them so strongly, especially someone who claims to have direct experiences with extraterrestrial beings.\nB: Are you serious? They are called UFOs, so not everybody can see them. \nA: Wait, you mean that you can see them? \nB: That's right. I can see them in my dreams. \nA: They come to the earth? \nB: No. Their task is to send the aliens here from outer space. \nA: Aliens from outer space? Do you talk to them? What do they usually say when you communicate with them? \nB: OK, OK, one by one, please! They look like robots, but they can speak. Their mission is to make friends with human beings. \nA: That means that you talk to them? In which language? \nB: Of course in English, they learn English on Mars too. \nA: Oh, and what do they look like again? You were about to say before I interrupted. \nB: They look like robots, but with a more organic touch, like they're part machine, part living being.", + "total_duration": 57.73233560090703, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--4/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--4/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--4/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Do you believe in UFOs?", + "original_text": "Do you believe in UFOs?", + "start_time": 0, + "end_time": 1.7531065759637188, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--4/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Of course, they are out there.", + "original_text": "Of course, they are out there.", + "start_time": 2.203679136069602, + "end_time": 3.562046483008378, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--4/temp/line_1_B.wav", + "silence_duration": 0.4505725601058834, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "But I never", + "original_text": "But I never [interrupt] thought I'd meet someone who actually believes in them so strongly, especially someone who claims to have direct experiences with extraterrestrial beings.", + "start_time": 4.036549115550625, + "end_time": 13.672830294688946, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--4/temp/line_2_A.wav", + "silence_duration": 0.4745026325422472, + "is_interrupted": true, + "text_after_interrupt": "thought I'd meet someone who actually believes in them so strongly, especially someone who claims to have direct experiences with extraterrestrial beings." + }, + { + "speaker": "B", + "text": "Are you serious? They are called UFOs, so not everybody can see them.", + "original_text": "Are you serious? They are called UFOs, so not everybody can see them.", + "start_time": 5.209156825301192, + "end_time": 9.388748662035887, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--4/temp/line_3_B.wav", + "silence_duration": 0.596358903400142, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Wait, you mean that you can see them?", + "original_text": "Wait, you mean that you can see them?", + "start_time": 14.209303645029873, + "end_time": 16.124949903533274, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--4/temp/line_4_A.wav", + "silence_duration": 0.5364733503409271, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "That's right. I can see them in my dreams.", + "original_text": "That's right. I can see them in my dreams.", + "start_time": 16.48764808431294, + "end_time": 18.879303413111128, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--4/temp/line_5_B.wav", + "silence_duration": 0.3626981807796672, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "They come to the earth?", + "original_text": "They come to the earth?", + "start_time": 19.449626314474948, + "end_time": 20.738333797468144, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--4/temp/line_6_A.wav", + "silence_duration": 0.5703229013638198, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "No. Their task is to send the aliens here from outer space.", + "original_text": "No. Their task is to send the aliens here from outer space.", + "start_time": 21.32510585439605, + "end_time": 24.436579777298544, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--4/temp/line_7_B.wav", + "silence_duration": 0.5867720569279069, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Aliens from outer space? Do you talk to them? What do they usually say when you communicate with them?", + "original_text": "Aliens from outer space? Do you talk to them? What do they usually say when you communicate with them?", + "start_time": 24.86359375971502, + "end_time": 31.56255067581479, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--4/temp/line_8_A.wav", + "silence_duration": 0.42701398241647626, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "OK, OK, one by one, please! They look like robots, but they can speak. Their mission is to make friends with human beings.", + "original_text": "OK, OK, one by one, please! They look like robots, but they can speak. Their mission is to make friends with human beings.", + "start_time": 32.13205439922178, + "end_time": 39.36507027223765, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--4/temp/line_9_B.wav", + "silence_duration": 0.5695037234069893, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "That means that you talk to them? In which language?", + "original_text": "That means that you talk to them? In which language?", + "start_time": 39.88411001862221, + "end_time": 43.15812362406439, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--4/temp/line_10_A.wav", + "silence_duration": 0.5190397463845566, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Of course in English, they learn English on Mars too.", + "original_text": "Of course in English, they learn English on Mars too.", + "start_time": 43.75005020806537, + "end_time": 46.49000485659145, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--4/temp/line_11_B.wav", + "silence_duration": 0.5919265840009778, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Oh, and what do they look like again? You were about to say before I interrupted.", + "original_text": "Oh, and what do they look like again? You were about to say before I interrupted.", + "start_time": 46.917565041254456, + "end_time": 51.96790517730888, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--4/temp/line_12_A.wav", + "silence_duration": 0.42756018466300805, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "They look like robots, but with a more organic touch, like they're part machine, part living being.", + "original_text": "They look like robots, but with a more organic touch, like they're part machine, part living being.", + "start_time": 52.27568538860537, + "end_time": 57.732374731008996, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--4/temp/line_13_B.wav", + "silence_duration": 0.30778021129648747, + "is_interrupted": false + } + ] + }, + "DialogSum--val--5": { + "original_text": "A: Did you go to school today? \nB: Of course. Did you? \nA: I didn't want to, so I didn't. \nB: That's sad, but have you gone to the movies recently? \nA: That's a [interrupt] surprising change in topic that caught me off guard since we were just talking about school attendance and suddenly shifted to entertainment options, but no, I haven't gone to the movies lately. \nB: Sorry to jump in, but I was just thinking, is there a specific movie you're interested in? \nA: I was about to say, that's a switch in topic. But no, I haven't gone to the movies. Why? \nB: I really want to go to the movies this weekend. \nA: So go then. \nB: I really don't want to go by myself. \nA: Well anyway, do you plan on going to school tomorrow? \nB: No, I think I'm going to go to the movies. By the way, what were you going to say earlier about the switch in topic? \nA: Oh, I just meant it was a surprising change in conversation.", + "cleaned_text": "A: Did you go to school today? \nB: Of course. Did you? \nA: I didn't want to, so I didn't. \nB: That's sad, but have you gone to the movies recently? \nA:That's a surprising change in topic that caught me off guard since we were just talking about school attendance and suddenly shifted to entertainment options, but no, I haven't gone to the movies lately.\nB: Sorry to jump in, but I was just thinking, is there a specific movie you're interested in? \nA: I was about to say, that's a switch in topic. But no, I haven't gone to the movies. Why? \nB: I really want to go to the movies this weekend. \nA: So go then. \nB: I really don't want to go by myself. \nA: Well anyway, do you plan on going to school tomorrow? \nB: No, I think I'm going to go to the movies. By the way, what were you going to say earlier about the switch in topic? \nA: Oh, I just meant it was a surprising change in conversation.", + "total_duration": 47.545034013605445, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--5/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--5/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--5/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Did you go to school today?", + "original_text": "Did you go to school today?", + "start_time": 0, + "end_time": 1.6370068027210884, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--5/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Of course. Did you?", + "original_text": "Of course. Did you?", + "start_time": 2.2292836488119736, + "end_time": 3.227741698698595, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--5/temp/line_1_B.wav", + "silence_duration": 0.5922768460908849, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I didn't want to, so I didn't.", + "original_text": "I didn't want to, so I didn't.", + "start_time": 3.6850739100783567, + "end_time": 5.844529692391282, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--5/temp/line_2_A.wav", + "silence_duration": 0.457332211379762, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "That's sad, but have you gone to the movies recently?", + "original_text": "That's sad, but have you gone to the movies recently?", + "start_time": 6.256128988382989, + "end_time": 9.228283183394327, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--5/temp/line_3_B.wav", + "silence_duration": 0.4115992959917072, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "That's a", + "original_text": "That's a [interrupt] surprising change in topic that caught me off guard since we were just talking about school attendance and suddenly shifted to entertainment options, but no, I haven't gone to the movies lately.", + "start_time": 9.672625261077323, + "end_time": 21.00396312955805, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--5/temp/line_4_A.wav", + "silence_duration": 0.44434207768299666, + "is_interrupted": true, + "text_after_interrupt": "surprising change in topic that caught me off guard since we were just talking about school attendance and suddenly shifted to entertainment options, but no, I haven't gone to the movies lately." + }, + { + "speaker": "B", + "text": "Sorry to jump in, but I was just thinking, is there a specific movie you're interested in?", + "original_text": "Sorry to jump in, but I was just thinking, is there a specific movie you're interested in?", + "start_time": 10.46210371912721, + "end_time": 15.582103719127211, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--5/temp/line_5_B.wav", + "silence_duration": 0.43768106090074793, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I was about to say, that's a switch in topic. But no, I haven't gone to the movies. Why?", + "original_text": "I was about to say, that's a switch in topic. But no, I haven't gone to the movies. Why?", + "start_time": 21.558459545448947, + "end_time": 27.595647754065727, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--5/temp/line_6_A.wav", + "silence_duration": 0.5544964158908978, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I really want to go to the movies this weekend.", + "original_text": "I really want to go to the movies this weekend.", + "start_time": 28.07220820524347, + "end_time": 30.3245438061505, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--5/temp/line_7_B.wav", + "silence_duration": 0.4765604511777425, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "So go then.", + "original_text": "So go then.", + "start_time": 30.70833294480079, + "end_time": 31.683571040038885, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--5/temp/line_8_A.wav", + "silence_duration": 0.38378913865028813, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I really don't want to go by myself.", + "original_text": "I really don't want to go by myself.", + "start_time": 32.175561731547965, + "end_time": 33.928668307511685, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--5/temp/line_9_B.wav", + "silence_duration": 0.49199069150908203, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Well anyway, do you plan on going to school tomorrow?", + "original_text": "Well anyway, do you plan on going to school tomorrow?", + "start_time": 34.46731091693954, + "end_time": 37.57878483984203, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--5/temp/line_10_A.wav", + "silence_duration": 0.5386426094278569, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "No, I think I'm going to go to the movies. By the way, what were you going to say earlier about the switch in topic?", + "original_text": "No, I think I'm going to go to the movies. By the way, what were you going to say earlier about the switch in topic?", + "start_time": 38.06266943790832, + "end_time": 43.46130889369063, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--5/temp/line_11_B.wav", + "silence_duration": 0.48388459806628886, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Oh, I just meant it was a surprising change in conversation.", + "original_text": "Oh, I just meant it was a surprising change in conversation.", + "start_time": 43.8531055557569, + "end_time": 47.54507834487254, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--5/temp/line_12_A.wav", + "silence_duration": 0.3917966620662702, + "is_interrupted": false + } + ] + }, + "DialogSum--val--6": { + "original_text": "A: Honey, I think you should quit smoking. \nB: Why? You said I was hot when [interrupt] you saw me with a cigarette back then during our college days, but now I realize that was just youthful ignorance talking. \nA: I know I did, but I want you to be fit. Smoking is killing. \nB: I know. \nA: Check out this article. It says smoking can lead to lung cancer. \nB: I don't believe [interrupt] everything I read online, but I know it's not good for me and I should probably take this more seriously than I have been. \nA: Wait, you don't believe it? But you know that smoking does harm to health, right? \nB: Of course I know it, but you know it's hard to quit [interrupt] when it's been a habit for so long and all my friends at work still smoke during breaks. \nA: I get that it's difficult, but stop beating around the bush. Will you quit or not? \nB: Yes, ma'am. Whatever you say.", + "cleaned_text": "A: Honey, I think you should quit smoking. \nB:Why? You said I was hot when you saw me with a cigarette back then during our college days, but now I realize that was just youthful ignorance talking.\nA: I know I did, but I want you to be fit. Smoking is killing. \nB: I know. \nA: Check out this article. It says smoking can lead to lung cancer. \nB:I don't believe everything I read online, but I know it's not good for me and I should probably take this more seriously than I have been.\nA: Wait, you don't believe it? But you know that smoking does harm to health, right? \nB:Of course I know it, but you know it's hard to quit when it's been a habit for so long and all my friends at work still smoke during breaks.\nA: I get that it's difficult, but stop beating around the bush. Will you quit or not? \nB: Yes, ma'am. Whatever you say.", + "total_duration": 42.962857142857146, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--6/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--6/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--6/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Honey, I think you should quit smoking.", + "original_text": "Honey, I think you should quit smoking.", + "start_time": 0, + "end_time": 2.089795918367347, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--6/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Why? You said I was hot when", + "original_text": "Why? You said I was hot when [interrupt] you saw me with a cigarette back then during our college days, but now I realize that was just youthful ignorance talking.", + "start_time": 2.632424850846233, + "end_time": 10.283399907535575, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--6/temp/line_1_B.wav", + "silence_duration": 0.5426289324788856, + "is_interrupted": true, + "text_after_interrupt": "you saw me with a cigarette back then during our college days, but now I realize that was just youthful ignorance talking." + }, + { + "speaker": "A", + "text": "I know I did, but I want you to be fit. Smoking is killing.", + "original_text": "I know I did, but I want you to be fit. Smoking is killing.", + "start_time": 4.907980406401789, + "end_time": 9.505531426809952, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--6/temp/line_2_A.wav", + "silence_duration": 0.3486775310493293, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I know.", + "original_text": "I know.", + "start_time": 10.74320536120863, + "end_time": 11.358534159394571, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--6/temp/line_3_B.wav", + "silence_duration": 0.4598054536730558, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Check out this article. It says smoking can lead to lung cancer.", + "original_text": "Check out this article. It says smoking can lead to lung cancer.", + "start_time": 11.895942669250672, + "end_time": 15.947824755418473, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--6/temp/line_4_A.wav", + "silence_duration": 0.5374085098561008, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I don't believe", + "original_text": "I don't believe [interrupt] everything I read online, but I know it's not good for me and I should probably take this more seriously than I have been.", + "start_time": 16.3134186502229, + "end_time": 22.65246626927052, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--6/temp/line_5_B.wav", + "silence_duration": 0.36559389480442744, + "is_interrupted": true, + "text_after_interrupt": "everything I read online, but I know it's not good for me and I should probably take this more seriously than I have been." + }, + { + "speaker": "A", + "text": "Wait, you don't believe it? But you know that smoking does harm to health, right?", + "original_text": "Wait, you don't believe it? But you know that smoking does harm to health, right?", + "start_time": 22.31348185054609, + "end_time": 26.922642848278517, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--6/temp/line_6_A.wav", + "silence_duration": 0.4060393894329752, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Of course I know it, but you know it's hard to quit", + "original_text": "Of course I know it, but you know it's hard to quit [interrupt] when it's been a habit for so long and all my friends at work still smoke during breaks.", + "start_time": 27.35893461463124, + "end_time": 33.756032120300176, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--6/temp/line_7_B.wav", + "silence_duration": 0.4362917663527226, + "is_interrupted": true, + "text_after_interrupt": "when it's been a habit for so long and all my friends at work still smoke during breaks." + }, + { + "speaker": "A", + "text": "I get that it's difficult, but stop beating around the bush. Will you quit or not?", + "original_text": "I get that it's difficult, but stop beating around the bush. Will you quit or not?", + "start_time": 35.85408433542971, + "end_time": 40.950864380781184, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--6/temp/line_8_A.wav", + "silence_duration": 0.5339945118669193, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, ma'am. Whatever you say.", + "original_text": "Yes, ma'am. Whatever you say.", + "start_time": 41.43037476333019, + "end_time": 42.96289177013291, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--6/temp/line_9_B.wav", + "silence_duration": 0.4795103825490111, + "is_interrupted": false + } + ] + }, + "DialogSum--val--7": { + "original_text": "A: Excuse me, Mr. White? I just need you to sign these before I [interrupt] head out for the day because I have an important appointment scheduled right after work and I wouldn't want to be late for it.\nB: Oh, Sherry, before I sign, could you remind me what these documents are for? I want to make sure I haven't missed anything important.\nA: Sure, these are the quarterly budget reports and the new contract for the supplier. I just need you to sign them before I leave.\nB: Ah, right. Sorry to have kept you waiting. If you hadn't told me, I probably would have just forgotten all about [interrupt] the budget reports which contain crucial financial projections for the next quarter that we need to review during tomorrow's management meeting.\nA: No worries, sir. Just one more signature here, please.\nB: Oh, and I was going to ask—what was the other document you mentioned earlier?\nA: That was the new contract for the supplier. Here you are.\nB: There you are.", + "cleaned_text": "A:Excuse me, Mr. White? I just need you to sign these before I head out for the day because I have an important appointment scheduled right after work and I wouldn't want to be late for it.\nB: Oh, Sherry, before I sign, could you remind me what these documents are for? I want to make sure I haven't missed anything important.\nA: Sure, these are the quarterly budget reports and the new contract for the supplier. I just need you to sign them before I leave.\nB:Ah, right. Sorry to have kept you waiting. If you hadn't told me, I probably would have just forgotten all about the budget reports which contain crucial financial projections for the next quarter that we need to review during tomorrow's management meeting.\nA: No worries, sir. Just one more signature here, please.\nB: Oh, and I was going to ask—what was the other document you mentioned earlier?\nA: That was the new contract for the supplier. Here you are.\nB: There you are.", + "total_duration": 46.94943310657597, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--7/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--7/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--7/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Excuse me, Mr. White? I just need you to sign these before I", + "original_text": "Excuse me, Mr. White? I just need you to sign these before I [interrupt] head out for the day because I have an important appointment scheduled right after work and I wouldn't want to be late for it.", + "start_time": 0, + "end_time": 11.517097505668934, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--7/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": true, + "text_after_interrupt": "head out for the day because I have an important appointment scheduled right after work and I wouldn't want to be late for it." + }, + { + "speaker": "B", + "text": "Oh, Sherry, before I sign, could you remind me what these documents are for? I want to make sure I haven't missed anything important.", + "original_text": "Oh, Sherry, before I sign, could you remind me what these documents are for? I want to make sure I haven't missed anything important.", + "start_time": 4.3769614512471655, + "end_time": 12.016326530612245, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--7/temp/line_1_B.wav", + "silence_duration": 0.42461497903952056, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Sure, these are the quarterly budget reports and the new contract for the supplier. I just need you to sign them before I leave.", + "original_text": "Sure, these are the quarterly budget reports and the new contract for the supplier. I just need you to sign them before I leave.", + "start_time": 12.449433430395997, + "end_time": 19.93786880454566, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--7/temp/line_2_A.wav", + "silence_duration": 0.4331068997837513, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Ah, right. Sorry to have kept you waiting. If you hadn't told me, I probably would have just forgotten all about", + "original_text": "Ah, right. Sorry to have kept you waiting. If you hadn't told me, I probably would have just forgotten all about [interrupt] the budget reports which contain crucial financial projections for the next quarter that we need to review during tomorrow's management meeting.", + "start_time": 20.515013023001263, + "end_time": 32.76353910009877, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--7/temp/line_3_B.wav", + "silence_duration": 0.5771442184556035, + "is_interrupted": true, + "text_after_interrupt": "the budget reports which contain crucial financial projections for the next quarter that we need to review during tomorrow's management meeting." + }, + { + "speaker": "A", + "text": "No worries, sir. Just one more signature here, please.", + "original_text": "No worries, sir. Just one more signature here, please.", + "start_time": 33.50992265306281, + "end_time": 37.08579566893582, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--7/temp/line_4_A.wav", + "silence_duration": 0.4109191636243259, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Oh, and I was going to ask—what was the other document you mentioned earlier?", + "original_text": "Oh, and I was going to ask—what was the other document you mentioned earlier?", + "start_time": 37.47716511603185, + "end_time": 41.354897542335706, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--7/temp/line_5_B.wav", + "silence_duration": 0.3913694470960254, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "That was the new contract for the supplier. Here you are.", + "original_text": "That was the new contract for the supplier. Here you are.", + "start_time": 41.66576942642134, + "end_time": 45.62477169399504, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--7/temp/line_6_A.wav", + "silence_duration": 0.31087188408563404, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "There you are.", + "original_text": "There you are.", + "start_time": 46.15997118886736, + "end_time": 46.949449646917245, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--7/temp/line_7_B.wav", + "silence_duration": 0.53519949487232, + "is_interrupted": false + } + ] + }, + "DialogSum--val--8": { + "original_text": "A: Hey, Karen. Looks like you got some sun this weekend.\nB: Yeah? I guess so. I spent the weekend at the beach.\nA: That's great. Where did you stay?\nB: Some friends of my parents live out there, and they invited [interrupt] me to stay with them for the weekend. It was really nice to catch up with them and enjoy the beautiful ocean views from their beachfront property.\nA: Oh, that sounds nice! By the way, what part of the beach were you at? I've been thinking of visiting a quieter spot.\nB: It was a small, private stretch near the south end. But I was saying, they invited me over, and it was really relaxing. So, what did you do this weekend?\nA: I wish I could say I did something as fun as you did. I spent most of it in the library, working on that research project. It's been taking up all my free time lately.\nB: Oh, I figured. You must be exhausted. But before we get into that, you mentioned you jogged on the beach. How was that? I've heard running on sand can be tough.\nA: It was harder than I expected! I couldn't get through a whole game of volleyball before I had to sit down. The sand just drains your energy.\nB: I can imagine. Did you get to swim at all, or was it just too cold?\nA: I wanted to, but the water was freezing. I only managed to get in up to my knees. But anyway, how's that research project going?", + "cleaned_text": "A: Hey, Karen. Looks like you got some sun this weekend.\nB: Yeah? I guess so. I spent the weekend at the beach.\nA: That's great. Where did you stay?\nB:Some friends of my parents live out there, and they invited me to stay with them for the weekend. It was really nice to catch up with them and enjoy the beautiful ocean views from their beachfront property.\nA: Oh, that sounds nice! By the way, what part of the beach were you at? I've been thinking of visiting a quieter spot.\nB: It was a small, private stretch near the south end. But I was saying, they invited me over, and it was really relaxing. So, what did you do this weekend?\nA: I wish I could say I did something as fun as you did. I spent most of it in the library, working on that research project. It's been taking up all my free time lately.\nB: Oh, I figured. You must be exhausted. But before we get into that, you mentioned you jogged on the beach. How was that? I've heard running on sand can be tough.\nA: It was harder than I expected! I couldn't get through a whole game of volleyball before I had to sit down. The sand just drains your energy.\nB: I can imagine. Did you get to swim at all, or was it just too cold?\nA: I wanted to, but the water was freezing. I only managed to get in up to my knees. But anyway, how's that research project going?", + "total_duration": 69.95877551020408, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--8/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--8/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--8/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Hey, Karen. Looks like you got some sun this weekend.", + "original_text": "Hey, Karen. Looks like you got some sun this weekend.", + "start_time": 0, + "end_time": 3.889342403628118, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--8/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yeah? I guess so. I spent the weekend at the beach.", + "original_text": "Yeah? I guess so. I spent the weekend at the beach.", + "start_time": 4.31909158868209, + "end_time": 7.6743750353941085, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--8/temp/line_1_B.wav", + "silence_duration": 0.429749185053972, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "That's great. Where did you stay?", + "original_text": "That's great. Where did you stay?", + "start_time": 7.982222025873834, + "end_time": 10.339047422699231, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--8/temp/line_2_A.wav", + "silence_duration": 0.3078469904797252, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Some friends of my parents live out there, and they invited", + "original_text": "Some friends of my parents live out there, and they invited [interrupt] me to stay with them for the weekend. It was really nice to catch up with them and enjoy the beautiful ocean views from their beachfront property.", + "start_time": 10.938909522094843, + "end_time": 20.44748095066627, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--8/temp/line_3_B.wav", + "silence_duration": 0.5998620993956125, + "is_interrupted": true, + "text_after_interrupt": "me to stay with them for the weekend. It was really nice to catch up with them and enjoy the beautiful ocean views from their beachfront property." + }, + { + "speaker": "A", + "text": "Oh, that sounds nice! By the way, what part of the beach were you at? I've been thinking of visiting a quieter spot.", + "original_text": "Oh, that sounds nice! By the way, what part of the beach were you at? I've been thinking of visiting a quieter spot.", + "start_time": 13.388614737514343, + "end_time": 20.48231088263906, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--8/temp/line_4_A.wav", + "silence_duration": 0.4805509510300182, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "It was a small, private stretch near the south end. But I was saying, they invited me over, and it was really relaxing. So, what did you do this weekend?", + "original_text": "It was a small, private stretch near the south end. But I was saying, they invited me over, and it was really relaxing. So, what did you do this weekend?", + "start_time": 21.04041967601453, + "end_time": 29.95688226104854, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--8/temp/line_5_B.wav", + "silence_duration": 0.558108793375472, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I wish I could say I did something as fun as you did. I spent most of it in the library, working on that research project. It's been taking up all my free time lately.", + "original_text": "I wish I could say I did something as fun as you did. I spent most of it in the library, working on that research project. It's been taking up all my free time lately.", + "start_time": 30.46751821900009, + "end_time": 40.661078309703036, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--8/temp/line_6_A.wav", + "silence_duration": 0.5106359579515491, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Oh, I figured. You must be exhausted. But before we get into that, you mentioned you jogged on the beach. How was that? I've heard running on sand can be tough.", + "original_text": "Oh, I figured. You must be exhausted. But before we get into that, you mentioned you jogged on the beach. How was that? I've heard running on sand can be tough.", + "start_time": 41.032324942747216, + "end_time": 49.44955850283792, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--8/temp/line_7_B.wav", + "silence_duration": 0.37124663304418254, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "It was harder than I expected! I couldn't get through a whole game of volleyball before I had to sit down. The sand just drains your energy.", + "original_text": "It was harder than I expected! I couldn't get through a whole game of volleyball before I had to sit down. The sand just drains your energy.", + "start_time": 49.79276206739257, + "end_time": 57.44373712408191, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--8/temp/line_8_A.wav", + "silence_duration": 0.343203564554654, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I can imagine. Did you get to swim at all, or was it just too cold?", + "original_text": "I can imagine. Did you get to swim at all, or was it just too cold?", + "start_time": 57.801609318961425, + "end_time": 61.2962124935646, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--8/temp/line_9_B.wav", + "silence_duration": 0.35787219487951205, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I wanted to, but the water was freezing. I only managed to get in up to my knees. But anyway, how's that research project going?", + "original_text": "I wanted to, but the water was freezing. I only managed to get in up to my knees. But anyway, how's that research project going?", + "start_time": 61.72732217659133, + "end_time": 69.95879609949382, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--8/temp/line_10_A.wav", + "silence_duration": 0.4311096830267227, + "is_interrupted": false + } + ] + }, + "DialogSum--val--9": { + "original_text": "A: How do you usually spend your leisure time? I mean, do you have any special interests out of your job? \nB: Of course. You see, almost everyone has some kind of hobby—[interrupt] I was just about to mention that I find it really important to have something to unwind with after a long day, especially activities that engage both creativity and technical skills like photography or painting. \nA: Yeah, you're quite right. What's your hobby? \nB: I like taking photos outdoors. \nA: Oh, photography, it's really a good hobby. \nB: Yes, I usually develop and print all my own photos. \nA: Wait, you yourself have a photo studio? \nB: Yes, simple as it is. It does work. By the way, I didn't finish earlier—I was going to say that photography helps me relax after work.", + "cleaned_text": "A: How do you usually spend your leisure time? I mean, do you have any special interests out of your job? \nB:Of course. You see, almost everyone has some kind of hobby— I was just about to mention that I find it really important to have something to unwind with after a long day, especially activities that engage both creativity and technical skills like photography or painting.\nA: Yeah, you're quite right. What's your hobby? \nB: I like taking photos outdoors. \nA: Oh, photography, it's really a good hobby. \nB: Yes, I usually develop and print all my own photos. \nA: Wait, you yourself have a photo studio? \nB: Yes, simple as it is. It does work. By the way, I didn't finish earlier—I was going to say that photography helps me relax after work.", + "total_duration": 40.46843537414966, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--9/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--9/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--9/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "How do you usually spend your leisure time? I mean, do you have any special interests out of your job?", + "original_text": "How do you usually spend your leisure time? I mean, do you have any special interests out of your job?", + "start_time": 0, + "end_time": 6.095238095238095, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--9/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Of course. You see, almost everyone has some kind of hobby—", + "original_text": "Of course. You see, almost everyone has some kind of hobby—[interrupt] I was just about to mention that I find it really important to have something to unwind with after a long day, especially activities that engage both creativity and technical skills like photography or painting.", + "start_time": 6.639186292898684, + "end_time": 20.408619399474645, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--9/temp/line_1_B.wav", + "silence_duration": 0.5439481976605884, + "is_interrupted": true, + "text_after_interrupt": "I was just about to mention that I find it really important to have something to unwind with after a long day, especially activities that engage both creativity and technical skills like photography or painting." + }, + { + "speaker": "A", + "text": "Yeah, you're quite right. What's your hobby?", + "original_text": "Yeah, you're quite right. What's your hobby?", + "start_time": 9.669390374531336, + "end_time": 13.198823481107299, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--9/temp/line_2_A.wav", + "silence_duration": 0.3411023650911967, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I like taking photos outdoors.", + "original_text": "I like taking photos outdoors.", + "start_time": 20.742765306211616, + "end_time": 22.51909183682386, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--9/temp/line_3_B.wav", + "silence_duration": 0.3341459067369706, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Oh, photography, it's really a good hobby.", + "original_text": "Oh, photography, it's really a good hobby.", + "start_time": 23.00591633828858, + "end_time": 26.175440147812388, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--9/temp/line_4_A.wav", + "silence_duration": 0.4868245014647187, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, I usually develop and print all my own photos.", + "original_text": "Yes, I usually develop and print all my own photos.", + "start_time": 26.718279929703186, + "end_time": 29.376964736959422, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--9/temp/line_5_B.wav", + "silence_duration": 0.5428397818907986, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Wait, you yourself have a photo studio?", + "original_text": "Wait, you yourself have a photo studio?", + "start_time": 29.741547601183722, + "end_time": 32.853021524086216, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--9/temp/line_6_A.wav", + "silence_duration": 0.36458286422430064, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, simple as it is. It does work. By the way, I didn't finish earlier—I was going to say that photography helps me relax after work.", + "original_text": "Yes, simple as it is. It does work. By the way, I didn't finish earlier—I was going to say that photography helps me relax after work.", + "start_time": 33.25866400946957, + "end_time": 40.46845992783692, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--9/temp/line_7_B.wav", + "silence_duration": 0.40564248538335496, + "is_interrupted": false + } + ] + }, + "DialogSum--val--10": { + "original_text": "A: Have you ever seen Bill Gate's home on the internet? \nB: No. What's it like? \nA: It's got its own library, theatre, swimming pool, and a guest house. The house itself has about ten different rooms that are all hooked up to computers so you can get things done in each room through [interrupt] voice commands or even with just a touch on a tablet, making the entire living experience incredibly seamless and futuristic while still maintaining comfort and luxury. \nB: Wow, that sounds incredible! But do you think you'd want to live in a place like that? \nA: I think his house is fantastic, but I wouldn't want to live there. You would have to hire one or two people to clean all the rooms in the house, plus a few people to take care of the gardens. \nB: What's your dream home like then? \nA: My dream home is actually just a small cottage in a quiet village in England. \nB: Would you want to buy an old cottage or build a new one yourself? \nA: Old homes are great because they've got character. I think that's [interrupt] what makes them so unique and charming, something you can't easily replicate with new constructions, especially when you consider the craftsmanship and history embedded in every wooden beam and stone wall. \nB: Is that why you wear second-hand clothes as well? Because they've got character? \nA: No, that's just because I don't have enough money to buy new clothes all the time! But coming back to the cottage, I think having that character in a home is really important. \nB: I see. If you lived in an old house, would it be decorated in a modern way?", + "cleaned_text": "A: Have you ever seen Bill Gate's home on the internet? \nB: No. What's it like? \nA:It's got its own library, theatre, swimming pool, and a guest house. The house itself has about ten different rooms that are all hooked up to computers so you can get things done in each room through voice commands or even with just a touch on a tablet, making the entire living experience incredibly seamless and futuristic while still maintaining comfort and luxury.\nB: Wow, that sounds incredible! But do you think you'd want to live in a place like that? \nA: I think his house is fantastic, but I wouldn't want to live there. You would have to hire one or two people to clean all the rooms in the house, plus a few people to take care of the gardens. \nB: What's your dream home like then? \nA: My dream home is actually just a small cottage in a quiet village in England. \nB: Would you want to buy an old cottage or build a new one yourself? \nA:Old homes are great because they've got character. I think that's what makes them so unique and charming, something you can't easily replicate with new constructions, especially when you consider the craftsmanship and history embedded in every wooden beam and stone wall.\nB: Is that why you wear second-hand clothes as well? Because they've got character? \nA: No, that's just because I don't have enough money to buy new clothes all the time! But coming back to the cottage, I think having that character in a home is really important. \nB: I see. If you lived in an old house, would it be decorated in a modern way?", + "total_duration": 79.43936507936507, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--10/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--10/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--10/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Have you ever seen Bill Gate's home on the internet?", + "original_text": "Have you ever seen Bill Gate's home on the internet?", + "start_time": 0, + "end_time": 2.809614512471655, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--10/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "No. What's it like?", + "original_text": "No. What's it like?", + "start_time": 3.2146791024701926, + "end_time": 4.491776608139126, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--10/temp/line_1_B.wav", + "silence_duration": 0.40506458999853767, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "It's got its own library, theatre, swimming pool, and a guest house. The house itself has about ten different rooms that are all hooked up to computers so you can get things done in each room through", + "original_text": "It's got its own library, theatre, swimming pool, and a guest house. The house itself has about ten different rooms that are all hooked up to computers so you can get things done in each room through [interrupt] voice commands or even with just a touch on a tablet, making the entire living experience incredibly seamless and futuristic while still maintaining comfort and luxury.", + "start_time": 5.041184950539758, + "end_time": 26.60091284169622, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--10/temp/line_2_A.wav", + "silence_duration": 0.5494083424006321, + "is_interrupted": true, + "text_after_interrupt": "voice commands or even with just a touch on a tablet, making the entire living experience incredibly seamless and futuristic while still maintaining comfort and luxury." + }, + { + "speaker": "B", + "text": "Wow, that sounds incredible! But do you think you'd want to live in a place like that?", + "original_text": "Wow, that sounds incredible! But do you think you'd want to live in a place like that?", + "start_time": 16.256423045777854, + "end_time": 20.389574973215495, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--10/temp/line_3_B.wav", + "silence_duration": 0.3744753063358698, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I think his house is fantastic, but I wouldn't want to live there. You would have to hire one or two people to clean all the rooms in the house, plus a few people to take care of the gardens.", + "original_text": "I think his house is fantastic, but I wouldn't want to live there. You would have to hire one or two people to clean all the rooms in the house, plus a few people to take care of the gardens.", + "start_time": 26.90628577307292, + "end_time": 37.65712477534049, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--10/temp/line_4_A.wav", + "silence_duration": 0.3053729313766975, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "What's your dream home like then?", + "original_text": "What's your dream home like then?", + "start_time": 38.03056407144901, + "end_time": 39.56308107825173, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--10/temp/line_5_B.wav", + "silence_duration": 0.3734392961085127, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "My dream home is actually just a small cottage in a quiet village in England.", + "original_text": "My dream home is actually just a small cottage in a quiet village in England.", + "start_time": 40.067894844092905, + "end_time": 44.665445864501066, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--10/temp/line_6_A.wav", + "silence_duration": 0.5048137658411795, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Would you want to buy an old cottage or build a new one yourself?", + "original_text": "Would you want to buy an old cottage or build a new one yourself?", + "start_time": 45.08825444937098, + "end_time": 48.06040864438231, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--10/temp/line_7_B.wav", + "silence_duration": 0.4228085848699137, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Old homes are great because they've got character. I think that's", + "original_text": "Old homes are great because they've got character. I think that's [interrupt] what makes them so unique and charming, something you can't easily replicate with new constructions, especially when you consider the craftsmanship and history embedded in every wooden beam and stone wall.", + "start_time": 48.51556320328967, + "end_time": 63.49243395158899, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--10/temp/line_8_A.wav", + "silence_duration": 0.4551545589073632, + "is_interrupted": true, + "text_after_interrupt": "what makes them so unique and charming, something you can't easily replicate with new constructions, especially when you consider the craftsmanship and history embedded in every wooden beam and stone wall." + }, + { + "speaker": "B", + "text": "Is that why you wear second-hand clothes as well? Because they've got character?", + "original_text": "Is that why you wear second-hand clothes as well? Because they've got character?", + "start_time": 57.567164672752575, + "end_time": 61.09659777932854, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--10/temp/line_9_B.wav", + "silence_duration": 0.41920039163703743, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "No, that's just because I don't have enough money to buy new clothes all the time! But coming back to the cottage, I think having that character in a home is really important.", + "original_text": "No, that's just because I don't have enough money to buy new clothes all the time! But coming back to the cottage, I think having that character in a home is really important.", + "start_time": 63.83613852994532, + "end_time": 74.2735081444578, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--10/temp/line_10_A.wav", + "silence_duration": 0.3437045783563309, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I see. If you lived in an old house, would it be decorated in a modern way?", + "original_text": "I see. If you lived in an old house, would it be decorated in a modern way?", + "start_time": 74.8418252895612, + "end_time": 79.43937630996936, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--10/temp/line_11_B.wav", + "silence_duration": 0.5683171451034054, + "is_interrupted": false + } + ] + }, + "DialogSum--val--11": { + "original_text": "A: I am tired of everything in my life.\nB: What? How happy your life is! I do envy you.\nA: You don't know that I have been over-protected by my mother these years. I am really about to [interrupt] break free and start living on my own terms, exploring new opportunities and discovering who I truly am without constant supervision and restrictions.\nB: Over-protected? That must be suffocating. Have you tried talking to her about how you feel?\nA: I have, but it's complicated. I was saying I'm really about to leave the family and spread my wings.\nB: That sounds like a big step. Do you have a plan in place for when you do?", + "cleaned_text": "A: I am tired of everything in my life.\nB: What? How happy your life is! I do envy you.\nA:You don't know that I have been over-protected by my mother these years. I am really about to break free and start living on my own terms, exploring new opportunities and discovering who I truly am without constant supervision and restrictions.\nB: Over-protected? That must be suffocating. Have you tried talking to her about how you feel?\nA: I have, but it's complicated. I was saying I'm really about to leave the family and spread my wings.\nB: That sounds like a big step. Do you have a plan in place for when you do?", + "total_duration": 31.935374149659864, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--11/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--11/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--11/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "I am tired of everything in my life.", + "original_text": "I am tired of everything in my life.", + "start_time": 0, + "end_time": 2.1942857142857144, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--11/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "What? How happy your life is! I do envy you.", + "original_text": "What? How happy your life is! I do envy you.", + "start_time": 2.648139978218495, + "end_time": 5.887323651687883, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--11/temp/line_1_B.wav", + "silence_duration": 0.4538542639327806, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "You don't know that I have been over-protected by my mother these years. I am really about to", + "original_text": "You don't know that I have been over-protected by my mother these years. I am really about to [interrupt] break free and start living on my own terms, exploring new opportunities and discovering who I truly am without constant supervision and restrictions.", + "start_time": 6.391880837570216, + "end_time": 21.34553163122101, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--11/temp/line_2_A.wav", + "silence_duration": 0.5045571858823332, + "is_interrupted": true, + "text_after_interrupt": "break free and start living on my own terms, exploring new opportunities and discovering who I truly am without constant supervision and restrictions." + }, + { + "speaker": "B", + "text": "Over-protected? That must be suffocating. Have you tried talking to her about how you feel?", + "original_text": "Over-protected? That must be suffocating. Have you tried talking to her about how you feel?", + "start_time": 11.767300338704004, + "end_time": 16.155871767275432, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--11/temp/line_3_B.wav", + "silence_duration": 0.4422234577527386, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I have, but it's complicated. I was saying I'm really about to leave the family and spread my wings.", + "original_text": "I have, but it's complicated. I was saying I'm really about to leave the family and spread my wings.", + "start_time": 21.753055603542528, + "end_time": 28.184983041184253, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--11/temp/line_4_A.wav", + "silence_duration": 0.4075239723215157, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "That sounds like a big step. Do you have a plan in place for when you do?", + "original_text": "That sounds like a big step. Do you have a plan in place for when you do?", + "start_time": 28.49883031218662, + "end_time": 31.93538360016848, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--11/temp/line_5_B.wav", + "silence_duration": 0.31384727100236465, + "is_interrupted": false + } + ] + }, + "DialogSum--val--13": { + "original_text": "A: Hi, Mr. Zhang. What's wrong? You don't look so happy. How was your [interrupt] weekend? I noticed you seemed quite preoccupied during our last meeting as well, so I'm wondering if there's something specific that's been bothering you lately.\nB: I was turned down again. It's frustrating. I guess you've got to teach me some skills. \nA: Me? I'm even less experienced than you are. \nB: At least you know what American women generally like in a man. \nA: Believe it or not, I guess American women like a man in good shape, which Chinese women may not care about so much. That's my honest opinion. I know you have been trying very [interrupt] hard to adapt to the culture here, and I genuinely admire your persistence despite all the challenges you've faced so far in your dating life.\nB: But American men are naturally taller than Chinese men. So even if I exercise, there aren't many chances. \nA: No, that's not true. I've met two American women who were married to Chinese. But those Chinese look very strong and healthy. So if you exercise more often, I bet it will surely be easier for you to date American girls. How old is Jacky Chan? He's small and short. But I bet he can have any American woman he wants. \nB: You know, that's going to be a tremendous change for me. Because I never exercise. By the way, what were you saying about what American women like? You mentioned something about being in good shape? \nA: Oh right, I was saying that American women generally appreciate a man who's in good shape. It's something that tends to stand out more here.", + "cleaned_text": "A:Hi, Mr. Zhang. What's wrong? You don't look so happy. How was your weekend? I noticed you seemed quite preoccupied during our last meeting as well, so I'm wondering if there's something specific that's been bothering you lately.\nB: I was turned down again. It's frustrating. I guess you've got to teach me some skills. \nA: Me? I'm even less experienced than you are. \nB: At least you know what American women generally like in a man. \nA:Believe it or not, I guess American women like a man in good shape, which Chinese women may not care about so much. That's my honest opinion. I know you have been trying very hard to adapt to the culture here, and I genuinely admire your persistence despite all the challenges you've faced so far in your dating life.\nB: But American men are naturally taller than Chinese men. So even if I exercise, there aren't many chances. \nA: No, that's not true. I've met two American women who were married to Chinese. But those Chinese look very strong and healthy. So if you exercise more often, I bet it will surely be easier for you to date American girls. How old is Jacky Chan? He's small and short. But I bet he can have any American woman he wants. \nB: You know, that's going to be a tremendous change for me. Because I never exercise. By the way, what were you saying about what American women like? You mentioned something about being in good shape? \nA: Oh right, I was saying that American women generally appreciate a man who's in good shape. It's something that tends to stand out more here.", + "total_duration": 81.75904761904762, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--13/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--13/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--13/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Hi, Mr. Zhang. What's wrong? You don't look so happy. How was your", + "original_text": "Hi, Mr. Zhang. What's wrong? You don't look so happy. How was your [interrupt] weekend? I noticed you seemed quite preoccupied during our last meeting as well, so I'm wondering if there's something specific that's been bothering you lately.", + "start_time": 0, + "end_time": 14.512471655328799, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--13/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": true, + "text_after_interrupt": "weekend? I noticed you seemed quite preoccupied during our last meeting as well, so I'm wondering if there's something specific that's been bothering you lately." + }, + { + "speaker": "B", + "text": "I was turned down again. It's frustrating. I guess you've got to teach me some skills.", + "original_text": "I was turned down again. It's frustrating. I guess you've got to teach me some skills.", + "start_time": 4.133151927437642, + "end_time": 8.185034013605442, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--13/temp/line_1_B.wav", + "silence_duration": 0.5416877667323909, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Me? I'm even less experienced than you are.", + "original_text": "Me? I'm even less experienced than you are.", + "start_time": 14.983847147934853, + "end_time": 18.362350549295396, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--13/temp/line_2_A.wav", + "silence_duration": 0.47137549260605394, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "At least you know what American women generally like in a man.", + "original_text": "At least you know what American women generally like in a man.", + "start_time": 18.882435234175723, + "end_time": 21.692049746647378, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--13/temp/line_3_B.wav", + "silence_duration": 0.5200846848803284, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Believe it or not, I guess American women like a man in good shape, which Chinese women may not care about so much. That's my honest opinion. I know you have been trying very", + "original_text": "Believe it or not, I guess American women like a man in good shape, which Chinese women may not care about so much. That's my honest opinion. I know you have been trying very [interrupt] hard to adapt to the culture here, and I genuinely admire your persistence despite all the challenges you've faced so far in your dating life.", + "start_time": 22.11877355786984, + "end_time": 40.71795723133923, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--13/temp/line_4_A.wav", + "silence_duration": 0.4267238112224636, + "is_interrupted": true, + "text_after_interrupt": "hard to adapt to the culture here, and I genuinely admire your persistence despite all the challenges you've faced so far in your dating life." + }, + { + "speaker": "B", + "text": "But American men are naturally taller than Chinese men. So even if I exercise, there aren't many chances.", + "original_text": "But American men are naturally taller than Chinese men. So even if I exercise, there aren't many chances.", + "start_time": 37.32442186139299, + "end_time": 43.05975065957893, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--13/temp/line_5_B.wav", + "silence_duration": 0.4278608986117689, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "No, that's not true. I've met two American women who were married to Chinese. But those Chinese look very strong and healthy. So if you exercise more often, I bet it will surely be easier for you to date American girls. How old is Jacky Chan? He's small and short. But I bet he can have any American woman he wants.", + "original_text": "No, that's not true. I've met two American women who were married to Chinese. But those Chinese look very strong and healthy. So if you exercise more often, I bet it will surely be easier for you to date American girls. How old is Jacky Chan? He's small and short. But I bet he can have any American woman he wants.", + "start_time": 43.587618329921966, + "end_time": 63.82380880611244, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--13/temp/line_6_A.wav", + "silence_duration": 0.5278676703430365, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "You know, that's going to be a tremendous change for me. Because I never exercise. By the way, what were you saying about what American women like? You mentioned something about being in good shape?", + "original_text": "You know, that's going to be a tremendous change for me. Because I never exercise. By the way, what were you saying about what American women like? You mentioned something about being in good shape?", + "start_time": 64.26756339092121, + "end_time": 73.54393527300738, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--13/temp/line_7_B.wav", + "silence_duration": 0.44375458480877, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Oh right, I was saying that American women generally appreciate a man who's in good shape. It's something that tends to stand out more here.", + "original_text": "Oh right, I was saying that American women generally appreciate a man who's in good shape. It's something that tends to stand out more here.", + "start_time": 74.10809683772213, + "end_time": 81.75907189441148, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--13/temp/line_8_A.wav", + "silence_duration": 0.564161564714745, + "is_interrupted": false + } + ] + }, + "DialogSum--val--14": { + "original_text": "A: What sports do you think women excel at most? \nB: I think women excel in every sport except the ones that are taboo for us to join in, like football. \nA: I mean which ones are they better at than [interrupt] men, like gymnastics or figure skating, where they often outperform due to different strengths and techniques that emphasize flexibility, grace, and artistic expression? \nB: Why do you care? Women and men are different all around. I don't think they can be compared. \nA: That's a good point. Let me change my question. What sports do women like best? \nB: Well, I know some women who love golf and I know others who love contact sports. \nA: Wait, earlier you mentioned that some sports are taboo for women, like football. Do you think that's changing? \nB: It is changing, but slowly. Still, there are societal norms that make it hard for women to fully participate in some sports. But back to your earlier question [interrupt] about which sports women like best, I think it really depends on the individual's personality, upbringing, and cultural background, which all play significant roles in shaping their preferences. \nA: Oh right, you were saying something about women and contact sports. Are those becoming more popular among women now? \nB: Yes, definitely. More women are getting into sports like rugby and boxing, breaking those old taboos.", + "cleaned_text": "A: What sports do you think women excel at most? \nB: I think women excel in every sport except the ones that are taboo for us to join in, like football. \nA:I mean which ones are they better at than men, like gymnastics or figure skating, where they often outperform due to different strengths and techniques that emphasize flexibility, grace, and artistic expression?\nB: Why do you care? Women and men are different all around. I don't think they can be compared. \nA: That's a good point. Let me change my question. What sports do women like best? \nB: Well, I know some women who love golf and I know others who love contact sports. \nA: Wait, earlier you mentioned that some sports are taboo for women, like football. Do you think that's changing? \nB:It is changing, but slowly. Still, there are societal norms that make it hard for women to fully participate in some sports. But back to your earlier question about which sports women like best, I think it really depends on the individual's personality, upbringing, and cultural background, which all play significant roles in shaping their preferences.\nA: Oh right, you were saying something about women and contact sports. Are those becoming more popular among women now? \nB: Yes, definitely. More women are getting into sports like rugby and boxing, breaking those old taboos.", + "total_duration": 65.83832199546485, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--14/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--14/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--14/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "What sports do you think women excel at most?", + "original_text": "What sports do you think women excel at most?", + "start_time": 0, + "end_time": 2.716734693877551, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--14/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I think women excel in every sport except the ones that are taboo for us to join in, like football.", + "original_text": "I think women excel in every sport except the ones that are taboo for us to join in, like football.", + "start_time": 3.2823644355278003, + "end_time": 8.739053777931428, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--14/temp/line_1_B.wav", + "silence_duration": 0.565629741650249, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I mean which ones are they better at than", + "original_text": "I mean which ones are they better at than [interrupt] men, like gymnastics or figure skating, where they often outperform due to different strengths and techniques that emphasize flexibility, grace, and artistic expression?", + "start_time": 9.157304309752531, + "end_time": 21.56837006938972, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--14/temp/line_2_A.wav", + "silence_duration": 0.4182505318211037, + "is_interrupted": true, + "text_after_interrupt": "men, like gymnastics or figure skating, where they often outperform due to different strengths and techniques that emphasize flexibility, grace, and artistic expression?" + }, + { + "speaker": "B", + "text": "Why do you care? Women and men are different all around. I don't think they can be compared.", + "original_text": "Why do you care? Women and men are different all around. I don't think they can be compared.", + "start_time": 11.525739683902192, + "end_time": 15.995580953743461, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--14/temp/line_3_B.wav", + "silence_duration": 0.5986730768728534, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "That's a good point. Let me change my question. What sports do women like best?", + "original_text": "That's a good point. Let me change my question. What sports do women like best?", + "start_time": 22.139404272274557, + "end_time": 26.713735338034194, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--14/temp/line_4_A.wav", + "silence_duration": 0.571034202884839, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Well, I know some women who love golf and I know others who love contact sports.", + "original_text": "Well, I know some women who love golf and I know others who love contact sports.", + "start_time": 27.117020520764488, + "end_time": 31.226952493553604, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--14/temp/line_5_B.wav", + "silence_duration": 0.40328518273029434, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Wait, earlier you mentioned that some sports are taboo for women, like football. Do you think that's changing?", + "original_text": "Wait, earlier you mentioned that some sports are taboo for women, like football. Do you think that's changing?", + "start_time": 31.626115014996873, + "end_time": 37.7445730648835, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--14/temp/line_6_A.wav", + "silence_duration": 0.3991625214432697, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "It is changing, but slowly. Still, there are societal norms that make it hard for women to fully participate in some sports. But back to your earlier question", + "original_text": "It is changing, but slowly. Still, there are societal norms that make it hard for women to fully participate in some sports. But back to your earlier question [interrupt] about which sports women like best, I think it really depends on the individual's personality, upbringing, and cultural background, which all play significant roles in shaping their preferences.", + "start_time": 38.295461360345584, + "end_time": 57.42870399073107, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--14/temp/line_7_B.wav", + "silence_duration": 0.5508882954620888, + "is_interrupted": true, + "text_after_interrupt": "about which sports women like best, I think it really depends on the individual's personality, upbringing, and cultural background, which all play significant roles in shaping their preferences." + }, + { + "speaker": "A", + "text": "Oh right, you were saying something about women and contact sports. Are those becoming more popular among women now?", + "original_text": "Oh right, you were saying something about women and contact sports. Are those becoming more popular among women now?", + "start_time": 52.918902059561205, + "end_time": 59.39726940649998, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--14/temp/line_8_A.wav", + "silence_duration": 0.31582281210643004, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, definitely. More women are getting into sports like rugby and boxing, breaking those old taboos.", + "original_text": "Yes, definitely. More women are getting into sports like rugby and boxing, breaking those old taboos.", + "start_time": 59.98691974057973, + "end_time": 65.8383483120083, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--14/temp/line_9_B.wav", + "silence_duration": 0.5896503340797503, + "is_interrupted": false + } + ] + }, + "DialogSum--val--15": { + "original_text": "A: Is there a city where it's always warm?\nB: Yes, there are many cities where it's almost always warm. San Diego, for [interrupt] example, has a very mild climate year-round with temperatures rarely dropping below 60 degrees Fahrenheit even in winter months.\nA: Oh, San Diego sounds nice! But are there any other cities where it's always hot?\nB: Many. Most of the cities in the southern part of the United States are hot all year.\nA: But why do so many people live there?\nB: Most people grow accustomed to the climate, but there are many others who complain about [interrupt] the high humidity and extreme temperatures during the summer months when heat indexes can reach dangerous levels above 100 degrees Fahrenheit.\nA: Complain? That's interesting. So, are there any cities where it rains a lot?\nB: Several. Two good examples are Seattle, in the state of Washington, and Portland, Oregon.\nA: Tell us about some cold cities.\nB: In the north there are many cities which are very cold in the winter. Boston and Chicago are two of them.\nA: Is it always cold in Chicago and Boston?\nB: Oh, no. On the contrary, there are many beautiful days, especially in the spring and fall. Also, about what I was saying earlier, people often complain about the heat, but they stay because of job opportunities or family ties.", + "cleaned_text": "A: Is there a city where it's always warm?\nB:Yes, there are many cities where it's almost always warm. San Diego, for example, has a very mild climate year-round with temperatures rarely dropping below 60 degrees Fahrenheit even in winter months.\nA: Oh, San Diego sounds nice! But are there any other cities where it's always hot?\nB: Many. Most of the cities in the southern part of the United States are hot all year.\nA: But why do so many people live there?\nB:Most people grow accustomed to the climate, but there are many others who complain about the high humidity and extreme temperatures during the summer months when heat indexes can reach dangerous levels above 100 degrees Fahrenheit.\nA: Complain? That's interesting. So, are there any cities where it rains a lot?\nB: Several. Two good examples are Seattle, in the state of Washington, and Portland, Oregon.\nA: Tell us about some cold cities.\nB: In the north there are many cities which are very cold in the winter. Boston and Chicago are two of them.\nA: Is it always cold in Chicago and Boston?\nB: Oh, no. On the contrary, there are many beautiful days, especially in the spring and fall. Also, about what I was saying earlier, people often complain about the heat, but they stay because of job opportunities or family ties.", + "total_duration": 62.42371882086168, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--15/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--15/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--15/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Is there a city where it's always warm?", + "original_text": "Is there a city where it's always warm?", + "start_time": 0, + "end_time": 2.078185941043084, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--15/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, there are many cities where it's almost always warm. San Diego, for", + "original_text": "Yes, there are many cities where it's almost always warm. San Diego, for [interrupt] example, has a very mild climate year-round with temperatures rarely dropping below 60 degrees Fahrenheit even in winter months.", + "start_time": 2.4666033916868684, + "end_time": 12.218984344067822, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--15/temp/line_1_B.wav", + "silence_duration": 0.38841745064378463, + "is_interrupted": true, + "text_after_interrupt": "example, has a very mild climate year-round with temperatures rarely dropping below 60 degrees Fahrenheit even in winter months." + }, + { + "speaker": "A", + "text": "Oh, San Diego sounds nice! But are there any other cities where it's always hot?", + "original_text": "Oh, San Diego sounds nice! But are there any other cities where it's always hot?", + "start_time": 5.98442652093857, + "end_time": 10.756127201210678, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--15/temp/line_2_A.wav", + "silence_duration": 0.4387051703712739, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Many. Most of the cities in the southern part of the United States are hot all year.", + "original_text": "Many. Most of the cities in the southern part of the United States are hot all year.", + "start_time": 12.758504651374302, + "end_time": 17.495375399673623, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--15/temp/line_3_B.wav", + "silence_duration": 0.5395203073064809, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "But why do so many people live there?", + "original_text": "But why do so many people live there?", + "start_time": 17.95962285362038, + "end_time": 19.991368885366413, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--15/temp/line_4_A.wav", + "silence_duration": 0.4642474539467583, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Most people grow accustomed to the climate, but there are many others who complain about", + "original_text": "Most people grow accustomed to the climate, but there are many others who complain about [interrupt] the high humidity and extreme temperatures during the summer months when heat indexes can reach dangerous levels above 100 degrees Fahrenheit.", + "start_time": 20.340651423656983, + "end_time": 32.15960833975676, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--15/temp/line_5_B.wav", + "silence_duration": 0.3492825382905701, + "is_interrupted": true, + "text_after_interrupt": "the high humidity and extreme temperatures during the summer months when heat indexes can reach dangerous levels above 100 degrees Fahrenheit." + }, + { + "speaker": "A", + "text": "Complain? That's interesting. So, are there any cities where it rains a lot?", + "original_text": "Complain? That's interesting. So, are there any cities where it rains a lot?", + "start_time": 29.543241009529297, + "end_time": 33.93181243810073, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--15/temp/line_6_A.wav", + "silence_duration": 0.3858654570300314, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Several. Two good examples are Seattle, in the state of Washington, and Portland, Oregon.", + "original_text": "Several. Two good examples are Seattle, in the state of Washington, and Portland, Oregon.", + "start_time": 34.393516982018724, + "end_time": 39.40902718610036, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--15/temp/line_7_B.wav", + "silence_duration": 0.46170454391799737, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Tell us about some cold cities.", + "original_text": "Tell us about some cold cities.", + "start_time": 39.88026721045748, + "end_time": 41.79591346896088, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--15/temp/line_8_A.wav", + "silence_duration": 0.4712400243571194, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "In the north there are many cities which are very cold in the winter. Boston and Chicago are two of them.", + "original_text": "In the north there are many cities which are very cold in the winter. Boston and Chicago are two of them.", + "start_time": 42.31119776282387, + "end_time": 47.3615378988783, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--15/temp/line_9_B.wav", + "silence_duration": 0.5152842938629931, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Is it always cold in Chicago and Boston?", + "original_text": "Is it always cold in Chicago and Boston?", + "start_time": 47.83861957412537, + "end_time": 50.33476469884192, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--15/temp/line_10_A.wav", + "silence_duration": 0.4770816752470723, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Oh, no. On the contrary, there are many beautiful days, especially in the spring and fall. Also, about what I was saying earlier, people often complain about the heat, but they stay because of job opportunities or family ties.", + "original_text": "Oh, no. On the contrary, there are many beautiful days, especially in the spring and fall. Also, about what I was saying earlier, people often complain about the heat, but they stay because of job opportunities or family ties.", + "start_time": 50.7673036597102, + "end_time": 62.42372089327029, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--15/temp/line_11_B.wav", + "silence_duration": 0.4325389608682766, + "is_interrupted": false + } + ] + }, + "DialogSum--val--16": { + "original_text": "A: Julia, I would like to have a word with you. Have a seat. \nB: Thank you. \nA: According to your performance, I decided to give you a salary increase. From next month, there will be a 2,000 yuan raise to your salary. Although your first raise might not sound considerable, the company believes that with your ability, sooner or later you'll [interrupt] be in line for more significant raises as you continue to grow and contribute to the company's success through innovative solutions and leadership potential we've observed in your work. \nB: Sorry to interrupt, Mr. George, but I wanted to ask—does this raise reflect my recent project contributions, or is it more based on my overall performance since joining? \nA: It's based on both, actually. Your recent projects have been impressive, and that's why we believe you'll get a better raise in the future as well. I think you deserved this. \nB: Thank you again. I'll keep doing my best.", + "cleaned_text": "A: Julia, I would like to have a word with you. Have a seat. \nB: Thank you. \nA:According to your performance, I decided to give you a salary increase. From next month, there will be a 2,000 yuan raise to your salary. Although your first raise might not sound considerable, the company believes that with your ability, sooner or later you'll be in line for more significant raises as you continue to grow and contribute to the company's success through innovative solutions and leadership potential we've observed in your work.\nB: Sorry to interrupt, Mr. George, but I wanted to ask—does this raise reflect my recent project contributions, or is it more based on my overall performance since joining? \nA: It's based on both, actually. Your recent projects have been impressive, and that's why we believe you'll get a better raise in the future as well. I think you deserved this. \nB: Thank you again. I'll keep doing my best.", + "total_duration": 44.39551020408163, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--16/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--16/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--16/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Julia, I would like to have a word with you. Have a seat.", + "original_text": "Julia, I would like to have a word with you. Have a seat.", + "start_time": 0, + "end_time": 3.912562358276644, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--16/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Thank you.", + "original_text": "Thank you.", + "start_time": 4.3841975513957125, + "end_time": 4.918256508311813, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--16/temp/line_1_B.wav", + "silence_duration": 0.47163519311906843, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "According to your performance, I decided to give you a salary increase. From next month, there will be a 2,000 yuan raise to your salary. Although your first raise might not sound considerable, the company believes that with your ability, sooner or later you'll", + "original_text": "According to your performance, I decided to give you a salary increase. From next month, there will be a 2,000 yuan raise to your salary. Although your first raise might not sound considerable, the company believes that with your ability, sooner or later you'll [interrupt] be in line for more significant raises as you continue to grow and contribute to the company's success through innovative solutions and leadership potential we've observed in your work.", + "start_time": 5.357055953920647, + "end_time": 30.2488473371406, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--16/temp/line_2_A.wav", + "silence_duration": 0.4387994456088349, + "is_interrupted": true, + "text_after_interrupt": "be in line for more significant raises as you continue to grow and contribute to the company's success through innovative solutions and leadership potential we've observed in your work." + }, + { + "speaker": "B", + "text": "Sorry to interrupt, Mr. George, but I wanted to ask—does this raise reflect my recent project contributions, or is it more based on my overall performance since joining?", + "original_text": "Sorry to interrupt, Mr. George, but I wanted to ask—does this raise reflect my recent project contributions, or is it more based on my overall performance since joining?", + "start_time": 20.926035545757383, + "end_time": 30.22562738249208, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--16/temp/line_3_B.wav", + "silence_duration": 0.40756813379394313, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "It's based on both, actually. Your recent projects have been impressive, and that's why we believe you'll get a better raise in the future as well. I think you deserved this.", + "original_text": "It's based on both, actually. Your recent projects have been impressive, and that's why we believe you'll get a better raise in the future as well. I think you deserved this.", + "start_time": 30.847094713133956, + "end_time": 41.89979312583237, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--16/temp/line_4_A.wav", + "silence_duration": 0.5982473759933569, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Thank you again. I'll keep doing my best.", + "original_text": "Thank you again. I'll keep doing my best.", + "start_time": 42.456655462574254, + "end_time": 44.39552167572618, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--16/temp/line_5_B.wav", + "silence_duration": 0.5568623367418869, + "is_interrupted": false + } + ] + }, + "DialogSum--val--17": { + "original_text": "A: I'm afraid it's bad news for you. You haven't got the position. \nB: Oh, no! I can't have failed. Are you sure? \nA: I'm afraid so. I'm terribly sorry. \nB: It sucks. But Arden told me he's satisfied with my qualifications and [interrupt] thought I was a strong candidate for the role, especially considering my extensive experience and the successful projects I've led in the past year. \nA: Sorry to cut in, but I just want to clarify—Arden might have been satisfied, but he's not the only one who makes the final decision. There were others involved in the process. \nB: Right, I understand. But how am I going to face the fellows in our office? They thought I would be promoted. They must be waiting for my good news. \nA: I don't think the thing can be that serious. You should face the result. Besides, I don't think the position is the best for you. \nB: But I lost the chance. And you mentioned Arden wasn't the only one deciding—who else was involved?", + "cleaned_text": "A: I'm afraid it's bad news for you. You haven't got the position. \nB: Oh, no! I can't have failed. Are you sure? \nA: I'm afraid so. I'm terribly sorry. \nB:It sucks. But Arden told me he's satisfied with my qualifications and thought I was a strong candidate for the role, especially considering my extensive experience and the successful projects I've led in the past year.\nA: Sorry to cut in, but I just want to clarify—Arden might have been satisfied, but he's not the only one who makes the final decision. There were others involved in the process. \nB: Right, I understand. But how am I going to face the fellows in our office? They thought I would be promoted. They must be waiting for my good news. \nA: I don't think the thing can be that serious. You should face the result. Besides, I don't think the position is the best for you. \nB: But I lost the chance. And you mentioned Arden wasn't the only one deciding—who else was involved?", + "total_duration": 47.47424036281179, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--17/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--17/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--17/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "I'm afraid it's bad news for you. You haven't got the position.", + "original_text": "I'm afraid it's bad news for you. You haven't got the position.", + "start_time": 0, + "end_time": 3.889342403628118, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--17/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Oh, no! I can't have failed. Are you sure?", + "original_text": "Oh, no! I can't have failed. Are you sure?", + "start_time": 4.285128801179243, + "end_time": 6.7232240392744815, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--17/temp/line_1_B.wav", + "silence_duration": 0.39578639755112544, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I'm afraid so. I'm terribly sorry.", + "original_text": "I'm afraid so. I'm terribly sorry.", + "start_time": 7.08933474136307, + "end_time": 10.165978732292775, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--17/temp/line_2_A.wav", + "silence_duration": 0.3661107020885884, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "It sucks. But Arden told me he's satisfied with my qualifications and", + "original_text": "It sucks. But Arden told me he's satisfied with my qualifications and [interrupt] thought I was a strong candidate for the role, especially considering my extensive experience and the successful projects I've led in the past year.", + "start_time": 10.480068817459657, + "end_time": 22.11326609637122, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--17/temp/line_3_B.wav", + "silence_duration": 0.31409008516688236, + "is_interrupted": true, + "text_after_interrupt": "thought I was a strong candidate for the role, especially considering my extensive experience and the successful projects I've led in the past year." + }, + { + "speaker": "A", + "text": "Sorry to cut in, but I just want to clarify—Arden might have been satisfied, but he's not the only one who makes the final decision. There were others involved in the process.", + "original_text": "Sorry to cut in, but I just want to clarify—Arden might have been satisfied, but he's not the only one who makes the final decision. There were others involved in the process.", + "start_time": 15.809048409296391, + "end_time": 26.66437720748233, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--17/temp/line_4_A.wav", + "silence_duration": 0.5500353153153363, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Right, I understand. But how am I going to face the fellows in our office? They thought I would be promoted. They must be waiting for my good news.", + "original_text": "Right, I understand. But how am I going to face the fellows in our office? They thought I would be promoted. They must be waiting for my good news.", + "start_time": 27.182328521339056, + "end_time": 34.46178430365198, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--17/temp/line_5_B.wav", + "silence_duration": 0.5179513138567234, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I don't think the thing can be that serious. You should face the result. Besides, I don't think the position is the best for you.", + "original_text": "I don't think the thing can be that serious. You should face the result. Besides, I don't think the position is the best for you.", + "start_time": 34.9657439625336, + "end_time": 42.33807956344063, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--17/temp/line_6_A.wav", + "silence_duration": 0.5039596588816174, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "But I lost the chance. And you mentioned Arden wasn't the only one deciding—who else was involved?", + "original_text": "But I lost the chance. And you mentioned Arden wasn't the only one deciding—who else was involved?", + "start_time": 42.92313509500093, + "end_time": 47.47424620611204, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--17/temp/line_7_B.wav", + "silence_duration": 0.5850555315602983, + "is_interrupted": false + } + ] + }, + "DialogSum--val--19": { + "original_text": "A: Can I help you, ma'am? \nB: Yes, will you keep our bags until 6 p.m.? \nA: Are you all our guests? \nB: Yes, we checked out just now. \nA: Please fill in this [interrupt] form with your details so we can store your bags securely and ensure they are properly labeled for easy retrieval when you return later this evening. \nB: Oh, before I forget, do you need any ID or proof of our stay while filling this out? \nA: No, just your name and room number will be fine. But as I was saying, please fill in this form. \nB: Is this all right? \nA: So you are leaving this evening. We keep your bags until 6 p.m. Here's your tag. \nB: Thanks a lot.", + "cleaned_text": "A: Can I help you, ma'am? \nB: Yes, will you keep our bags until 6 p.m.? \nA: Are you all our guests? \nB: Yes, we checked out just now. \nA:Please fill in this form with your details so we can store your bags securely and ensure they are properly labeled for easy retrieval when you return later this evening.\nB: Oh, before I forget, do you need any ID or proof of our stay while filling this out? \nA: No, just your name and room number will be fine. But as I was saying, please fill in this form. \nB: Is this all right? \nA: So you are leaving this evening. We keep your bags until 6 p.m. Here's your tag. \nB: Thanks a lot.", + "total_duration": 32.75170068027211, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--19/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--19/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--19/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Can I help you, ma'am?", + "original_text": "Can I help you, ma'am?", + "start_time": 0, + "end_time": 1.0797278911564625, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--19/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, will you keep our bags until 6 p.m.?", + "original_text": "Yes, will you keep our bags until 6 p.m.?", + "start_time": 1.5859058047306571, + "end_time": 3.954341178880317, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--19/temp/line_1_B.wav", + "silence_duration": 0.5061779135741945, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Are you all our guests?", + "original_text": "Are you all our guests?", + "start_time": 4.446651759954051, + "end_time": 5.805019106892827, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--19/temp/line_2_A.wav", + "silence_duration": 0.4923105810737335, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, we checked out just now.", + "original_text": "Yes, we checked out just now.", + "start_time": 6.321212202171794, + "end_time": 8.039488846162724, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--19/temp/line_3_B.wav", + "silence_duration": 0.5161930952789676, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Please fill in this", + "original_text": "Please fill in this [interrupt] form with your details so we can store your bags securely and ensure they are properly labeled for easy retrieval when you return later this evening.", + "start_time": 8.567017788139893, + "end_time": 18.156859057981162, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--19/temp/line_4_A.wav", + "silence_duration": 0.5275289419771687, + "is_interrupted": true, + "text_after_interrupt": "form with your details so we can store your bags securely and ensure they are properly labeled for easy retrieval when you return later this evening." + }, + { + "speaker": "B", + "text": "Oh, before I forget, do you need any ID or proof of our stay while filling this out?", + "original_text": "Oh, before I forget, do you need any ID or proof of our stay while filling this out?", + "start_time": 9.844115293808827, + "end_time": 14.232686722380254, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--19/temp/line_5_B.wav", + "silence_duration": 0.4154015923108265, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "No, just your name and room number will be fine. But as I was saying, please fill in this form.", + "original_text": "No, just your name and room number will be fine. But as I was saying, please fill in this form.", + "start_time": 18.621475096332095, + "end_time": 24.53095355438198, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--19/temp/line_6_A.wav", + "silence_duration": 0.46461603835093324, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Is this all right?", + "original_text": "Is this all right?", + "start_time": 25.083063185797858, + "end_time": 25.953811485117587, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--19/temp/line_7_B.wav", + "silence_duration": 0.5521096314158777, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "So you are leaving this evening. We keep your bags until 6 p.m. Here's your tag.", + "original_text": "So you are leaving this evening. We keep your bags until 6 p.m. Here's your tag.", + "start_time": 26.4224043322471, + "end_time": 31.49596442295005, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--19/temp/line_8_A.wav", + "silence_duration": 0.468592847129514, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Thanks a lot.", + "original_text": "Thanks a lot.", + "start_time": 31.97384980408009, + "end_time": 32.75171828480571, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--19/temp/line_9_B.wav", + "silence_duration": 0.4778853811300397, + "is_interrupted": false + } + ] + }, + "DialogSum--val--20": { + "original_text": "A: Sorry, Brad. But you are going to have to re-do this.\nB: What's the problem, Ms. Murphy?\nA: It's badly organized. I can't present this to [interrupt] the board in its current state because the flow of information is confusing and the visual presentation doesn't meet our corporate standards for professional reports.\nB: The board? I understand. I'll make sure it's more structured. Is there anything specific you'd like me to focus on?\nA: Yes, the key points aren't clear enough. And I was also going to mention that the data analysis section needs more [interrupt] depth, especially in terms of comparing our current performance with industry benchmarks and providing actionable insights that could help us improve our market position.\nB: Oh, more detailed breakdowns? I can definitely add that. I'll re-work it and give it back to you this afternoon.", + "cleaned_text": "A: Sorry, Brad. But you are going to have to re-do this.\nB: What's the problem, Ms. Murphy?\nA:It's badly organized. I can't present this to the board in its current state because the flow of information is confusing and the visual presentation doesn't meet our corporate standards for professional reports.\nB: The board? I understand. I'll make sure it's more structured. Is there anything specific you'd like me to focus on?\nA:Yes, the key points aren't clear enough. And I was also going to mention that the data analysis section needs more depth, especially in terms of comparing our current performance with industry benchmarks and providing actionable insights that could help us improve our market position.\nB: Oh, more detailed breakdowns? I can definitely add that. I'll re-work it and give it back to you this afternoon.", + "total_duration": 37.88453514739229, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--20/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--20/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--20/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Sorry, Brad. But you are going to have to re-do this.", + "original_text": "Sorry, Brad. But you are going to have to re-do this.", + "start_time": 0, + "end_time": 3.633922902494331, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--20/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "What's the problem, Ms. Murphy?", + "original_text": "What's the problem, Ms. Murphy?", + "start_time": 4.134210208425758, + "end_time": 5.6318972832556895, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--20/temp/line_1_B.wav", + "silence_duration": 0.5002873059314275, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "It's badly organized. I can't present this to", + "original_text": "It's badly organized. I can't present this to [interrupt] the board in its current state because the flow of information is confusing and the visual presentation doesn't meet our corporate standards for professional reports.", + "start_time": 6.089149047671474, + "end_time": 18.802074217739502, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--20/temp/line_2_A.wav", + "silence_duration": 0.4572517644157844, + "is_interrupted": true, + "text_after_interrupt": "the board in its current state because the flow of information is confusing and the visual presentation doesn't meet our corporate standards for professional reports." + }, + { + "speaker": "B", + "text": "The board? I understand. I'll make sure it's more structured. Is there anything specific you'd like me to focus on?", + "original_text": "The board? I understand. I'll make sure it's more structured. Is there anything specific you'd like me to focus on?", + "start_time": 9.142573083952653, + "end_time": 15.55128056694585, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--20/temp/line_3_B.wav", + "silence_duration": 0.482796334699901, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Yes, the key points aren't clear enough. And I was also going to mention that the data analysis section needs more", + "original_text": "Yes, the key points aren't clear enough. And I was also going to mention that the data analysis section needs more [interrupt] depth, especially in terms of comparing our current performance with industry benchmarks and providing actionable insights that could help us improve our market position.", + "start_time": 19.302781447482, + "end_time": 36.41588802344572, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--20/temp/line_4_A.wav", + "silence_duration": 0.5007072297424985, + "is_interrupted": true, + "text_after_interrupt": "depth, especially in terms of comparing our current performance with industry benchmarks and providing actionable insights that could help us improve our market position." + }, + { + "speaker": "B", + "text": "Oh, more detailed breakdowns? I can definitely add that. I'll re-work it and give it back to you this afternoon.", + "original_text": "Oh, more detailed breakdowns? I can definitely add that. I'll re-work it and give it back to you this afternoon.", + "start_time": 32.613646724396645, + "end_time": 37.88457642961207, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--20/temp/line_5_B.wav", + "silence_duration": 0.3513353313568865, + "is_interrupted": false + } + ] + }, + "DialogSum--val--21": { + "original_text": "A: Did you know that drinking beer helps you sing better? \nB: Are you sure? How do you [interrupt] know that? Have you tried it yourself or is this something you've researched extensively through scientific studies or personal experimentation? \nA: Sorry, I just remembered—how do you know that? Is it based on personal experience or something you read? \nB: Well, usually people think I'm a terrible singer, but after we all have a few beers, they say I sound a lot better! \nA: Well, I heard that if you drink enough beer, you can speak foreign languages better. . . \nB: Then after a few beers, you'll be singing in Taiwanese? \nA: Maybe. . . But wait, I didn't catch how you knew people think you sing better after drinking. Was that just from your friends? \nB: Yeah, it's mostly just my friends who've noticed.", + "cleaned_text": "A: Did you know that drinking beer helps you sing better? \nB:Are you sure? How do you know that? Have you tried it yourself or is this something you've researched extensively through scientific studies or personal experimentation?\nA: Sorry, I just remembered—how do you know that? Is it based on personal experience or something you read? \nB: Well, usually people think I'm a terrible singer, but after we all have a few beers, they say I sound a lot better! \nA: Well, I heard that if you drink enough beer, you can speak foreign languages better. . . \nB: Then after a few beers, you'll be singing in Taiwanese? \nA: Maybe. . . But wait, I didn't catch how you knew people think you sing better after drinking. Was that just from your friends? \nB: Yeah, it's mostly just my friends who've noticed.", + "total_duration": 36.72562358276644, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--21/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--21/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--21/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Did you know that drinking beer helps you sing better?", + "original_text": "Did you know that drinking beer helps you sing better?", + "start_time": 0, + "end_time": 2.6122448979591835, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--21/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Are you sure? How do you", + "original_text": "Are you sure? How do you [interrupt] know that? Have you tried it yourself or is this something you've researched extensively through scientific studies or personal experimentation?", + "start_time": 3.015987557154163, + "end_time": 11.247461480056657, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--21/temp/line_1_B.wav", + "silence_duration": 0.4037426591949791, + "is_interrupted": true, + "text_after_interrupt": "know that? Have you tried it yourself or is this something you've researched extensively through scientific studies or personal experimentation?" + }, + { + "speaker": "A", + "text": "Sorry, I just remembered—how do you know that? Is it based on personal experience or something you read?", + "original_text": "Sorry, I just remembered—how do you know that? Is it based on personal experience or something you read?", + "start_time": 4.606554450578199, + "end_time": 11.003651956247133, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--21/temp/line_2_A.wav", + "silence_duration": 0.380874274961859, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Well, usually people think I'm a terrible singer, but after we all have a few beers, they say I sound a lot better!", + "original_text": "Well, usually people think I'm a terrible singer, but after we all have a few beers, they say I sound a lot better!", + "start_time": 11.755334154342373, + "end_time": 17.73447247633784, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--21/temp/line_3_B.wav", + "silence_duration": 0.5078726742857165, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Well, I heard that if you drink enough beer, you can speak foreign languages better. . .", + "original_text": "Well, I heard that if you drink enough beer, you can speak foreign languages better. . .", + "start_time": 18.11072182026905, + "end_time": 22.487683271516214, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--21/temp/line_4_A.wav", + "silence_duration": 0.376249343931211, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Then after a few beers, you'll be singing in Taiwanese?", + "original_text": "Then after a few beers, you'll be singing in Taiwanese?", + "start_time": 23.081222272589166, + "end_time": 25.797956966466717, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--21/temp/line_5_B.wav", + "silence_duration": 0.5935390010729523, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Maybe. . . But wait, I didn't catch how you knew people think you sing better after drinking. Was that just from your friends?", + "original_text": "Maybe. . . But wait, I didn't catch how you knew people think you sing better after drinking. Was that just from your friends?", + "start_time": 26.394222037072943, + "end_time": 33.96392725249245, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--21/temp/line_6_A.wav", + "silence_duration": 0.5962650706062245, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yeah, it's mostly just my friends who've noticed.", + "original_text": "Yeah, it's mostly just my friends who've noticed.", + "start_time": 34.45010872792128, + "end_time": 36.72566428347684, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--21/temp/line_7_B.wav", + "silence_duration": 0.4861814754288383, + "is_interrupted": false + } + ] + }, + "DialogSum--val--23": { + "original_text": "A: Amy, you don't look so well. What happened? \nB: Yes. I feel terrible. I have been coughing for the whole [interrupt] night, and I couldn't sleep at all because my throat feels incredibly sore and my head is pounding like there's a drum inside it. \nA: Morning? That sounds concerning. Do you feel anything else? \nB: Yes. I feel chilly and sluggish. \nA: Have you had similar feelings before? \nB: No. This is my first day abroad. I am not sure what is [interrupt] causing this, but I hope it's nothing serious like a viral infection or some kind of allergic reaction to the new environment. \nA: Wrong with you? It might just be the local climate not agreeing with you. I'll get you some medicine. \nB: Thank you very much.", + "cleaned_text": "A: Amy, you don't look so well. What happened? \nB:Yes. I feel terrible. I have been coughing for the whole night, and I couldn't sleep at all because my throat feels incredibly sore and my head is pounding like there's a drum inside it.\nA: Morning? That sounds concerning. Do you feel anything else? \nB: Yes. I feel chilly and sluggish. \nA: Have you had similar feelings before? \nB:No. This is my first day abroad. I am not sure what is causing this, but I hope it's nothing serious like a viral infection or some kind of allergic reaction to the new environment.\nA: Wrong with you? It might just be the local climate not agreeing with you. I'll get you some medicine. \nB: Thank you very much.", + "total_duration": 32.359591836734694, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--23/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--23/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--23/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Amy, you don't look so well. What happened?", + "original_text": "Amy, you don't look so well. What happened?", + "start_time": 0, + "end_time": 2.4961451247165534, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--23/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes. I feel terrible. I have been coughing for the whole", + "original_text": "Yes. I feel terrible. I have been coughing for the whole [interrupt] night, and I couldn't sleep at all because my throat feels incredibly sore and my head is pounding like there's a drum inside it.", + "start_time": 2.9526853253403806, + "end_time": 11.92719779699571, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--23/temp/line_1_B.wav", + "silence_duration": 0.4565402006238273, + "is_interrupted": true, + "text_after_interrupt": "night, and I couldn't sleep at all because my throat feels incredibly sore and my head is pounding like there's a drum inside it." + }, + { + "speaker": "A", + "text": "Morning? That sounds concerning. Do you feel anything else?", + "original_text": "Morning? That sounds concerning. Do you feel anything else?", + "start_time": 6.2266989307825575, + "end_time": 10.104431357086412, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--23/temp/line_2_A.wav", + "silence_duration": 0.3129817549685412, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes. I feel chilly and sluggish.", + "original_text": "Yes. I feel chilly and sluggish.", + "start_time": 12.25117540840277, + "end_time": 14.190041621554697, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--23/temp/line_3_B.wav", + "silence_duration": 0.32397761140705916, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Have you had similar feelings before?", + "original_text": "Have you had similar feelings before?", + "start_time": 14.767035134823601, + "end_time": 16.775561211921108, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--23/temp/line_4_A.wav", + "silence_duration": 0.5769935132689052, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "No. This is my first day abroad. I am not sure what is", + "original_text": "No. This is my first day abroad. I am not sure what is [interrupt] causing this, but I hope it's nothing serious like a viral infection or some kind of allergic reaction to the new environment.", + "start_time": 17.120299703517414, + "end_time": 25.955492447281586, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--23/temp/line_5_B.wav", + "silence_duration": 0.34473849159630665, + "is_interrupted": true, + "text_after_interrupt": "causing this, but I hope it's nothing serious like a viral infection or some kind of allergic reaction to the new environment." + }, + { + "speaker": "A", + "text": "Wrong with you? It might just be the local climate not agreeing with you. I'll get you some medicine.", + "original_text": "Wrong with you? It might just be the local climate not agreeing with you. I'll get you some medicine.", + "start_time": 24.55436744981363, + "end_time": 30.846975159564195, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--23/temp/line_6_A.wav", + "silence_duration": 0.48984560974029084, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Thank you very much.", + "original_text": "Thank you very much.", + "start_time": 31.279906584475818, + "end_time": 32.35963447563228, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--23/temp/line_7_B.wav", + "silence_duration": 0.43293142491162306, + "is_interrupted": false + } + ] + }, + "DialogSum--val--24": { + "original_text": "A: Would you like to order now, madam?\nB: Yes, please. I'd like the steak and mushrooms.\nA: How would you like your steak, rare, medium, or well-done?\nB: I'd like it well done, please.\nA: What kind of potatoes would you like to go with that, mashed, boiled, or baked?\nB: I think I'll have baked potatoes. And can I now have [interrupt] some extra butter on the side as well as a small portion of sour cream and chives to complement the potatoes perfectly?\nA: Sorry to jump in, did you mean baked potatoes, right?\nB: Yes, baked potatoes. And can I now have iced tea with lemon on the side, please?\nA: Good, and would you care for soup or salad to start with?\nB: I'd like cream onion soup, please.\nA: Will you have dessert to be, madam?\nB: I want to skip dessert. Oh, and just to confirm, you got the iced tea with lemon on the side, right?\nA: Yes, I've got that noted. That is all, thank you.", + "cleaned_text": "A: Would you like to order now, madam?\nB: Yes, please. I'd like the steak and mushrooms.\nA: How would you like your steak, rare, medium, or well-done?\nB: I'd like it well done, please.\nA: What kind of potatoes would you like to go with that, mashed, boiled, or baked?\nB:I think I'll have baked potatoes. And can I now have some extra butter on the side as well as a small portion of sour cream and chives to complement the potatoes perfectly?\nA: Sorry to jump in, did you mean baked potatoes, right?\nB: Yes, baked potatoes. And can I now have iced tea with lemon on the side, please?\nA: Good, and would you care for soup or salad to start with?\nB: I'd like cream onion soup, please.\nA: Will you have dessert to be, madam?\nB: I want to skip dessert. Oh, and just to confirm, you got the iced tea with lemon on the side, right?\nA: Yes, I've got that noted. That is all, thank you.", + "total_duration": 48.05673469387755, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--24/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--24/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--24/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Would you like to order now, madam?", + "original_text": "Would you like to order now, madam?", + "start_time": 0, + "end_time": 1.7298866213151927, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--24/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, please. I'd like the steak and mushrooms.", + "original_text": "Yes, please. I'd like the steak and mushrooms.", + "start_time": 2.066080558955888, + "end_time": 4.480955842402601, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--24/temp/line_1_B.wav", + "silence_duration": 0.3361939376406956, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "How would you like your steak, rare, medium, or well-done?", + "original_text": "How would you like your steak, rare, medium, or well-done?", + "start_time": 5.026674289024623, + "end_time": 8.939236647301266, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--24/temp/line_2_A.wav", + "silence_duration": 0.5457184466220218, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I'd like it well done, please.", + "original_text": "I'd like it well done, please.", + "start_time": 9.396893688942564, + "end_time": 10.929410695745284, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--24/temp/line_3_B.wav", + "silence_duration": 0.45765704164129806, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "What kind of potatoes would you like to go with that, mashed, boiled, or baked?", + "original_text": "What kind of potatoes would you like to go with that, mashed, boiled, or baked?", + "start_time": 11.433875175668138, + "end_time": 15.903716445509408, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--24/temp/line_4_A.wav", + "silence_duration": 0.5044644799228547, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I think I'll have baked potatoes. And can I now have", + "original_text": "I think I'll have baked potatoes. And can I now have [interrupt] some extra butter on the side as well as a small portion of sour cream and chives to complement the potatoes perfectly?", + "start_time": 16.273672060121108, + "end_time": 24.505145983023603, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--24/temp/line_5_B.wav", + "silence_duration": 0.3699556146116989, + "is_interrupted": true, + "text_after_interrupt": "some extra butter on the side as well as a small portion of sour cream and chives to complement the potatoes perfectly?" + }, + { + "speaker": "A", + "text": "Sorry to jump in, did you mean baked potatoes, right?", + "original_text": "Sorry to jump in, did you mean baked potatoes, right?", + "start_time": 19.164556413862606, + "end_time": 23.04228884016646, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--24/temp/line_6_A.wav", + "silence_duration": 0.41424452363081876, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, baked potatoes. And can I now have iced tea with lemon on the side, please?", + "original_text": "Yes, baked potatoes. And can I now have iced tea with lemon on the side, please?", + "start_time": 24.957178569583903, + "end_time": 29.926248864368482, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--24/temp/line_7_B.wav", + "silence_duration": 0.4520325865602986, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Good, and would you care for soup or salad to start with?", + "original_text": "Good, and would you care for soup or salad to start with?", + "start_time": 30.231929793613414, + "end_time": 33.88907265075627, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--24/temp/line_8_A.wav", + "silence_duration": 0.3056809292449319, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I'd like cream onion soup, please.", + "original_text": "I'd like cream onion soup, please.", + "start_time": 34.33115820347459, + "end_time": 36.32807430324783, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--24/temp/line_9_B.wav", + "silence_duration": 0.44208555271831695, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Will you have dessert to be, madam?", + "original_text": "Will you have dessert to be, madam?", + "start_time": 36.82706222709864, + "end_time": 38.74270848560204, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--24/temp/line_10_A.wav", + "silence_duration": 0.49898792385080565, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I want to skip dessert. Oh, and just to confirm, you got the iced tea with lemon on the side, right?", + "original_text": "I want to skip dessert. Oh, and just to confirm, you got the iced tea with lemon on the side, right?", + "start_time": 39.06120107431222, + "end_time": 44.45984053009454, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--24/temp/line_11_B.wav", + "silence_duration": 0.318492588710183, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Yes, I've got that noted. That is all, thank you.", + "original_text": "Yes, I've got that noted. That is all, thank you.", + "start_time": 44.78276576770211, + "end_time": 48.05677937314429, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--24/temp/line_12_A.wav", + "silence_duration": 0.3229252376075687, + "is_interrupted": false + } + ] + }, + "DialogSum--val--25": { + "original_text": "A: I've been working hard for a whole year. I really need a break.\nB: That's true. You need to take some time off to [interrupt] recharge and relax, maybe even travel somewhere new where you can experience different cultures and completely step away from your daily routine. You deserve it.\nA: Yes, exactly! I'm looking forward to my annual vacation.\nB: When are you going to take your vacation?\nA: Later this month. I can't wait to finally unwind and disconnect from work.\nB: Wait, later this month? That's so soon! I really envy you. You know I'm not taking my vacation until December.\nA: Oh, I was just about to say I can't [interrupt] wait! December sounds like a long time to hold out, especially when you've been working non-stop without any significant breaks since the beginning of the year.", + "cleaned_text": "A: I've been working hard for a whole year. I really need a break.\nB:That's true. You need to take some time off to recharge and relax, maybe even travel somewhere new where you can experience different cultures and completely step away from your daily routine. You deserve it.\nA: Yes, exactly! I'm looking forward to my annual vacation.\nB: When are you going to take your vacation?\nA: Later this month. I can't wait to finally unwind and disconnect from work.\nB: Wait, later this month? That's so soon! I really envy you. You know I'm not taking my vacation until December.\nA:Oh, I was just about to say I can't wait! December sounds like a long time to hold out, especially when you've been working non-stop without any significant breaks since the beginning of the year.", + "total_duration": 40.8568253968254, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--25/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--25/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--25/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "I've been working hard for a whole year. I really need a break.", + "original_text": "I've been working hard for a whole year. I really need a break.", + "start_time": 0, + "end_time": 3.81968253968254, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--25/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "That's true. You need to take some time off to", + "original_text": "That's true. You need to take some time off to [interrupt] recharge and relax, maybe even travel somewhere new where you can experience different cultures and completely step away from your daily routine. You deserve it.", + "start_time": 4.149722684262269, + "end_time": 15.086321323718051, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--25/temp/line_1_B.wav", + "silence_duration": 0.3300401445797288, + "is_interrupted": true, + "text_after_interrupt": "recharge and relax, maybe even travel somewhere new where you can experience different cultures and completely step away from your daily routine. You deserve it." + }, + { + "speaker": "A", + "text": "Yes, exactly! I'm looking forward to my annual vacation.", + "original_text": "Yes, exactly! I'm looking forward to my annual vacation.", + "start_time": 6.820017468842767, + "end_time": 10.871899555010568, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--25/temp/line_2_A.wav", + "silence_duration": 0.41163560913966146, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "When are you going to take your vacation?", + "original_text": "When are you going to take your vacation?", + "start_time": 15.471109357519007, + "end_time": 17.119726137564356, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--25/temp/line_3_B.wav", + "silence_duration": 0.38478803380095533, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Later this month. I can't wait to finally unwind and disconnect from work.", + "original_text": "Later this month. I can't wait to finally unwind and disconnect from work.", + "start_time": 17.70689957707136, + "end_time": 22.118690960291318, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--25/temp/line_4_A.wav", + "silence_duration": 0.5871734395070061, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Wait, later this month? That's so soon! I really envy you. You know I'm not taking my vacation until December.", + "original_text": "Wait, later this month? That's so soon! I really envy you. You know I'm not taking my vacation until December.", + "start_time": 22.518903044319433, + "end_time": 28.335501683775217, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--25/temp/line_5_B.wav", + "silence_duration": 0.40021208402811453, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Oh, I was just about to say I can't", + "original_text": "Oh, I was just about to say I can't [interrupt] wait! December sounds like a long time to hold out, especially when you've been working non-stop without any significant breaks since the beginning of the year.", + "start_time": 28.88696266010039, + "end_time": 40.856849281415585, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--25/temp/line_6_A.wav", + "silence_duration": 0.5514609763251755, + "is_interrupted": true, + "text_after_interrupt": "wait! December sounds like a long time to hold out, especially when you've been working non-stop without any significant breaks since the beginning of the year." + } + ] + }, + "DialogSum--val--26": { + "original_text": "A: Waiter, get me a rag, please. I have just spilled my [interrupt] coffee all over the table and it's starting to drip onto the floor which could make this area quite dangerous for other customers.\nB: Sorry to interrupt, but let me help you with that first. \nA: Thank you. Please bring me some paper napkins as well. \nB: Oh, right! Here you are. By the way, do you still need that rag?", + "cleaned_text": "A:Waiter, get me a rag, please. I have just spilled my coffee all over the table and it's starting to drip onto the floor which could make this area quite dangerous for other customers.\nB: Sorry to interrupt, but let me help you with that first. \nA: Thank you. Please bring me some paper napkins as well. \nB: Oh, right! Here you are. By the way, do you still need that rag?", + "total_duration": 18.0075283446712, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--26/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--26/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--26/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Waiter, get me a rag, please. I have just spilled my", + "original_text": "Waiter, get me a rag, please. I have just spilled my [interrupt] coffee all over the table and it's starting to drip onto the floor which could make this area quite dangerous for other customers.", + "start_time": 0, + "end_time": 10.39092970521542, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--26/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": true, + "text_after_interrupt": "coffee all over the table and it's starting to drip onto the floor which could make this area quite dangerous for other customers." + }, + { + "speaker": "B", + "text": "Sorry to interrupt, but let me help you with that first.", + "original_text": "Sorry to interrupt, but let me help you with that first.", + "start_time": 3.308843537414966, + "end_time": 6.106848072562358, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--26/temp/line_1_B.wav", + "silence_duration": 0.4767408429851847, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Thank you. Please bring me some paper napkins as well.", + "original_text": "Thank you. Please bring me some paper napkins as well.", + "start_time": 10.706388136683922, + "end_time": 13.806252082262153, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--26/temp/line_2_A.wav", + "silence_duration": 0.31545843146850056, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Oh, right! Here you are. By the way, do you still need that rag?", + "original_text": "Oh, right! Here you are. By the way, do you still need that rag?", + "start_time": 14.269147647858464, + "end_time": 18.007560346271163, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--26/temp/line_3_B.wav", + "silence_duration": 0.46289556559631095, + "is_interrupted": false + } + ] + }, + "DialogSum--val--27": { + "original_text": "A: What's wrong with you? \nB: I'm trying to send the instruction book by E-mail, but I failed many, many times. And there is something wrong with the net maybe. It's so [interrupt] frustrating because I need to get this sent out urgently and I'm worried I might miss the deadline if this keeps happening. \nA: Sorry to cut in, but have you tried restarting your router? Sometimes a quick reset can solve the issue. \nB: I haven't tried that yet, but I will. By the way, I am used to editing with Word 2003, and there are many pictures in the book. \nA: It's beyond question. You can save it the same as a document. \nB: I merely know how to send the direct letter. But I am not familiar with the attachment. \nA: It's the same as usual. The only difference lies in that you need to paste the book as an attachment. \nB: Can I mail the book if it is a large file? \nA: There are limitations to the capacity of an E-mail. Commonly it's no more than 4 MB. \nB: What if it exceeds the [interrupt] limit? I'm worried it might be too large to send and I don't know how to compress the file or split it into smaller parts to make it work. \nA: Oh, I almost forgot to mention, you can use cloud services like Google Drive or Dropbox for large files. But what were you asking about the capacity? \nB: Yes, I was asking what to do if the file exceeds the E-mail capacity.", + "cleaned_text": "A: What's wrong with you? \nB:I'm trying to send the instruction book by E-mail, but I failed many, many times. And there is something wrong with the net maybe. It's so frustrating because I need to get this sent out urgently and I'm worried I might miss the deadline if this keeps happening.\nA: Sorry to cut in, but have you tried restarting your router? Sometimes a quick reset can solve the issue. \nB: I haven't tried that yet, but I will. By the way, I am used to editing with Word 2003, and there are many pictures in the book. \nA: It's beyond question. You can save it the same as a document. \nB: I merely know how to send the direct letter. But I am not familiar with the attachment. \nA: It's the same as usual. The only difference lies in that you need to paste the book as an attachment. \nB: Can I mail the book if it is a large file? \nA: There are limitations to the capacity of an E-mail. Commonly it's no more than 4 MB. \nB:What if it exceeds the limit? I'm worried it might be too large to send and I don't know how to compress the file or split it into smaller parts to make it work.\nA: Oh, I almost forgot to mention, you can use cloud services like Google Drive or Dropbox for large files. But what were you asking about the capacity? \nB: Yes, I was asking what to do if the file exceeds the E-mail capacity.", + "total_duration": 68.53056689342404, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--27/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--27/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--27/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "What's wrong with you?", + "original_text": "What's wrong with you?", + "start_time": 0, + "end_time": 1.2887074829931973, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--27/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I'm trying to send the instruction book by E-mail, but I failed many, many times. And there is something wrong with the net maybe. It's so", + "original_text": "I'm trying to send the instruction book by E-mail, but I failed many, many times. And there is something wrong with the net maybe. It's so [interrupt] frustrating because I need to get this sent out urgently and I'm worried I might miss the deadline if this keeps happening.", + "start_time": 1.7128329677593563, + "end_time": 14.367708251206068, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--27/temp/line_1_B.wav", + "silence_duration": 0.4241254847661592, + "is_interrupted": true, + "text_after_interrupt": "frustrating because I need to get this sent out urgently and I'm worried I might miss the deadline if this keeps happening." + }, + { + "speaker": "A", + "text": "Sorry to cut in, but have you tried restarting your router? Sometimes a quick reset can solve the issue.", + "original_text": "Sorry to cut in, but have you tried restarting your router? Sometimes a quick reset can solve the issue.", + "start_time": 9.363808024448698, + "end_time": 16.21369464576389, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--27/temp/line_2_A.wav", + "silence_duration": 0.5880698370124955, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I haven't tried that yet, but I will. By the way, I am used to editing with Word 2003, and there are many pictures in the book.", + "original_text": "I haven't tried that yet, but I will. By the way, I am used to editing with Word 2003, and there are many pictures in the book.", + "start_time": 16.57979207978043, + "end_time": 23.673488224905146, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--27/temp/line_3_B.wav", + "silence_duration": 0.3660974340165382, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "It's beyond question. You can save it the same as a document.", + "original_text": "It's beyond question. You can save it the same as a document.", + "start_time": 24.131792087274206, + "end_time": 27.568345375256065, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--27/temp/line_4_A.wav", + "silence_duration": 0.45830386236905907, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I merely know how to send the direct letter. But I am not familiar with the attachment.", + "original_text": "I merely know how to send the direct letter. But I am not familiar with the attachment.", + "start_time": 28.064916417872436, + "end_time": 32.2212882999586, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--27/temp/line_5_B.wav", + "silence_duration": 0.4965710426163696, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "It's the same as usual. The only difference lies in that you need to paste the book as an attachment.", + "original_text": "It's the same as usual. The only difference lies in that you need to paste the book as an attachment.", + "start_time": 32.611534361628586, + "end_time": 38.509402842354206, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--27/temp/line_6_A.wav", + "silence_duration": 0.3902460616699873, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Can I mail the book if it is a large file?", + "original_text": "Can I mail the book if it is a large file?", + "start_time": 39.10318455188124, + "end_time": 41.192980470248585, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--27/temp/line_7_B.wav", + "silence_duration": 0.5937817095270386, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "There are limitations to the capacity of an E-mail. Commonly it's no more than 4 MB.", + "original_text": "There are limitations to the capacity of an E-mail. Commonly it's no more than 4 MB.", + "start_time": 41.5961071655085, + "end_time": 47.528805578206914, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--27/temp/line_8_A.wav", + "silence_duration": 0.4031266952599107, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "What if it exceeds the", + "original_text": "What if it exceeds the [interrupt] limit? I'm worried it might be too large to send and I don't know how to compress the file or split it into smaller parts to make it work.", + "start_time": 47.96416012261519, + "end_time": 56.21885400016621, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--27/temp/line_9_B.wav", + "silence_duration": 0.43535454440827515, + "is_interrupted": true, + "text_after_interrupt": "limit? I'm worried it might be too large to send and I don't know how to compress the file or split it into smaller parts to make it work." + }, + { + "speaker": "A", + "text": "Oh, I almost forgot to mention, you can use cloud services like Google Drive or Dropbox for large files. But what were you asking about the capacity?", + "original_text": "Oh, I almost forgot to mention, you can use cloud services like Google Drive or Dropbox for large files. But what were you asking about the capacity?", + "start_time": 54.788441735514574, + "end_time": 64.2041333454919, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--27/temp/line_10_A.wav", + "silence_duration": 0.40961852357849676, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, I was asking what to do if the file exceeds the E-mail capacity.", + "original_text": "Yes, I was asking what to do if the file exceeds the E-mail capacity.", + "start_time": 64.71091401444582, + "end_time": 68.53059655412837, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--27/temp/line_11_B.wav", + "silence_duration": 0.5067806689539215, + "is_interrupted": false + } + ] + }, + "DialogSum--val--28": { + "original_text": "A: Bill, will you be free at noon? \nB: Yes. What can I do for you? \nA: We need a new filing cabinet in the office. Could you go downtown with me after lunch? \nB: All right. Have you got an idea about what type to [interrupt] consider? I was thinking about something that matches the current office decor while also providing additional storage space for our growing document collection. \nA: Sorry to cut you off, but I just realized—do we have enough space in the office for another cabinet? \nB: Good point. Yes, we do have space. I was asking if you had an idea about what type to buy? \nA: Yes, the same as the one we have. And we also need some small articles in the office, such as pens, clips, erasers and sticky notes. \nB: Can you remember them all?", + "cleaned_text": "A: Bill, will you be free at noon? \nB: Yes. What can I do for you? \nA: We need a new filing cabinet in the office. Could you go downtown with me after lunch? \nB:All right. Have you got an idea about what type to consider? I was thinking about something that matches the current office decor while also providing additional storage space for our growing document collection.\nA: Sorry to cut you off, but I just realized—do we have enough space in the office for another cabinet? \nB: Good point. Yes, we do have space. I was asking if you had an idea about what type to buy? \nA: Yes, the same as the one we have. And we also need some small articles in the office, such as pens, clips, erasers and sticky notes. \nB: Can you remember them all?", + "total_duration": 37.33963718820862, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--28/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--28/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--28/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Bill, will you be free at noon?", + "original_text": "Bill, will you be free at noon?", + "start_time": 0, + "end_time": 1.7531065759637188, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--28/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes. What can I do for you?", + "original_text": "Yes. What can I do for you?", + "start_time": 2.222715914359732, + "end_time": 3.8713326944050834, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--28/temp/line_1_B.wav", + "silence_duration": 0.46960933839601315, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "We need a new filing cabinet in the office. Could you go downtown with me after lunch?", + "original_text": "We need a new filing cabinet in the office. Could you go downtown with me after lunch?", + "start_time": 4.255675346617043, + "end_time": 9.41050527858983, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--28/temp/line_2_A.wav", + "silence_duration": 0.3843426522119592, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "All right. Have you got an idea about what type to", + "original_text": "All right. Have you got an idea about what type to [interrupt] consider? I was thinking about something that matches the current office decor while also providing additional storage space for our growing document collection.", + "start_time": 9.818565011223319, + "end_time": 19.97729516995348, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--28/temp/line_3_B.wav", + "silence_duration": 0.4080597326334878, + "is_interrupted": true, + "text_after_interrupt": "consider? I was thinking about something that matches the current office decor while also providing additional storage space for our growing document collection." + }, + { + "speaker": "A", + "text": "Sorry to cut you off, but I just realized—do we have enough space in the office for another cabinet?", + "original_text": "Sorry to cut you off, but I just realized—do we have enough space in the office for another cabinet?", + "start_time": 12.61656954637071, + "end_time": 18.653757754987492, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--28/temp/line_4_A.wav", + "silence_duration": 0.4262985178707538, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Good point. Yes, we do have space. I was asking if you had an idea about what type to buy?", + "original_text": "Good point. Yes, we do have space. I was asking if you had an idea about what type to buy?", + "start_time": 20.446922793317285, + "end_time": 26.344791274042908, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--28/temp/line_5_B.wav", + "silence_duration": 0.46962762336380637, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Yes, the same as the one we have. And we also need some small articles in the office, such as pens, clips, erasers and sticky notes.", + "original_text": "Yes, the same as the one we have. And we also need some small articles in the office, such as pens, clips, erasers and sticky notes.", + "start_time": 26.919091223559967, + "end_time": 35.928433627188085, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--28/temp/line_6_A.wav", + "silence_duration": 0.5742999495170599, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Can you remember them all?", + "original_text": "Can you remember them all?", + "start_time": 36.248339776699076, + "end_time": 37.339677645179805, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--28/temp/line_7_B.wav", + "silence_duration": 0.3199061495109927, + "is_interrupted": false + } + ] + }, + "DialogSum--val--29": { + "original_text": "A: Do you know anything about health food?\nB: It is so popular among people to preserve health now, so I read some books about health food and learned about various nutritional benefits and preparation methods.\nA: Can you give me some examples?\nB: Drinking warm and fresh water in the morning on wakening up is one of [interrupt] the simplest yet effective practices for maintaining good health as it helps kickstart your metabolism and flush out toxins accumulated overnight.\nA: Wait, why specifically warm water? I've always heard about drinking water in the morning, but why does the temperature matter?\nB: Warm water can be good for your stomach, which is empty at that moment. And freshness can keep the water active to clean your digestive system. I was also going to mention yogurt [interrupt] as another beneficial food that supports gut health and boosts immunity through its probiotic content and essential nutrients that aid in digestion and nutrient absorption.\nA: Oh, yogurt! I've heard it's great for digestion. But what makes it so special compared to other dairy products?\nB: Yogurt has protein, vitamins, and it's acidic. If you drink it every day, your stomach will be more comfortable, and it can also help balance the gut flora, which is essential for overall health and can even improve mental wellbeing through the gut-brain connection.", + "cleaned_text": "A: Do you know anything about health food?\nB: It is so popular among people to preserve health now, so I read some books about health food and learned about various nutritional benefits and preparation methods.\nA: Can you give me some examples?\nB:Drinking warm and fresh water in the morning on wakening up is one of the simplest yet effective practices for maintaining good health as it helps kickstart your metabolism and flush out toxins accumulated overnight.\nA: Wait, why specifically warm water? I've always heard about drinking water in the morning, but why does the temperature matter?\nB:Warm water can be good for your stomach, which is empty at that moment. And freshness can keep the water active to clean your digestive system. I was also going to mention yogurt as another beneficial food that supports gut health and boosts immunity through its probiotic content and essential nutrients that aid in digestion and nutrient absorption.\nA: Oh, yogurt! I've heard it's great for digestion. But what makes it so special compared to other dairy products?\nB: Yogurt has protein, vitamins, and it's acidic. If you drink it every day, your stomach will be more comfortable, and it can also help balance the gut flora, which is essential for overall health and can even improve mental wellbeing through the gut-brain connection.", + "total_duration": 62.695736961451246, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--29/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--29/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--29/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Do you know anything about health food?", + "original_text": "Do you know anything about health food?", + "start_time": 0, + "end_time": 2.0317460317460316, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--29/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "It is so popular among people to preserve health now, so I read some books about health food and learned about various nutritional benefits and preparation methods.", + "original_text": "It is so popular among people to preserve health now, so I read some books about health food and learned about various nutritional benefits and preparation methods.", + "start_time": 2.4067624238589795, + "end_time": 10.940095757192314, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--29/temp/line_1_B.wav", + "silence_duration": 0.3750163921129481, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Can you give me some examples?", + "original_text": "Can you give me some examples?", + "start_time": 11.358827002869516, + "end_time": 13.08871362418471, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--29/temp/line_2_A.wav", + "silence_duration": 0.4187312456772015, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Drinking warm and fresh water in the morning on wakening up is one of", + "original_text": "Drinking warm and fresh water in the morning on wakening up is one of [interrupt] the simplest yet effective practices for maintaining good health as it helps kickstart your metabolism and flush out toxins accumulated overnight.", + "start_time": 13.494716110092993, + "end_time": 25.17435329830161, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--29/temp/line_3_B.wav", + "silence_duration": 0.406002485908284, + "is_interrupted": true, + "text_after_interrupt": "the simplest yet effective practices for maintaining good health as it helps kickstart your metabolism and flush out toxins accumulated overnight." + }, + { + "speaker": "A", + "text": "Wait, why specifically warm water? I've always heard about drinking water in the morning, but why does the temperature matter?", + "original_text": "Wait, why specifically warm water? I've always heard about drinking water in the morning, but why does the temperature matter?", + "start_time": 17.56981815090932, + "end_time": 25.185963275625873, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--29/temp/line_4_A.wav", + "silence_duration": 0.48920011313051615, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Warm water can be good for your stomach, which is empty at that moment. And freshness can keep the water active to clean your digestive system. I was also going to mention yogurt", + "original_text": "Warm water can be good for your stomach, which is empty at that moment. And freshness can keep the water active to clean your digestive system. I was also going to mention yogurt [interrupt] as another beneficial food that supports gut health and boosts immunity through its probiotic content and essential nutrients that aid in digestion and nutrient absorption.", + "start_time": 25.677377039126732, + "end_time": 43.48708225454624, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--29/temp/line_5_B.wav", + "silence_duration": 0.4914137635008584, + "is_interrupted": true, + "text_after_interrupt": "as another beneficial food that supports gut health and boosts immunity through its probiotic content and essential nutrients that aid in digestion and nutrient absorption." + }, + { + "speaker": "A", + "text": "Oh, yogurt! I've heard it's great for digestion. But what makes it so special compared to other dairy products?", + "original_text": "Oh, yogurt! I've heard it's great for digestion. But what makes it so special compared to other dairy products?", + "start_time": 42.539483527501304, + "end_time": 48.91336107852171, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--29/temp/line_6_A.wav", + "silence_duration": 0.4540977020256022, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yogurt has protein, vitamins, and it's acidic. If you drink it every day, your stomach will be more comfortable, and it can also help balance the gut flora, which is essential for overall health and can even improve mental wellbeing through the gut-brain connection.", + "original_text": "Yogurt has protein, vitamins, and it's acidic. If you drink it every day, your stomach will be more comfortable, and it can also help balance the gut flora, which is essential for overall health and can even improve mental wellbeing through the gut-brain connection.", + "start_time": 49.32104819670262, + "end_time": 62.695742074253644, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--29/temp/line_7_B.wav", + "silence_duration": 0.4076871181809073, + "is_interrupted": false + } + ] + }, + "DialogSum--val--30": { + "original_text": "A: The bridegroom looks a bit nervous. \nB: On this occasion, most people do. \nA: Oh, they are playing the wedding March. Here they [interrupt] come, walking down the aisle together with such grace and poise despite the obvious emotions of the moment. \nB: She is a beautiful bride, isn't she? \nA: Yes, she is. I am so happy for them. \nB: Are you crying? \nA: Yes, I always cry at weddings. Harris and Anne are perfect for each other, and it's just so touching to see them finally tie the knot. \nB: You know, Harris mentioned something about their honeymoon plans. Did you hear where they're going? \nA: I didn't catch that. But yes, Harris and Anne are perfect for each other. \nB: Yes, they are. \nA: You and Tom also make a great couple. \nB: In fact, we are beginning to make preparations. \nA: For the wedding?", + "cleaned_text": "A: The bridegroom looks a bit nervous. \nB: On this occasion, most people do. \nA:Oh, they are playing the wedding March. Here they come, walking down the aisle together with such grace and poise despite the obvious emotions of the moment.\nB: She is a beautiful bride, isn't she? \nA: Yes, she is. I am so happy for them. \nB: Are you crying? \nA: Yes, I always cry at weddings. Harris and Anne are perfect for each other, and it's just so touching to see them finally tie the knot. \nB: You know, Harris mentioned something about their honeymoon plans. Did you hear where they're going? \nA: I didn't catch that. But yes, Harris and Anne are perfect for each other. \nB: Yes, they are. \nA: You and Tom also make a great couple. \nB: In fact, we are beginning to make preparations. \nA: For the wedding?", + "total_duration": 44.989342403628115, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--30/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--30/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--30/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "The bridegroom looks a bit nervous.", + "original_text": "The bridegroom looks a bit nervous.", + "start_time": 0, + "end_time": 1.9969160997732427, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--30/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "On this occasion, most people do.", + "original_text": "On this occasion, most people do.", + "start_time": 2.352948362504943, + "end_time": 4.048005051847347, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--30/temp/line_1_B.wav", + "silence_duration": 0.3560322627317003, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Oh, they are playing the wedding March. Here they", + "original_text": "Oh, they are playing the wedding March. Here they [interrupt] come, walking down the aisle together with such grace and poise despite the obvious emotions of the moment.", + "start_time": 4.409173262359543, + "end_time": 13.766814985715552, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--30/temp/line_2_A.wav", + "silence_duration": 0.36116821051219616, + "is_interrupted": true, + "text_after_interrupt": "come, walking down the aisle together with such grace and poise despite the obvious emotions of the moment." + }, + { + "speaker": "B", + "text": "She is a beautiful bride, isn't she?", + "original_text": "She is a beautiful bride, isn't she?", + "start_time": 6.9285383417246225, + "end_time": 8.681644917688342, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--30/temp/line_3_B.wav", + "silence_duration": 0.30713854792213785, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Yes, she is. I am so happy for them.", + "original_text": "Yes, she is. I am so happy for them.", + "start_time": 14.312794298079375, + "end_time": 16.866989309417242, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--30/temp/line_4_A.wav", + "silence_duration": 0.5459793123638237, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Are you crying?", + "original_text": "Are you crying?", + "start_time": 17.334988272621306, + "end_time": 18.22895652658956, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--30/temp/line_5_B.wav", + "silence_duration": 0.4679989632040641, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Yes, I always cry at weddings. Harris and Anne are perfect for each other, and it's just so touching to see them finally tie the knot.", + "original_text": "Yes, I always cry at weddings. Harris and Anne are perfect for each other, and it's just so touching to see them finally tie the knot.", + "start_time": 18.784185544959158, + "end_time": 26.899559694619022, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--30/temp/line_6_A.wav", + "silence_duration": 0.5552290183695974, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "You know, Harris mentioned something about their honeymoon plans. Did you hear where they're going?", + "original_text": "You know, Harris mentioned something about their honeymoon plans. Did you hear where they're going?", + "start_time": 27.34769686565487, + "end_time": 31.724658316902037, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--30/temp/line_7_B.wav", + "silence_duration": 0.4481371710358486, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I didn't catch that. But yes, Harris and Anne are perfect for each other.", + "original_text": "I didn't catch that. But yes, Harris and Anne are perfect for each other.", + "start_time": 32.274734398552255, + "end_time": 36.88389539628468, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--30/temp/line_8_A.wav", + "silence_duration": 0.5500760816502145, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, they are.", + "original_text": "Yes, they are.", + "start_time": 37.35120030328594, + "end_time": 38.21033862528141, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--30/temp/line_9_B.wav", + "silence_duration": 0.4673049070012617, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "You and Tom also make a great couple.", + "original_text": "You and Tom also make a great couple.", + "start_time": 38.59331515698206, + "end_time": 40.78760087126777, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--30/temp/line_10_A.wav", + "silence_duration": 0.38297653170065143, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "In fact, we are beginning to make preparations.", + "original_text": "In fact, we are beginning to make preparations.", + "start_time": 41.25375246570231, + "end_time": 43.61057786252771, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--30/temp/line_11_B.wav", + "silence_duration": 0.46615159443453896, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "For the wedding?", + "original_text": "For the wedding?", + "start_time": 44.199877494173855, + "end_time": 44.98935595222374, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--30/temp/line_12_A.wav", + "silence_duration": 0.5892996316461445, + "is_interrupted": false + } + ] + }, + "DialogSum--val--31": { + "original_text": "A: We've been cramming for tomorrow's history exam since early this morning. What do you say we take a break and listen to some music, okay? \nB: Now that you mention it, I'm getting a little bummed-out from studying nonstop, too. Listening to some music for a while would [interrupt] definitely help us unwind a bit before diving back into the books, especially since we've been at this for hours and our brains need some time to process all this information. \nA: Sorry to cut in, but do you think taking a break now might mess up our momentum? I mean, we still have a lot of material to cover. \nB: I get what you're saying, but I think a short break could actually help us recharge. While you're picking out a record to play, I'll grab a couple of beers out of the refrigerator. \nA: You sure have a lot of discs here. \nB: Yeah, I've got everything from rock n'roll to the latest new - wave stuff. \nA: To tell you the truth, I'm strictly into classical music. You don't happen to have any Bach or Mozart, do you? \nB: Sorry, my taste in music doesn't go back any further than the 1960's. Music written before then is just history to me. \nA: Speaking of history, you mentioned taking a break earlier, but do you think we should get back to the books soon? We've got an exam tomorrow, remember?", + "cleaned_text": "A: We've been cramming for tomorrow's history exam since early this morning. What do you say we take a break and listen to some music, okay? \nB:Now that you mention it, I'm getting a little bummed-out from studying nonstop, too. Listening to some music for a while would definitely help us unwind a bit before diving back into the books, especially since we've been at this for hours and our brains need some time to process all this information.\nA: Sorry to cut in, but do you think taking a break now might mess up our momentum? I mean, we still have a lot of material to cover. \nB: I get what you're saying, but I think a short break could actually help us recharge. While you're picking out a record to play, I'll grab a couple of beers out of the refrigerator. \nA: You sure have a lot of discs here. \nB: Yeah, I've got everything from rock n'roll to the latest new - wave stuff. \nA: To tell you the truth, I'm strictly into classical music. You don't happen to have any Bach or Mozart, do you? \nB: Sorry, my taste in music doesn't go back any further than the 1960's. Music written before then is just history to me. \nA: Speaking of history, you mentioned taking a break earlier, but do you think we should get back to the books soon? We've got an exam tomorrow, remember?", + "total_duration": 61.76947845804989, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--31/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--31/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--31/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "We've been cramming for tomorrow's history exam since early this morning. What do you say we take a break and listen to some music, okay?", + "original_text": "We've been cramming for tomorrow's history exam since early this morning. What do you say we take a break and listen to some music, okay?", + "start_time": 0, + "end_time": 7.75546485260771, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--31/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Now that you mention it, I'm getting a little bummed-out from studying nonstop, too. Listening to some music for a while would", + "original_text": "Now that you mention it, I'm getting a little bummed-out from studying nonstop, too. Listening to some music for a while would [interrupt] definitely help us unwind a bit before diving back into the books, especially since we've been at this for hours and our brains need some time to process all this information.", + "start_time": 8.220292300061768, + "end_time": 22.814033796660407, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--31/temp/line_1_B.wav", + "silence_duration": 0.464827447454058, + "is_interrupted": true, + "text_after_interrupt": "definitely help us unwind a bit before diving back into the books, especially since we've been at this for hours and our brains need some time to process all this information." + }, + { + "speaker": "A", + "text": "Sorry to cut in, but do you think taking a break now might mess up our momentum? I mean, we still have a lot of material to cover.", + "original_text": "Sorry to cut in, but do you think taking a break now might mess up our momentum? I mean, we still have a lot of material to cover.", + "start_time": 14.512900009812334, + "end_time": 22.686324046093514, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--31/temp/line_2_A.wav", + "silence_duration": 0.5826149540711384, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I get what you're saying, but I think a short break could actually help us recharge. While you're picking out a record to play, I'll grab a couple of beers out of the refrigerator.", + "original_text": "I get what you're saying, but I think a short break could actually help us recharge. While you're picking out a record to play, I'll grab a couple of beers out of the refrigerator.", + "start_time": 23.251854379084616, + "end_time": 31.78518771241795, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--31/temp/line_3_B.wav", + "silence_duration": 0.4378205824242102, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "You sure have a lot of discs here.", + "original_text": "You sure have a lot of discs here.", + "start_time": 32.29813036964989, + "end_time": 34.236996582801815, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--31/temp/line_4_A.wav", + "silence_duration": 0.512942657231936, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yeah, I've got everything from rock n'roll to the latest new - wave stuff.", + "original_text": "Yeah, I've got everything from rock n'roll to the latest new - wave stuff.", + "start_time": 34.55113366092989, + "end_time": 38.52174590582785, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--31/temp/line_5_B.wav", + "silence_duration": 0.31413707812807795, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "To tell you the truth, I'm strictly into classical music. You don't happen to have any Bach or Mozart, do you?", + "original_text": "To tell you the truth, I'm strictly into classical music. You don't happen to have any Bach or Mozart, do you?", + "start_time": 38.99915039580369, + "end_time": 45.477517742742464, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--31/temp/line_6_A.wav", + "silence_duration": 0.47740448997583806, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Sorry, my taste in music doesn't go back any further than the 1960's. Music written before then is just history to me.", + "original_text": "Sorry, my taste in music doesn't go back any further than the 1960's. Music written before then is just history to me.", + "start_time": 45.97036776101941, + "end_time": 52.90152422360445, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--31/temp/line_7_B.wav", + "silence_duration": 0.4928500182769463, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Speaking of history, you mentioned taking a break earlier, but do you think we should get back to the books soon? We've got an exam tomorrow, remember?", + "original_text": "Speaking of history, you mentioned taking a break earlier, but do you think we should get back to the books soon? We've got an exam tomorrow, remember?", + "start_time": 53.375482086646656, + "end_time": 61.76949569208883, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--31/temp/line_8_A.wav", + "silence_duration": 0.473957863042211, + "is_interrupted": false + } + ] + }, + "DialogSum--val--32": { + "original_text": "A: Excuse me. Have you got any books on genetic engineering? I've looked for them everywhere, but I can't find [interrupt] any in the usual sections, and I'm starting to wonder if they're out of stock or if they've been moved to a different location entirely. \nB: Sorry to interrupt, but did you check the new arrivals section? Sometimes we place popular topics like genetic engineering there because they tend to attract more attention when displayed prominently. \nA: I haven't checked there yet. But if they're not there, could you tell me if you've got any on this shelf? \nB: I'm not sure if we've got any now. Books of that kind are on this shelf. Well, I'm afraid we've sold [interrupt] most of them recently because they're in high demand among university students and researchers working on cutting-edge biotechnology projects. \nA: Oh, that's disappointing! But just to clarify, do you usually restock these books regularly? \nB: Yes, we do. Come some time next week if you like. I think we'll have got some by then as our new shipment is expected to arrive within the next few days.", + "cleaned_text": "A:Excuse me. Have you got any books on genetic engineering? I've looked for them everywhere, but I can't find any in the usual sections, and I'm starting to wonder if they're out of stock or if they've been moved to a different location entirely.\nB: Sorry to interrupt, but did you check the new arrivals section? Sometimes we place popular topics like genetic engineering there because they tend to attract more attention when displayed prominently. \nA: I haven't checked there yet. But if they're not there, could you tell me if you've got any on this shelf? \nB:I'm not sure if we've got any now. Books of that kind are on this shelf. Well, I'm afraid we've sold most of them recently because they're in high demand among university students and researchers working on cutting-edge biotechnology projects.\nA: Oh, that's disappointing! But just to clarify, do you usually restock these books regularly? \nB: Yes, we do. Come some time next week if you like. I think we'll have got some by then as our new shipment is expected to arrive within the next few days.", + "total_duration": 50.88775510204081, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--32/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--32/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--32/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Excuse me. Have you got any books on genetic engineering? I've looked for them everywhere, but I can't find", + "original_text": "Excuse me. Have you got any books on genetic engineering? I've looked for them everywhere, but I can't find [interrupt] any in the usual sections, and I'm starting to wonder if they're out of stock or if they've been moved to a different location entirely.", + "start_time": 0, + "end_time": 14.373151927437641, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--32/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": true, + "text_after_interrupt": "any in the usual sections, and I'm starting to wonder if they're out of stock or if they've been moved to a different location entirely." + }, + { + "speaker": "B", + "text": "Sorry to interrupt, but did you check the new arrivals section? Sometimes we place popular topics like genetic engineering there because they tend to attract more attention when displayed prominently.", + "original_text": "Sorry to interrupt, but did you check the new arrivals section? Sometimes we place popular topics like genetic engineering there because they tend to attract more attention when displayed prominently.", + "start_time": 6.873106575963718, + "end_time": 16.92734693877551, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--32/temp/line_1_B.wav", + "silence_duration": 0.5689115342670511, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I haven't checked there yet. But if they're not there, could you tell me if you've got any on this shelf?", + "original_text": "I haven't checked there yet. But if they're not there, could you tell me if you've got any on this shelf?", + "start_time": 17.52728706286393, + "end_time": 23.204565974428554, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--32/temp/line_2_A.wav", + "silence_duration": 0.5999401240884199, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I'm not sure if we've got any now. Books of that kind are on this shelf. Well, I'm afraid we've sold", + "original_text": "I'm not sure if we've got any now. Books of that kind are on this shelf. Well, I'm afraid we've sold [interrupt] most of them recently because they're in high demand among university students and researchers working on cutting-edge biotechnology projects.", + "start_time": 23.608516485806177, + "end_time": 36.18212192798305, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--32/temp/line_3_B.wav", + "silence_duration": 0.4039505113776219, + "is_interrupted": true, + "text_after_interrupt": "most of them recently because they're in high demand among university students and researchers working on cutting-edge biotechnology projects." + }, + { + "speaker": "A", + "text": "Oh, that's disappointing! But just to clarify, do you usually restock these books regularly?", + "original_text": "Oh, that's disappointing! But just to clarify, do you usually restock these books regularly?", + "start_time": 37.15949570450177, + "end_time": 43.09219411720019, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--32/temp/line_4_A.wav", + "silence_duration": 0.5051156987174228, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, we do. Come some time next week if you like. I think we'll have got some by then as our new shipment is expected to arrive within the next few days.", + "original_text": "Yes, we do. Come some time next week if you like. I think we'll have got some by then as our new shipment is expected to arrive within the next few days.", + "start_time": 43.596700044626026, + "end_time": 50.88776580426321, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--32/temp/line_5_B.wav", + "silence_duration": 0.5045059274258404, + "is_interrupted": false + } + ] + }, + "DialogSum--val--33": { + "original_text": "A: Excuse me. Does this bus go to the National Library of China? \nB: Yes, there are three stops [interrupt] before you get there, so it won't take too long. The first one is at the shopping district, then the city park, and finally the library stop which has a distinctive red brick building right across from it. \nA: Oh, great! How long is the ride? \nB: Well, you will get there in about a quarter of an hour if the traffic isn't too congested, but usually, at this time, it's quite clear. \nA: Sorry to cut in, but could you also let me know when we get to the stop? I'm a stranger here. \nB: Sure, madam. I'll remind you. By the way, I was about to say, the traffic isn't too heavy around this time, so it should be a smooth ride.", + "cleaned_text": "A: Excuse me. Does this bus go to the National Library of China? \nB:Yes, there are three stops before you get there, so it won't take too long. The first one is at the shopping district, then the city park, and finally the library stop which has a distinctive red brick building right across from it.\nA: Oh, great! How long is the ride? \nB: Well, you will get there in about a quarter of an hour if the traffic isn't too congested, but usually, at this time, it's quite clear. \nA: Sorry to cut in, but could you also let me know when we get to the stop? I'm a stranger here. \nB: Sure, madam. I'll remind you. By the way, I was about to say, the traffic isn't too heavy around this time, so it should be a smooth ride.", + "total_duration": 37.31301587301587, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--33/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--33/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--33/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Excuse me. Does this bus go to the National Library of China?", + "original_text": "Excuse me. Does this bus go to the National Library of China?", + "start_time": 0, + "end_time": 3.657142857142857, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--33/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, there are three stops", + "original_text": "Yes, there are three stops [interrupt] before you get there, so it won't take too long. The first one is at the shopping district, then the city park, and finally the library stop which has a distinctive red brick building right across from it.", + "start_time": 4.20295332342336, + "end_time": 15.673610919795243, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--33/temp/line_1_B.wav", + "silence_duration": 0.5458104662805028, + "is_interrupted": true, + "text_after_interrupt": "before you get there, so it won't take too long. The first one is at the shopping district, then the city park, and finally the library stop which has a distinctive red brick building right across from it." + }, + { + "speaker": "A", + "text": "Oh, great! How long is the ride?", + "original_text": "Oh, great! How long is the ride?", + "start_time": 5.6193705569834504, + "end_time": 7.98780593113311, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--33/temp/line_2_A.wav", + "silence_duration": 0.43083118438249, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Well, you will get there in about a quarter of an hour if the traffic isn't too congested, but usually, at this time, it's quite clear.", + "original_text": "Well, you will get there in about a quarter of an hour if the traffic isn't too congested, but usually, at this time, it's quite clear.", + "start_time": 16.192835152186188, + "end_time": 22.72925238574628, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--33/temp/line_3_B.wav", + "silence_duration": 0.5192242323909443, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Sorry to cut in, but could you also let me know when we get to the stop? I'm a stranger here.", + "original_text": "Sorry to cut in, but could you also let me know when we get to the stop? I'm a stranger here.", + "start_time": 23.158476791032143, + "end_time": 29.474304455431238, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--33/temp/line_4_A.wav", + "silence_duration": 0.4292244052858639, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Sure, madam. I'll remind you. By the way, I was about to say, the traffic isn't too heavy around this time, so it should be a smooth ride.", + "original_text": "Sure, madam. I'll remind you. By the way, I was about to say, the traffic isn't too heavy around this time, so it should be a smooth ride.", + "start_time": 30.05680628280339, + "end_time": 37.31304211046779, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--33/temp/line_5_B.wav", + "silence_duration": 0.582501827372151, + "is_interrupted": false + } + ] + }, + "DialogSum--val--35": { + "original_text": "A: Good afternoon, Dr. Anderson's office. \nB: Hello, my name is John Keat, and I was hoping I could come in today to see the doctor. \nA: Are you a patient of Dr. Anderson? \nB: Well, no. I'm at a convention from Mexico and the manager of the hotel where I'm staying suggested that I [interrupt] visit your office because of Dr. Anderson's reputation for treating ear-related issues, particularly his innovative approaches to tinnitus and other auditory disorders that many other specialists struggle with. \nA: Sorry to jump in, but just to clarify, are you experiencing something urgent that needs immediate attention? \nB: Yes, actually. I've got this ringing in my ears. It's so terrible that I can hardly hear people talking now. \nA: Are you in any pain or is there any fluid? \nB: No discharge, just a slight earache. \nA: Does the pain happen all the time, or once in a while? \nB: It has been aching for two days and it's never stopped. I thought it might be due to my flying in the air, and after some rest it'll be all gone. But who knows it's getting worse. I need to see the doctor. \nA: The doctor will be busy at the hospital until this evening. The earliest you could see him would be tomorrow morning at ten. \nB: The time is good for me. I'll come in then if that's okay. Oh, and about what I was saying earlier—the hotel manager suggested I call your office because of Dr. Anderson's expertise.", + "cleaned_text": "A: Good afternoon, Dr. Anderson's office. \nB: Hello, my name is John Keat, and I was hoping I could come in today to see the doctor. \nA: Are you a patient of Dr. Anderson? \nB:Well, no. I'm at a convention from Mexico and the manager of the hotel where I'm staying suggested that I visit your office because of Dr. Anderson's reputation for treating ear-related issues, particularly his innovative approaches to tinnitus and other auditory disorders that many other specialists struggle with.\nA: Sorry to jump in, but just to clarify, are you experiencing something urgent that needs immediate attention? \nB: Yes, actually. I've got this ringing in my ears. It's so terrible that I can hardly hear people talking now. \nA: Are you in any pain or is there any fluid? \nB: No discharge, just a slight earache. \nA: Does the pain happen all the time, or once in a while? \nB: It has been aching for two days and it's never stopped. I thought it might be due to my flying in the air, and after some rest it'll be all gone. But who knows it's getting worse. I need to see the doctor. \nA: The doctor will be busy at the hospital until this evening. The earliest you could see him would be tomorrow morning at ten. \nB: The time is good for me. I'll come in then if that's okay. Oh, and about what I was saying earlier—the hotel manager suggested I call your office because of Dr. Anderson's expertise.", + "total_duration": 72.12390022675737, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--35/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--35/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--35/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Good afternoon, Dr. Anderson's office.", + "original_text": "Good afternoon, Dr. Anderson's office.", + "start_time": 0, + "end_time": 2.8908843537414968, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--35/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Hello, my name is John Keat, and I was hoping I could come in today to see the doctor.", + "original_text": "Hello, my name is John Keat, and I was hoping I could come in today to see the doctor.", + "start_time": 3.345963366329001, + "end_time": 8.280203729140792, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--35/temp/line_1_B.wav", + "silence_duration": 0.45507901258750416, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Are you a patient of Dr. Anderson?", + "original_text": "Are you a patient of Dr. Anderson?", + "start_time": 8.709140289435396, + "end_time": 10.740886321181428, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--35/temp/line_2_A.wav", + "silence_duration": 0.42893656029460375, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Well, no. I'm at a convention from Mexico and the manager of the hotel where I'm staying suggested that I", + "original_text": "Well, no. I'm at a convention from Mexico and the manager of the hotel where I'm staying suggested that I [interrupt] visit your office because of Dr. Anderson's reputation for treating ear-related issues, particularly his innovative approaches to tinnitus and other auditory disorders that many other specialists struggle with.", + "start_time": 11.111150215447726, + "end_time": 27.70180781181961, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--35/temp/line_3_B.wav", + "silence_duration": 0.3702638942662988, + "is_interrupted": true, + "text_after_interrupt": "visit your office because of Dr. Anderson's reputation for treating ear-related issues, particularly his innovative approaches to tinnitus and other auditory disorders that many other specialists struggle with." + }, + { + "speaker": "A", + "text": "Sorry to jump in, but just to clarify, are you experiencing something urgent that needs immediate attention?", + "original_text": "Sorry to jump in, but just to clarify, are you experiencing something urgent that needs immediate attention?", + "start_time": 16.660719376445456, + "end_time": 23.231966541978338, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--35/temp/line_4_A.wav", + "silence_duration": 0.5774263870010232, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, actually. I've got this ringing in my ears. It's so terrible that I can hardly hear people talking now.", + "original_text": "Yes, actually. I've got this ringing in my ears. It's so terrible that I can hardly hear people talking now.", + "start_time": 28.060040828724194, + "end_time": 33.830199558882924, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--35/temp/line_5_B.wav", + "silence_duration": 0.358233016904586, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Are you in any pain or is there any fluid?", + "original_text": "Are you in any pain or is there any fluid?", + "start_time": 34.27674049198228, + "end_time": 37.49270421080314, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--35/temp/line_6_A.wav", + "silence_duration": 0.4465409330993539, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "No discharge, just a slight earache.", + "original_text": "No discharge, just a slight earache.", + "start_time": 37.81693759612685, + "end_time": 40.33630267549193, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--35/temp/line_7_B.wav", + "silence_duration": 0.32423338532371104, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Does the pain happen all the time, or once in a while?", + "original_text": "Does the pain happen all the time, or once in a while?", + "start_time": 40.67315966801724, + "end_time": 44.132932910647625, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--35/temp/line_8_A.wav", + "silence_duration": 0.33685699252531476, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "It has been aching for two days and it's never stopped. I thought it might be due to my flying in the air, and after some rest it'll be all gone. But who knows it's getting worse. I need to see the doctor.", + "original_text": "It has been aching for two days and it's never stopped. I thought it might be due to my flying in the air, and after some rest it'll be all gone. But who knows it's getting worse. I need to see the doctor.", + "start_time": 44.50365495299721, + "end_time": 54.25603590537816, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--35/temp/line_9_B.wav", + "silence_duration": 0.3707220423495823, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "The doctor will be busy at the hospital until this evening. The earliest you could see him would be tomorrow morning at ten.", + "original_text": "The doctor will be busy at the hospital until this evening. The earliest you could see him would be tomorrow morning at ten.", + "start_time": 54.56314370364475, + "end_time": 61.48269018890552, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--35/temp/line_10_A.wav", + "silence_duration": 0.30710779826658696, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "The time is good for me. I'll come in then if that's okay. Oh, and about what I was saying earlier—the hotel manager suggested I call your office because of Dr. Anderson's expertise.", + "original_text": "The time is good for me. I'll come in then if that's okay. Oh, and about what I was saying earlier—the hotel manager suggested I call your office because of Dr. Anderson's expertise.", + "start_time": 61.98843494290497, + "end_time": 72.12394514698661, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--35/temp/line_11_B.wav", + "silence_duration": 0.5057447539994502, + "is_interrupted": false + } + ] + }, + "DialogSum--val--36": { + "original_text": "A: The hike will last for 2 hours. We'll start at sea level and then climb up a few hills. Are you sure you're prepared for the elevation change? It can be a bit challenging if you're not used to it.\nB: Ready? Absolutely! The one-hour yoga class this morning really made me full of energy. I'm feeling so good. I bet I can race you up those hills.\nA: That won't be necessary. We want to take our time to enjoy the sights along the way. We'll point out certain plants, some of the insects, and [interrupt] even talk about the local wildlife including birds, small mammals, and reptiles, but don't worry, we'll keep an eye out for anything unusual while making sure everyone stays safe and comfortable throughout the journey.\nB: Wait, did you say something about snakes? Uh, I definitely will be racing you up the hill!", + "cleaned_text": "A: The hike will last for 2 hours. We'll start at sea level and then climb up a few hills. Are you sure you're prepared for the elevation change? It can be a bit challenging if you're not used to it.\nB: Ready? Absolutely! The one-hour yoga class this morning really made me full of energy. I'm feeling so good. I bet I can race you up those hills.\nA:That won't be necessary. We want to take our time to enjoy the sights along the way. We'll point out certain plants, some of the insects, and even talk about the local wildlife including birds, small mammals, and reptiles, but don't worry, we'll keep an eye out for anything unusual while making sure everyone stays safe and comfortable throughout the journey.\nB: Wait, did you say something about snakes? Uh, I definitely will be racing you up the hill!", + "total_duration": 33.91061224489796, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--36/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--36/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--36/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "The hike will last for 2 hours. We'll start at sea level and then climb up a few hills. Are you sure you're prepared for the elevation change? It can be a bit challenging if you're not used to it.", + "original_text": "The hike will last for 2 hours. We'll start at sea level and then climb up a few hills. Are you sure you're prepared for the elevation change? It can be a bit challenging if you're not used to it.", + "start_time": 0, + "end_time": 11.38938775510204, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--36/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Ready? Absolutely! The one-hour yoga class this morning really made me full of energy. I'm feeling so good. I bet I can race you up those hills.", + "original_text": "Ready? Absolutely! The one-hour yoga class this morning really made me full of energy. I'm feeling so good. I bet I can race you up those hills.", + "start_time": 11.900056197897532, + "end_time": 19.818060733044923, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--36/temp/line_1_B.wav", + "silence_duration": 0.5106684427954917, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "That won't be necessary. We want to take our time to enjoy the sights along the way. We'll point out certain plants, some of the insects, and", + "original_text": "That won't be necessary. We want to take our time to enjoy the sights along the way. We'll point out certain plants, some of the insects, and [interrupt] even talk about the local wildlife including birds, small mammals, and reptiles, but don't worry, we'll keep an eye out for anything unusual while making sure everyone stays safe and comfortable throughout the journey.", + "start_time": 20.245687968802475, + "end_time": 40.73729794612674, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--36/temp/line_2_A.wav", + "silence_duration": 0.4276272357575511, + "is_interrupted": true, + "text_after_interrupt": "even talk about the local wildlife including birds, small mammals, and reptiles, but don't worry, we'll keep an eye out for anything unusual while making sure everyone stays safe and comfortable throughout the journey." + }, + { + "speaker": "B", + "text": "Wait, did you say something about snakes? Uh, I definitely will be racing you up the hill!", + "original_text": "Wait, did you say something about snakes? Uh, I definitely will be racing you up the hill!", + "start_time": 29.034440803269597, + "end_time": 33.91063127946008, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--36/temp/line_3_B.wav", + "silence_duration": 0.3251286523422243, + "is_interrupted": false + } + ] + }, + "DialogSum--val--37": { + "original_text": "A: Anne, thanks so much for introducing me to Caroline! Our first date went so well. I'm so excited to be in love right [interrupt] now, it feels like everything just clicked between us and I can't stop thinking about her beautiful smile and the way she laughs at my jokes.\nB: Sorry to interrupt, but just to clarify, are you sure it wasn't just the excitement of the first date? Sometimes it takes a bit longer to really know someone.\nA: I get that, but I really feel like we connected on a deeper level. I even want to climb the highest mountain and shout, Caroline, will you marry [interrupt] me someday, but I know I need to be patient and let things develop naturally over time while we explore our shared interests and values.\nB: Wow, you'd better not. Before you ask her to marry you, maybe you should ask her out on a second date. Only one date is not enough for you to know each other well.\nA: You're right, I should definitely take it slow. But did I mention how amazing our first date was? It felt like we had known each other forever.", + "cleaned_text": "A:Anne, thanks so much for introducing me to Caroline! Our first date went so well. I'm so excited to be in love right now, it feels like everything just clicked between us and I can't stop thinking about her beautiful smile and the way she laughs at my jokes.\nB: Sorry to interrupt, but just to clarify, are you sure it wasn't just the excitement of the first date? Sometimes it takes a bit longer to really know someone.\nA:I get that, but I really feel like we connected on a deeper level. I even want to climb the highest mountain and shout, Caroline, will you marry me someday, but I know I need to be patient and let things develop naturally over time while we explore our shared interests and values.\nB: Wow, you'd better not. Before you ask her to marry you, maybe you should ask her out on a second date. Only one date is not enough for you to know each other well.\nA: You're right, I should definitely take it slow. But did I mention how amazing our first date was? It felt like we had known each other forever.", + "total_duration": 50.83555555555556, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--37/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--37/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--37/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Anne, thanks so much for introducing me to Caroline! Our first date went so well. I'm so excited to be in love right", + "original_text": "Anne, thanks so much for introducing me to Caroline! Our first date went so well. I'm so excited to be in love right [interrupt] now, it feels like everything just clicked between us and I can't stop thinking about her beautiful smile and the way she laughs at my jokes.", + "start_time": 0, + "end_time": 15.534149659863946, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--37/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": true, + "text_after_interrupt": "now, it feels like everything just clicked between us and I can't stop thinking about her beautiful smile and the way she laughs at my jokes." + }, + { + "speaker": "B", + "text": "Sorry to interrupt, but just to clarify, are you sure it wasn't just the excitement of the first date? Sometimes it takes a bit longer to really know someone.", + "original_text": "Sorry to interrupt, but just to clarify, are you sure it wasn't just the excitement of the first date? Sometimes it takes a bit longer to really know someone.", + "start_time": 7.233015873015873, + "end_time": 15.348390022675737, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--37/temp/line_1_B.wav", + "silence_duration": 0.46592863051738964, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I get that, but I really feel like we connected on a deeper level. I even want to climb the highest mountain and shout, Caroline, will you marry", + "original_text": "I get that, but I really feel like we connected on a deeper level. I even want to climb the highest mountain and shout, Caroline, will you marry [interrupt] me someday, but I know I need to be patient and let things develop naturally over time while we explore our shared interests and values.", + "start_time": 15.985416851743429, + "end_time": 33.48165267940783, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--37/temp/line_2_A.wav", + "silence_duration": 0.45126719187948283, + "is_interrupted": true, + "text_after_interrupt": "me someday, but I know I need to be patient and let things develop naturally over time while we explore our shared interests and values." + }, + { + "speaker": "B", + "text": "Wow, you'd better not. Before you ask her to marry you, maybe you should ask her out on a second date. Only one date is not enough for you to know each other well.", + "original_text": "Wow, you'd better not. Before you ask her to marry you, maybe you should ask her out on a second date. Only one date is not enough for you to know each other well.", + "start_time": 33.75724698138683, + "end_time": 41.930671017668004, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--37/temp/line_3_B.wav", + "silence_duration": 0.30978769092873754, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "You're right, I should definitely take it slow. But did I mention how amazing our first date was? It felt like we had known each other forever.", + "original_text": "You're right, I should definitely take it slow. But did I mention how amazing our first date was? It felt like we had known each other forever.", + "start_time": 42.25579267605772, + "end_time": 50.83556591868811, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--37/temp/line_4_A.wav", + "silence_duration": 0.32512165838972235, + "is_interrupted": false + } + ] + }, + "DialogSum--val--38": { + "original_text": "A: Can I help you? \nB: Yes. Are there any spare rooms here? \nA: Would you be interested in a three-bedroom flat? I have a few [interrupt] smaller units available if you're looking for something cozier, including some lovely studio apartments with modern amenities and great natural lighting that might suit your needs perfectly. \nB: Sorry to cut in, but three bedrooms might be too much for me. Do you have anything smaller? \nA: I understand. We do have some smaller options. But you mentioned you don't have much furniture—did you want to discuss any furnished options? \nB: Oh, I hadn't thought about that. A furnished place could be convenient. What do you have available?", + "cleaned_text": "A: Can I help you? \nB: Yes. Are there any spare rooms here? \nA:Would you be interested in a three-bedroom flat? I have a few smaller units available if you're looking for something cozier, including some lovely studio apartments with modern amenities and great natural lighting that might suit your needs perfectly.\nB: Sorry to cut in, but three bedrooms might be too much for me. Do you have anything smaller? \nA: I understand. We do have some smaller options. But you mentioned you don't have much furniture—did you want to discuss any furnished options? \nB: Oh, I hadn't thought about that. A furnished place could be convenient. What do you have available?", + "total_duration": 33.82507936507937, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--38/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--38/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--38/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Can I help you?", + "original_text": "Can I help you?", + "start_time": 0, + "end_time": 0.8707482993197279, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--38/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes. Are there any spare rooms here?", + "original_text": "Yes. Are there any spare rooms here?", + "start_time": 1.3664179224311492, + "end_time": 3.885783001796229, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--38/temp/line_1_B.wav", + "silence_duration": 0.4956696231114214, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Would you be interested in a three-bedroom flat? I have a few", + "original_text": "Would you be interested in a three-bedroom flat? I have a few [interrupt] smaller units available if you're looking for something cozier, including some lovely studio apartments with modern amenities and great natural lighting that might suit your needs perfectly.", + "start_time": 4.241584522683672, + "end_time": 19.497094726765305, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--38/temp/line_2_A.wav", + "silence_duration": 0.35580152088744305, + "is_interrupted": true, + "text_after_interrupt": "smaller units available if you're looking for something cozier, including some lovely studio apartments with modern amenities and great natural lighting that might suit your needs perfectly." + }, + { + "speaker": "B", + "text": "Sorry to cut in, but three bedrooms might be too much for me. Do you have anything smaller?", + "original_text": "Sorry to cut in, but three bedrooms might be too much for me. Do you have anything smaller?", + "start_time": 8.734645747173467, + "end_time": 13.529566382094101, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--38/temp/line_3_B.wav", + "silence_duration": 0.5640911319697642, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I understand. We do have some smaller options. But you mentioned you don't have much furniture—did you want to discuss any furnished options?", + "original_text": "I understand. We do have some smaller options. But you mentioned you don't have much furniture—did you want to discuss any furnished options?", + "start_time": 19.987864441953835, + "end_time": 28.207728387532065, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--38/temp/line_4_A.wav", + "silence_duration": 0.4907697151885324, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Oh, I hadn't thought about that. A furnished place could be convenient. What do you have available?", + "original_text": "Oh, I hadn't thought about that. A furnished place could be convenient. What do you have available?", + "start_time": 28.728310724560874, + "end_time": 33.82509076991235, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--38/temp/line_5_B.wav", + "silence_duration": 0.5205823370288085, + "is_interrupted": false + } + ] + }, + "DialogSum--val--39": { + "original_text": "A: I'm sorry. That's all very unfortunate. I'm sure something can be done. I will put you through to our legal consultant, Mrs. Schroder. One moment, please. (dialing sound...) Hello, Mr. Cruise? Thank you for waiting. I'm awfully sorry, but Mrs. Schroder is having a meeting right now. Could she call you [interrupt] back later this afternoon, perhaps around 3 PM? She usually finishes her meetings by then and will have ample time to address your concerns thoroughly and provide the proper legal guidance you require.\nB: I'm sorry to interrupt, but are you sure this isn't just another delay tactic? I really need this resolved as soon as possible.\nA: I completely understand your concern, sir. I assure you, it's not a delay tactic. I have noted your complaint, and I will urge Mrs. Schroder to call you back as soon as possible. Could I have your phone number, please?\nB: Yes. It's 0181 945 8719. By the way, you were about to say when Mrs. Schroder could call me back?\nA: Oh, right. She should be able to call you later this afternoon.", + "cleaned_text": "A:I'm sorry. That's all very unfortunate. I'm sure something can be done. I will put you through to our legal consultant, Mrs. Schroder. One moment, please. (dialing sound...) Hello, Mr. Cruise? Thank you for waiting. I'm awfully sorry, but Mrs. Schroder is having a meeting right now. Could she call you back later this afternoon, perhaps around 3 PM? She usually finishes her meetings by then and will have ample time to address your concerns thoroughly and provide the proper legal guidance you require.\nB: I'm sorry to interrupt, but are you sure this isn't just another delay tactic? I really need this resolved as soon as possible.\nA: I completely understand your concern, sir. I assure you, it's not a delay tactic. I have noted your complaint, and I will urge Mrs. Schroder to call you back as soon as possible. Could I have your phone number, please?\nB: Yes. It's 0181 945 8719. By the way, you were about to say when Mrs. Schroder could call me back?\nA: Oh, right. She should be able to call you later this afternoon.", + "total_duration": 58.05578231292517, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--39/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--39/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--39/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "I'm sorry. That's all very unfortunate. I'm sure something can be done. I will put you through to our legal consultant, Mrs. Schroder. One moment, please. (dialing sound...) Hello, Mr. Cruise? Thank you for waiting. I'm awfully sorry, but Mrs. Schroder is having a meeting right now. Could she call you", + "original_text": "I'm sorry. That's all very unfortunate. I'm sure something can be done. I will put you through to our legal consultant, Mrs. Schroder. One moment, please. (dialing sound...) Hello, Mr. Cruise? Thank you for waiting. I'm awfully sorry, but Mrs. Schroder is having a meeting right now. Could she call you [interrupt] back later this afternoon, perhaps around 3 PM? She usually finishes her meetings by then and will have ample time to address your concerns thoroughly and provide the proper legal guidance you require.", + "start_time": 0, + "end_time": 31.381768707482994, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--39/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": true, + "text_after_interrupt": "back later this afternoon, perhaps around 3 PM? She usually finishes her meetings by then and will have ample time to address your concerns thoroughly and provide the proper legal guidance you require." + }, + { + "speaker": "B", + "text": "I'm sorry to interrupt, but are you sure this isn't just another delay tactic? I really need this resolved as soon as possible.", + "original_text": "I'm sorry to interrupt, but are you sure this isn't just another delay tactic? I really need this resolved as soon as possible.", + "start_time": 18.332154195011338, + "end_time": 24.76408163265306, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--39/temp/line_1_B.wav", + "silence_duration": 0.35475452962427056, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I completely understand your concern, sir. I assure you, it's not a delay tactic. I have noted your complaint, and I will urge Mrs. Schroder to call you back as soon as possible. Could I have your phone number, please?", + "original_text": "I completely understand your concern, sir. I assure you, it's not a delay tactic. I have noted your complaint, and I will urge Mrs. Schroder to call you back as soon as possible. Could I have your phone number, please?", + "start_time": 31.723628679523607, + "end_time": 44.35528400832179, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--39/temp/line_2_A.wav", + "silence_duration": 0.3418599720406132, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes. It's 0181 945 8719. By the way, you were about to say when Mrs. Schroder could call me back?", + "original_text": "Yes. It's 0181 945 8719. By the way, you were about to say when Mrs. Schroder could call me back?", + "start_time": 44.658534565502954, + "end_time": 53.853636606319284, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--39/temp/line_3_B.wav", + "silence_duration": 0.3032505571811626, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Oh, right. She should be able to call you later this afternoon.", + "original_text": "Oh, right. She should be able to call you later this afternoon.", + "start_time": 54.17807296736505, + "end_time": 58.055805393668905, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--39/temp/line_4_A.wav", + "silence_duration": 0.32443636104576, + "is_interrupted": false + } + ] + }, + "DialogSum--val--41": { + "original_text": "A: Adam, could you show me around the school? \nB: No problem. \nA: What's the tallest building? \nB: You mean the white building near the playground? \nA: Yes. \nB: That is the library. And it has more than 1,000,000 [interrupt] rare and valuable collections that are often used for research purposes by both students and visiting scholars from around the world. \nA: Sorry to interrupt, but is it open to students all year round? \nB: Yes, it's open year-round. By the way, I was mentioning that the library has more than 1,000,000 books. \nA: That's impressive! What's the building to the south of the library? \nB: You know, our school is divided into two parts, the junior high school and the senior high school. That is the new classroom building for our senior high school. \nA: Is there a swimming pool in your school? \nB: Yes. There is a large swimming pool, but it is only available in the summer, when the weather is warm enough for outdoor activities. \nA: Oh, only in summer? \nB: Exactly, only in summer. \nA: I do envy you. And I hope I can enter your school one day. \nB: I believe that you can make your dream come true.", + "cleaned_text": "A: Adam, could you show me around the school? \nB: No problem. \nA: What's the tallest building? \nB: You mean the white building near the playground? \nA: Yes. \nB:That is the library. And it has more than 1,000,000 rare and valuable collections that are often used for research purposes by both students and visiting scholars from around the world.\nA: Sorry to interrupt, but is it open to students all year round? \nB: Yes, it's open year-round. By the way, I was mentioning that the library has more than 1,000,000 books. \nA: That's impressive! What's the building to the south of the library? \nB: You know, our school is divided into two parts, the junior high school and the senior high school. That is the new classroom building for our senior high school. \nA: Is there a swimming pool in your school? \nB: Yes. There is a large swimming pool, but it is only available in the summer, when the weather is warm enough for outdoor activities. \nA: Oh, only in summer? \nB: Exactly, only in summer. \nA: I do envy you. And I hope I can enter your school one day. \nB: I believe that you can make your dream come true.", + "total_duration": 57.40866213151927, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--41/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--41/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--41/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Adam, could you show me around the school?", + "original_text": "Adam, could you show me around the school?", + "start_time": 0, + "end_time": 2.36843537414966, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--41/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "No problem.", + "original_text": "No problem.", + "start_time": 2.7065660147277266, + "end_time": 3.542484382074665, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--41/temp/line_1_B.wav", + "silence_duration": 0.33813064057806674, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "What's the tallest building?", + "original_text": "What's the tallest building?", + "start_time": 3.9112372764419794, + "end_time": 5.490194192541752, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--41/temp/line_2_A.wav", + "silence_duration": 0.3687528943673142, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "You mean the white building near the playground?", + "original_text": "You mean the white building near the playground?", + "start_time": 6.0090145310848975, + "end_time": 8.122030404100771, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--41/temp/line_3_B.wav", + "silence_duration": 0.5188203385431458, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Yes.", + "original_text": "Yes.", + "start_time": 8.55617753042923, + "end_time": 9.229556215236485, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--41/temp/line_4_A.wav", + "silence_duration": 0.43414712632845887, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "That is the library. And it has more than 1,000,000", + "original_text": "That is the library. And it has more than 1,000,000 [interrupt] rare and valuable collections that are often used for research purposes by both students and visiting scholars from around the world.", + "start_time": 9.712146354875859, + "end_time": 18.6518288945584, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--41/temp/line_5_B.wav", + "silence_duration": 0.482590139639374, + "is_interrupted": true, + "text_after_interrupt": "rare and valuable collections that are often used for research purposes by both students and visiting scholars from around the world." + }, + { + "speaker": "A", + "text": "Sorry to interrupt, but is it open to students all year round?", + "original_text": "Sorry to interrupt, but is it open to students all year round?", + "start_time": 12.788790345805564, + "end_time": 16.701352704082208, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--41/temp/line_6_A.wav", + "silence_duration": 0.481508930145353, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, it's open year-round. By the way, I was mentioning that the library has more than 1,000,000 books.", + "original_text": "Yes, it's open year-round. By the way, I was mentioning that the library has more than 1,000,000 books.", + "start_time": 19.14365653258195, + "end_time": 24.76288555752526, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--41/temp/line_7_B.wav", + "silence_duration": 0.491827638023552, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "That's impressive! What's the building to the south of the library?", + "original_text": "That's impressive! What's the building to the south of the library?", + "start_time": 25.119877119816415, + "end_time": 28.99760954612027, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--41/temp/line_8_A.wav", + "silence_duration": 0.3569915622911549, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "You know, our school is divided into two parts, the junior high school and the senior high school. That is the new classroom building for our senior high school.", + "original_text": "You know, our school is divided into two parts, the junior high school and the senior high school. That is the new classroom building for our senior high school.", + "start_time": 29.417314767819285, + "end_time": 37.01023993788731, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--41/temp/line_9_B.wav", + "silence_duration": 0.4197052216990145, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Is there a swimming pool in your school?", + "original_text": "Is there a swimming pool in your school?", + "start_time": 37.513748021659666, + "end_time": 39.46422421213585, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--41/temp/line_10_A.wav", + "silence_duration": 0.5035080837723496, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes. There is a large swimming pool, but it is only available in the summer, when the weather is warm enough for outdoor activities.", + "original_text": "Yes. There is a large swimming pool, but it is only available in the summer, when the weather is warm enough for outdoor activities.", + "start_time": 39.91682683951088, + "end_time": 46.23265450390998, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--41/temp/line_11_B.wav", + "silence_duration": 0.45260262737502943, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Oh, only in summer?", + "original_text": "Oh, only in summer?", + "start_time": 46.760094538797645, + "end_time": 48.21134170433052, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--41/temp/line_12_A.wav", + "silence_duration": 0.527440034887666, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Exactly, only in summer.", + "original_text": "Exactly, only in summer.", + "start_time": 48.787016821357284, + "end_time": 50.67944312521216, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--41/temp/line_13_B.wav", + "silence_duration": 0.5756751170267604, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I do envy you. And I hope I can enter your school one day.", + "original_text": "I do envy you. And I hope I can enter your school one day.", + "start_time": 51.23939647745034, + "end_time": 54.76882958402631, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--41/temp/line_14_A.wav", + "silence_duration": 0.559953352238183, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I believe that you can make your dream come true.", + "original_text": "I believe that you can make your dream come true.", + "start_time": 55.24923716474116, + "end_time": 57.408692947054085, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--41/temp/line_15_B.wav", + "silence_duration": 0.4804075807148551, + "is_interrupted": false + } + ] + }, + "DialogSum--val--42": { + "original_text": "A: Excuse me. I'm a stranger here and lost my way. \nB: Can I help you? \nA: Sure. Can I get to the central department stall this way? \nB: Uh... Yes. Turn right, then take the second turning on your [interrupt] left, and you'll see a large shopping complex with distinctive blue signage where you should continue straight past the fountain until you reach the central department stall. \nA: Sorry to cut in, but I just realized I might also need to stop by the national bank. Do you know where that is? \nB: Yes, it's on this street. Keep walking for two blocks and it's on the corner on the right. But about the department stall, after you take the second left, it's about a fifteen-minute walk. \nA: Got it, thanks very much. \nB: You are welcome. Good luck.", + "cleaned_text": "A: Excuse me. I'm a stranger here and lost my way. \nB: Can I help you? \nA: Sure. Can I get to the central department stall this way? \nB:Uh... Yes. Turn right, then take the second turning on your left, and you'll see a large shopping complex with distinctive blue signage where you should continue straight past the fountain until you reach the central department stall.\nA: Sorry to cut in, but I just realized I might also need to stop by the national bank. Do you know where that is? \nB: Yes, it's on this street. Keep walking for two blocks and it's on the corner on the right. But about the department stall, after you take the second left, it's about a fifteen-minute walk. \nA: Got it, thanks very much. \nB: You are welcome. Good luck.", + "total_duration": 35.471927437641725, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--42/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--42/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--42/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Excuse me. I'm a stranger here and lost my way.", + "original_text": "Excuse me. I'm a stranger here and lost my way.", + "start_time": 0, + "end_time": 3.7384126984126986, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--42/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Can I help you?", + "original_text": "Can I help you?", + "start_time": 4.315387128086339, + "end_time": 5.151305495433278, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--42/temp/line_1_B.wav", + "silence_duration": 0.5769744296736403, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Sure. Can I get to the central department stall this way?", + "original_text": "Sure. Can I get to the central department stall this way?", + "start_time": 5.491835439549449, + "end_time": 8.463989634560788, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--42/temp/line_2_A.wav", + "silence_duration": 0.34052994411617077, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Uh... Yes. Turn right, then take the second turning on your", + "original_text": "Uh... Yes. Turn right, then take the second turning on your [interrupt] left, and you'll see a large shopping complex with distinctive blue signage where you should continue straight past the fountain until you reach the central department stall.", + "start_time": 9.034615338934943, + "end_time": 21.38763121195082, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--42/temp/line_3_B.wav", + "silence_duration": 0.5706257043741554, + "is_interrupted": true, + "text_after_interrupt": "left, and you'll see a large shopping complex with distinctive blue signage where you should continue straight past the fountain until you reach the central department stall." + }, + { + "speaker": "A", + "text": "Sorry to cut in, but I just realized I might also need to stop by the national bank. Do you know where that is?", + "original_text": "Sorry to cut in, but I just realized I might also need to stop by the national bank. Do you know where that is?", + "start_time": 13.086497425102744, + "end_time": 19.79706431852678, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--42/temp/line_4_A.wav", + "silence_duration": 0.49721058355430914, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, it's on this street. Keep walking for two blocks and it's on the corner on the right. But about the department stall, after you take the second left, it's about a fifteen-minute walk.", + "original_text": "Yes, it's on this street. Keep walking for two blocks and it's on the corner on the right. But about the department stall, after you take the second left, it's about a fifteen-minute walk.", + "start_time": 21.8717577492355, + "end_time": 31.148129631321666, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--42/temp/line_5_B.wav", + "silence_duration": 0.48412653728468047, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Got it, thanks very much.", + "original_text": "Got it, thanks very much.", + "start_time": 31.724093963138102, + "end_time": 33.442370607129035, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--42/temp/line_6_A.wav", + "silence_duration": 0.5759643318164369, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "You are welcome. Good luck.", + "original_text": "You are welcome. Good luck.", + "start_time": 33.97424316577376, + "end_time": 35.47193024060369, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--42/temp/line_7_B.wav", + "silence_duration": 0.5318725586447242, + "is_interrupted": false + } + ] + }, + "DialogSum--val--43": { + "original_text": "A: Some people pile on their agonise and try to seek other's sympathy by telling them how miserable they [interrupt] feel, hoping to get something out of it. It's a manipulative tactic that preys on people's kindness and often leaves the giver feeling used and disappointed.\nB: Yeah, and it's really frustrating because they often take advantage of other people's hospitality and generosity.\nA: Exactly. I was fooled once. A lady told me she needed some money to keep the pot boiling. So I gave her some money and bailed her out of the situation. But later I learned that she had [interrupt] used the money for something completely different, something I would never have supported. She threw an extravagant party with expensive alcohol and gourmet food while claiming to be struggling to feed her children.\nB: Lied to you, right? That's terrible. But you know, you should have seen through her. It sounds like you were still a bit wet behind the ears back then.\nA: Yeah, I guess so. But I never got to tell you what she actually did with the money... She spent it on a lavish dinner for herself, rather than on the essentials she claimed she needed. The worst part was she posted pictures of the party on social media without a care in the world.", + "cleaned_text": "A:Some people pile on their agonise and try to seek other's sympathy by telling them how miserable they feel, hoping to get something out of it. It's a manipulative tactic that preys on people's kindness and often leaves the giver feeling used and disappointed.\nB: Yeah, and it's really frustrating because they often take advantage of other people's hospitality and generosity.\nA:Exactly. I was fooled once. A lady told me she needed some money to keep the pot boiling. So I gave her some money and bailed her out of the situation. But later I learned that she had used the money for something completely different, something I would never have supported. She threw an extravagant party with expensive alcohol and gourmet food while claiming to be struggling to feed her children.\nB: Lied to you, right? That's terrible. But you know, you should have seen through her. It sounds like you were still a bit wet behind the ears back then.\nA: Yeah, I guess so. But I never got to tell you what she actually did with the money... She spent it on a lavish dinner for herself, rather than on the essentials she claimed she needed. The worst part was she posted pictures of the party on social media without a care in the world.", + "total_duration": 56.87469387755102, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--43/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--43/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--43/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Some people pile on their agonise and try to seek other's sympathy by telling them how miserable they", + "original_text": "Some people pile on their agonise and try to seek other's sympathy by telling them how miserable they [interrupt] feel, hoping to get something out of it. It's a manipulative tactic that preys on people's kindness and often leaves the giver feeling used and disappointed.", + "start_time": 0, + "end_time": 14.837551020408164, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--43/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": true, + "text_after_interrupt": "feel, hoping to get something out of it. It's a manipulative tactic that preys on people's kindness and often leaves the giver feeling used and disappointed." + }, + { + "speaker": "B", + "text": "Yeah, and it's really frustrating because they often take advantage of other people's hospitality and generosity.", + "original_text": "Yeah, and it's really frustrating because they often take advantage of other people's hospitality and generosity.", + "start_time": 6.478367346938776, + "end_time": 12.07437641723356, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--43/temp/line_1_B.wav", + "silence_duration": 0.42388688110802625, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Exactly. I was fooled once. A lady told me she needed some money to keep the pot boiling. So I gave her some money and bailed her out of the situation. But later I learned that she had", + "original_text": "Exactly. I was fooled once. A lady told me she needed some money to keep the pot boiling. So I gave her some money and bailed her out of the situation. But later I learned that she had [interrupt] used the money for something completely different, something I would never have supported. She threw an extravagant party with expensive alcohol and gourmet food while claiming to be struggling to feed her children.", + "start_time": 15.185866361444122, + "end_time": 38.13879153151215, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--43/temp/line_2_A.wav", + "silence_duration": 0.34831534103595846, + "is_interrupted": true, + "text_after_interrupt": "used the money for something completely different, something I would never have supported. She threw an extravagant party with expensive alcohol and gourmet food while claiming to be struggling to feed her children." + }, + { + "speaker": "B", + "text": "Lied to you, right? That's terrible. But you know, you should have seen through her. It sounds like you were still a bit wet behind the ears back then.", + "original_text": "Lied to you, right? That's terrible. But you know, you should have seen through her. It sounds like you were still a bit wet behind the ears back then.", + "start_time": 32.706299613562976, + "end_time": 39.66067603079654, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--43/temp/line_3_B.wav", + "silence_duration": 0.3594985611086551, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Yeah, I guess so. But I never got to tell you what she actually did with the money... She spent it on a lavish dinner for herself, rather than on the essentials she claimed she needed. The worst part was she posted pictures of the party on social media without a care in the world.", + "original_text": "Yeah, I guess so. But I never got to tell you what she actually did with the money... She spent it on a lavish dinner for herself, rather than on the essentials she claimed she needed. The worst part was she posted pictures of the party on social media without a care in the world.", + "start_time": 39.98220583676241, + "end_time": 56.87472284356513, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--43/temp/line_4_A.wav", + "silence_duration": 0.3215298059658768, + "is_interrupted": false + } + ] + }, + "DialogSum--val--44": { + "original_text": "A: I'm looking for a pan I can use in my kitchen.\nB: What size pan were you thinking of?\nA: I've already got a small pan. I need a big [interrupt] one for cooking larger meals, especially when I have guests over, because I frequently host dinner parties and need something that can handle multiple servings at once.\nB: Sorry to jump in, but do you have any material preference? Like non-stick or stainless steel?\nA: I was actually thinking of a non-stick one. But I haven't mentioned the size yet. I need a big one.\nB: Well, this one might work for you.\nA: Oh, no, that's way too heavy a pan for me.\nB: Here, lift this aluminum pan. It's the same size.\nA: Yes, it's very lightweight. But I don't want this aluminum handle.\nB: Here's a similar aluminum pan. But it has a heat-resistant handle.\nA: Oh, this feels very nice. It's perfect. I'll take it.\nB: I knew we'd find the right pan sooner or later. How would you like to [interrupt] pay for it? We accept cash, card, or mobile payments, and you can also sign up for our loyalty program to get discounts on future purchases.\nA: Oh, before that, I need a lid for this pan.\nB: No problem. Here's the lid that comes with the pan.", + "cleaned_text": "A: I'm looking for a pan I can use in my kitchen.\nB: What size pan were you thinking of?\nA:I've already got a small pan. I need a big one for cooking larger meals, especially when I have guests over, because I frequently host dinner parties and need something that can handle multiple servings at once.\nB: Sorry to jump in, but do you have any material preference? Like non-stick or stainless steel?\nA: I was actually thinking of a non-stick one. But I haven't mentioned the size yet. I need a big one.\nB: Well, this one might work for you.\nA: Oh, no, that's way too heavy a pan for me.\nB: Here, lift this aluminum pan. It's the same size.\nA: Yes, it's very lightweight. But I don't want this aluminum handle.\nB: Here's a similar aluminum pan. But it has a heat-resistant handle.\nA: Oh, this feels very nice. It's perfect. I'll take it.\nB:I knew we'd find the right pan sooner or later. How would you like to pay for it? We accept cash, card, or mobile payments, and you can also sign up for our loyalty program to get discounts on future purchases.\nA: Oh, before that, I need a lid for this pan.\nB: No problem. Here's the lid that comes with the pan.", + "total_duration": 63.51387755102041, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--44/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--44/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--44/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "I'm looking for a pan I can use in my kitchen.", + "original_text": "I'm looking for a pan I can use in my kitchen.", + "start_time": 0, + "end_time": 2.7399546485260773, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--44/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "What size pan were you thinking of?", + "original_text": "What size pan were you thinking of?", + "start_time": 3.318079206099183, + "end_time": 5.094405736711428, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--44/temp/line_1_B.wav", + "silence_duration": 0.578124557573106, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I've already got a small pan. I need a big", + "original_text": "I've already got a small pan. I need a big [interrupt] one for cooking larger meals, especially when I have guests over, because I frequently host dinner parties and need something that can handle multiple servings at once.", + "start_time": 5.472995431782411, + "end_time": 18.371680239038646, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--44/temp/line_2_A.wav", + "silence_duration": 0.37858969507098317, + "is_interrupted": true, + "text_after_interrupt": "one for cooking larger meals, especially when I have guests over, because I frequently host dinner parties and need something that can handle multiple servings at once." + }, + { + "speaker": "B", + "text": "Sorry to jump in, but do you have any material preference? Like non-stick or stainless steel?", + "original_text": "Sorry to jump in, but do you have any material preference? Like non-stick or stainless steel?", + "start_time": 8.445149626793748, + "end_time": 13.658029445387854, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--44/temp/line_3_B.wav", + "silence_duration": 0.5239187498206239, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I was actually thinking of a non-stick one. But I haven't mentioned the size yet. I need a big one.", + "original_text": "I was actually thinking of a non-stick one. But I haven't mentioned the size yet. I need a big one.", + "start_time": 18.93038060330449, + "end_time": 24.909518925299952, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--44/temp/line_4_A.wav", + "silence_duration": 0.5587003642658412, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Well, this one might work for you.", + "original_text": "Well, this one might work for you.", + "start_time": 25.42644292305652, + "end_time": 27.237599385641555, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--44/temp/line_5_B.wav", + "silence_duration": 0.5169239977565669, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Oh, no, that's way too heavy a pan for me.", + "original_text": "Oh, no, that's way too heavy a pan for me.", + "start_time": 27.60194703056834, + "end_time": 30.481221406985572, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--44/temp/line_6_A.wav", + "silence_duration": 0.3643476449267847, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Here, lift this aluminum pan. It's the same size.", + "original_text": "Here, lift this aluminum pan. It's the same size.", + "start_time": 30.823906584183803, + "end_time": 33.99343039370761, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--44/temp/line_7_B.wav", + "silence_duration": 0.3426851771982313, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Yes, it's very lightweight. But I don't want this aluminum handle.", + "original_text": "Yes, it's very lightweight. But I don't want this aluminum handle.", + "start_time": 34.58040121644136, + "end_time": 38.85287287177016, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--44/temp/line_8_A.wav", + "silence_duration": 0.5869708227337471, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Here's a similar aluminum pan. But it has a heat-resistant handle.", + "original_text": "Here's a similar aluminum pan. But it has a heat-resistant handle.", + "start_time": 39.35650727454284, + "end_time": 43.24584967817096, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--44/temp/line_9_B.wav", + "silence_duration": 0.5036344027726806, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Oh, this feels very nice. It's perfect. I'll take it.", + "original_text": "Oh, this feels very nice. It's perfect. I'll take it.", + "start_time": 43.66906849472611, + "end_time": 47.40748119313881, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--44/temp/line_10_A.wav", + "silence_duration": 0.4232188165551489, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I knew we'd find the right pan sooner or later. How would you like to", + "original_text": "I knew we'd find the right pan sooner or later. How would you like to [interrupt] pay for it? We accept cash, card, or mobile payments, and you can also sign up for our loyalty program to get discounts on future purchases.", + "start_time": 47.74784966331664, + "end_time": 59.183677327715735, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--44/temp/line_11_B.wav", + "silence_duration": 0.34036847017783795, + "is_interrupted": true, + "text_after_interrupt": "pay for it? We accept cash, card, or mobile payments, and you can also sign up for our loyalty program to get discounts on future purchases." + }, + { + "speaker": "A", + "text": "Oh, before that, I need a lid for this pan.", + "original_text": "Oh, before that, I need a lid for this pan.", + "start_time": 57.77708555645126, + "end_time": 60.366110499761916, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--44/temp/line_12_A.wav", + "silence_duration": 0.4256164625533818, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "No problem. Here's the lid that comes with the pan.", + "original_text": "No problem. Here's the lid that comes with the pan.", + "start_time": 60.68106233476157, + "end_time": 63.51389680188175, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--44/temp/line_13_B.wav", + "silence_duration": 0.31495183499965174, + "is_interrupted": false + } + ] + }, + "DialogSum--val--45": { + "original_text": "A: Come in, come in! \nB: Hi, Gary, what happened? I was waiting for you at the theater. Why didn't you meet me [interrupt] I was getting worried when you didn't show up and started thinking something might have happened to you on the way here. \nA: I thought we were supposed to meet here. \nB: Don't you know our movie starts at seven? And we were going to meet at the theater at five to seven. Then it doesn't make sense to meet at the apartment. \nA: I'm sorry. We must have misunderstood each other. I was going to mention that I thought we had a different plan, but I guess I should have confirmed it with you earlier. \nB: Why don't you try to be clearer about your intentions [interrupt] next time, so we don't end up in situations like this? It's really frustrating when we keep having these miscommunications about our plans. \nA: You're right, I should've been more specific. But just to clarify, did you mean we were supposed to meet at the theater right before the movie started, or did I miss something else? \nB: We were definitely supposed to meet at the theater at five to seven. But it's okay. I don't want to go now. We've already missed ten minutes of the movie. I don't want to see a movie without watching the beginning.", + "cleaned_text": "A: Come in, come in! \nB:Hi, Gary, what happened? I was waiting for you at the theater. Why didn't you meet me I was getting worried when you didn't show up and started thinking something might have happened to you on the way here.\nA: I thought we were supposed to meet here. \nB: Don't you know our movie starts at seven? And we were going to meet at the theater at five to seven. Then it doesn't make sense to meet at the apartment. \nA: I'm sorry. We must have misunderstood each other. I was going to mention that I thought we had a different plan, but I guess I should have confirmed it with you earlier. \nB:Why don't you try to be clearer about your intentions next time, so we don't end up in situations like this? It's really frustrating when we keep having these miscommunications about our plans.\nA: You're right, I should've been more specific. But just to clarify, did you mean we were supposed to meet at the theater right before the movie started, or did I miss something else? \nB: We were definitely supposed to meet at the theater at five to seven. But it's okay. I don't want to go now. We've already missed ten minutes of the movie. I don't want to see a movie without watching the beginning.", + "total_duration": 55.62662131519274, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--45/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--45/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--45/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Come in, come in!", + "original_text": "Come in, come in!", + "start_time": 0, + "end_time": 1.1377777777777778, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--45/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Hi, Gary, what happened? I was waiting for you at the theater. Why didn't you meet me", + "original_text": "Hi, Gary, what happened? I was waiting for you at the theater. Why didn't you meet me [interrupt] I was getting worried when you didn't show up and started thinking something might have happened to you on the way here.", + "start_time": 1.5333652685513572, + "end_time": 10.68202740007063, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--45/temp/line_1_B.wav", + "silence_duration": 0.3955874907735795, + "is_interrupted": true, + "text_after_interrupt": "I was getting worried when you didn't show up and started thinking something might have happened to you on the way here." + }, + { + "speaker": "A", + "text": "I thought we were supposed to meet here.", + "original_text": "I thought we were supposed to meet here.", + "start_time": 6.026426493041153, + "end_time": 8.058172524787185, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--45/temp/line_2_A.wav", + "silence_duration": 0.5173835855441744, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Don't you know our movie starts at seven? And we were going to meet at the theater at five to seven. Then it doesn't make sense to meet at the apartment.", + "original_text": "Don't you know our movie starts at seven? And we were going to meet at the theater at five to seven. Then it doesn't make sense to meet at the apartment.", + "start_time": 11.168013000733742, + "end_time": 18.296539077831248, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--45/temp/line_3_B.wav", + "silence_duration": 0.48598560066311147, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I'm sorry. We must have misunderstood each other. I was going to mention that I thought we had a different plan, but I guess I should have confirmed it with you earlier.", + "original_text": "I'm sorry. We must have misunderstood each other. I was going to mention that I thought we had a different plan, but I guess I should have confirmed it with you earlier.", + "start_time": 18.64525496352827, + "end_time": 28.978134782122375, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--45/temp/line_4_A.wav", + "silence_duration": 0.3487158856970229, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Why don't you try to be clearer about your intentions", + "original_text": "Why don't you try to be clearer about your intentions [interrupt] next time, so we don't end up in situations like this? It's really frustrating when we keep having these miscommunications about our plans.", + "start_time": 29.530363849672966, + "end_time": 39.39884457529655, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--45/temp/line_5_B.wav", + "silence_duration": 0.5522290675505921, + "is_interrupted": true, + "text_after_interrupt": "next time, so we don't end up in situations like this? It's really frustrating when we keep having these miscommunications about our plans." + }, + { + "speaker": "A", + "text": "You're right, I should've been more specific. But just to clarify, did you mean we were supposed to meet at the theater right before the movie started, or did I miss something else?", + "original_text": "You're right, I should've been more specific. But just to clarify, did you mean we were supposed to meet at the theater right before the movie started, or did I miss something else?", + "start_time": 34.563546171886806, + "end_time": 44.722276330616964, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--45/temp/line_6_A.wav", + "silence_duration": 0.5036215033110275, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "We were definitely supposed to meet at the theater at five to seven. But it's okay. I don't want to go now. We've already missed ten minutes of the movie. I don't want to see a movie without watching the beginning.", + "original_text": "We were definitely supposed to meet at the theater at five to seven. But it's okay. I don't want to go now. We've already missed ten minutes of the movie. I don't want to see a movie without watching the beginning.", + "start_time": 45.21247994119258, + "end_time": 55.62662960105653, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--45/temp/line_7_B.wav", + "silence_duration": 0.49020361057561646, + "is_interrupted": false + } + ] + }, + "DialogSum--val--47": { + "original_text": "A: What's wrong with you, Lucy? \nB: Our dog Rusty is lost. Someone left the backyard gate open and he got out. My daughter is so upset [interrupt] that she hasn't stopped crying since we realized he was missing and she keeps asking when he's coming home every five minutes. \nA: Have you called the local dog shelters? \nB: Well, they haven't seen him. They said they would call me if they find our dog, but I don't expect miracles. It's 2 days and... \nA: We can always look for miracles. Does he have any identification on him? \nB: He's wearing his sweater. He's brown with white spots and... Sorry, I'm not thinking straight. You know, he's a big part of our family. We got him when he was a little [interrupt] puppy, and he's been with us through so many important moments including my daughter's first steps and her first day of school. \nA: Wait, did you say he's wearing a sweater? That might help people recognize him faster. \nB: Yes, he's wearing a sweater. But as I was saying, we got him when he was a little puppy. I'm just worried he was stolen or is injured somewhere. \nA: I understand. I used to pet dogs, too. Let's walk around the neighborhood. Hey, look! There he is. \nB: Rusty! Come here boy! Oh, Glenn, I can't thank you enough. I owe you a big favor.", + "cleaned_text": "A: What's wrong with you, Lucy? \nB:Our dog Rusty is lost. Someone left the backyard gate open and he got out. My daughter is so upset that she hasn't stopped crying since we realized he was missing and she keeps asking when he's coming home every five minutes.\nA: Have you called the local dog shelters? \nB: Well, they haven't seen him. They said they would call me if they find our dog, but I don't expect miracles. It's 2 days and... \nA: We can always look for miracles. Does he have any identification on him? \nB:He's wearing his sweater. He's brown with white spots and... Sorry, I'm not thinking straight. You know, he's a big part of our family. We got him when he was a little puppy, and he's been with us through so many important moments including my daughter's first steps and her first day of school.\nA: Wait, did you say he's wearing a sweater? That might help people recognize him faster. \nB: Yes, he's wearing a sweater. But as I was saying, we got him when he was a little puppy. I'm just worried he was stolen or is injured somewhere. \nA: I understand. I used to pet dogs, too. Let's walk around the neighborhood. Hey, look! There he is. \nB: Rusty! Come here boy! Oh, Glenn, I can't thank you enough. I owe you a big favor.", + "total_duration": 61.44439909297052, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--47/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--47/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--47/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "What's wrong with you, Lucy?", + "original_text": "What's wrong with you, Lucy?", + "start_time": 0, + "end_time": 1.555736961451247, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--47/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Our dog Rusty is lost. Someone left the backyard gate open and he got out. My daughter is so upset", + "original_text": "Our dog Rusty is lost. Someone left the backyard gate open and he got out. My daughter is so upset [interrupt] that she hasn't stopped crying since we realized he was missing and she keeps asking when he's coming home every five minutes.", + "start_time": 1.8737574589898556, + "end_time": 13.263145214091896, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--47/temp/line_1_B.wav", + "silence_duration": 0.31802049753860856, + "is_interrupted": true, + "text_after_interrupt": "that she hasn't stopped crying since we realized he was missing and she keeps asking when he's coming home every five minutes." + }, + { + "speaker": "A", + "text": "Have you called the local dog shelters?", + "original_text": "Have you called the local dog shelters?", + "start_time": 7.945775599579425, + "end_time": 10.03557151794677, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--47/temp/line_2_A.wav", + "silence_duration": 0.56299363355346, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Well, they haven't seen him. They said they would call me if they find our dog, but I don't expect miracles. It's 2 days and...", + "original_text": "Well, they haven't seen him. They said they would call me if they find our dog, but I don't expect miracles. It's 2 days and...", + "start_time": 13.636402002728921, + "end_time": 19.731640097967016, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--47/temp/line_3_B.wav", + "silence_duration": 0.3732567886370249, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "We can always look for miracles. Does he have any identification on him?", + "original_text": "We can always look for miracles. Does he have any identification on him?", + "start_time": 20.212250147519153, + "end_time": 24.728531326657475, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--47/temp/line_4_A.wav", + "silence_duration": 0.48061004955213726, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "He's wearing his sweater. He's brown with white spots and... Sorry, I'm not thinking straight. You know, he's a big part of our family. We got him when he was a little", + "original_text": "He's wearing his sweater. He's brown with white spots and... Sorry, I'm not thinking straight. You know, he's a big part of our family. We got him when he was a little [interrupt] puppy, and he's been with us through so many important moments including my daughter's first steps and her first day of school.", + "start_time": 25.14221910058607, + "end_time": 39.25995152688992, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--47/temp/line_5_B.wav", + "silence_duration": 0.4136877739285948, + "is_interrupted": true, + "text_after_interrupt": "puppy, and he's been with us through so many important moments including my daughter's first steps and her first day of school." + }, + { + "speaker": "A", + "text": "Wait, did you say he's wearing a sweater? That might help people recognize him faster.", + "original_text": "Wait, did you say he's wearing a sweater? That might help people recognize him faster.", + "start_time": 36.157403988429024, + "end_time": 41.17291419251066, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--47/temp/line_6_A.wav", + "silence_duration": 0.391926693330291, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, he's wearing a sweater. But as I was saying, we got him when he was a little puppy. I'm just worried he was stolen or is injured somewhere.", + "original_text": "Yes, he's wearing a sweater. But as I was saying, we got him when he was a little puppy. I'm just worried he was stolen or is injured somewhere.", + "start_time": 41.64606548069918, + "end_time": 48.43790221539305, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--47/temp/line_7_B.wav", + "silence_duration": 0.4731512881885179, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I understand. I used to pet dogs, too. Let's walk around the neighborhood. Hey, look! There he is.", + "original_text": "I understand. I used to pet dogs, too. Let's walk around the neighborhood. Hey, look! There he is.", + "start_time": 48.88561644438977, + "end_time": 56.06058243078432, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--47/temp/line_8_A.wav", + "silence_duration": 0.4477142289967163, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Rusty! Come here boy! Oh, Glenn, I can't thank you enough. I owe you a big favor.", + "original_text": "Rusty! Come here boy! Oh, Glenn, I can't thank you enough. I owe you a big favor.", + "start_time": 56.64947959419089, + "end_time": 61.44440022911153, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--47/temp/line_9_B.wav", + "silence_duration": 0.5888971634065695, + "is_interrupted": false + } + ] + }, + "DialogSum--val--48": { + "original_text": "A: Oh, Patrick. I can't get this phone to work. Can you help me? \nB: Are you trying to make a [interrupt] call or just trying to set it up? I can walk you through either process step by step if you'd like, starting with the basics of how to navigate the menu system. \nA: Yes, I just got it and I can't get the thing to work. \nB: Let me see. OK, you turn it on. \nA: I didn't turn it [interrupt] on because I thought it was already on out of the box, but now I realize most electronics need to be manually powered on for the first time after unboxing them. \nB: Wait, you didn't turn it on? That's the first step. See, you wait for the screen to light up. Then you enter the phone number and press the C button, right here. Got it?", + "cleaned_text": "A: Oh, Patrick. I can't get this phone to work. Can you help me? \nB:Are you trying to make a call or just trying to set it up? I can walk you through either process step by step if you'd like, starting with the basics of how to navigate the menu system.\nA: Yes, I just got it and I can't get the thing to work. \nB: Let me see. OK, you turn it on. \nA:I didn't turn it on because I thought it was already on out of the box, but now I realize most electronics need to be manually powered on for the first time after unboxing them.\nB: Wait, you didn't turn it on? That's the first step. See, you wait for the screen to light up. Then you enter the phone number and press the C button, right here. Got it?", + "total_duration": 28.40222222222222, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--48/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--48/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--48/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Oh, Patrick. I can't get this phone to work. Can you help me?", + "original_text": "Oh, Patrick. I can't get this phone to work. Can you help me?", + "start_time": 0, + "end_time": 3.7384126984126986, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--48/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Are you trying to make a", + "original_text": "Are you trying to make a [interrupt] call or just trying to set it up? I can walk you through either process step by step if you'd like, starting with the basics of how to navigate the menu system.", + "start_time": 4.242159474654863, + "end_time": 12.694222966718357, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--48/temp/line_1_B.wav", + "silence_duration": 0.5037467762421646, + "is_interrupted": true, + "text_after_interrupt": "call or just trying to set it up? I can walk you through either process step by step if you'd like, starting with the basics of how to navigate the menu system." + }, + { + "speaker": "A", + "text": "Yes, I just got it and I can't get the thing to work.", + "original_text": "Yes, I just got it and I can't get the thing to work.", + "start_time": 5.7398465494847954, + "end_time": 8.874540427035816, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--48/temp/line_2_A.wav", + "silence_duration": 0.35415939575977495, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Let me see. OK, you turn it on.", + "original_text": "Let me see. OK, you turn it on.", + "start_time": 13.279082554975457, + "end_time": 15.217948768127384, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--48/temp/line_3_B.wav", + "silence_duration": 0.5848595882570995, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I didn't turn it", + "original_text": "I didn't turn it [interrupt] on because I thought it was already on out of the box, but now I realize most electronics need to be manually powered on for the first time after unboxing them.", + "start_time": 15.78301410903749, + "end_time": 25.72115469860665, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--48/temp/line_4_A.wav", + "silence_duration": 0.5650653409101054, + "is_interrupted": true, + "text_after_interrupt": "on because I thought it was already on out of the box, but now I realize most electronics need to be manually powered on for the first time after unboxing them." + }, + { + "speaker": "B", + "text": "Wait, you didn't turn it on? That's the first step. See, you wait for the screen to light up. Then you enter the phone number and press the C button, right here. Got it?", + "original_text": "Wait, you didn't turn it on? That's the first step. See, you wait for the screen to light up. Then you enter the phone number and press the C button, right here. Got it?", + "start_time": 19.9037280603303, + "end_time": 28.402231461690846, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--48/temp/line_5_B.wav", + "silence_duration": 0.3554124548739502, + "is_interrupted": false + } + ] + }, + "DialogSum--val--49": { + "original_text": "A: May I help you? \nB: Yes, I'd like to book 3 seats to Calgary, Canada on a flight, leaving sometime before next [interrupt] week, preferably before Sunday, as we have an important family reunion that we absolutely can't miss. \nA: Sorry to jump in, but do you have any specific time in mind for departure? It might help narrow down the options. \nB: Oh, no specific time, just before next Sunday. \nA: Got it. Economy class? \nB: Yes. \nA: One way or round trip? \nB: One way. \nA: There aren't any direct flights, sir. You will have to change in Vancouver. \nB: That's alright. \nA: There is a Canadian Airlines flight 30 leaving Beijing next Friday at 10 o'clock am. It has 3 seats available. Will that be alright? \nB: That's fine. \nA: Your name, please. \nB: BASIL, Basil. How much is the [interrupt] ticket including all taxes and fees? I'd also like to know if there are any baggage restrictions we should be aware of before booking. \nA: Sorry, I missed that—was it B-A-S-I-L? \nB: Yes, that's correct. How much is the ticket?", + "cleaned_text": "A: May I help you? \nB:Yes, I'd like to book 3 seats to Calgary, Canada on a flight, leaving sometime before next week, preferably before Sunday, as we have an important family reunion that we absolutely can't miss.\nA: Sorry to jump in, but do you have any specific time in mind for departure? It might help narrow down the options. \nB: Oh, no specific time, just before next Sunday. \nA: Got it. Economy class? \nB: Yes. \nA: One way or round trip? \nB: One way. \nA: There aren't any direct flights, sir. You will have to change in Vancouver. \nB: That's alright. \nA: There is a Canadian Airlines flight 30 leaving Beijing next Friday at 10 o'clock am. It has 3 seats available. Will that be alright? \nB: That's fine. \nA: Your name, please. \nB:BASIL, Basil. How much is the ticket including all taxes and fees? I'd also like to know if there are any baggage restrictions we should be aware of before booking.\nA: Sorry, I missed that—was it B-A-S-I-L? \nB: Yes, that's correct. How much is the ticket?", + "total_duration": 56.907165532879816, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--49/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--49/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--49/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "May I help you?", + "original_text": "May I help you?", + "start_time": 0, + "end_time": 0.9984580498866213, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--49/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, I'd like to book 3 seats to Calgary, Canada on a flight, leaving sometime before next", + "original_text": "Yes, I'd like to book 3 seats to Calgary, Canada on a flight, leaving sometime before next [interrupt] week, preferably before Sunday, as we have an important family reunion that we absolutely can't miss.", + "start_time": 1.403706859719134, + "end_time": 11.562437018449293, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--49/temp/line_1_B.wav", + "silence_duration": 0.4052488098325127, + "is_interrupted": true, + "text_after_interrupt": "week, preferably before Sunday, as we have an important family reunion that we absolutely can't miss." + }, + { + "speaker": "A", + "text": "Sorry to jump in, but do you have any specific time in mind for departure? It might help narrow down the options.", + "original_text": "Sorry to jump in, but do you have any specific time in mind for departure? It might help narrow down the options.", + "start_time": 6.802346315501446, + "end_time": 14.035362188517318, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--49/temp/line_2_A.wav", + "silence_duration": 0.5703451522444136, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Oh, no specific time, just before next Sunday.", + "original_text": "Oh, no specific time, just before next Sunday.", + "start_time": 14.597921782730914, + "end_time": 17.488806136472412, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--49/temp/line_3_B.wav", + "silence_duration": 0.5625595942135951, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Got it. Economy class?", + "original_text": "Got it. Economy class?", + "start_time": 18.00185287698193, + "end_time": 20.393508205780115, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--49/temp/line_4_A.wav", + "silence_duration": 0.5130467405095174, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes.", + "original_text": "Yes.", + "start_time": 20.787702713587656, + "end_time": 21.356591602476545, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--49/temp/line_5_B.wav", + "silence_duration": 0.3941945078075417, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "One way or round trip?", + "original_text": "One way or round trip?", + "start_time": 21.788125853091145, + "end_time": 23.123273245381395, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--49/temp/line_6_A.wav", + "silence_duration": 0.4315342506146004, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "One way.", + "original_text": "One way.", + "start_time": 23.598928726562306, + "end_time": 24.249087456721035, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--49/temp/line_7_B.wav", + "silence_duration": 0.47565548118091117, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "There aren't any direct flights, sir. You will have to change in Vancouver.", + "original_text": "There aren't any direct flights, sir. You will have to change in Vancouver.", + "start_time": 24.6480296559627, + "end_time": 28.839231470021655, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--49/temp/line_8_A.wav", + "silence_duration": 0.39894219924166135, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "That's alright.", + "original_text": "That's alright.", + "start_time": 29.206592062468836, + "end_time": 30.042510429815774, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--49/temp/line_9_B.wav", + "silence_duration": 0.3673605924471804, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "There is a Canadian Airlines flight 30 leaving Beijing next Friday at 10 o'clock am. It has 3 seats available. Will that be alright?", + "original_text": "There is a Canadian Airlines flight 30 leaving Beijing next Friday at 10 o'clock am. It has 3 seats available. Will that be alright?", + "start_time": 30.640298929080476, + "end_time": 39.09236242114397, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--49/temp/line_10_A.wav", + "silence_duration": 0.5977884992647009, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "That's fine.", + "original_text": "That's fine.", + "start_time": 39.413689513238914, + "end_time": 40.249607880585856, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--49/temp/line_11_B.wav", + "silence_duration": 0.32132709209494686, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Your name, please.", + "original_text": "Your name, please.", + "start_time": 40.68113606512379, + "end_time": 41.85374377487435, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--49/temp/line_12_A.wav", + "silence_duration": 0.4315281845379347, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "BASIL, Basil. How much is the", + "original_text": "BASIL, Basil. How much is the [interrupt] ticket including all taxes and fees? I'd also like to know if there are any baggage restrictions we should be aware of before booking.", + "start_time": 42.39965617065533, + "end_time": 51.59475821147166, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--49/temp/line_13_B.wav", + "silence_duration": 0.5459123957809766, + "is_interrupted": true, + "text_after_interrupt": "ticket including all taxes and fees? I'd also like to know if there are any baggage restrictions we should be aware of before booking." + }, + { + "speaker": "A", + "text": "Sorry, I missed that—was it B-A-S-I-L?", + "original_text": "Sorry, I missed that—was it B-A-S-I-L?", + "start_time": 50.13083505648509, + "end_time": 53.64865818573679, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--49/temp/line_14_A.wav", + "silence_duration": 0.4295904033651031, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, that's correct. How much is the ticket?", + "original_text": "Yes, that's correct. How much is the ticket?", + "start_time": 53.95824836573616, + "end_time": 56.90718260609897, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--49/temp/line_15_B.wav", + "silence_duration": 0.30959017999937155, + "is_interrupted": false + } + ] + }, + "DialogSum--val--50": { + "original_text": "A: Hong, it seems like you really struggle to learn English, is this level too hard for [interrupt] you, or is it something else that's making it difficult? Maybe we should discuss specific areas where you feel particularly challenged so we can tailor the lessons better to your needs.\nB: I don't know. I think it's just boring. I don't like the workbooks because the lessons talk about baby things. I'm not a little child. I want to learn something more exciting. \nA: Hmm, I have an idea that you'll like. This week, you can do a special project for your English class that will be more engaging and fun for you. \nB: Oh, what's that? \nA: I want you to watch some YouTube videos of people speaking in different English accents. I'll send you the links for the ones you should watch, they're very funny. One person does about 30 different accents in 10 minutes. \nB: Wow, that's great, but, won't it be harder for me to learn English if I'm listening to so many different ways of speaking the language? \nA: It shouldn't, this is just a fun project to help you get more interested in the lessons. There is a more serious side to it, though. I want you to write a one page essay about the videos and tell the class about your project on Friday. You can show some of the videos during your presentation too if you like. I think the whole class will benefit from this. \nB: I can't wait to get started. Thank you, Miss Winters. By the way, what was the special project you mentioned earlier before I interrupted? \nA: Oh, that was the project I just explained—watching the videos and preparing the essay and presentation. I'm glad you're excited about it!", + "cleaned_text": "A:Hong, it seems like you really struggle to learn English, is this level too hard for you, or is it something else that's making it difficult? Maybe we should discuss specific areas where you feel particularly challenged so we can tailor the lessons better to your needs.\nB: I don't know. I think it's just boring. I don't like the workbooks because the lessons talk about baby things. I'm not a little child. I want to learn something more exciting. \nA: Hmm, I have an idea that you'll like. This week, you can do a special project for your English class that will be more engaging and fun for you. \nB: Oh, what's that? \nA: I want you to watch some YouTube videos of people speaking in different English accents. I'll send you the links for the ones you should watch, they're very funny. One person does about 30 different accents in 10 minutes. \nB: Wow, that's great, but, won't it be harder for me to learn English if I'm listening to so many different ways of speaking the language? \nA: It shouldn't, this is just a fun project to help you get more interested in the lessons. There is a more serious side to it, though. I want you to write a one page essay about the videos and tell the class about your project on Friday. You can show some of the videos during your presentation too if you like. I think the whole class will benefit from this. \nB: I can't wait to get started. Thank you, Miss Winters. By the way, what was the special project you mentioned earlier before I interrupted? \nA: Oh, that was the project I just explained—watching the videos and preparing the essay and presentation. I'm glad you're excited about it!", + "total_duration": 83.02598639455782, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--50/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--50/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--50/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Hong, it seems like you really struggle to learn English, is this level too hard for", + "original_text": "Hong, it seems like you really struggle to learn English, is this level too hard for [interrupt] you, or is it something else that's making it difficult? Maybe we should discuss specific areas where you feel particularly challenged so we can tailor the lessons better to your needs.", + "start_time": 0, + "end_time": 15.696689342403628, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--50/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": true, + "text_after_interrupt": "you, or is it something else that's making it difficult? Maybe we should discuss specific areas where you feel particularly challenged so we can tailor the lessons better to your needs." + }, + { + "speaker": "B", + "text": "I don't know. I think it's just boring. I don't like the workbooks because the lessons talk about baby things. I'm not a little child. I want to learn something more exciting.", + "original_text": "I don't know. I think it's just boring. I don't like the workbooks because the lessons talk about baby things. I'm not a little child. I want to learn something more exciting.", + "start_time": 6.095238095238095, + "end_time": 15.034920634920635, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--50/temp/line_1_B.wav", + "silence_duration": 0.47931796006555816, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Hmm, I have an idea that you'll like. This week, you can do a special project for your English class that will be more engaging and fun for you.", + "original_text": "Hmm, I have an idea that you'll like. This week, you can do a special project for your English class that will be more engaging and fun for you.", + "start_time": 16.27512188210536, + "end_time": 23.84482709752486, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--50/temp/line_2_A.wav", + "silence_duration": 0.5784325397017325, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Oh, what's that?", + "original_text": "Oh, what's that?", + "start_time": 24.151472985637316, + "end_time": 24.9409514436872, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--50/temp/line_3_B.wav", + "silence_duration": 0.30664588811245613, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I want you to watch some YouTube videos of people speaking in different English accents. I'll send you the links for the ones you should watch, they're very funny. One person does about 30 different accents in 10 minutes.", + "original_text": "I want you to watch some YouTube videos of people speaking in different English accents. I'll send you the links for the ones you should watch, they're very funny. One person does about 30 different accents in 10 minutes.", + "start_time": 25.41830077406898, + "end_time": 38.13122594413701, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--50/temp/line_4_A.wav", + "silence_duration": 0.4773493303817806, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Wow, that's great, but, won't it be harder for me to learn English if I'm listening to so many different ways of speaking the language?", + "original_text": "Wow, that's great, but, won't it be harder for me to learn English if I'm listening to so many different ways of speaking the language?", + "start_time": 38.657931774697445, + "end_time": 45.333668736148695, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--50/temp/line_5_B.wav", + "silence_duration": 0.5267058305604386, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "It shouldn't, this is just a fun project to help you get more interested in the lessons. There is a more serious side to it, though. I want you to write a one page essay about the videos and tell the class about your project on Friday. You can show some of the videos during your presentation too if you like. I think the whole class will benefit from this.", + "original_text": "It shouldn't, this is just a fun project to help you get more interested in the lessons. There is a more serious side to it, though. I want you to write a one page essay about the videos and tell the class about your project on Friday. You can show some of the videos during your presentation too if you like. I think the whole class will benefit from this.", + "start_time": 45.92929484127387, + "end_time": 66.78081411565029, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--50/temp/line_6_A.wav", + "silence_duration": 0.5956261051251739, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I can't wait to get started. Thank you, Miss Winters. By the way, what was the special project you mentioned earlier before I interrupted?", + "original_text": "I can't wait to get started. Thank you, Miss Winters. By the way, what was the special project you mentioned earlier before I interrupted?", + "start_time": 67.15814629282762, + "end_time": 73.81066329963035, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--50/temp/line_7_B.wav", + "silence_duration": 0.37733217717733625, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Oh, that was the project I just explained—watching the videos and preparing the essay and presentation. I'm glad you're excited about it!", + "original_text": "Oh, that was the project I just explained—watching the videos and preparing the essay and presentation. I'm glad you're excited about it!", + "start_time": 74.27207021795644, + "end_time": 83.02599312045078, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--50/temp/line_8_A.wav", + "silence_duration": 0.4614069183260868, + "is_interrupted": false + } + ] + }, + "DialogSum--val--51": { + "original_text": "A: Have any plans for the weekend, Tom? \nB: Yeah, I'm going for a hike in the southern Rocky [interrupt] Mountains near the Maroon Bells area, which is known for its stunning alpine scenery and crystal-clear lakes that reflect the surrounding peaks perfectly. I've been looking forward to it for weeks. \nA: Oh, do you go hiking often? \nB: I go as much as I can. I love hiking because you can really get in touch with nature. \nA: It would be nice to get out of the city. Do you want some company? \nB: Sure. But, it will be a long hike, 30 miles in three days. Have you been hiking [interrupt] that distance before through challenging terrain with significant elevation changes? It's quite a challenge, but definitely worth it for the breathtaking views and sense of accomplishment. \nA: Before? Yeah, I go a lot too. I saw a bear and a mountain lion on my last hike. \nB: Wow! You must have been pretty far away from the city. \nA: Yeah, my friend and I hiked in a very wild part of the national forest. By the way, you mentioned the southern Rocky—where exactly are you planning to hike? \nB: Oh, right! I was going to say, we're heading to the Maroon Bells area. It's supposed to be beautiful this time of year. \nA: That sounds amazing. Well, bring your friend along too. We'll have a great time this weekend.", + "cleaned_text": "A: Have any plans for the weekend, Tom? \nB:Yeah, I'm going for a hike in the southern Rocky Mountains near the Maroon Bells area, which is known for its stunning alpine scenery and crystal-clear lakes that reflect the surrounding peaks perfectly. I've been looking forward to it for weeks.\nA: Oh, do you go hiking often? \nB: I go as much as I can. I love hiking because you can really get in touch with nature. \nA: It would be nice to get out of the city. Do you want some company? \nB:Sure. But, it will be a long hike, 30 miles in three days. Have you been hiking that distance before through challenging terrain with significant elevation changes? It's quite a challenge, but definitely worth it for the breathtaking views and sense of accomplishment.\nA: Before? Yeah, I go a lot too. I saw a bear and a mountain lion on my last hike. \nB: Wow! You must have been pretty far away from the city. \nA: Yeah, my friend and I hiked in a very wild part of the national forest. By the way, you mentioned the southern Rocky—where exactly are you planning to hike? \nB: Oh, right! I was going to say, we're heading to the Maroon Bells area. It's supposed to be beautiful this time of year. \nA: That sounds amazing. Well, bring your friend along too. We'll have a great time this weekend.", + "total_duration": 63.990975056689344, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--51/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--51/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--51/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Have any plans for the weekend, Tom?", + "original_text": "Have any plans for the weekend, Tom?", + "start_time": 0, + "end_time": 2.2291156462585033, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--51/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yeah, I'm going for a hike in the southern Rocky", + "original_text": "Yeah, I'm going for a hike in the southern Rocky [interrupt] Mountains near the Maroon Bells area, which is known for its stunning alpine scenery and crystal-clear lakes that reflect the surrounding peaks perfectly. I've been looking forward to it for weeks.", + "start_time": 2.6132211271668746, + "end_time": 15.105556728073903, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--51/temp/line_1_B.wav", + "silence_duration": 0.3841054809083714, + "is_interrupted": true, + "text_after_interrupt": "Mountains near the Maroon Bells area, which is known for its stunning alpine scenery and crystal-clear lakes that reflect the surrounding peaks perfectly. I've been looking forward to it for weeks." + }, + { + "speaker": "A", + "text": "Oh, do you go hiking often?", + "original_text": "Oh, do you go hiking often?", + "start_time": 5.086146297234902, + "end_time": 7.303651966169142, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--51/temp/line_2_A.wav", + "silence_duration": 0.5741264921513703, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I go as much as I can. I love hiking because you can really get in touch with nature.", + "original_text": "I go as much as I can. I love hiking because you can really get in touch with nature.", + "start_time": 15.574968703914827, + "end_time": 19.870660313892152, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--51/temp/line_3_B.wav", + "silence_duration": 0.46941197584092414, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "It would be nice to get out of the city. Do you want some company?", + "original_text": "It would be nice to get out of the city. Do you want some company?", + "start_time": 20.446869664095818, + "end_time": 24.022742679968832, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--51/temp/line_4_A.wav", + "silence_duration": 0.5762093502036648, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Sure. But, it will be a long hike, 30 miles in three days. Have you been hiking", + "original_text": "Sure. But, it will be a long hike, 30 miles in three days. Have you been hiking [interrupt] that distance before through challenging terrain with significant elevation changes? It's quite a challenge, but definitely worth it for the breathtaking views and sense of accomplishment.", + "start_time": 24.575293989543717, + "end_time": 38.70463639317184, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--51/temp/line_5_B.wav", + "silence_duration": 0.5525513095748845, + "is_interrupted": true, + "text_after_interrupt": "that distance before through challenging terrain with significant elevation changes? It's quite a challenge, but definitely worth it for the breathtaking views and sense of accomplishment." + }, + { + "speaker": "A", + "text": "Before? Yeah, I go a lot too. I saw a bear and a mountain lion on my last hike.", + "original_text": "Before? Yeah, I go a lot too. I saw a bear and a mountain lion on my last hike.", + "start_time": 31.81753892865165, + "end_time": 37.309058203028066, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--51/temp/line_6_A.wav", + "silence_duration": 0.3239279205937702, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Wow! You must have been pretty far away from the city.", + "original_text": "Wow! You must have been pretty far away from the city.", + "start_time": 39.06459085499585, + "end_time": 42.036745050007184, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--51/temp/line_7_B.wav", + "silence_duration": 0.3599544618240123, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Yeah, my friend and I hiked in a very wild part of the national forest. By the way, you mentioned the southern Rocky—where exactly are you planning to hike?", + "original_text": "Yeah, my friend and I hiked in a very wild part of the national forest. By the way, you mentioned the southern Rocky—where exactly are you planning to hike?", + "start_time": 42.37353910564037, + "end_time": 51.45254137321406, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--51/temp/line_8_A.wav", + "silence_duration": 0.3367940556331843, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Oh, right! I was going to say, we're heading to the Maroon Bells area. It's supposed to be beautiful this time of year.", + "original_text": "Oh, right! I was going to say, we're heading to the Maroon Bells area. It's supposed to be beautiful this time of year.", + "start_time": 52.005674725743575, + "end_time": 58.15896270760298, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--51/temp/line_9_B.wav", + "silence_duration": 0.5531333525295141, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "That sounds amazing. Well, bring your friend along too. We'll have a great time this weekend.", + "original_text": "That sounds amazing. Well, bring your friend along too. We'll have a great time this weekend.", + "start_time": 58.754910166849164, + "end_time": 63.99100994009179, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--51/temp/line_10_A.wav", + "silence_duration": 0.5959474592461822, + "is_interrupted": false + } + ] + }, + "DialogSum--val--52": { + "original_text": "A: I've got an idea. Let's make this game even more [interrupt] challenging by adding some unexpected twists to the rules that will really test our knowledge and creativity under pressure. \nB: How? Do you want to play strip-trivia or something? \nA: Well, if you want to! Seriously, though, let's make a bet. \nB: A bet? Why don't we just make it a friendly competition without any pressure, just for fun and see who comes out on top after several rounds of increasingly difficult questions? \nA: Wait, hear me out. The bet could make it more exciting! Maybe something small, like the loser buys dinner? \nB: Alright, that sounds fair. But I was going to say, why not just keep it light-hearted? No need for high stakes.", + "cleaned_text": "A:I've got an idea. Let's make this game even more challenging by adding some unexpected twists to the rules that will really test our knowledge and creativity under pressure.\nB: How? Do you want to play strip-trivia or something? \nA: Well, if you want to! Seriously, though, let's make a bet. \nB: A bet? Why don't we just make it a friendly competition without any pressure, just for fun and see who comes out on top after several rounds of increasingly difficult questions? \nA: Wait, hear me out. The bet could make it more exciting! Maybe something small, like the loser buys dinner? \nB: Alright, that sounds fair. But I was going to say, why not just keep it light-hearted? No need for high stakes.", + "total_duration": 38.07310657596372, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--52/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--52/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--52/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "I've got an idea. Let's make this game even more", + "original_text": "I've got an idea. Let's make this game even more [interrupt] challenging by adding some unexpected twists to the rules that will really test our knowledge and creativity under pressure.", + "start_time": 0, + "end_time": 10.170340136054422, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--52/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": true, + "text_after_interrupt": "challenging by adding some unexpected twists to the rules that will really test our knowledge and creativity under pressure." + }, + { + "speaker": "B", + "text": "How? Do you want to play strip-trivia or something?", + "original_text": "How? Do you want to play strip-trivia or something?", + "start_time": 3.308843537414966, + "end_time": 6.025578231292517, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--52/temp/line_1_B.wav", + "silence_duration": 0.36924909020389574, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Well, if you want to! Seriously, though, let's make a bet.", + "original_text": "Well, if you want to! Seriously, though, let's make a bet.", + "start_time": 10.638276306763013, + "end_time": 14.272199209257344, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--52/temp/line_2_A.wav", + "silence_duration": 0.46793617070859, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "A bet? Why don't we just make it a friendly competition without any pressure, just for fun and see who comes out on top after several rounds of increasingly difficult questions?", + "original_text": "A bet? Why don't we just make it a friendly competition without any pressure, just for fun and see who comes out on top after several rounds of increasingly difficult questions?", + "start_time": 14.799751668734428, + "end_time": 23.658164367147126, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--52/temp/line_3_B.wav", + "silence_duration": 0.5275524594770846, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Wait, hear me out. The bet could make it more exciting! Maybe something small, like the loser buys dinner?", + "original_text": "Wait, hear me out. The bet could make it more exciting! Maybe something small, like the loser buys dinner?", + "start_time": 24.11103095580573, + "end_time": 31.36726678347013, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--52/temp/line_4_A.wav", + "silence_duration": 0.45286658865860524, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Alright, that sounds fair. But I was going to say, why not just keep it light-hearted? No need for high stakes.", + "original_text": "Alright, that sounds fair. But I was going to say, why not just keep it light-hearted? No need for high stakes.", + "start_time": 31.780534142578485, + "end_time": 38.07314185232905, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--52/temp/line_5_B.wav", + "silence_duration": 0.41326735910835627, + "is_interrupted": false + } + ] + }, + "DialogSum--val--53": { + "original_text": "A: Here is your spicy diced chicken with peanuts, sir. \nB: Thank you. It looks very appetizing. I can't wait to dig in. \nA: I would advise you to enjoy the dish while it is hot. \nB: Tasty and tender! It must be one of the famous local dishes. \nA: Yes. It's a traditional dish. \nB: And it must be very particular in cooking. \nA: You are right, sir. To prepare it, a Sichuan food chef first fries some chilli until they turn reddish [interrupt] brown, which gives the dish its distinctive aroma and heat, then carefully balances the flavors with Sichuan peppercorns and other secret spices that create that signature numbing sensation. \nB: Oh, I was just wondering, is this dish typically very spicy? I'm curious about the level of heat. \nA: Yes, it can be quite spicy, but the spiciness can be adjusted to taste. By the way, I was mentioning that the chilli is fried until it turns reddish brown, and then the diced chicken breast meat is added to the pot with other condiments and peanuts. That's why the dish has a bright colour. \nB: I see.", + "cleaned_text": "A: Here is your spicy diced chicken with peanuts, sir. \nB: Thank you. It looks very appetizing. I can't wait to dig in. \nA: I would advise you to enjoy the dish while it is hot. \nB: Tasty and tender! It must be one of the famous local dishes. \nA: Yes. It's a traditional dish. \nB: And it must be very particular in cooking. \nA:You are right, sir. To prepare it, a Sichuan food chef first fries some chilli until they turn reddish brown, which gives the dish its distinctive aroma and heat, then carefully balances the flavors with Sichuan peppercorns and other secret spices that create that signature numbing sensation.\nB: Oh, I was just wondering, is this dish typically very spicy? I'm curious about the level of heat. \nA: Yes, it can be quite spicy, but the spiciness can be adjusted to taste. By the way, I was mentioning that the chilli is fried until it turns reddish brown, and then the diced chicken breast meat is added to the pot with other condiments and peanuts. That's why the dish has a bright colour. \nB: I see.", + "total_duration": 57.85886621315193, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--53/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--53/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--53/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Here is your spicy diced chicken with peanuts, sir.", + "original_text": "Here is your spicy diced chicken with peanuts, sir.", + "start_time": 0, + "end_time": 2.972154195011338, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--53/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Thank you. It looks very appetizing. I can't wait to dig in.", + "original_text": "Thank you. It looks very appetizing. I can't wait to dig in.", + "start_time": 3.541131110477001, + "end_time": 6.7106549200008105, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--53/temp/line_1_B.wav", + "silence_duration": 0.5689769154656628, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I would advise you to enjoy the dish while it is hot.", + "original_text": "I would advise you to enjoy the dish while it is hot.", + "start_time": 7.298441783023925, + "end_time": 10.456355615223472, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--53/temp/line_2_A.wav", + "silence_duration": 0.5877868630231142, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Tasty and tender! It must be one of the famous local dishes.", + "original_text": "Tasty and tender! It must be one of the famous local dishes.", + "start_time": 11.026839996758014, + "end_time": 14.544663126009715, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--53/temp/line_3_B.wav", + "silence_duration": 0.5704843815345418, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Yes. It's a traditional dish.", + "original_text": "Yes. It's a traditional dish.", + "start_time": 15.096658395598572, + "end_time": 17.708903293557757, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--53/temp/line_4_A.wav", + "silence_duration": 0.5519952695888574, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "And it must be very particular in cooking.", + "original_text": "And it must be very particular in cooking.", + "start_time": 18.230185668046992, + "end_time": 20.180661858523184, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--53/temp/line_5_B.wav", + "silence_duration": 0.5212823744892369, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "You are right, sir. To prepare it, a Sichuan food chef first fries some chilli until they turn reddish", + "original_text": "You are right, sir. To prepare it, a Sichuan food chef first fries some chilli until they turn reddish [interrupt] brown, which gives the dish its distinctive aroma and heat, then carefully balances the flavors with Sichuan peppercorns and other secret spices that create that signature numbing sensation.", + "start_time": 20.66922214731486, + "end_time": 39.28001579810851, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--53/temp/line_6_A.wav", + "silence_duration": 0.48856028879167546, + "is_interrupted": true, + "text_after_interrupt": "brown, which gives the dish its distinctive aroma and heat, then carefully balances the flavors with Sichuan peppercorns and other secret spices that create that signature numbing sensation." + }, + { + "speaker": "B", + "text": "Oh, I was just wondering, is this dish typically very spicy? I'm curious about the level of heat.", + "original_text": "Oh, I was just wondering, is this dish typically very spicy? I'm curious about the level of heat.", + "start_time": 27.42622895003595, + "end_time": 33.08028790695205, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--53/temp/line_7_B.wav", + "silence_duration": 0.46829681593202, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Yes, it can be quite spicy, but the spiciness can be adjusted to taste. By the way, I was mentioning that the chilli is fried until it turns reddish brown, and then the diced chicken breast meat is added to the pot with other condiments and peanuts. That's why the dish has a bright colour.", + "original_text": "Yes, it can be quite spicy, but the spiciness can be adjusted to taste. By the way, I was mentioning that the chilli is fried until it turns reddish brown, and then the diced chicken breast meat is added to the pot with other condiments and peanuts. That's why the dish has a bright colour.", + "start_time": 39.72198832256778, + "end_time": 56.95119467177413, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--53/temp/line_8_A.wav", + "silence_duration": 0.4419725244592773, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I see.", + "original_text": "I see.", + "start_time": 57.26678583039755, + "end_time": 57.85889467393497, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--53/temp/line_9_B.wav", + "silence_duration": 0.31559115862341613, + "is_interrupted": false + } + ] + }, + "DialogSum--val--54": { + "original_text": "A: So what's wrong with the drain? \nB: It's clogged and water won't go [interrupt] down at all despite trying multiple methods like using a plunger and pouring hot water down the pipes. I tried running the tap for a while, but nothing seems to be moving. \nA: Wait, is it completely blocked, or is the water just draining slowly? \nB: It's completely blocked. Let me take a look. You know why? It's clogged with hair. No wonder water won't go down. \nA: Well, I guess people who lived here before didn't clean the drain regularly, which probably caused a buildup over time. \nB: Oh, speaking of the previous tenants, do you know how long they lived here? Maybe they neglected maintenance for a while. \nA: I'm not sure, but considering this mess, it seems likely. Anyway, what should I do now? \nB: Don't worry. I've got some acid here. It will help dissolve the hair down there. \nA: Ur, it stinks!", + "cleaned_text": "A: So what's wrong with the drain? \nB:It's clogged and water won't go down at all despite trying multiple methods like using a plunger and pouring hot water down the pipes. I tried running the tap for a while, but nothing seems to be moving.\nA: Wait, is it completely blocked, or is the water just draining slowly? \nB: It's completely blocked. Let me take a look. You know why? It's clogged with hair. No wonder water won't go down. \nA: Well, I guess people who lived here before didn't clean the drain regularly, which probably caused a buildup over time. \nB: Oh, speaking of the previous tenants, do you know how long they lived here? Maybe they neglected maintenance for a while. \nA: I'm not sure, but considering this mess, it seems likely. Anyway, what should I do now? \nB: Don't worry. I've got some acid here. It will help dissolve the hair down there. \nA: Ur, it stinks!", + "total_duration": 45.37655328798186, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--54/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--54/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--54/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "So what's wrong with the drain?", + "original_text": "So what's wrong with the drain?", + "start_time": 0, + "end_time": 1.6950566893424037, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--54/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "It's clogged and water won't go", + "original_text": "It's clogged and water won't go [interrupt] down at all despite trying multiple methods like using a plunger and pouring hot water down the pipes. I tried running the tap for a while, but nothing seems to be moving.", + "start_time": 2.025498933427085, + "end_time": 12.416428638642506, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--54/temp/line_1_B.wav", + "silence_duration": 0.3304422440846815, + "is_interrupted": true, + "text_after_interrupt": "down at all despite trying multiple methods like using a plunger and pouring hot water down the pipes. I tried running the tap for a while, but nothing seems to be moving." + }, + { + "speaker": "A", + "text": "Wait, is it completely blocked, or is the water just draining slowly?", + "original_text": "Wait, is it completely blocked, or is the water just draining slowly?", + "start_time": 3.6741157134724367, + "end_time": 8.35293657515044, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--54/temp/line_2_A.wav", + "silence_duration": 0.49990833695715586, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "It's completely blocked. Let me take a look. You know why? It's clogged with hair. No wonder water won't go down.", + "original_text": "It's completely blocked. Let me take a look. You know why? It's clogged with hair. No wonder water won't go down.", + "start_time": 12.726875819595758, + "end_time": 18.520254504403013, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--54/temp/line_3_B.wav", + "silence_duration": 0.310447180953253, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Well, I guess people who lived here before didn't clean the drain regularly, which probably caused a buildup over time.", + "original_text": "Well, I guess people who lived here before didn't clean the drain regularly, which probably caused a buildup over time.", + "start_time": 18.845643901661578, + "end_time": 25.60265070438267, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--54/temp/line_4_A.wav", + "silence_duration": 0.3253893972585634, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Oh, speaking of the previous tenants, do you know how long they lived here? Maybe they neglected maintenance for a while.", + "original_text": "Oh, speaking of the previous tenants, do you know how long they lived here? Maybe they neglected maintenance for a while.", + "start_time": 26.1090116513151, + "end_time": 32.587378998253875, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--54/temp/line_5_B.wav", + "silence_duration": 0.5063609469324324, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I'm not sure, but considering this mess, it seems likely. Anyway, what should I do now?", + "original_text": "I'm not sure, but considering this mess, it seems likely. Anyway, what should I do now?", + "start_time": 33.09236625900214, + "end_time": 38.63032544267561, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--54/temp/line_6_A.wav", + "silence_duration": 0.5049872607482656, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Don't worry. I've got some acid here. It will help dissolve the hair down there.", + "original_text": "Don't worry. I've got some acid here. It will help dissolve the hair down there.", + "start_time": 39.11625259200401, + "end_time": 43.075254859577704, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--54/temp/line_7_B.wav", + "silence_duration": 0.48592714932839653, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Ur, it stinks!", + "original_text": "Ur, it stinks!", + "start_time": 43.437713658709086, + "end_time": 45.37657987186101, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--54/temp/line_8_A.wav", + "silence_duration": 0.3624587991313803, + "is_interrupted": false + } + ] + }, + "DialogSum--val--55": { + "original_text": "A: Then when at the earliest can we expect the [interrupt] shipment to be ready so that we can meet our deadlines? We've been receiving numerous inquiries from our clients and they're getting increasingly anxious about potential delays in their supply chains.\nB: Sorry to jump in, but I really need to know—what's causing the delay? Is it a production issue or something else?\nA: It's mainly a production issue. Our manufacturers are currently at full capacity. But I was going to say, the earliest we can manage is by the middle of October.\nB: It's too late. You see, in our market, October is the season for this kind of commodity. So the goods must be shipped before October, or we won't be ready for the season.\nA: Well, considering our long-standing good business relationship, we'll try hard to negotiate with our manufacturers for an earlier delivery.\nB: Thanks. Then may I suggest that you put down in the contract 'shipment on September 15 or earlier'?\nA: Let me see. Now the workers will have to work on three shifts for it. Well, we can manage it on the 20th of September. That's the best we can do.", + "cleaned_text": "A:Then when at the earliest can we expect the shipment to be ready so that we can meet our deadlines? We've been receiving numerous inquiries from our clients and they're getting increasingly anxious about potential delays in their supply chains.\nB: Sorry to jump in, but I really need to know—what's causing the delay? Is it a production issue or something else?\nA: It's mainly a production issue. Our manufacturers are currently at full capacity. But I was going to say, the earliest we can manage is by the middle of October.\nB: It's too late. You see, in our market, October is the season for this kind of commodity. So the goods must be shipped before October, or we won't be ready for the season.\nA: Well, considering our long-standing good business relationship, we'll try hard to negotiate with our manufacturers for an earlier delivery.\nB: Thanks. Then may I suggest that you put down in the contract 'shipment on September 15 or earlier'?\nA: Let me see. Now the workers will have to work on three shifts for it. Well, we can manage it on the 20th of September. That's the best we can do.", + "total_duration": 56.46503401360544, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--55/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--55/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--55/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Then when at the earliest can we expect the", + "original_text": "Then when at the earliest can we expect the [interrupt] shipment to be ready so that we can meet our deadlines? We've been receiving numerous inquiries from our clients and they're getting increasingly anxious about potential delays in their supply chains.", + "start_time": 0, + "end_time": 13.548843537414966, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--55/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": true, + "text_after_interrupt": "shipment to be ready so that we can meet our deadlines? We've been receiving numerous inquiries from our clients and they're getting increasingly anxious about potential delays in their supply chains." + }, + { + "speaker": "B", + "text": "Sorry to jump in, but I really need to know—what's causing the delay? Is it a production issue or something else?", + "original_text": "Sorry to jump in, but I really need to know—what's causing the delay? Is it a production issue or something else?", + "start_time": 2.36843537414966, + "end_time": 7.662585034013606, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--55/temp/line_1_B.wav", + "silence_duration": 0.5321966404448916, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "It's mainly a production issue. Our manufacturers are currently at full capacity. But I was going to say, the earliest we can manage is by the middle of October.", + "original_text": "It's mainly a production issue. Our manufacturers are currently at full capacity. But I was going to say, the earliest we can manage is by the middle of October.", + "start_time": 13.912534955657158, + "end_time": 24.001605250441738, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--55/temp/line_2_A.wav", + "silence_duration": 0.36369141824219153, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "It's too late. You see, in our market, October is the season for this kind of commodity. So the goods must be shipped before October, or we won't be ready for the season.", + "original_text": "It's too late. You see, in our market, October is the season for this kind of commodity. So the goods must be shipped before October, or we won't be ready for the season.", + "start_time": 24.345414717590003, + "end_time": 33.13416755205712, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--55/temp/line_3_B.wav", + "silence_duration": 0.34380946714826643, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Well, considering our long-standing good business relationship, we'll try hard to negotiate with our manufacturers for an earlier delivery.", + "original_text": "Well, considering our long-standing good business relationship, we'll try hard to negotiate with our manufacturers for an earlier delivery.", + "start_time": 33.542193578446984, + "end_time": 41.32087838570322, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--55/temp/line_4_A.wav", + "silence_duration": 0.4080260263898594, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Thanks. Then may I suggest that you put down in the contract 'shipment on September 15 or earlier'?", + "original_text": "Thanks. Then may I suggest that you put down in the contract 'shipment on September 15 or earlier'?", + "start_time": 41.89214408514111, + "end_time": 47.66230281529984, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--55/temp/line_5_B.wav", + "silence_duration": 0.5712656994378922, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Let me see. Now the workers will have to work on three shifts for it. Well, we can manage it on the 20th of September. That's the best we can do.", + "original_text": "Let me see. Now the workers will have to work on three shifts for it. Well, we can manage it on the 20th of September. That's the best we can do.", + "start_time": 48.18714737882304, + "end_time": 56.46506121102259, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--55/temp/line_6_A.wav", + "silence_duration": 0.5248445635232057, + "is_interrupted": false + } + ] + }, + "DialogSum--val--56": { + "original_text": "A: Mr. Brown, are your children always kicking up a row like this? I cannot concentrate on my [interrupt] work with all this noise, and it's becoming quite a challenge to stay focused especially when I have important deadlines approaching and need complete silence to think clearly. \nB: Sorry to interrupt, Mr. Black, but I'm already trying to make them quiet. They should calm down soon. \nA: I appreciate that, but I'm afraid if the noise goes on, I shall have no alternative but to speak to the building management about this issue, as it's affecting my productivity. \nB: Please, sir, just give me a moment. Believe me, everything will be all right.", + "cleaned_text": "A:Mr. Brown, are your children always kicking up a row like this? I cannot concentrate on my work with all this noise, and it's becoming quite a challenge to stay focused especially when I have important deadlines approaching and need complete silence to think clearly.\nB: Sorry to interrupt, Mr. Black, but I'm already trying to make them quiet. They should calm down soon. \nA: I appreciate that, but I'm afraid if the noise goes on, I shall have no alternative but to speak to the building management about this issue, as it's affecting my productivity. \nB: Please, sir, just give me a moment. Believe me, everything will be all right.", + "total_duration": 29.797414965986395, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--56/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--56/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--56/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Mr. Brown, are your children always kicking up a row like this? I cannot concentrate on my", + "original_text": "Mr. Brown, are your children always kicking up a row like this? I cannot concentrate on my [interrupt] work with all this noise, and it's becoming quite a challenge to stay focused especially when I have important deadlines approaching and need complete silence to think clearly.", + "start_time": 0, + "end_time": 15.09297052154195, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--56/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": true, + "text_after_interrupt": "work with all this noise, and it's becoming quite a challenge to stay focused especially when I have important deadlines approaching and need complete silence to think clearly." + }, + { + "speaker": "B", + "text": "Sorry to interrupt, Mr. Black, but I'm already trying to make them quiet. They should calm down soon.", + "original_text": "Sorry to interrupt, Mr. Black, but I'm already trying to make them quiet. They should calm down soon.", + "start_time": 6.292607709750567, + "end_time": 11.470657596371883, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--56/temp/line_1_B.wav", + "silence_duration": 0.35579376064291285, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I appreciate that, but I'm afraid if the noise goes on, I shall have no alternative but to speak to the building management about this issue, as it's affecting my productivity.", + "original_text": "I appreciate that, but I'm afraid if the noise goes on, I shall have no alternative but to speak to the building management about this issue, as it's affecting my productivity.", + "start_time": 15.4155378733413, + "end_time": 26.154766898284613, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--56/temp/line_2_A.wav", + "silence_duration": 0.3225673517993499, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Please, sir, just give me a moment. Believe me, everything will be all right.", + "original_text": "Please, sir, just give me a moment. Believe me, everything will be all right.", + "start_time": 26.500222186005796, + "end_time": 29.7974557460965, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--56/temp/line_3_B.wav", + "silence_duration": 0.34545528772118467, + "is_interrupted": false + } + ] + }, + "DialogSum--val--57": { + "original_text": "A: I don't understand why some parents keep beefing and complaining about their daughters not being able to follow [interrupt] their own expectations or societal norms without considering how much pressure this puts on young women who are just trying to find their own way in life.\nB: Sorry to cut in, but speaking of complaints, do you know if Li Na's mother has always been so harsh on her, or did it start after her neighbor's daughter got married to that Canadian?\nA: It's definitely gotten worse since the neighbor's daughter got married. Li Na's mother has been building a fire under her ever since. She's almost driving Li Na crazy. But you mentioned something earlier—what do you think Li Na would do in this situation?\nB: If I were Li Na, I would ask her if she had done that.\nA: Well, Li Na is as meek as a lamb. She never goes against anyone or anything. She's as good as gold, you know?", + "cleaned_text": "A:I don't understand why some parents keep beefing and complaining about their daughters not being able to follow their own expectations or societal norms without considering how much pressure this puts on young women who are just trying to find their own way in life.\nB: Sorry to cut in, but speaking of complaints, do you know if Li Na's mother has always been so harsh on her, or did it start after her neighbor's daughter got married to that Canadian?\nA: It's definitely gotten worse since the neighbor's daughter got married. Li Na's mother has been building a fire under her ever since. She's almost driving Li Na crazy. But you mentioned something earlier—what do you think Li Na would do in this situation?\nB: If I were Li Na, I would ask her if she had done that.\nA: Well, Li Na is as meek as a lamb. She never goes against anyone or anything. She's as good as gold, you know?", + "total_duration": 41.68512471655329, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--57/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--57/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--57/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "I don't understand why some parents keep beefing and complaining about their daughters not being able to follow", + "original_text": "I don't understand why some parents keep beefing and complaining about their daughters not being able to follow [interrupt] their own expectations or societal norms without considering how much pressure this puts on young women who are just trying to find their own way in life.", + "start_time": 0, + "end_time": 14.895600907029479, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--57/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": true, + "text_after_interrupt": "their own expectations or societal norms without considering how much pressure this puts on young women who are just trying to find their own way in life." + }, + { + "speaker": "B", + "text": "Sorry to cut in, but speaking of complaints, do you know if Li Na's mother has always been so harsh on her, or did it start after her neighbor's daughter got married to that Canadian?", + "original_text": "Sorry to cut in, but speaking of complaints, do you know if Li Na's mother has always been so harsh on her, or did it start after her neighbor's daughter got married to that Canadian?", + "start_time": 6.048798185941043, + "end_time": 15.243900226757368, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--57/temp/line_1_B.wav", + "silence_duration": 0.41373862336673844, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "It's definitely gotten worse since the neighbor's daughter got married. Li Na's mother has been building a fire under her ever since. She's almost driving Li Na crazy. But you mentioned something earlier—what do you think Li Na would do in this situation?", + "original_text": "It's definitely gotten worse since the neighbor's daughter got married. Li Na's mother has been building a fire under her ever since. She's almost driving Li Na crazy. But you mentioned something earlier—what do you think Li Na would do in this situation?", + "start_time": 15.707215772556575, + "end_time": 31.136875636502154, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--57/temp/line_2_A.wav", + "silence_duration": 0.46331554579920686, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "If I were Li Na, I would ask her if she had done that.", + "original_text": "If I were Li Na, I would ask her if she had done that.", + "start_time": 31.43707664974463, + "end_time": 33.7706820919215, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--57/temp/line_3_B.wav", + "silence_duration": 0.3002010132424738, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Well, Li Na is as meek as a lamb. She never goes against anyone or anything. She's as good as gold, you know?", + "original_text": "Well, Li Na is as meek as a lamb. She never goes against anyone or anything. She's as good as gold, you know?", + "start_time": 34.17350341385876, + "end_time": 41.685158742656945, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--57/temp/line_4_A.wav", + "silence_duration": 0.4028213219372632, + "is_interrupted": false + } + ] + }, + "DialogSum--val--58": { + "original_text": "A: How do you like these dishes? \nB: Fine, they are colorful and [interrupt] full of vibrant flavors that I really appreciate, especially the way the spices complement each other without overpowering the natural taste of the ingredients. \nA: Sorry to jump in, but I'm curious—did you find the flavors balanced? \nB: Yes, they are tasty. I really enjoyed the dinner. I have never tasted anything like this. \nA: I'm glad to hear that! Would you like some more rice? \nB: No, thanks. I'm full. \nA: Another piece of meat pie? \nB: No, thanks. I'm on a diet. But I was wondering, what dessert options do you have? \nA: How about some ice cream? \nB: Ice cream, please.", + "cleaned_text": "A: How do you like these dishes? \nB:Fine, they are colorful and full of vibrant flavors that I really appreciate, especially the way the spices complement each other without overpowering the natural taste of the ingredients.\nA: Sorry to jump in, but I'm curious—did you find the flavors balanced? \nB: Yes, they are tasty. I really enjoyed the dinner. I have never tasted anything like this. \nA: I'm glad to hear that! Would you like some more rice? \nB: No, thanks. I'm full. \nA: Another piece of meat pie? \nB: No, thanks. I'm on a diet. But I was wondering, what dessert options do you have? \nA: How about some ice cream? \nB: Ice cream, please.", + "total_duration": 33.0356462585034, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--58/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--58/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--58/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "How do you like these dishes?", + "original_text": "How do you like these dishes?", + "start_time": 0, + "end_time": 1.6718367346938776, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--58/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Fine, they are colorful and", + "original_text": "Fine, they are colorful and [interrupt] full of vibrant flavors that I really appreciate, especially the way the spices complement each other without overpowering the natural taste of the ingredients.", + "start_time": 2.017990032107036, + "end_time": 11.735541052515199, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--58/temp/line_1_B.wav", + "silence_duration": 0.34615329741315826, + "is_interrupted": true, + "text_after_interrupt": "full of vibrant flavors that I really appreciate, especially the way the spices complement each other without overpowering the natural taste of the ingredients." + }, + { + "speaker": "A", + "text": "Sorry to jump in, but I'm curious—did you find the flavors balanced?", + "original_text": "Sorry to jump in, but I'm curious—did you find the flavors balanced?", + "start_time": 4.154225859771435, + "end_time": 8.867876653422229, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--58/temp/line_2_A.wav", + "silence_duration": 0.3349252699923774, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, they are tasty. I really enjoyed the dinner. I have never tasted anything like this.", + "original_text": "Yes, they are tasty. I really enjoyed the dinner. I have never tasted anything like this.", + "start_time": 12.118536287413932, + "end_time": 17.435905901926404, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--58/temp/line_3_B.wav", + "silence_duration": 0.3829952348987325, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I'm glad to hear that! Would you like some more rice?", + "original_text": "I'm glad to hear that! Would you like some more rice?", + "start_time": 17.9163086808865, + "end_time": 21.15549235435589, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--58/temp/line_4_A.wav", + "silence_duration": 0.48040277896009753, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "No, thanks. I'm full.", + "original_text": "No, thanks. I'm full.", + "start_time": 21.48276731083226, + "end_time": 22.899184544392348, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--58/temp/line_5_B.wav", + "silence_duration": 0.3272749564763699, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Another piece of meat pie?", + "original_text": "Another piece of meat pie?", + "start_time": 23.396811073562965, + "end_time": 25.09186776290537, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--58/temp/line_6_A.wav", + "silence_duration": 0.4976265291706172, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "No, thanks. I'm on a diet. But I was wondering, what dessert options do you have?", + "original_text": "No, thanks. I'm on a diet. But I was wondering, what dessert options do you have?", + "start_time": 25.534425792712614, + "end_time": 29.60952783352894, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--58/temp/line_7_B.wav", + "silence_duration": 0.4425580298072439, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "How about some ice cream?", + "original_text": "How about some ice cream?", + "start_time": 29.988444464919333, + "end_time": 31.439691630452213, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--58/temp/line_8_A.wav", + "silence_duration": 0.3789166313903935, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Ice cream, please.", + "original_text": "Ice cream, please.", + "start_time": 31.816609214444558, + "end_time": 33.035656833492176, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--58/temp/line_9_B.wav", + "silence_duration": 0.3769175839923449, + "is_interrupted": false + } + ] + }, + "DialogSum--val--59": { + "original_text": "A: This place serves good breakfasts, don't you think? \nB: Yes. But I'm not used to eating American-style breakfast. \nA: What are you planning to do today? \nB: I saw yesterday that they rent windsurfers at the beach. I want to rent one. \nA: Have you done windsurfing before? \nB: No, but it looks fun. I always wanted to [interrupt] try something adventurous like this, especially since we're on vacation and this seems like the perfect opportunity to step out of my comfort zone.\nA: Sorry to jump in, but do you know how challenging windsurfing can be, especially if it's windy today? \nB: I've heard it's tough, but I still want to try it. \nA: Can you take a little advice from a friend? \nB: Sure. What? \nA: Don't waste your money. Windsurfing is very hard. And it will be windy today. They will charge you fifty dollars for a half-hour, and you won't be able to windsurf. You will fall and fall and [interrupt] probably get frustrated before you even get the hang of it, especially since the waves are particularly strong this time of year and the equipment can be quite heavy to maneuver for beginners.\nB: I get that it's difficult, but I'm really curious. Is it really that impossible for a beginner? \nA: It's not impossible, but it takes a long time to learn. You would spend a thousand dollars to learn it on a rental windsurfer. \nB: Well, I will see. How was your day at the office?", + "cleaned_text": "A: This place serves good breakfasts, don't you think? \nB: Yes. But I'm not used to eating American-style breakfast. \nA: What are you planning to do today? \nB: I saw yesterday that they rent windsurfers at the beach. I want to rent one. \nA: Have you done windsurfing before? \nB:No, but it looks fun. I always wanted to try something adventurous like this, especially since we're on vacation and this seems like the perfect opportunity to step out of my comfort zone.\nA: Sorry to jump in, but do you know how challenging windsurfing can be, especially if it's windy today? \nB: I've heard it's tough, but I still want to try it. \nA: Can you take a little advice from a friend? \nB: Sure. What? \nA:Don't waste your money. Windsurfing is very hard. And it will be windy today. They will charge you fifty dollars for a half-hour, and you won't be able to windsurf. You will fall and fall and probably get frustrated before you even get the hang of it, especially since the waves are particularly strong this time of year and the equipment can be quite heavy to maneuver for beginners.\nB: I get that it's difficult, but I'm really curious. Is it really that impossible for a beginner? \nA: It's not impossible, but it takes a long time to learn. You would spend a thousand dollars to learn it on a rental windsurfer. \nB: Well, I will see. How was your day at the office?", + "total_duration": 68.37401360544217, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--59/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--59/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--59/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "This place serves good breakfasts, don't you think?", + "original_text": "This place serves good breakfasts, don't you think?", + "start_time": 0, + "end_time": 2.75156462585034, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--59/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes. But I'm not used to eating American-style breakfast.", + "original_text": "Yes. But I'm not used to eating American-style breakfast.", + "start_time": 3.23789610058021, + "end_time": 6.616399501940754, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--59/temp/line_1_B.wav", + "silence_duration": 0.48633147472987015, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "What are you planning to do today?", + "original_text": "What are you planning to do today?", + "start_time": 7.022767846828697, + "end_time": 8.880364218710783, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--59/temp/line_2_A.wav", + "silence_duration": 0.4063683448879426, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I saw yesterday that they rent windsurfers at the beach. I want to rent one.", + "original_text": "I saw yesterday that they rent windsurfers at the beach. I want to rent one.", + "start_time": 9.331121950013749, + "end_time": 13.359784081533023, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--59/temp/line_3_B.wav", + "silence_duration": 0.45075773130296526, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Have you done windsurfing before?", + "original_text": "Have you done windsurfing before?", + "start_time": 13.693231251456544, + "end_time": 15.55082762333863, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--59/temp/line_4_A.wav", + "silence_duration": 0.3334471699235195, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "No, but it looks fun. I always wanted to", + "original_text": "No, but it looks fun. I always wanted to [interrupt] try something adventurous like this, especially since we're on vacation and this seems like the perfect opportunity to step out of my comfort zone.", + "start_time": 15.884206907183428, + "end_time": 25.218628675890912, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--59/temp/line_5_B.wav", + "silence_duration": 0.3333792838447978, + "is_interrupted": true, + "text_after_interrupt": "try something adventurous like this, especially since we're on vacation and this seems like the perfect opportunity to step out of my comfort zone." + }, + { + "speaker": "A", + "text": "Sorry to jump in, but do you know how challenging windsurfing can be, especially if it's windy today?", + "original_text": "Sorry to jump in, but do you know how challenging windsurfing can be, especially if it's windy today?", + "start_time": 18.29908219063014, + "end_time": 24.649739787002023, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--59/temp/line_6_A.wav", + "silence_duration": 0.5869433687234278, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I've heard it's tough, but I still want to try it.", + "original_text": "I've heard it's tough, but I still want to try it.", + "start_time": 25.70537339482274, + "end_time": 28.375668179403238, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--59/temp/line_7_B.wav", + "silence_duration": 0.48674471893182825, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Can you take a little advice from a friend?", + "original_text": "Can you take a little advice from a friend?", + "start_time": 28.84229731570582, + "end_time": 31.036583029991537, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--59/temp/line_8_A.wav", + "silence_duration": 0.4666291363025833, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Sure. What?", + "original_text": "Sure. What?", + "start_time": 31.38469332092052, + "end_time": 32.58052098531961, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--59/temp/line_9_B.wav", + "silence_duration": 0.34811029092898177, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Don't waste your money. Windsurfing is very hard. And it will be windy today. They will charge you fifty dollars for a half-hour, and you won't be able to windsurf. You will fall and fall and", + "original_text": "Don't waste your money. Windsurfing is very hard. And it will be windy today. They will charge you fifty dollars for a half-hour, and you won't be able to windsurf. You will fall and fall and [interrupt] probably get frustrated before you even get the hang of it, especially since the waves are particularly strong this time of year and the equipment can be quite heavy to maneuver for beginners.", + "start_time": 33.10178663274907, + "end_time": 54.80083425179669, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--59/temp/line_10_A.wav", + "silence_duration": 0.5212656474294609, + "is_interrupted": true, + "text_after_interrupt": "probably get frustrated before you even get the hang of it, especially since the waves are particularly strong this time of year and the equipment can be quite heavy to maneuver for beginners." + }, + { + "speaker": "B", + "text": "I get that it's difficult, but I'm really curious. Is it really that impossible for a beginner?", + "original_text": "I get that it's difficult, but I'm really curious. Is it really that impossible for a beginner?", + "start_time": 52.05328463210438, + "end_time": 57.17328463210438, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--59/temp/line_11_B.wav", + "silence_duration": 0.3003826373384236, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "It's not impossible, but it takes a long time to learn. You would spend a thousand dollars to learn it on a rental windsurfer.", + "original_text": "It's not impossible, but it takes a long time to learn. You would spend a thousand dollars to learn it on a rental windsurfer.", + "start_time": 57.748922590487275, + "end_time": 65.06320830477299, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--59/temp/line_12_A.wav", + "silence_duration": 0.5756379583829014, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Well, I will see. How was your day at the office?", + "original_text": "Well, I will see. How was your day at the office?", + "start_time": 65.57601009236626, + "end_time": 68.37401462751366, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--59/temp/line_13_B.wav", + "silence_duration": 0.5128017875932772, + "is_interrupted": false + } + ] + }, + "DialogSum--val--60": { + "original_text": "A: Ben, what are you doing? \nB: Well, I would say that I'm just drifting - - here, in the [interrupt] space between what I want to do and what I feel I should do, navigating through this strange limbo where my passions and responsibilities seem to constantly pull me in opposite directions. \nA: Sorry to interrupt, but what do you mean by drifting? Are you feeling lost or just taking a break? \nB: It's more like taking a break. It's very comfortable just to drift here. \nA: Have you thought about graduate school? \nB: No. \nA: Would you mind telling me then, what were those four years of college for? What was the point of all that hard [interrupt] work and dedication if you're not planning to use your degree immediately, especially considering how much time and effort you invested in your education and personal growth during those formative years? \nB: Wait, before you go on, are you asking if I regret going to college? \nA: Not exactly, but I'm curious about what you think all that hard work was for. \nB: You got me.", + "cleaned_text": "A: Ben, what are you doing? \nB:Well, I would say that I'm just drifting - - here, in the space between what I want to do and what I feel I should do, navigating through this strange limbo where my passions and responsibilities seem to constantly pull me in opposite directions.\nA: Sorry to interrupt, but what do you mean by drifting? Are you feeling lost or just taking a break? \nB: It's more like taking a break. It's very comfortable just to drift here. \nA: Have you thought about graduate school? \nB: No. \nA:Would you mind telling me then, what were those four years of college for? What was the point of all that hard work and dedication if you're not planning to use your degree immediately, especially considering how much time and effort you invested in your education and personal growth during those formative years?\nB: Wait, before you go on, are you asking if I regret going to college? \nA: Not exactly, but I'm curious about what you think all that hard work was for. \nB: You got me.", + "total_duration": 46.884126984126986, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--60/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--60/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--60/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Ben, what are you doing?", + "original_text": "Ben, what are you doing?", + "start_time": 0, + "end_time": 1.6137868480725623, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--60/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Well, I would say that I'm just drifting - - here, in the", + "original_text": "Well, I would say that I'm just drifting - - here, in the [interrupt] space between what I want to do and what I feel I should do, navigating through this strange limbo where my passions and responsibilities seem to constantly pull me in opposite directions.", + "start_time": 1.9526145669113253, + "end_time": 14.642319782330826, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--60/temp/line_1_B.wav", + "silence_duration": 0.338827718838763, + "is_interrupted": true, + "text_after_interrupt": "space between what I want to do and what I feel I should do, navigating through this strange limbo where my passions and responsibilities seem to constantly pull me in opposite directions." + }, + { + "speaker": "A", + "text": "Sorry to interrupt, but what do you mean by drifting? Are you feeling lost or just taking a break?", + "original_text": "Sorry to interrupt, but what do you mean by drifting? Are you feeling lost or just taking a break?", + "start_time": 5.06408848981382, + "end_time": 11.263816380970283, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--60/temp/line_2_A.wav", + "silence_duration": 0.4901207484169546, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "It's more like taking a break. It's very comfortable just to drift here.", + "original_text": "It's more like taking a break. It's very comfortable just to drift here.", + "start_time": 15.07118979879979, + "end_time": 18.403253290863283, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--60/temp/line_3_B.wav", + "silence_duration": 0.42887001646896244, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Have you thought about graduate school?", + "original_text": "Have you thought about graduate school?", + "start_time": 18.76147900117668, + "end_time": 20.595855418410242, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--60/temp/line_4_A.wav", + "silence_duration": 0.3582257103133967, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "No.", + "original_text": "No.", + "start_time": 21.14337807566134, + "end_time": 21.735486919198753, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--60/temp/line_5_B.wav", + "silence_duration": 0.5475226572510971, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Would you mind telling me then, what were those four years of college for? What was the point of all that hard", + "original_text": "Would you mind telling me then, what were those four years of college for? What was the point of all that hard [interrupt] work and dedication if you're not planning to use your degree immediately, especially considering how much time and effort you invested in your education and personal growth during those formative years?", + "start_time": 22.170058100824665, + "end_time": 40.061033157514004, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--60/temp/line_6_A.wav", + "silence_duration": 0.4345711816259126, + "is_interrupted": true, + "text_after_interrupt": "work and dedication if you're not planning to use your degree immediately, especially considering how much time and effort you invested in your education and personal growth during those formative years?" + }, + { + "speaker": "B", + "text": "Wait, before you go on, are you asking if I regret going to college?", + "original_text": "Wait, before you go on, are you asking if I regret going to college?", + "start_time": 35.276123213301375, + "end_time": 38.875216183822914, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--60/temp/line_7_B.wav", + "silence_duration": 0.5594902988314634, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Not exactly, but I'm curious about what you think all that hard work was for.", + "original_text": "Not exactly, but I'm curious about what you think all that hard work was for.", + "start_time": 40.592261355036094, + "end_time": 45.630991513766254, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--60/temp/line_8_A.wav", + "silence_duration": 0.5312281975220909, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "You got me.", + "original_text": "You got me.", + "start_time": 46.18756110816628, + "end_time": 46.88415974762206, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--60/temp/line_9_B.wav", + "silence_duration": 0.5565695944000246, + "is_interrupted": false + } + ] + }, + "DialogSum--val--61": { + "original_text": "A: The stepmother was very wicked. She couldn't stand a happy smile on the boy's [interrupt] face because it reminded her of everything she lacked in her own miserable life. Every time she saw it, her jealousy grew stronger and more unbearable. \nB: Wait, why was she so upset with him? Did something specific happen between them? \nA: Not really, it was just her nature to be cruel. She did her best to pull out the thorn in her flesh and the boy lost whatever made him [interrupt] smile, including his beloved toys, his friendships, and even the small joys of daily life that most children take for granted. His laughter faded away, and he became a shadow of his former self. \nB: Oh no, that's heartbreaking. What exactly did she do to make him lose his happiness? \nA: She took away everything he loved, leaving him with nothing but sadness. Poor child! \nB: Indeed, it's tragic how some people can be so heartless.", + "cleaned_text": "A:The stepmother was very wicked. She couldn't stand a happy smile on the boy's face because it reminded her of everything she lacked in her own miserable life. Every time she saw it, her jealousy grew stronger and more unbearable.\nB: Wait, why was she so upset with him? Did something specific happen between them? \nA:Not really, it was just her nature to be cruel. She did her best to pull out the thorn in her flesh and the boy lost whatever made him smile, including his beloved toys, his friendships, and even the small joys of daily life that most children take for granted. His laughter faded away, and he became a shadow of his former self.\nB: Oh no, that's heartbreaking. What exactly did she do to make him lose his happiness? \nA: She took away everything he loved, leaving him with nothing but sadness. Poor child! \nB: Indeed, it's tragic how some people can be so heartless.", + "total_duration": 43.92285714285714, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--61/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--61/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--61/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "The stepmother was very wicked. She couldn't stand a happy smile on the boy's", + "original_text": "The stepmother was very wicked. She couldn't stand a happy smile on the boy's [interrupt] face because it reminded her of everything she lacked in her own miserable life. Every time she saw it, her jealousy grew stronger and more unbearable.", + "start_time": 0, + "end_time": 13.572063492063492, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--61/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": true, + "text_after_interrupt": "face because it reminded her of everything she lacked in her own miserable life. Every time she saw it, her jealousy grew stronger and more unbearable." + }, + { + "speaker": "B", + "text": "Wait, why was she so upset with him? Did something specific happen between them?", + "original_text": "Wait, why was she so upset with him? Did something specific happen between them?", + "start_time": 4.911020408163266, + "end_time": 9.58984126984127, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--61/temp/line_1_B.wav", + "silence_duration": 0.5800864958093811, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Not really, it was just her nature to be cruel. She did her best to pull out the thorn in her flesh and the boy lost whatever made him", + "original_text": "Not really, it was just her nature to be cruel. She did her best to pull out the thorn in her flesh and the boy lost whatever made him [interrupt] smile, including his beloved toys, his friendships, and even the small joys of daily life that most children take for granted. His laughter faded away, and he became a shadow of his former self.", + "start_time": 13.93021515770831, + "end_time": 34.70046459081489, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--61/temp/line_2_A.wav", + "silence_duration": 0.35815166564481793, + "is_interrupted": true, + "text_after_interrupt": "smile, including his beloved toys, his friendships, and even the small joys of daily life that most children take for granted. His laughter faded away, and he became a shadow of his former self." + }, + { + "speaker": "B", + "text": "Oh no, that's heartbreaking. What exactly did she do to make him lose his happiness?", + "original_text": "Oh no, that's heartbreaking. What exactly did she do to make him lose his happiness?", + "start_time": 27.311456341189633, + "end_time": 31.42138831397875, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--61/temp/line_3_B.wav", + "silence_duration": 0.4671848831069819, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "She took away everything he loved, leaving him with nothing but sadness. Poor child!", + "original_text": "She took away everything he loved, leaving him with nothing but sadness. Poor child!", + "start_time": 35.248910024068216, + "end_time": 40.50822975195938, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--61/temp/line_4_A.wav", + "silence_duration": 0.5484454332533246, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Indeed, it's tragic how some people can be so heartless.", + "original_text": "Indeed, it's tragic how some people can be so heartless.", + "start_time": 40.8230223078955, + "end_time": 43.92288625347373, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--61/temp/line_5_B.wav", + "silence_duration": 0.3147925559361226, + "is_interrupted": false + } + ] + }, + "DialogSum--val--63": { + "original_text": "A: I'm not sure, is this our stop? \nB: Yeah, get off the bus. \nA: Do you have any idea where we [interrupt] were supposed to get off? I think we might've missed it because the landmarks don't match what I remember from the directions. \nB: Sorry, I just realized, do you think we got off too early? \nA: I was about to say, I'm really not sure where we are. This can't be the right stop. \nB: I don't think this is right. \nA: We got off too early, didn't we? \nB: Yeah, we did get off too early. \nA: I should've just stayed on the bus. \nB: I messed up. \nA: Great, we have to walk now. \nB: You want to wait for the next bus?", + "cleaned_text": "A: I'm not sure, is this our stop? \nB: Yeah, get off the bus. \nA:Do you have any idea where we were supposed to get off? I think we might've missed it because the landmarks don't match what I remember from the directions.\nB: Sorry, I just realized, do you think we got off too early? \nA: I was about to say, I'm really not sure where we are. This can't be the right stop. \nB: I don't think this is right. \nA: We got off too early, didn't we? \nB: Yeah, we did get off too early. \nA: I should've just stayed on the bus. \nB: I messed up. \nA: Great, we have to walk now. \nB: You want to wait for the next bus?", + "total_duration": 32.34031746031746, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--63/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--63/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--63/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "I'm not sure, is this our stop?", + "original_text": "I'm not sure, is this our stop?", + "start_time": 0, + "end_time": 2.0317460317460316, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--63/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yeah, get off the bus.", + "original_text": "Yeah, get off the bus.", + "start_time": 2.458007035911708, + "end_time": 3.932474156093114, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--63/temp/line_1_B.wav", + "silence_duration": 0.42626100416567647, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Do you have any idea where we", + "original_text": "Do you have any idea where we [interrupt] were supposed to get off? I think we might've missed it because the landmarks don't match what I remember from the directions.", + "start_time": 4.237242500619633, + "end_time": 12.549986264791968, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--63/temp/line_2_A.wav", + "silence_duration": 0.30476834452651946, + "is_interrupted": true, + "text_after_interrupt": "were supposed to get off? I think we might've missed it because the landmarks don't match what I remember from the directions." + }, + { + "speaker": "B", + "text": "Sorry, I just realized, do you think we got off too early?", + "original_text": "Sorry, I just realized, do you think we got off too early?", + "start_time": 6.234158600392876, + "end_time": 8.985723226243216, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--63/temp/line_3_B.wav", + "silence_duration": 0.4155033686189933, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I was about to say, I'm really not sure where we are. This can't be the right stop.", + "original_text": "I was about to say, I'm really not sure where we are. This can't be the right stop.", + "start_time": 13.087744822823515, + "end_time": 18.38189448268746, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--63/temp/line_4_A.wav", + "silence_duration": 0.5377585580315459, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I don't think this is right.", + "original_text": "I don't think this is right.", + "start_time": 18.972259955118947, + "end_time": 20.33062730205772, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--63/temp/line_5_B.wav", + "silence_duration": 0.5903654724314856, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "We got off too early, didn't we?", + "original_text": "We got off too early, didn't we?", + "start_time": 20.841880204039512, + "end_time": 22.676256621273073, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--63/temp/line_6_A.wav", + "silence_duration": 0.5112529019817925, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yeah, we did get off too early.", + "original_text": "Yeah, we did get off too early.", + "start_time": 22.989832331031103, + "end_time": 24.603619179103664, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--63/temp/line_7_B.wav", + "silence_duration": 0.31357570975802945, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I should've just stayed on the bus.", + "original_text": "I should've just stayed on the bus.", + "start_time": 25.05842508866983, + "end_time": 27.00890127914602, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--63/temp/line_8_A.wav", + "silence_duration": 0.4548059095661646, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I messed up.", + "original_text": "I messed up.", + "start_time": 27.3824165551293, + "end_time": 28.195114967827713, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--63/temp/line_9_B.wav", + "silence_duration": 0.37351527598328116, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Great, we have to walk now.", + "original_text": "Great, we have to walk now.", + "start_time": 28.743589681898296, + "end_time": 30.4386463712407, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--63/temp/line_10_A.wav", + "silence_duration": 0.5484747140705823, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "You want to wait for the next bus?", + "original_text": "You want to wait for the next bus?", + "start_time": 30.865884330614477, + "end_time": 32.340351450795886, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--63/temp/line_11_B.wav", + "silence_duration": 0.4272379593737761, + "is_interrupted": false + } + ] + }, + "DialogSum--val--64": { + "original_text": "A: You can use a Type A Agreement Savings Account the same way as a Settlement [interrupt] account, which means you have easy access to your funds and can make unlimited transactions without worrying about monthly maintenance fees or minimum balance requirements.\nB: Sorry, I just want to make sure, is there any penalty for early withdrawal?\nA: No penalty, but I haven't explained the differences between Type A and Type B Accounts yet. You asked earlier about Type B, right?\nB: Oh yes, could you clarify that for me?", + "cleaned_text": "A:You can use a Type A Agreement Savings Account the same way as a Settlement account, which means you have easy access to your funds and can make unlimited transactions without worrying about monthly maintenance fees or minimum balance requirements.\nB: Sorry, I just want to make sure, is there any penalty for early withdrawal?\nA: No penalty, but I haven't explained the differences between Type A and Type B Accounts yet. You asked earlier about Type B, right?\nB: Oh yes, could you clarify that for me?", + "total_duration": 26.51904761904762, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--64/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--64/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--64/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "You can use a Type A Agreement Savings Account the same way as a Settlement", + "original_text": "You can use a Type A Agreement Savings Account the same way as a Settlement [interrupt] account, which means you have easy access to your funds and can make unlimited transactions without worrying about monthly maintenance fees or minimum balance requirements.", + "start_time": 0, + "end_time": 15.034920634920635, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--64/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": true, + "text_after_interrupt": "account, which means you have easy access to your funds and can make unlimited transactions without worrying about monthly maintenance fees or minimum balance requirements." + }, + { + "speaker": "B", + "text": "Sorry, I just want to make sure, is there any penalty for early withdrawal?", + "original_text": "Sorry, I just want to make sure, is there any penalty for early withdrawal?", + "start_time": 4.249251700680272, + "end_time": 8.02249433106576, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--64/temp/line_1_B.wav", + "silence_duration": 0.5491902299507203, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "No penalty, but I haven't explained the differences between Type A and Type B Accounts yet. You asked earlier about Type B, right?", + "original_text": "No penalty, but I haven't explained the differences between Type A and Type B Accounts yet. You asked earlier about Type B, right?", + "start_time": 15.626148062216858, + "end_time": 23.96211178103772, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--64/temp/line_2_A.wav", + "silence_duration": 0.5912274272962235, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Oh yes, could you clarify that for me?", + "original_text": "Oh yes, could you clarify that for me?", + "start_time": 24.289936660540473, + "end_time": 26.519052306798976, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--64/temp/line_3_B.wav", + "silence_duration": 0.32782487950275435, + "is_interrupted": false + } + ] + }, + "DialogSum--val--65": { + "original_text": "A: To which gate do I need to go to catch connecting flight 101 to New York City? \nB: Go to gate 18. The plane is now boarding. You must hurry if you want to make it on time since they typically close the doors [interrupt] about 15 minutes before departure and this flight is known for being quite strict about their boarding procedures. \nA: Sorry to interrupt, but can you show me the fastest way to get there? \nB: Instead of walking, you can take this shuttle to get you there faster. \nA: Do you think the plane will leave without me? \nB: No, I'll call the attendants at the gate. I will tell them you're on your way, so they can be prepared. \nA: Oh, thank you so much. I would really appreciate that. By the way, you were about to say something about the attendants? \nB: Yes, I was saying I'll tell them you're on your way so they can hold the plane for a few minutes if needed. \nA: You are welcome. Have a safe trip.", + "cleaned_text": "A: To which gate do I need to go to catch connecting flight 101 to New York City? \nB:Go to gate 18. The plane is now boarding. You must hurry if you want to make it on time since they typically close the doors about 15 minutes before departure and this flight is known for being quite strict about their boarding procedures.\nA: Sorry to interrupt, but can you show me the fastest way to get there? \nB: Instead of walking, you can take this shuttle to get you there faster. \nA: Do you think the plane will leave without me? \nB: No, I'll call the attendants at the gate. I will tell them you're on your way, so they can be prepared. \nA: Oh, thank you so much. I would really appreciate that. By the way, you were about to say something about the attendants? \nB: Yes, I was saying I'll tell them you're on your way so they can hold the plane for a few minutes if needed. \nA: You are welcome. Have a safe trip.", + "total_duration": 45.55877551020408, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--65/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--65/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--65/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "To which gate do I need to go to catch connecting flight 101 to New York City?", + "original_text": "To which gate do I need to go to catch connecting flight 101 to New York City?", + "start_time": 0, + "end_time": 5.154829931972789, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--65/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Go to gate 18. The plane is now boarding. You must hurry if you want to make it on time since they typically close the doors", + "original_text": "Go to gate 18. The plane is now boarding. You must hurry if you want to make it on time since they typically close the doors [interrupt] about 15 minutes before departure and this flight is known for being quite strict about their boarding procedures.", + "start_time": 5.680140788647562, + "end_time": 17.893836933772278, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--65/temp/line_1_B.wav", + "silence_duration": 0.5253108566747731, + "is_interrupted": true, + "text_after_interrupt": "about 15 minutes before departure and this flight is known for being quite strict about their boarding procedures." + }, + { + "speaker": "A", + "text": "Sorry to interrupt, but can you show me the fastest way to get there?", + "original_text": "Sorry to interrupt, but can you show me the fastest way to get there?", + "start_time": 11.879868679804025, + "end_time": 16.036240561890192, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--65/temp/line_2_A.wav", + "silence_duration": 0.40704490644186797, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Instead of walking, you can take this shuttle to get you there faster.", + "original_text": "Instead of walking, you can take this shuttle to get you there faster.", + "start_time": 18.325377999372705, + "end_time": 21.460071876923724, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--65/temp/line_3_B.wav", + "silence_duration": 0.43154106560042704, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Do you think the plane will leave without me?", + "original_text": "Do you think the plane will leave without me?", + "start_time": 21.87902568281416, + "end_time": 23.957211623857244, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--65/temp/line_4_A.wav", + "silence_duration": 0.4189538058904364, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "No, I'll call the attendants at the gate. I will tell them you're on your way, so they can be prepared.", + "original_text": "No, I'll call the attendants at the gate. I will tell them you're on your way, so they can be prepared.", + "start_time": 24.55666388500978, + "end_time": 30.17589290995309, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--65/temp/line_5_B.wav", + "silence_duration": 0.599452261152535, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Oh, thank you so much. I would really appreciate that. By the way, you were about to say something about the attendants?", + "original_text": "Oh, thank you so much. I would really appreciate that. By the way, you were about to say something about the attendants?", + "start_time": 30.644527465209674, + "end_time": 37.59890388244323, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--65/temp/line_6_A.wav", + "silence_duration": 0.4686345552565802, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, I was saying I'll tell them you're on your way so they can hold the plane for a few minutes if needed.", + "original_text": "Yes, I was saying I'll tell them you're on your way so they can hold the plane for a few minutes if needed.", + "start_time": 38.11409845814752, + "end_time": 43.303758322093096, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--65/temp/line_7_B.wav", + "silence_duration": 0.5151945757042824, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "You are welcome. Have a safe trip.", + "original_text": "You are welcome. Have a safe trip.", + "start_time": 43.7244203648493, + "end_time": 45.55879678208286, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--65/temp/line_8_A.wav", + "silence_duration": 0.4206620427562039, + "is_interrupted": false + } + ] + }, + "DialogSum--val--66": { + "original_text": "A: Uh. . . that's Greek to me. \nB: That means they have tapered [interrupt] legs, which get narrower towards the bottom and create a more tailored silhouette compared to straight-cut pants, though the exact degree of tapering can vary between styles. \nA: Tapered? Like, skinny jeans? \nB: Well, mine are baggy. They're the kind of pants you can lounge around in. \nA: Oh, got it. But I was going to ask—what did you mean by \"tapered\"? Is it just the legs? \nB: Yeah, just the legs. Mine are, too. \nA: So maybe we should go out after all. \nB: Yeah. Let's just lounge around!", + "cleaned_text": "A: Uh. . . that's Greek to me. \nB:That means they have tapered legs, which get narrower towards the bottom and create a more tailored silhouette compared to straight-cut pants, though the exact degree of tapering can vary between styles.\nA: Tapered? Like, skinny jeans? \nB: Well, mine are baggy. They're the kind of pants you can lounge around in. \nA: Oh, got it. But I was going to ask—what did you mean by \"tapered\"? Is it just the legs? \nB: Yeah, just the legs. Mine are, too. \nA: So maybe we should go out after all. \nB: Yeah. Let's just lounge around!", + "total_duration": 32.4162358276644, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--66/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--66/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--66/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Uh. . . that's Greek to me.", + "original_text": "Uh. . . that's Greek to me.", + "start_time": 0, + "end_time": 2.589024943310658, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--66/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "That means they have tapered", + "original_text": "That means they have tapered [interrupt] legs, which get narrower towards the bottom and create a more tailored silhouette compared to straight-cut pants, though the exact degree of tapering can vary between styles.", + "start_time": 2.9263774566506617, + "end_time": 13.375357048487395, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--66/temp/line_1_B.wav", + "silence_duration": 0.3373525133400037, + "is_interrupted": true, + "text_after_interrupt": "legs, which get narrower towards the bottom and create a more tailored silhouette compared to straight-cut pants, though the exact degree of tapering can vary between styles." + }, + { + "speaker": "A", + "text": "Tapered? Like, skinny jeans?", + "original_text": "Tapered? Like, skinny jeans?", + "start_time": 4.296354780913701, + "end_time": 6.212001039417102, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--66/temp/line_2_A.wav", + "silence_duration": 0.316589523156704, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Well, mine are baggy. They're the kind of pants you can lounge around in.", + "original_text": "Well, mine are baggy. They're the kind of pants you can lounge around in.", + "start_time": 13.962520632447808, + "end_time": 17.57322358029361, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--66/temp/line_3_B.wav", + "silence_duration": 0.5871635839604136, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Oh, got it. But I was going to ask—what did you mean by \"tapered\"? Is it just the legs?", + "original_text": "Oh, got it. But I was going to ask—what did you mean by \"tapered\"? Is it just the legs?", + "start_time": 18.110727549970566, + "end_time": 24.449775169018185, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--66/temp/line_4_A.wav", + "silence_duration": 0.537503969676954, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yeah, just the legs. Mine are, too.", + "original_text": "Yeah, just the legs. Mine are, too.", + "start_time": 24.76116187511, + "end_time": 27.292136931799345, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--66/temp/line_5_B.wav", + "silence_duration": 0.31138670609181723, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "So maybe we should go out after all.", + "original_text": "So maybe we should go out after all.", + "start_time": 27.604641889126732, + "end_time": 29.880197444682288, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--66/temp/line_6_A.wav", + "silence_duration": 0.3125049573273885, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yeah. Let's just lounge around!", + "original_text": "Yeah. Let's just lounge around!", + "start_time": 30.245198512651214, + "end_time": 32.4162642722884, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--66/temp/line_7_B.wav", + "silence_duration": 0.365001067968925, + "is_interrupted": false + } + ] + }, + "DialogSum--val--67": { + "original_text": "A: Excuse me, madam. Is this seat taken? \nB: No. \nA: Do you mind my sharing the same table with [interrupt] you if it's not too much trouble? I noticed all the other tables are occupied and I'd really appreciate having somewhere to sit while I wait for my friend to arrive. \nB: Sorry to interrupt, but I was just wondering—do you know if there's a special event happening today? It's unusually crowded. \nA: Of course not. There are so many people here today. Actually, I was about to ask if you had any idea why it's so busy. I heard there might be a celebrity appearance or perhaps a big sale happening nearby that's drawing all these crowds.", + "cleaned_text": "A: Excuse me, madam. Is this seat taken? \nB: No. \nA:Do you mind my sharing the same table with you if it's not too much trouble? I noticed all the other tables are occupied and I'd really appreciate having somewhere to sit while I wait for my friend to arrive.\nB: Sorry to interrupt, but I was just wondering—do you know if there's a special event happening today? It's unusually crowded. \nA: Of course not. There are so many people here today. Actually, I was about to ask if you had any idea why it's so busy. I heard there might be a celebrity appearance or perhaps a big sale happening nearby that's drawing all these crowds.", + "total_duration": 30.60934240362812, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--67/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--67/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--67/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Excuse me, madam. Is this seat taken?", + "original_text": "Excuse me, madam. Is this seat taken?", + "start_time": 0, + "end_time": 2.589024943310658, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--67/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "No.", + "original_text": "No.", + "start_time": 2.997935583499741, + "end_time": 3.5552144950643667, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--67/temp/line_1_B.wav", + "silence_duration": 0.4089106401890831, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Do you mind my sharing the same table with", + "original_text": "Do you mind my sharing the same table with [interrupt] you if it's not too much trouble? I noticed all the other tables are occupied and I'd really appreciate having somewhere to sit while I wait for my friend to arrive.", + "start_time": 4.1056199007897165, + "end_time": 15.796867066322598, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--67/temp/line_2_A.wav", + "silence_duration": 0.55040540572535, + "is_interrupted": true, + "text_after_interrupt": "you if it's not too much trouble? I noticed all the other tables are occupied and I'd really appreciate having somewhere to sit while I wait for my friend to arrive." + }, + { + "speaker": "B", + "text": "Sorry to interrupt, but I was just wondering—do you know if there's a special event happening today? It's unusually crowded.", + "original_text": "Sorry to interrupt, but I was just wondering—do you know if there's a special event happening today? It's unusually crowded.", + "start_time": 6.474055274939376, + "end_time": 13.811560943873616, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--67/temp/line_3_B.wav", + "silence_duration": 0.4538538966962644, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Of course not. There are so many people here today. Actually, I was about to ask if you had any idea why it's so busy. I heard there might be a celebrity appearance or perhaps a big sale happening nearby that's drawing all these crowds.", + "original_text": "Of course not. There are so many people here today. Actually, I was about to ask if you had any idea why it's so busy. I heard there might be a celebrity appearance or perhaps a big sale happening nearby that's drawing all these crowds.", + "start_time": 16.18977817933533, + "end_time": 30.609370016070024, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--67/temp/line_4_A.wav", + "silence_duration": 0.3929111130127346, + "is_interrupted": false + } + ] + }, + "DialogSum--val--68": { + "original_text": "A: Wangfujing Grand Hotels. How can I help you? \nB: Do you have any rooms available next Saturday and Sunday night? \nA: Could you hold the line, please? I will check out our room availability for those days. . . Yes, we have a few vacancies next weekend. We have double rooms, suites, and deluxe suites in Japanese, Roman, French, and presidential styles, which one do you [interrupt] prefer? Our Japanese-style rooms feature traditional tatami mats and minimalist decor, while the Roman-style offers luxurious marble baths and classical European furnishings. \nB: Sorry to jump in, but could you also tell me if the double room has a good view? That's quite important to me. \nA: Absolutely, Ms. Monica. The double rooms have a great view of the city skyline. Oh, and I was about to ask which style you prefer for the room—Japanese, Roman, French, or presidential? \nB: A double room in a French style would be perfect. \nA: OK. Could I have your name, please? \nB: My name is Monica Cellar. \nA: OK, Ms. Monica. I've reserved a double room in the French style for you next Saturday and Sunday night. We will see you then! \nB: Thank you.", + "cleaned_text": "A: Wangfujing Grand Hotels. How can I help you? \nB: Do you have any rooms available next Saturday and Sunday night? \nA:Could you hold the line, please? I will check out our room availability for those days. . . Yes, we have a few vacancies next weekend. We have double rooms, suites, and deluxe suites in Japanese, Roman, French, and presidential styles, which one do you prefer? Our Japanese-style rooms feature traditional tatami mats and minimalist decor, while the Roman-style offers luxurious marble baths and classical European furnishings.\nB: Sorry to jump in, but could you also tell me if the double room has a good view? That's quite important to me. \nA: Absolutely, Ms. Monica. The double rooms have a great view of the city skyline. Oh, and I was about to ask which style you prefer for the room—Japanese, Roman, French, or presidential? \nB: A double room in a French style would be perfect. \nA: OK. Could I have your name, please? \nB: My name is Monica Cellar. \nA: OK, Ms. Monica. I've reserved a double room in the French style for you next Saturday and Sunday night. We will see you then! \nB: Thank you.", + "total_duration": 63.1421768707483, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--68/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--68/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--68/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Wangfujing Grand Hotels. How can I help you?", + "original_text": "Wangfujing Grand Hotels. How can I help you?", + "start_time": 0, + "end_time": 3.01859410430839, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--68/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Do you have any rooms available next Saturday and Sunday night?", + "original_text": "Do you have any rooms available next Saturday and Sunday night?", + "start_time": 3.3292407213062347, + "end_time": 6.13885523377789, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--68/temp/line_1_B.wav", + "silence_duration": 0.3106466169978445, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Could you hold the line, please? I will check out our room availability for those days. . . Yes, we have a few vacancies next weekend. We have double rooms, suites, and deluxe suites in Japanese, Roman, French, and presidential styles, which one do you", + "original_text": "Could you hold the line, please? I will check out our room availability for those days. . . Yes, we have a few vacancies next weekend. We have double rooms, suites, and deluxe suites in Japanese, Roman, French, and presidential styles, which one do you [interrupt] prefer? Our Japanese-style rooms feature traditional tatami mats and minimalist decor, while the Roman-style offers luxurious marble baths and classical European furnishings.", + "start_time": 6.495584698224759, + "end_time": 33.535221886433376, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--68/temp/line_2_A.wav", + "silence_duration": 0.35672946444686926, + "is_interrupted": true, + "text_after_interrupt": "prefer? Our Japanese-style rooms feature traditional tatami mats and minimalist decor, while the Roman-style offers luxurious marble baths and classical European furnishings." + }, + { + "speaker": "B", + "text": "Sorry to jump in, but could you also tell me if the double room has a good view? That's quite important to me.", + "original_text": "Sorry to jump in, but could you also tell me if the double room has a good view? That's quite important to me.", + "start_time": 21.867194675549023, + "end_time": 27.32388401795265, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--68/temp/line_3_B.wav", + "silence_duration": 0.44020554121705524, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Absolutely, Ms. Monica. The double rooms have a great view of the city skyline. Oh, and I was about to ask which style you prefer for the room—Japanese, Roman, French, or presidential?", + "original_text": "Absolutely, Ms. Monica. The double rooms have a great view of the city skyline. Oh, and I was about to ask which style you prefer for the room—Japanese, Roman, French, or presidential?", + "start_time": 33.839483188740566, + "end_time": 46.029959379216756, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--68/temp/line_4_A.wav", + "silence_duration": 0.3042613023071889, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "A double room in a French style would be perfect.", + "original_text": "A double room in a French style would be perfect.", + "start_time": 46.52863231266029, + "end_time": 48.86223775483716, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--68/temp/line_5_B.wav", + "silence_duration": 0.4986729334435347, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "OK. Could I have your name, please?", + "original_text": "OK. Could I have your name, please?", + "start_time": 49.17643636737001, + "end_time": 51.92800099322035, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--68/temp/line_6_A.wav", + "silence_duration": 0.3141986125328507, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "My name is Monica Cellar.", + "original_text": "My name is Monica Cellar.", + "start_time": 52.320260956951266, + "end_time": 53.75989814515988, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--68/temp/line_7_B.wav", + "silence_duration": 0.3922599637309142, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "OK, Ms. Monica. I've reserved a double room in the French style for you next Saturday and Sunday night. We will see you then!", + "original_text": "OK, Ms. Monica. I've reserved a double room in the French style for you next Saturday and Sunday night. We will see you then!", + "start_time": 54.20438570354685, + "end_time": 61.994680488127344, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--68/temp/line_8_A.wav", + "silence_duration": 0.4444875583869652, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Thank you.", + "original_text": "Thank you.", + "start_time": 62.584910197061255, + "end_time": 63.14218910862588, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--68/temp/line_9_B.wav", + "silence_duration": 0.5902297089339121, + "is_interrupted": false + } + ] + }, + "DialogSum--val--69": { + "original_text": "A: We can offer you a 5% discount. \nB: Your price is rather out of line, much higher than we expected. We can't buy with your offer. \nA: Well, what do you suggest then? How about 8%? \nB: When we say your prices are much too high, we don't mean they are higher only by 2 or 3 percent. If we are to place an order with you, I think a discount of about 15% would be [interrupt] enough to make it a feasible option for us given the current market conditions and the volume of business we're proposing to bring to your company. \nA: 15%? What? You want to drive me bankrupt! You can't expect us to make such a large reduction. \nB: There's no point in making a counter offer because the gap is too great. \nA: How about 10%? This price is already a little tight, our profit margin is not that large. \nB: Ok. I can settle for that. But just to clarify, I was saying earlier that 15% would be sufficient if we were to place an order with you.", + "cleaned_text": "A: We can offer you a 5% discount. \nB: Your price is rather out of line, much higher than we expected. We can't buy with your offer. \nA: Well, what do you suggest then? How about 8%? \nB:When we say your prices are much too high, we don't mean they are higher only by 2 or 3 percent. If we are to place an order with you, I think a discount of about 15% would be enough to make it a feasible option for us given the current market conditions and the volume of business we're proposing to bring to your company.\nA: 15%? What? You want to drive me bankrupt! You can't expect us to make such a large reduction. \nB: There's no point in making a counter offer because the gap is too great. \nA: How about 10%? This price is already a little tight, our profit margin is not that large. \nB: Ok. I can settle for that. But just to clarify, I was saying earlier that 15% would be sufficient if we were to place an order with you.", + "total_duration": 49.83283446712018, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--69/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--69/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--69/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "We can offer you a 5% discount.", + "original_text": "We can offer you a 5% discount.", + "start_time": 0, + "end_time": 2.6586848072562357, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--69/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Your price is rather out of line, much higher than we expected. We can't buy with your offer.", + "original_text": "Your price is rather out of line, much higher than we expected. We can't buy with your offer.", + "start_time": 2.9860187764840607, + "end_time": 7.421030114352542, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--69/temp/line_1_B.wav", + "silence_duration": 0.32733396922782476, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Well, what do you suggest then? How about 8%?", + "original_text": "Well, what do you suggest then? How about 8%?", + "start_time": 7.7968134821234525, + "end_time": 11.825475613642727, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--69/temp/line_2_A.wav", + "silence_duration": 0.37578336777091115, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "When we say your prices are much too high, we don't mean they are higher only by 2 or 3 percent. If we are to place an order with you, I think a discount of about 15% would be", + "original_text": "When we say your prices are much too high, we don't mean they are higher only by 2 or 3 percent. If we are to place an order with you, I think a discount of about 15% would be [interrupt] enough to make it a feasible option for us given the current market conditions and the volume of business we're proposing to bring to your company.", + "start_time": 12.3285162409497, + "end_time": 29.000443678591424, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--69/temp/line_3_B.wav", + "silence_duration": 0.5030406273069721, + "is_interrupted": true, + "text_after_interrupt": "enough to make it a feasible option for us given the current market conditions and the volume of business we're proposing to bring to your company." + }, + { + "speaker": "A", + "text": "15%? What? You want to drive me bankrupt! You can't expect us to make such a large reduction.", + "original_text": "15%? What? You want to drive me bankrupt! You can't expect us to make such a large reduction.", + "start_time": 22.68461601419233, + "end_time": 29.75509220466852, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--69/temp/line_4_A.wav", + "silence_duration": 0.5712102678983186, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "There's no point in making a counter offer because the gap is too great.", + "original_text": "There's no point in making a counter offer because the gap is too great.", + "start_time": 30.26315045080903, + "end_time": 34.09444296781583, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--69/temp/line_5_B.wav", + "silence_duration": 0.5080582461405079, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "How about 10%? This price is already a little tight, our profit margin is not that large.", + "original_text": "How about 10%? This price is already a little tight, our profit margin is not that large.", + "start_time": 34.68645644084727, + "end_time": 41.39702333427131, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--69/temp/line_6_A.wav", + "silence_duration": 0.5920134730314435, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Ok. I can settle for that. But just to clarify, I was saying earlier that 15% would be sufficient if we were to place an order with you.", + "original_text": "Ok. I can settle for that. But just to clarify, I was saying earlier that 15% would be sufficient if we were to place an order with you.", + "start_time": 41.91486282078602, + "end_time": 49.83286735593341, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--69/temp/line_7_B.wav", + "silence_duration": 0.5178394865147101, + "is_interrupted": false + } + ] + }, + "DialogSum--val--70": { + "original_text": "A: You are seemingly upset. What's behind you?\nB: Arden wants to have a trademark for our new series of products registered. But I have no idea on the registering [interrupt] process, and I'm worried about making mistakes that could delay everything, especially since we're on a tight deadline to launch these products in the market.\nA: Sorry to jump in, but are you worried about the legal aspects or just the process itself?\nB: Mostly the process itself. I've never experienced this. Can you tell me something about it?\nA: It is known that there is a time limit for trademarks. And we should not have a similar trademark with the one in the same field [interrupt] to avoid any potential legal conflicts or rejections, which could significantly impact our brand reputation and marketing timeline for these new products.\nB: Based on what you said, does it mean that we can not have a trademark like 'genova', right?\nA: Correct. And our country follows the priority of use principle.\nB: That makes sense. By the way, earlier you mentioned the registering process but didn't finish. Could you tell me more about the preparation for the register?", + "cleaned_text": "A: You are seemingly upset. What's behind you?\nB:Arden wants to have a trademark for our new series of products registered. But I have no idea on the registering process, and I'm worried about making mistakes that could delay everything, especially since we're on a tight deadline to launch these products in the market.\nA: Sorry to jump in, but are you worried about the legal aspects or just the process itself?\nB: Mostly the process itself. I've never experienced this. Can you tell me something about it?\nA:It is known that there is a time limit for trademarks. And we should not have a similar trademark with the one in the same field to avoid any potential legal conflicts or rejections, which could significantly impact our brand reputation and marketing timeline for these new products.\nB: Based on what you said, does it mean that we can not have a trademark like 'genova', right?\nA: Correct. And our country follows the priority of use principle.\nB: That makes sense. By the way, earlier you mentioned the registering process but didn't finish. Could you tell me more about the preparation for the register?", + "total_duration": 52.91519274376417, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--70/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--70/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--70/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "You are seemingly upset. What's behind you?", + "original_text": "You are seemingly upset. What's behind you?", + "start_time": 0, + "end_time": 3.378503401360544, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--70/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Arden wants to have a trademark for our new series of products registered. But I have no idea on the registering", + "original_text": "Arden wants to have a trademark for our new series of products registered. But I have no idea on the registering [interrupt] process, and I'm worried about making mistakes that could delay everything, especially since we're on a tight deadline to launch these products in the market.", + "start_time": 3.7248107461938664, + "end_time": 16.87891505458389, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--70/temp/line_1_B.wav", + "silence_duration": 0.3463073448333221, + "is_interrupted": true, + "text_after_interrupt": "process, and I'm worried about making mistakes that could delay everything, especially since we're on a tight deadline to launch these products in the market." + }, + { + "speaker": "A", + "text": "Sorry to jump in, but are you worried about the legal aspects or just the process itself?", + "original_text": "Sorry to jump in, but are you worried about the legal aspects or just the process itself?", + "start_time": 9.483359499028333, + "end_time": 15.079368569323119, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--70/temp/line_2_A.wav", + "silence_duration": 0.5553010313508651, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Mostly the process itself. I've never experienced this. Can you tell me something about it?", + "original_text": "Mostly the process itself. I've never experienced this. Can you tell me something about it?", + "start_time": 17.39298439146802, + "end_time": 22.12985513976734, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--70/temp/line_3_B.wav", + "silence_duration": 0.5140693368841323, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "It is known that there is a time limit for trademarks. And we should not have a similar trademark with the one in the same field", + "original_text": "It is known that there is a time limit for trademarks. And we should not have a similar trademark with the one in the same field [interrupt] to avoid any potential legal conflicts or rejections, which could significantly impact our brand reputation and marketing timeline for these new products.", + "start_time": 22.597281646261614, + "end_time": 39.071839469390866, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--70/temp/line_4_A.wav", + "silence_duration": 0.46742650649427275, + "is_interrupted": true, + "text_after_interrupt": "to avoid any potential legal conflicts or rejections, which could significantly impact our brand reputation and marketing timeline for these new products." + }, + { + "speaker": "B", + "text": "Based on what you said, does it mean that we can not have a trademark like 'genova', right?", + "original_text": "Based on what you said, does it mean that we can not have a trademark like 'genova', right?", + "start_time": 35.45970253594722, + "end_time": 40.25462317086786, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--70/temp/line_5_B.wav", + "silence_duration": 0.5868322091622828, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Correct. And our country follows the priority of use principle.", + "original_text": "Correct. And our country follows the priority of use principle.", + "start_time": 40.84363405469698, + "end_time": 44.89551614086478, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--70/temp/line_6_A.wav", + "silence_duration": 0.5890108838291201, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "That makes sense. By the way, earlier you mentioned the registering process but didn't finish. Could you tell me more about the preparation for the register?", + "original_text": "That makes sense. By the way, earlier you mentioned the registering process but didn't finish. Could you tell me more about the preparation for the register?", + "start_time": 45.357120871218434, + "end_time": 52.915216109313675, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--70/temp/line_7_B.wav", + "silence_duration": 0.461604730353658, + "is_interrupted": false + } + ] + }, + "DialogSum--val--71": { + "original_text": "A: Your mp3 looks so cool. Where did you get it? \nB: I bought it online. \nA: Really? Do you often [interrupt] find good deals online or do you have specific websites you rely on for the best discounts and quality products? \nB: Sorry to jump in, but do you trust the quality of the products you buy online? I've heard mixed reviews about that. \nA: Yes, I do, but I make sure to read reviews and check the seller's reputation before purchasing. By the way, I was about to ask if you often shop online? \nB: Oh, yes. I buy most of my daily necessities online. \nA: I've never tried E-shopping. Is it better than shopping at an actual store? \nB: Yes, much better. You can log in to a website, browse through many items and categories comfortably at home, order the goods, pay by credit or debit card, and the goods will be delivered to your home. \nA: Sounds good, and I don't have to queue up at the cashier. \nB: And you can still go 'window shopping' just like in a real shopping mall. \nA: Well, are there any other advantages? \nB: Yes, most of the shops are closed at 22 or even earlier, but the internet operates 24 hours a day, seven days a week, and can be accessed anywhere. \nA: Are there many choices of online shopping? \nB: Sure. You can buy almost anything you can think of, and there are often exclusive online discounts.", + "cleaned_text": "A: Your mp3 looks so cool. Where did you get it? \nB: I bought it online. \nA:Really? Do you often find good deals online or do you have specific websites you rely on for the best discounts and quality products?\nB: Sorry to jump in, but do you trust the quality of the products you buy online? I've heard mixed reviews about that. \nA: Yes, I do, but I make sure to read reviews and check the seller's reputation before purchasing. By the way, I was about to ask if you often shop online? \nB: Oh, yes. I buy most of my daily necessities online. \nA: I've never tried E-shopping. Is it better than shopping at an actual store? \nB: Yes, much better. You can log in to a website, browse through many items and categories comfortably at home, order the goods, pay by credit or debit card, and the goods will be delivered to your home. \nA: Sounds good, and I don't have to queue up at the cashier. \nB: And you can still go 'window shopping' just like in a real shopping mall. \nA: Well, are there any other advantages? \nB: Yes, most of the shops are closed at 22 or even earlier, but the internet operates 24 hours a day, seven days a week, and can be accessed anywhere. \nA: Are there many choices of online shopping? \nB: Sure. You can buy almost anything you can think of, and there are often exclusive online discounts.", + "total_duration": 71.45528344671202, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--71/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--71/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--71/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Your mp3 looks so cool. Where did you get it?", + "original_text": "Your mp3 looks so cool. Where did you get it?", + "start_time": 0, + "end_time": 3.030204081632653, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--71/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I bought it online.", + "original_text": "I bought it online.", + "start_time": 3.47817545386862, + "end_time": 4.592733276997872, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--71/temp/line_1_B.wav", + "silence_duration": 0.44797137223596667, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Really? Do you often", + "original_text": "Really? Do you often [interrupt] find good deals online or do you have specific websites you rely on for the best discounts and quality products?", + "start_time": 4.956748783730068, + "end_time": 13.432032230442086, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--71/temp/line_2_A.wav", + "silence_duration": 0.3640155067321959, + "is_interrupted": true, + "text_after_interrupt": "find good deals online or do you have specific websites you rely on for the best discounts and quality products?" + }, + { + "speaker": "B", + "text": "Sorry to jump in, but do you trust the quality of the products you buy online? I've heard mixed reviews about that.", + "original_text": "Sorry to jump in, but do you trust the quality of the products you buy online? I've heard mixed reviews about that.", + "start_time": 6.57053563180263, + "end_time": 12.619333817743673, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--71/temp/line_3_B.wav", + "silence_duration": 0.4861804258104984, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Yes, I do, but I make sure to read reviews and check the seller's reputation before purchasing. By the way, I was about to ask if you often shop online?", + "original_text": "Yes, I do, but I make sure to read reviews and check the seller's reputation before purchasing. By the way, I was about to ask if you often shop online?", + "start_time": 13.982343210223709, + "end_time": 23.897263845144344, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--71/temp/line_4_A.wav", + "silence_duration": 0.5503109797816222, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Oh, yes. I buy most of my daily necessities online.", + "original_text": "Oh, yes. I buy most of my daily necessities online.", + "start_time": 24.200206372730925, + "end_time": 27.23041045436358, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--71/temp/line_5_B.wav", + "silence_duration": 0.30294252758658125, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I've never tried E-shopping. Is it better than shopping at an actual store?", + "original_text": "I've never tried E-shopping. Is it better than shopping at an actual store?", + "start_time": 27.791686726300835, + "end_time": 31.843568812468636, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--71/temp/line_6_A.wav", + "silence_duration": 0.5612762719372549, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, much better. You can log in to a website, browse through many items and categories comfortably at home, order the goods, pay by credit or debit card, and the goods will be delivered to your home.", + "original_text": "Yes, much better. You can log in to a website, browse through many items and categories comfortably at home, order the goods, pay by credit or debit card, and the goods will be delivered to your home.", + "start_time": 32.32315917764763, + "end_time": 42.95789840667258, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--71/temp/line_7_B.wav", + "silence_duration": 0.4795903651789988, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Sounds good, and I don't have to queue up at the cashier.", + "original_text": "Sounds good, and I don't have to queue up at the cashier.", + "start_time": 43.31942214970942, + "end_time": 46.7791953923398, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--71/temp/line_8_A.wav", + "silence_duration": 0.3615237430368396, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "And you can still go 'window shopping' just like in a real shopping mall.", + "original_text": "And you can still go 'window shopping' just like in a real shopping mall.", + "start_time": 47.198374599578294, + "end_time": 50.65814784220868, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--71/temp/line_9_B.wav", + "silence_duration": 0.4191792072384957, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Well, are there any other advantages?", + "original_text": "Well, are there any other advantages?", + "start_time": 51.255756961565254, + "end_time": 54.03054154206412, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--71/temp/line_10_A.wav", + "silence_duration": 0.5976091193565768, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, most of the shops are closed at 22 or even earlier, but the internet operates 24 hours a day, seven days a week, and can be accessed anywhere.", + "original_text": "Yes, most of the shops are closed at 22 or even earlier, but the internet operates 24 hours a day, seven days a week, and can be accessed anywhere.", + "start_time": 54.56680184882125, + "end_time": 63.42521454723395, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--71/temp/line_11_B.wav", + "silence_duration": 0.5362603067571259, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Are there many choices of online shopping?", + "original_text": "Are there many choices of online shopping?", + "start_time": 63.99041075401458, + "end_time": 66.24274635492161, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--71/temp/line_12_A.wav", + "silence_duration": 0.5651962067806303, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Sure. You can buy almost anything you can think of, and there are often exclusive online discounts.", + "original_text": "Sure. You can buy almost anything you can think of, and there are often exclusive online discounts.", + "start_time": 66.55591063101234, + "end_time": 71.45532106185134, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--71/temp/line_13_B.wav", + "silence_duration": 0.3131642760907273, + "is_interrupted": false + } + ] + }, + "DialogSum--val--73": { + "original_text": "A: Hello. \nB: Hello. Is there anything I can do for you? \nA: Yes, please. I'd like to open a savings account. Would you please give me some [interrupt] advice on the best options available based on my financial goals and spending habits? \nB: Sorry to interrupt, but before we go into the details, could you tell me if you have any specific requirements or preferences for the account? \nA: Oh, I was actually going to ask for advice on the options, but sure. I don't have any specific requirements, just looking for something that allows flexibility. \nB: Certainly, I'll be very happy to help you. Usually, we offer current or fixed accounts for individuals. \nA: What's the difference between the two? \nB: If you open a fixed account, the interest rate is higher. \nA: Then how about the current account? \nB: You may withdraw the money at any time. You just need to present your deposit book. \nA: Thank you for your help. I think I'll open a current account. \nB: OK. Do you have your ID card on you? \nA: Yes. Oh, by the way, you mentioned earlier that you could give me some advice—was there anything else I should consider before finalizing this? \nB: Good point, I was going to mention that with a current account, while the flexibility is great, the interest rates are usually lower. But since you prefer flexibility, it seems like the right choice for you. \nA: That makes sense. Let's proceed. \nB: Good. Everything is done. Here is your deposit book and ID card.", + "cleaned_text": "A: Hello. \nB: Hello. Is there anything I can do for you? \nA:Yes, please. I'd like to open a savings account. Would you please give me some advice on the best options available based on my financial goals and spending habits?\nB: Sorry to interrupt, but before we go into the details, could you tell me if you have any specific requirements or preferences for the account? \nA: Oh, I was actually going to ask for advice on the options, but sure. I don't have any specific requirements, just looking for something that allows flexibility. \nB: Certainly, I'll be very happy to help you. Usually, we offer current or fixed accounts for individuals. \nA: What's the difference between the two? \nB: If you open a fixed account, the interest rate is higher. \nA: Then how about the current account? \nB: You may withdraw the money at any time. You just need to present your deposit book. \nA: Thank you for your help. I think I'll open a current account. \nB: OK. Do you have your ID card on you? \nA: Yes. Oh, by the way, you mentioned earlier that you could give me some advice—was there anything else I should consider before finalizing this? \nB: Good point, I was going to mention that with a current account, while the flexibility is great, the interest rates are usually lower. But since you prefer flexibility, it seems like the right choice for you. \nA: That makes sense. Let's proceed. \nB: Good. Everything is done. Here is your deposit book and ID card.", + "total_duration": 77.14104308390023, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--73/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--73/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--73/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Hello.", + "original_text": "Hello.", + "start_time": 0, + "end_time": 0.6501587301587302, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--73/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Hello. Is there anything I can do for you?", + "original_text": "Hello. Is there anything I can do for you?", + "start_time": 0.962102155690056, + "end_time": 3.1796078246242967, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--73/temp/line_1_B.wav", + "silence_duration": 0.31194342553132587, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Yes, please. I'd like to open a savings account. Would you please give me some", + "original_text": "Yes, please. I'd like to open a savings account. Would you please give me some [interrupt] advice on the best options available based on my financial goals and spending habits?", + "start_time": 3.5311261602578763, + "end_time": 13.562146568421142, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--73/temp/line_2_A.wav", + "silence_duration": 0.35151833563357954, + "is_interrupted": true, + "text_after_interrupt": "advice on the best options available based on my financial goals and spending habits?" + }, + { + "speaker": "B", + "text": "Sorry to interrupt, but before we go into the details, could you tell me if you have any specific requirements or preferences for the account?", + "original_text": "Sorry to interrupt, but before we go into the details, could you tell me if you have any specific requirements or preferences for the account?", + "start_time": 8.267996908557196, + "end_time": 14.862464028738602, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--73/temp/line_3_B.wav", + "silence_duration": 0.4312173079568191, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Oh, I was actually going to ask for advice on the options, but sure. I don't have any specific requirements, just looking for something that allows flexibility.", + "original_text": "Oh, I was actually going to ask for advice on the options, but sure. I don't have any specific requirements, just looking for something that allows flexibility.", + "start_time": 15.42420892833022, + "end_time": 25.66420892833022, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--73/temp/line_4_A.wav", + "silence_duration": 0.561744899591619, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Certainly, I'll be very happy to help you. Usually, we offer current or fixed accounts for individuals.", + "original_text": "Certainly, I'll be very happy to help you. Usually, we offer current or fixed accounts for individuals.", + "start_time": 25.967857121785592, + "end_time": 31.15751698573117, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--73/temp/line_5_B.wav", + "silence_duration": 0.3036481934553718, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "What's the difference between the two?", + "original_text": "What's the difference between the two?", + "start_time": 31.683022986948416, + "end_time": 33.482569472209185, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--73/temp/line_6_A.wav", + "silence_duration": 0.5255060012172444, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "If you open a fixed account, the interest rate is higher.", + "original_text": "If you open a fixed account, the interest rate is higher.", + "start_time": 33.9955271243027, + "end_time": 36.87480150071993, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--73/temp/line_7_B.wav", + "silence_duration": 0.5129576520935117, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Then how about the current account?", + "original_text": "Then how about the current account?", + "start_time": 37.38506471082018, + "end_time": 39.27749101467506, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--73/temp/line_8_A.wav", + "silence_duration": 0.5102632101002491, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "You may withdraw the money at any time. You just need to present your deposit book.", + "original_text": "You may withdraw the money at any time. You just need to present your deposit book.", + "start_time": 39.61140946613619, + "end_time": 43.93032103076204, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--73/temp/line_9_B.wav", + "silence_duration": 0.3339184514611283, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Thank you for your help. I think I'll open a current account.", + "original_text": "Thank you for your help. I think I'll open a current account.", + "start_time": 44.44718235284508, + "end_time": 48.47584448436436, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--73/temp/line_10_A.wav", + "silence_duration": 0.5168613220830475, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "OK. Do you have your ID card on you?", + "original_text": "OK. Do you have your ID card on you?", + "start_time": 49.00564742166673, + "end_time": 51.17671318130392, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--73/temp/line_11_B.wav", + "silence_duration": 0.5298029373023705, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Yes. Oh, by the way, you mentioned earlier that you could give me some advice—was there anything else I should consider before finalizing this?", + "original_text": "Yes. Oh, by the way, you mentioned earlier that you could give me some advice—was there anything else I should consider before finalizing this?", + "start_time": 51.512854983829385, + "end_time": 59.68627902011056, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--73/temp/line_12_A.wav", + "silence_duration": 0.33614180252546527, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Good point, I was going to mention that with a current account, while the flexibility is great, the interest rates are usually lower. But since you prefer flexibility, it seems like the right choice for you.", + "original_text": "Good point, I was going to mention that with a current account, while the flexibility is great, the interest rates are usually lower. But since you prefer flexibility, it seems like the right choice for you.", + "start_time": 60.17478863498272, + "end_time": 70.12453920187615, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--73/temp/line_13_B.wav", + "silence_duration": 0.48850961487215705, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "That makes sense. Let's proceed.", + "original_text": "That makes sense. Let's proceed.", + "start_time": 70.62561936306754, + "end_time": 73.12176448778409, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--73/temp/line_14_A.wav", + "silence_duration": 0.5010801611913906, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Good. Everything is done. Here is your deposit book and ID card.", + "original_text": "Good. Everything is done. Here is your deposit book and ID card.", + "start_time": 73.64644665949398, + "end_time": 77.14104983409715, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--73/temp/line_15_B.wav", + "silence_duration": 0.5246821717098855, + "is_interrupted": false + } + ] + }, + "DialogSum--val--74": { + "original_text": "A: There have been too many unplanned shutdowns over the past few months. We'll have to make a few changes to the way we operate. We need to reduce our [interrupt] downtime and improve our overall efficiency by implementing better monitoring systems and streamlining our maintenance procedures.\n\nB: Sorry to jump in, but I'm wondering if we've looked into the root causes of these shutdowns? It might help us address the problem more effectively.\n\nA: Good point, identifying the root causes is crucial. But I was also going to mention that our maintenance team is fully stretched dealing with problems. We don't have time to carry out any preventive maintenance [interrupt] which could help us avoid these shutdowns in the first place by identifying potential issues before they escalate into major problems.\n\nB: That's definitely a challenge. Maybe we should consider bringing in temporary support or outsourcing some tasks to free up the team for preventive maintenance?", + "cleaned_text": "A:There have been too many unplanned shutdowns over the past few months. We'll have to make a few changes to the way we operate. We need to reduce our downtime and improve our overall efficiency by implementing better monitoring systems and streamlining our maintenance procedures.\n\nB: Sorry to jump in, but I'm wondering if we've looked into the root causes of these shutdowns? It might help us address the problem more effectively.\n\nA:Good point, identifying the root causes is crucial. But I was also going to mention that our maintenance team is fully stretched dealing with problems. We don't have time to carry out any preventive maintenance which could help us avoid these shutdowns in the first place by identifying potential issues before they escalate into major problems.\n\nB: That's definitely a challenge. Maybe we should consider bringing in temporary support or outsourcing some tasks to free up the team for preventive maintenance?", + "total_duration": 44.54775510204082, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--74/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--74/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--74/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "There have been too many unplanned shutdowns over the past few months. We'll have to make a few changes to the way we operate. We need to reduce our", + "original_text": "There have been too many unplanned shutdowns over the past few months. We'll have to make a few changes to the way we operate. We need to reduce our [interrupt] downtime and improve our overall efficiency by implementing better monitoring systems and streamlining our maintenance procedures.", + "start_time": 0, + "end_time": 16.27718820861678, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--74/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": true, + "text_after_interrupt": "downtime and improve our overall efficiency by implementing better monitoring systems and streamlining our maintenance procedures." + }, + { + "speaker": "B", + "text": "Sorry to jump in, but I'm wondering if we've looked into the root causes of these shutdowns? It might help us address the problem more effectively.", + "original_text": "Sorry to jump in, but I'm wondering if we've looked into the root causes of these shutdowns? It might help us address the problem more effectively.", + "start_time": 8.231473922902495, + "end_time": 14.988480725623583, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--74/temp/line_1_B.wav", + "silence_duration": 0.5791202711755608, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Good point, identifying the root causes is crucial. But I was also going to mention that our maintenance team is fully stretched dealing with problems. We don't have time to carry out any preventive maintenance", + "original_text": "Good point, identifying the root causes is crucial. But I was also going to mention that our maintenance team is fully stretched dealing with problems. We don't have time to carry out any preventive maintenance [interrupt] which could help us avoid these shutdowns in the first place by identifying potential issues before they escalate into major problems.", + "start_time": 16.80705804664995, + "end_time": 36.137670291547906, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--74/temp/line_2_A.wav", + "silence_duration": 0.5298698380331683, + "is_interrupted": true, + "text_after_interrupt": "which could help us avoid these shutdowns in the first place by identifying potential issues before they escalate into major problems." + }, + { + "speaker": "B", + "text": "That's definitely a challenge. Maybe we should consider bringing in temporary support or outsourcing some tasks to free up the team for preventive maintenance?", + "original_text": "That's definitely a challenge. Maybe we should consider bringing in temporary support or outsourcing some tasks to free up the team for preventive maintenance?", + "start_time": 36.18860840429953, + "end_time": 44.54779207776892, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--74/temp/line_3_B.wav", + "silence_duration": 0.5593209974587157, + "is_interrupted": false + } + ] + }, + "DialogSum--val--75": { + "original_text": "A: Excuse me, I'm afraid you've parked in the wrong spot. \nB: Oh, really? Isn't this spot C40 [interrupt] in the C section near the main entrance where they usually have visitor parking available during business hours? I must have misread the sign. \nA: No, it's D408, my parking space. I have already paid for it. \nB: I'm sorry, I must have been confused. I had thought it's C section, but actually it's D section. By the way, you mentioned paying for it—how did you manage to reserve this exact spot? \nA: I reserved it through the building management a few months ago. But could you please move your car first? \nB: Of course, I'll move it right away. Thanks for letting me know.", + "cleaned_text": "A: Excuse me, I'm afraid you've parked in the wrong spot. \nB:Oh, really? Isn't this spot C40 in the C section near the main entrance where they usually have visitor parking available during business hours? I must have misread the sign.\nA: No, it's D408, my parking space. I have already paid for it. \nB: I'm sorry, I must have been confused. I had thought it's C section, but actually it's D section. By the way, you mentioned paying for it—how did you manage to reserve this exact spot? \nA: I reserved it through the building management a few months ago. But could you please move your car first? \nB: Of course, I'll move it right away. Thanks for letting me know.", + "total_duration": 33.088526077097505, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--75/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--75/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--75/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Excuse me, I'm afraid you've parked in the wrong spot.", + "original_text": "Excuse me, I'm afraid you've parked in the wrong spot.", + "start_time": 0, + "end_time": 3.076643990929705, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--75/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Oh, really? Isn't this spot C40", + "original_text": "Oh, really? Isn't this spot C40 [interrupt] in the C section near the main entrance where they usually have visitor parking available during business hours? I must have misread the sign.", + "start_time": 3.6586582185844367, + "end_time": 13.608408785477861, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--75/temp/line_1_B.wav", + "silence_duration": 0.5820142276547313, + "is_interrupted": true, + "text_after_interrupt": "in the C section near the main entrance where they usually have visitor parking available during business hours? I must have misread the sign." + }, + { + "speaker": "A", + "text": "No, it's D408, my parking space. I have already paid for it.", + "original_text": "No, it's D408, my parking space. I have already paid for it.", + "start_time": 6.468272731056092, + "end_time": 11.42573304851641, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--75/temp/line_2_A.wav", + "silence_duration": 0.306794805451362, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I'm sorry, I must have been confused. I had thought it's C section, but actually it's D section. By the way, you mentioned paying for it—how did you manage to reserve this exact spot?", + "original_text": "I'm sorry, I must have been confused. I had thought it's C section, but actually it's D section. By the way, you mentioned paying for it—how did you manage to reserve this exact spot?", + "start_time": 14.170873646528381, + "end_time": 23.609785211154232, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--75/temp/line_3_B.wav", + "silence_duration": 0.5624648610505208, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I reserved it through the building management a few months ago. But could you please move your car first?", + "original_text": "I reserved it through the building management a few months ago. But could you please move your car first?", + "start_time": 24.045295169288007, + "end_time": 29.67613417155558, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--75/temp/line_4_A.wav", + "silence_duration": 0.43550995813377535, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Of course, I'll move it right away. Thanks for letting me know.", + "original_text": "Of course, I'll move it right away. Thanks for letting me know.", + "start_time": 29.98867614213116, + "end_time": 33.08854008770939, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--75/temp/line_5_B.wav", + "silence_duration": 0.31254197057557653, + "is_interrupted": false + } + ] + }, + "DialogSum--val--76": { + "original_text": "A: Why don't you watch where you're going? \nB: Me? You're the one who pulled out in front of me! \nA: There was plenty of room for me to pull out. You didn't have to stay in the lane you were [interrupt] about to change into, but I guess you didn't see me signaling because you were too busy looking at your phone or something. \nB: Hey, listen. I had every right to stay in the lane I was in. You were supposed to wait until I passed to pull out. And anyhow, you didn't give me any time to change lanes. All of a sudden--BANG--there you are right in front of me. \nA: I think my arm is broken. \nB: Sorry about your arm, but it serves you right. You need to learn how to drive. You're lucky you didn't get killed. And I'm lucky to be alive too. \nA: Listen, let's just wait until the police get here. Then we can decide whose fault this accident really was, instead of arguing about it now. \nB: Fine with me. I know the laws of the road. I'm not worried. \nA: I have a cell phone in my car. Now it's probably on the floor on the passenger side. Why don't you get it for me, and then I can call the police? \nB: Alright. \nA: It doesn't work. It looks like it's broken. I need to get to a hospital. You should drive me there. \nB: Oh, yeah? It's better if we make a police report first. Then you can go to the hospital. \nA: But you interrupted me earlier—I was going to say, then we can decide whose fault this accident was, but now my arm really hurts. Can we please just focus on getting me to a hospital first?", + "cleaned_text": "A: Why don't you watch where you're going? \nB: Me? You're the one who pulled out in front of me! \nA:There was plenty of room for me to pull out. You didn't have to stay in the lane you were about to change into, but I guess you didn't see me signaling because you were too busy looking at your phone or something.\nB: Hey, listen. I had every right to stay in the lane I was in. You were supposed to wait until I passed to pull out. And anyhow, you didn't give me any time to change lanes. All of a sudden--BANG--there you are right in front of me. \nA: I think my arm is broken. \nB: Sorry about your arm, but it serves you right. You need to learn how to drive. You're lucky you didn't get killed. And I'm lucky to be alive too. \nA: Listen, let's just wait until the police get here. Then we can decide whose fault this accident really was, instead of arguing about it now. \nB: Fine with me. I know the laws of the road. I'm not worried. \nA: I have a cell phone in my car. Now it's probably on the floor on the passenger side. Why don't you get it for me, and then I can call the police? \nB: Alright. \nA: It doesn't work. It looks like it's broken. I need to get to a hospital. You should drive me there. \nB: Oh, yeah? It's better if we make a police report first. Then you can go to the hospital. \nA: But you interrupted me earlier—I was going to say, then we can decide whose fault this accident was, but now my arm really hurts. Can we please just focus on getting me to a hospital first?", + "total_duration": 79.76993197278911, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--76/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--76/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--76/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Why don't you watch where you're going?", + "original_text": "Why don't you watch where you're going?", + "start_time": 0, + "end_time": 1.9388662131519274, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--76/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Me? You're the one who pulled out in front of me!", + "original_text": "Me? You're the one who pulled out in front of me!", + "start_time": 2.239619920582935, + "end_time": 5.014404501081801, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--76/temp/line_1_B.wav", + "silence_duration": 0.3007537074310076, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "There was plenty of room for me to pull out. You didn't have to stay in the lane you were", + "original_text": "There was plenty of room for me to pull out. You didn't have to stay in the lane you were [interrupt] about to change into, but I guess you didn't see me signaling because you were too busy looking at your phone or something.", + "start_time": 5.574064552390713, + "end_time": 16.591933033116334, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--76/temp/line_2_A.wav", + "silence_duration": 0.5596600513089123, + "is_interrupted": true, + "text_after_interrupt": "about to change into, but I guess you didn't see me signaling because you were too busy looking at your phone or something." + }, + { + "speaker": "B", + "text": "Hey, listen. I had every right to stay in the lane I was in. You were supposed to wait until I passed to pull out. And anyhow, you didn't give me any time to change lanes. All of a sudden--BANG--there you are right in front of me.", + "original_text": "Hey, listen. I had every right to stay in the lane I was in. You were supposed to wait until I passed to pull out. And anyhow, you didn't give me any time to change lanes. All of a sudden--BANG--there you are right in front of me.", + "start_time": 10.11356568617756, + "end_time": 22.582681332436064, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--76/temp/line_3_B.wav", + "silence_duration": 0.46246239821944274, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I think my arm is broken.", + "original_text": "I think my arm is broken.", + "start_time": 23.124801710568686, + "end_time": 24.843078354559616, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--76/temp/line_4_A.wav", + "silence_duration": 0.5421203781326223, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Sorry about your arm, but it serves you right. You need to learn how to drive. You're lucky you didn't get killed. And I'm lucky to be alive too.", + "original_text": "Sorry about your arm, but it serves you right. You need to learn how to drive. You're lucky you didn't get killed. And I'm lucky to be alive too.", + "start_time": 25.30174637203308, + "end_time": 32.79018174618274, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--76/temp/line_5_B.wav", + "silence_duration": 0.4586680174734621, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Listen, let's just wait until the police get here. Then we can decide whose fault this accident really was, instead of arguing about it now.", + "original_text": "Listen, let's just wait until the police get here. Then we can decide whose fault this accident really was, instead of arguing about it now.", + "start_time": 33.22751617086528, + "end_time": 41.64474973095598, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--76/temp/line_6_A.wav", + "silence_duration": 0.43733442468253697, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Fine with me. I know the laws of the road. I'm not worried.", + "original_text": "Fine with me. I know the laws of the road. I'm not worried.", + "start_time": 42.09889041077246, + "end_time": 45.175534401702166, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--76/temp/line_7_B.wav", + "silence_duration": 0.45414067981648165, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I have a cell phone in my car. Now it's probably on the floor on the passenger side. Why don't you get it for me, and then I can call the police?", + "original_text": "I have a cell phone in my car. Now it's probably on the floor on the passenger side. Why don't you get it for me, and then I can call the police?", + "start_time": 45.70670574405629, + "end_time": 54.4374086919021, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--76/temp/line_8_A.wav", + "silence_duration": 0.53117134235413, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Alright.", + "original_text": "Alright.", + "start_time": 54.88740366839444, + "end_time": 55.47951251193186, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--76/temp/line_9_B.wav", + "silence_duration": 0.449994976492344, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "It doesn't work. It looks like it's broken. I need to get to a hospital. You should drive me there.", + "original_text": "It doesn't work. It looks like it's broken. I need to get to a hospital. You should drive me there.", + "start_time": 56.07357752194408, + "end_time": 62.551944868882856, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--76/temp/line_10_A.wav", + "silence_duration": 0.5940650100122192, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Oh, yeah? It's better if we make a police report first. Then you can go to the hospital.", + "original_text": "Oh, yeah? It's better if we make a police report first. Then you can go to the hospital.", + "start_time": 62.93521391254929, + "end_time": 68.09004384452207, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--76/temp/line_11_B.wav", + "silence_duration": 0.3832690436664279, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "But you interrupted me earlier—I was going to say, then we can decide whose fault this accident was, but now my arm really hurts. Can we please just focus on getting me to a hospital first?", + "original_text": "But you interrupted me earlier—I was going to say, then we can decide whose fault this accident was, but now my arm really hurts. Can we please just focus on getting me to a hospital first?", + "start_time": 68.43860782998898, + "end_time": 79.76994569846971, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--76/temp/line_12_A.wav", + "silence_duration": 0.34856398546690925, + "is_interrupted": false + } + ] + }, + "DialogSum--val--77": { + "original_text": "A: I hear a businessman is building a dog park in our city. \nB: Really? What for? \nA: Obviously because there's a law against having dogs in the streets. \nB: Does it mean that dogs have to stay at home all the [interrupt] time if the owners don't take them to the park? That seems like it would lead to behavioral issues and pent-up energy for the poor animals. \nA: Wait, are you saying there's no alternative for dog owners? \nB: Well, I was just wondering if the dogs have to stay at home all the time. It sounds pretty cruel, right? Maybe a dog park is a good idea. \nA: Maybe they should just allow people to walk their dogs in the streets. \nB: But then streets could be a mess. \nA: Couldn't people clean up after their dogs?", + "cleaned_text": "A: I hear a businessman is building a dog park in our city. \nB: Really? What for? \nA: Obviously because there's a law against having dogs in the streets. \nB:Does it mean that dogs have to stay at home all the time if the owners don't take them to the park? That seems like it would lead to behavioral issues and pent-up energy for the poor animals.\nA: Wait, are you saying there's no alternative for dog owners? \nB: Well, I was just wondering if the dogs have to stay at home all the time. It sounds pretty cruel, right? Maybe a dog park is a good idea. \nA: Maybe they should just allow people to walk their dogs in the streets. \nB: But then streets could be a mess. \nA: Couldn't people clean up after their dogs?", + "total_duration": 36.615873015873014, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--77/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--77/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--77/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "I hear a businessman is building a dog park in our city.", + "original_text": "I hear a businessman is building a dog park in our city.", + "start_time": 0, + "end_time": 3.297233560090703, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--77/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Really? What for?", + "original_text": "Really? What for?", + "start_time": 3.8215811057255347, + "end_time": 5.156728498015784, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--77/temp/line_1_B.wav", + "silence_duration": 0.5243475456348317, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Obviously because there's a law against having dogs in the streets.", + "original_text": "Obviously because there's a law against having dogs in the streets.", + "start_time": 5.751607124174983, + "end_time": 10.291108257961831, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--77/temp/line_2_A.wav", + "silence_duration": 0.5948786261591987, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Does it mean that dogs have to stay at home all the", + "original_text": "Does it mean that dogs have to stay at home all the [interrupt] time if the owners don't take them to the park? That seems like it would lead to behavioral issues and pent-up energy for the poor animals.", + "start_time": 10.849613237633175, + "end_time": 19.38294657096651, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--77/temp/line_3_B.wav", + "silence_duration": 0.5585049796713442, + "is_interrupted": true, + "text_after_interrupt": "time if the owners don't take them to the park? That seems like it would lead to behavioral issues and pent-up energy for the poor animals." + }, + { + "speaker": "A", + "text": "Wait, are you saying there's no alternative for dog owners?", + "original_text": "Wait, are you saying there's no alternative for dog owners?", + "start_time": 13.322538407701202, + "end_time": 17.09578103808669, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--77/temp/line_4_A.wav", + "silence_duration": 0.3752228959165828, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Well, I was just wondering if the dogs have to stay at home all the time. It sounds pretty cruel, right? Maybe a dog park is a good idea.", + "original_text": "Well, I was just wondering if the dogs have to stay at home all the time. It sounds pretty cruel, right? Maybe a dog park is a good idea.", + "start_time": 19.7891390453034, + "end_time": 27.49816398861406, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--77/temp/line_5_B.wav", + "silence_duration": 0.4061924743368894, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Maybe they should just allow people to walk their dogs in the streets.", + "original_text": "Maybe they should just allow people to walk their dogs in the streets.", + "start_time": 28.02940606133872, + "end_time": 31.640109009184524, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--77/temp/line_6_A.wav", + "silence_duration": 0.531242072724659, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "But then streets could be a mess.", + "original_text": "But then streets could be a mess.", + "start_time": 31.999549714756835, + "end_time": 33.64816649480218, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--77/temp/line_7_B.wav", + "silence_duration": 0.3594407055723114, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Couldn't people clean up after their dogs?", + "original_text": "Couldn't people clean up after their dogs?", + "start_time": 34.20104260287845, + "end_time": 36.615917886325164, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--77/temp/line_8_A.wav", + "silence_duration": 0.5528761080762725, + "is_interrupted": false + } + ] + }, + "DialogSum--val--78": { + "original_text": "A: Hi Kevin! \nB: Hi Laura, long time no see! What have you been up to lately? \nA: Not much. I can assure you. And you? \nB: Much the same except I do have some big news. \nA: Come on. This suspense is killing me. \nB: No, really, what have you been doing these past few weeks? The last time I saw you, you were looking for a new [interrupt] opportunity to grow professionally, maybe even in a different industry that could challenge your skills and provide better career prospects. \nA: Job, right? Well, that's not exactly true. I was thinking about changing jobs. Luckily, they offered me a new position in the accounting department. \nB: A step up in the big business world. \nA: I wouldn't exaggerate, but I am pleased. I had been hoping to get a promotion for a while. So when it finally came through, I was relieved. Actually, that's why I was looking for a new job. I just didn't want to work there anymore if they weren't going to recognize my [interrupt] potential and all the hard work I had been putting in over the past few years, especially since I had taken on additional responsibilities without proper compensation. \nB: Efforts, I totally get it. Right, sometimes you can do your best and it seems like the others don't know you exist. I hope the money's better. \nA: I got a reasonable raise, now enough about me. I was just saying I didn't want to stay if they didn't recognize my efforts. But anyway, I'm dying to hear your news. \nB: I am getting married.", + "cleaned_text": "A: Hi Kevin! \nB: Hi Laura, long time no see! What have you been up to lately? \nA: Not much. I can assure you. And you? \nB: Much the same except I do have some big news. \nA: Come on. This suspense is killing me. \nB:No, really, what have you been doing these past few weeks? The last time I saw you, you were looking for a new opportunity to grow professionally, maybe even in a different industry that could challenge your skills and provide better career prospects.\nA: Job, right? Well, that's not exactly true. I was thinking about changing jobs. Luckily, they offered me a new position in the accounting department. \nB: A step up in the big business world. \nA:I wouldn't exaggerate, but I am pleased. I had been hoping to get a promotion for a while. So when it finally came through, I was relieved. Actually, that's why I was looking for a new job. I just didn't want to work there anymore if they weren't going to recognize my potential and all the hard work I had been putting in over the past few years, especially since I had taken on additional responsibilities without proper compensation.\nB: Efforts, I totally get it. Right, sometimes you can do your best and it seems like the others don't know you exist. I hope the money's better. \nA: I got a reasonable raise, now enough about me. I was just saying I didn't want to stay if they didn't recognize my efforts. But anyway, I'm dying to hear your news. \nB: I am getting married.", + "total_duration": 73.24598639455782, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--78/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--78/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--78/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Hi Kevin!", + "original_text": "Hi Kevin!", + "start_time": 0, + "end_time": 0.8359183673469388, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--78/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Hi Laura, long time no see! What have you been up to lately?", + "original_text": "Hi Laura, long time no see! What have you been up to lately?", + "start_time": 1.2711947926123486, + "end_time": 4.6032582846758405, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--78/temp/line_1_B.wav", + "silence_duration": 0.4352764252654099, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Not much. I can assure you. And you?", + "original_text": "Not much. I can assure you. And you?", + "start_time": 5.141428306731532, + "end_time": 7.358933975665773, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--78/temp/line_2_A.wav", + "silence_duration": 0.5381700220556915, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Much the same except I do have some big news.", + "original_text": "Much the same except I do have some big news.", + "start_time": 7.697833219231287, + "end_time": 10.066268593380947, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--78/temp/line_3_B.wav", + "silence_duration": 0.3388992435655136, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Come on. This suspense is killing me.", + "original_text": "Come on. This suspense is killing me.", + "start_time": 10.406126702064782, + "end_time": 12.937101758754125, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--78/temp/line_4_A.wav", + "silence_duration": 0.3398581086838353, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "No, really, what have you been doing these past few weeks? The last time I saw you, you were looking for a new", + "original_text": "No, really, what have you been doing these past few weeks? The last time I saw you, you were looking for a new [interrupt] opportunity to grow professionally, maybe even in a different industry that could challenge your skills and provide better career prospects.", + "start_time": 13.35070656298027, + "end_time": 25.88948207318435, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--78/temp/line_5_B.wav", + "silence_duration": 0.413604804226144, + "is_interrupted": true, + "text_after_interrupt": "opportunity to grow professionally, maybe even in a different industry that could challenge your skills and provide better career prospects." + }, + { + "speaker": "A", + "text": "Job, right? Well, that's not exactly true. I was thinking about changing jobs. Luckily, they offered me a new position in the accounting department.", + "original_text": "Job, right? Well, that's not exactly true. I was thinking about changing jobs. Luckily, they offered me a new position in the accounting department.", + "start_time": 19.701364159352153, + "end_time": 28.733926517628795, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--78/temp/line_6_A.wav", + "silence_duration": 0.302409769548512, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "A step up in the big business world.", + "original_text": "A step up in the big business world.", + "start_time": 29.215690752364818, + "end_time": 31.189386897489534, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--78/temp/line_7_B.wav", + "silence_duration": 0.4817642347360224, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I wouldn't exaggerate, but I am pleased. I had been hoping to get a promotion for a while. So when it finally came through, I was relieved. Actually, that's why I was looking for a new job. I just didn't want to work there anymore if they weren't going to recognize my", + "original_text": "I wouldn't exaggerate, but I am pleased. I had been hoping to get a promotion for a while. So when it finally came through, I was relieved. Actually, that's why I was looking for a new job. I just didn't want to work there anymore if they weren't going to recognize my [interrupt] potential and all the hard work I had been putting in over the past few years, especially since I had taken on additional responsibilities without proper compensation.", + "start_time": 31.644326904746134, + "end_time": 56.00205933104999, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--78/temp/line_8_A.wav", + "silence_duration": 0.45494000725660066, + "is_interrupted": true, + "text_after_interrupt": "potential and all the hard work I had been putting in over the past few years, especially since I had taken on additional responsibilities without proper compensation." + }, + { + "speaker": "B", + "text": "Efforts, I totally get it. Right, sometimes you can do your best and it seems like the others don't know you exist. I hope the money's better.", + "original_text": "Efforts, I totally get it. Right, sometimes you can do your best and it seems like the others don't know you exist. I hope the money's better.", + "start_time": 54.307934636491694, + "end_time": 61.23909109907673, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--78/temp/line_9_B.wav", + "silence_duration": 0.37132994453731083, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I got a reasonable raise, now enough about me. I was just saying I didn't want to stay if they didn't recognize my efforts. But anyway, I'm dying to hear your news.", + "original_text": "I got a reasonable raise, now enough about me. I was just saying I didn't want to stay if they didn't recognize my efforts. But anyway, I'm dying to hear your news.", + "start_time": 61.69904128833277, + "end_time": 71.61396192325341, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--78/temp/line_10_A.wav", + "silence_duration": 0.4599501892560396, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I am getting married.", + "original_text": "I am getting married.", + "start_time": 72.2127150292905, + "end_time": 73.24600301114991, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--78/temp/line_11_B.wav", + "silence_duration": 0.5987531060370751, + "is_interrupted": false + } + ] + }, + "DialogSum--val--79": { + "original_text": "A: Where were you yesterday? \nB: I was at home asleep. \nA: Asleep! I thought that you had to take an exam. \nB: I was sick. I had a fever. I couldn't [interrupt] even think clearly, let alone study for the exam, and my head was pounding so badly that I couldn't even keep my eyes open for more than a few minutes at a time. \nA: Wait, you had a fever? Did you see a doctor? \nB: No, I didn't. I just stayed in bed and rested. I couldn't get out of bed. \nA: You still look a little sick. You couldn't go back to [interrupt] sleep after the fever broke because you were too worried about missing the exam and falling behind in your coursework? \nB: Sorry to cut you off, but I actually wanted to ask—what did the professor say about missing the exam? \nA: He said that I'd be able to take a make-up. But I was asking if you could go back to bed now. \nB: I'm going now. I just came here to speak to my professor. \nA: Are you going straight home? \nB: I have to stop at the drugstore on the way. I need some aspirin. \nA: Do you think that you should walk that far? \nB: I have to walk. I didn't bring my car. I didn't think I'd be able to drive today.", + "cleaned_text": "A: Where were you yesterday? \nB: I was at home asleep. \nA: Asleep! I thought that you had to take an exam. \nB:I was sick. I had a fever. I couldn't even think clearly, let alone study for the exam, and my head was pounding so badly that I couldn't even keep my eyes open for more than a few minutes at a time.\nA: Wait, you had a fever? Did you see a doctor? \nB: No, I didn't. I just stayed in bed and rested. I couldn't get out of bed. \nA:You still look a little sick. You couldn't go back to sleep after the fever broke because you were too worried about missing the exam and falling behind in your coursework?\nB: Sorry to cut you off, but I actually wanted to ask—what did the professor say about missing the exam? \nA: He said that I'd be able to take a make-up. But I was asking if you could go back to bed now. \nB: I'm going now. I just came here to speak to my professor. \nA: Are you going straight home? \nB: I have to stop at the drugstore on the way. I need some aspirin. \nA: Do you think that you should walk that far? \nB: I have to walk. I didn't bring my car. I didn't think I'd be able to drive today.", + "total_duration": 56.79283446712018, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--79/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--79/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--79/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Where were you yesterday?", + "original_text": "Where were you yesterday?", + "start_time": 0, + "end_time": 1.3931972789115645, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--79/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I was at home asleep.", + "original_text": "I was at home asleep.", + "start_time": 1.7172676607920705, + "end_time": 3.029195098433794, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--79/temp/line_1_B.wav", + "silence_duration": 0.3240703818805061, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Asleep! I thought that you had to take an exam.", + "original_text": "Asleep! I thought that you had to take an exam.", + "start_time": 3.604094551988534, + "end_time": 6.344049200514611, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--79/temp/line_2_A.wav", + "silence_duration": 0.57489945355474, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I was sick. I had a fever. I couldn't", + "original_text": "I was sick. I had a fever. I couldn't [interrupt] even think clearly, let alone study for the exam, and my head was pounding so badly that I couldn't even keep my eyes open for more than a few minutes at a time.", + "start_time": 6.786360576797874, + "end_time": 17.525589601741185, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--79/temp/line_3_B.wav", + "silence_duration": 0.44231137628326206, + "is_interrupted": true, + "text_after_interrupt": "even think clearly, let alone study for the exam, and my head was pounding so badly that I couldn't even keep my eyes open for more than a few minutes at a time." + }, + { + "speaker": "A", + "text": "Wait, you had a fever? Did you see a doctor?", + "original_text": "Wait, you had a fever? Did you see a doctor?", + "start_time": 9.015476223056377, + "end_time": 11.906360576797873, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--79/temp/line_4_A.wav", + "silence_duration": 0.5890030783099681, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "No, I didn't. I just stayed in bed and rested. I couldn't get out of bed.", + "original_text": "No, I didn't. I just stayed in bed and rested. I couldn't get out of bed.", + "start_time": 17.965001712082252, + "end_time": 22.098153639519893, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--79/temp/line_5_B.wav", + "silence_duration": 0.4394121103410683, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "You still look a little sick. You couldn't go back to", + "original_text": "You still look a little sick. You couldn't go back to [interrupt] sleep after the fever broke because you were too worried about missing the exam and falling behind in your coursework?", + "start_time": 22.659395453877558, + "end_time": 32.16796688244899, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--79/temp/line_6_A.wav", + "silence_duration": 0.5612418143576663, + "is_interrupted": true, + "text_after_interrupt": "sleep after the fever broke because you were too worried about missing the exam and falling behind in your coursework?" + }, + { + "speaker": "B", + "text": "Sorry to cut you off, but I actually wanted to ask—what did the professor say about missing the exam?", + "original_text": "Sorry to cut you off, but I actually wanted to ask—what did the professor say about missing the exam?", + "start_time": 29.252490326050605, + "end_time": 34.52342003126603, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--79/temp/line_7_B.wav", + "silence_duration": 0.5663501876021424, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "He said that I'd be able to take a make-up. But I was asking if you could go back to bed now.", + "original_text": "He said that I'd be able to take a make-up. But I was asking if you could go back to bed now.", + "start_time": 35.09297018478669, + "end_time": 40.46838968592047, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--79/temp/line_8_A.wav", + "silence_duration": 0.5695501535206606, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I'm going now. I just came here to speak to my professor.", + "original_text": "I'm going now. I just came here to speak to my professor.", + "start_time": 40.89949435296868, + "end_time": 44.092238117141015, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--79/temp/line_9_B.wav", + "silence_duration": 0.43110466704820916, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Are you going straight home?", + "original_text": "Are you going straight home?", + "start_time": 44.44943463750609, + "end_time": 45.900681803038964, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--79/temp/line_10_A.wav", + "silence_duration": 0.35719652036506944, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I have to stop at the drugstore on the way. I need some aspirin.", + "original_text": "I have to stop at the drugstore on the way. I need some aspirin.", + "start_time": 46.35480032726679, + "end_time": 49.66364386468175, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--79/temp/line_11_B.wav", + "silence_duration": 0.45411852422782173, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Do you think that you should walk that far?", + "original_text": "Do you think that you should walk that far?", + "start_time": 50.0847090317094, + "end_time": 52.16289497275248, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--79/temp/line_12_A.wav", + "silence_duration": 0.4210651670276461, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I have to walk. I didn't bring my car. I didn't think I'd be able to drive today.", + "original_text": "I have to walk. I didn't bring my car. I didn't think I'd be able to drive today.", + "start_time": 52.63649167150042, + "end_time": 56.79286355358659, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--79/temp/line_13_B.wav", + "silence_duration": 0.47359669874793764, + "is_interrupted": false + } + ] + }, + "DialogSum--val--80": { + "original_text": "A: What a great day! Hey, Tom, do you want to go to the beach this weekend? \nB: Yeah, that is a great idea. Maybe Sara would like to come along with us. \nA: I doubt it. \nB: Why? You are kidding! You know, she loves watching the [interrupt] waves and relaxing by the ocean, especially during sunset when the colors reflect beautifully on the water's surface. \nA: But yesterday afternoon she told me that she would go home this Saturday. \nB: What happened? \nA: She said that her mother was ill and stayed in the hospital, and therefore she wanted to go home to see her. \nB: I am sorry to hear that. Well, what do you think? Should we take some food? \nA: That sounds great. Maybe we could have a picnic on the beach. Then let's take some sandwiches, chips, and uh... maybe some fruit like apples or grapes. \nB: Oh, don't forget the salad as well. We should also take some drinks like Coke and beer. \nA: Good point. In addition, we had better pack beach towels and sun cream. \nB: OK. Please don't forget to give me a call and let's go down together. By the way, you were about to mention something else before I interrupted—what was it? \nA: Oh, right! I was going to say we should take some fruit as well.", + "cleaned_text": "A: What a great day! Hey, Tom, do you want to go to the beach this weekend? \nB: Yeah, that is a great idea. Maybe Sara would like to come along with us. \nA: I doubt it. \nB:Why? You are kidding! You know, she loves watching the waves and relaxing by the ocean, especially during sunset when the colors reflect beautifully on the water's surface.\nA: But yesterday afternoon she told me that she would go home this Saturday. \nB: What happened? \nA: She said that her mother was ill and stayed in the hospital, and therefore she wanted to go home to see her. \nB: I am sorry to hear that. Well, what do you think? Should we take some food? \nA: That sounds great. Maybe we could have a picnic on the beach. Then let's take some sandwiches, chips, and uh... maybe some fruit like apples or grapes. \nB: Oh, don't forget the salad as well. We should also take some drinks like Coke and beer. \nA: Good point. In addition, we had better pack beach towels and sun cream. \nB: OK. Please don't forget to give me a call and let's go down together. By the way, you were about to mention something else before I interrupted—what was it? \nA: Oh, right! I was going to say we should take some fruit as well.", + "total_duration": 64.30299319727891, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--80/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--80/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--80/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "What a great day! Hey, Tom, do you want to go to the beach this weekend?", + "original_text": "What a great day! Hey, Tom, do you want to go to the beach this weekend?", + "start_time": 0, + "end_time": 4.829750566893424, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--80/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yeah, that is a great idea. Maybe Sara would like to come along with us.", + "original_text": "Yeah, that is a great idea. Maybe Sara would like to come along with us.", + "start_time": 5.329963208977045, + "end_time": 9.103205839362532, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--80/temp/line_1_B.wav", + "silence_duration": 0.5002126420836203, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I doubt it.", + "original_text": "I doubt it.", + "start_time": 9.44766067440427, + "end_time": 10.376458860345313, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--80/temp/line_2_A.wav", + "silence_duration": 0.3444548350417375, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Why? You are kidding! You know, she loves watching the", + "original_text": "Why? You are kidding! You know, she loves watching the [interrupt] waves and relaxing by the ocean, especially during sunset when the colors reflect beautifully on the water's surface.", + "start_time": 10.784551532817321, + "end_time": 19.236615024880813, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--80/temp/line_3_B.wav", + "silence_duration": 0.4080926724720081, + "is_interrupted": true, + "text_after_interrupt": "waves and relaxing by the ocean, especially during sunset when the colors reflect beautifully on the water's surface." + }, + { + "speaker": "A", + "text": "But yesterday afternoon she told me that she would go home this Saturday.", + "original_text": "But yesterday afternoon she told me that she would go home this Saturday.", + "start_time": 13.478066272046346, + "end_time": 17.27452885708036, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--80/temp/line_4_A.wav", + "silence_duration": 0.4907503844440776, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "What happened?", + "original_text": "What happened?", + "start_time": 19.80332229968364, + "end_time": 20.476700984490897, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--80/temp/line_5_B.wav", + "silence_duration": 0.5667072748028268, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "She said that her mother was ill and stayed in the hospital, and therefore she wanted to go home to see her.", + "original_text": "She said that her mother was ill and stayed in the hospital, and therefore she wanted to go home to see her.", + "start_time": 20.81431933428865, + "end_time": 26.793457656284115, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--80/temp/line_6_A.wav", + "silence_duration": 0.3376183497977554, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I am sorry to hear that. Well, what do you think? Should we take some food?", + "original_text": "I am sorry to hear that. Well, what do you think? Should we take some food?", + "start_time": 27.109007437644625, + "end_time": 31.20732943310948, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--80/temp/line_7_B.wav", + "silence_duration": 0.3155497813605106, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "That sounds great. Maybe we could have a picnic on the beach. Then let's take some sandwiches, chips, and uh... maybe some fruit like apples or grapes.", + "original_text": "That sounds great. Maybe we could have a picnic on the beach. Then let's take some sandwiches, chips, and uh... maybe some fruit like apples or grapes.", + "start_time": 31.588062290586038, + "end_time": 41.317223288318466, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--80/temp/line_8_A.wav", + "silence_duration": 0.3807328574765576, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Oh, don't forget the salad as well. We should also take some drinks like Coke and beer.", + "original_text": "Oh, don't forget the salad as well. We should also take some drinks like Coke and beer.", + "start_time": 41.867467655989856, + "end_time": 46.38374883512818, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--80/temp/line_9_B.wav", + "silence_duration": 0.5502443676713911, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Good point. In addition, we had better pack beach towels and sun cream.", + "original_text": "Good point. In addition, we had better pack beach towels and sun cream.", + "start_time": 46.97156762860286, + "end_time": 51.522678739713974, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--80/temp/line_10_A.wav", + "silence_duration": 0.5878187934746821, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "OK. Please don't forget to give me a call and let's go down together. By the way, you were about to mention something else before I interrupted—what was it?", + "original_text": "OK. Please don't forget to give me a call and let's go down together. By the way, you were about to mention something else before I interrupted—what was it?", + "start_time": 51.83636718403142, + "end_time": 60.03301117496112, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--80/temp/line_11_B.wav", + "silence_duration": 0.31368844431744575, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Oh, right! I was going to say we should take some fruit as well.", + "original_text": "Oh, right! I was going to say we should take some fruit as well.", + "start_time": 60.5646036355258, + "end_time": 64.3030163339385, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--80/temp/line_12_A.wav", + "silence_duration": 0.53159246056468, + "is_interrupted": false + } + ] + }, + "DialogSum--val--81": { + "original_text": "A: Well, I was walking home from work two days ago, enjoying the nature all around me ... the birds, the frogs, the flowing stream ... [interrupt] the gentle breeze, and the colors of the sunset were just beautiful, creating this perfect peaceful atmosphere that made me completely forget about the stresses of the workday.\nB: Sorry to interrupt, but did this happen during the day or at night?\nA: Oh, it was in the evening, just before sunset. Anyway, I was walking, when this woman knocked me right off my feet, grabbed my stuff, and ran off through the trees. I was so surprised by the ordeal that I didn't go after her.\nB: Yeah. Can you describe the woman for me?\nA: Yeah. He was about a hundred and ninety centimeters tall ...\nB: Wait. You said a woman robbed you.\nA: Well, I'm not really sure. You see, the person was wearing a white and black polka dot dress, a light red sweater over it, and she ... or he ... was wearing a pair of basketball shoes.\nB: Humm. What else can you tell me?\nA: Okay. Like I said, the person was about 190 centimeters tall, heavy build, with long wavy hair. She ... or he ... was probably in his or her late 30's. I didn't get a good look at the person's face, but well ... uh ....\nB: What? Was there something else?\nA: Well, the person ... had a beard.\nB: Ah! What was, uh, taken ... exactly?", + "cleaned_text": "A:Well, I was walking home from work two days ago, enjoying the nature all around me ... the birds, the frogs, the flowing stream ... the gentle breeze, and the colors of the sunset were just beautiful, creating this perfect peaceful atmosphere that made me completely forget about the stresses of the workday.\nB: Sorry to interrupt, but did this happen during the day or at night?\nA: Oh, it was in the evening, just before sunset. Anyway, I was walking, when this woman knocked me right off my feet, grabbed my stuff, and ran off through the trees. I was so surprised by the ordeal that I didn't go after her.\nB: Yeah. Can you describe the woman for me?\nA: Yeah. He was about a hundred and ninety centimeters tall ...\nB: Wait. You said a woman robbed you.\nA: Well, I'm not really sure. You see, the person was wearing a white and black polka dot dress, a light red sweater over it, and she ... or he ... was wearing a pair of basketball shoes.\nB: Humm. What else can you tell me?\nA: Okay. Like I said, the person was about 190 centimeters tall, heavy build, with long wavy hair. She ... or he ... was probably in his or her late 30's. I didn't get a good look at the person's face, but well ... uh ....\nB: What? Was there something else?\nA: Well, the person ... had a beard.\nB: Ah! What was, uh, taken ... exactly?", + "total_duration": 81.14367346938775, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--81/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--81/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--81/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Well, I was walking home from work two days ago, enjoying the nature all around me ... the birds, the frogs, the flowing stream ...", + "original_text": "Well, I was walking home from work two days ago, enjoying the nature all around me ... the birds, the frogs, the flowing stream ... [interrupt] the gentle breeze, and the colors of the sunset were just beautiful, creating this perfect peaceful atmosphere that made me completely forget about the stresses of the workday.", + "start_time": 0, + "end_time": 17.99546485260771, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--81/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": true, + "text_after_interrupt": "the gentle breeze, and the colors of the sunset were just beautiful, creating this perfect peaceful atmosphere that made me completely forget about the stresses of the workday." + }, + { + "speaker": "B", + "text": "Sorry to interrupt, but did this happen during the day or at night?", + "original_text": "Sorry to interrupt, but did this happen during the day or at night?", + "start_time": 7.836734693877551, + "end_time": 11.215238095238096, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--81/temp/line_1_B.wav", + "silence_duration": 0.3437209749218077, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Oh, it was in the evening, just before sunset. Anyway, I was walking, when this woman knocked me right off my feet, grabbed my stuff, and ran off through the trees. I was so surprised by the ordeal that I didn't go after her.", + "original_text": "Oh, it was in the evening, just before sunset. Anyway, I was walking, when this woman knocked me right off my feet, grabbed my stuff, and ran off through the trees. I was so surprised by the ordeal that I didn't go after her.", + "start_time": 18.377319254227707, + "end_time": 31.856502927697093, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--81/temp/line_2_A.wav", + "silence_duration": 0.3818544016199951, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yeah. Can you describe the woman for me?", + "original_text": "Yeah. Can you describe the woman for me?", + "start_time": 32.278729153745125, + "end_time": 34.80970421043447, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--81/temp/line_3_B.wav", + "silence_duration": 0.4222262260480344, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Yeah. He was about a hundred and ninety centimeters tall ...", + "original_text": "Yeah. He was about a hundred and ninety centimeters tall ...", + "start_time": 35.24865013934031, + "end_time": 39.079942656347114, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--81/temp/line_4_A.wav", + "silence_duration": 0.4389459289058424, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Wait. You said a woman robbed you.", + "original_text": "Wait. You said a woman robbed you.", + "start_time": 39.54958763662519, + "end_time": 41.9644629200719, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--81/temp/line_5_B.wav", + "silence_duration": 0.4696449802780779, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Well, I'm not really sure. You see, the person was wearing a white and black polka dot dress, a light red sweater over it, and she ... or he ... was wearing a pair of basketball shoes.", + "original_text": "Well, I'm not really sure. You see, the person was wearing a white and black polka dot dress, a light red sweater over it, and she ... or he ... was wearing a pair of basketball shoes.", + "start_time": 42.43334412094043, + "end_time": 54.11298130914905, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--81/temp/line_6_A.wav", + "silence_duration": 0.46888120086852847, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Humm. What else can you tell me?", + "original_text": "Humm. What else can you tell me?", + "start_time": 54.705829494959865, + "end_time": 56.737575526705896, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--81/temp/line_7_B.wav", + "silence_duration": 0.592848185810817, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Okay. Like I said, the person was about 190 centimeters tall, heavy build, with long wavy hair. She ... or he ... was probably in his or her late 30's. I didn't get a good look at the person's face, but well ... uh ....", + "original_text": "Okay. Like I said, the person was about 190 centimeters tall, heavy build, with long wavy hair. She ... or he ... was probably in his or her late 30's. I didn't get a good look at the person's face, but well ... uh ....", + "start_time": 57.31069415080311, + "end_time": 73.901351747175, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--81/temp/line_8_A.wav", + "silence_duration": 0.5731186240972155, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "What? Was there something else?", + "original_text": "What? Was there something else?", + "start_time": 74.42761567578117, + "end_time": 76.15750229709636, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--81/temp/line_9_B.wav", + "silence_duration": 0.526263928606171, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Well, the person ... had a beard.", + "original_text": "Well, the person ... had a beard.", + "start_time": 76.56964188041877, + "end_time": 78.43884822962512, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--81/temp/line_10_A.wav", + "silence_duration": 0.41213958332241263, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Ah! What was, uh, taken ... exactly?", + "original_text": "Ah! What was, uh, taken ... exactly?", + "start_time": 78.8913459195765, + "end_time": 81.14368152048353, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--81/temp/line_11_B.wav", + "silence_duration": 0.4524976899513702, + "is_interrupted": false + } + ] + }, + "DialogSum--val--82": { + "original_text": "A: I don't know what Jim's got to grumble about. My workload has doubled in the past year and I still [interrupt] manage to keep up with everything without much complaint, even though I've had to work late several nights a week and skip lunch breaks to meet all the deadlines.\nB: Sorry to jump in, but do you think the boss is aware of how much your workload has increased? Maybe that's why he's more lenient with you.\nA: He might be, but I was going to say that Jim isn't doing anything different from when he arrived, as far as I can see.\nB: Yeah, but he's not as energetic as you are. Well, no one is. But the boss doesn't blame me when I get a bit behind. He is very understanding with me. But with Jim, he goes on and on.\nA: Speaking of the boss, I didn't finish earlier—do you think he knows how much Jim's workload has changed since he started? Or does he think Jim's just not pulling his weight?", + "cleaned_text": "A:I don't know what Jim's got to grumble about. My workload has doubled in the past year and I still manage to keep up with everything without much complaint, even though I've had to work late several nights a week and skip lunch breaks to meet all the deadlines.\nB: Sorry to jump in, but do you think the boss is aware of how much your workload has increased? Maybe that's why he's more lenient with you.\nA: He might be, but I was going to say that Jim isn't doing anything different from when he arrived, as far as I can see.\nB: Yeah, but he's not as energetic as you are. Well, no one is. But the boss doesn't blame me when I get a bit behind. He is very understanding with me. But with Jim, he goes on and on.\nA: Speaking of the boss, I didn't finish earlier—do you think he knows how much Jim's workload has changed since he started? Or does he think Jim's just not pulling his weight?", + "total_duration": 42.286303854875285, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--82/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--82/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--82/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "I don't know what Jim's got to grumble about. My workload has doubled in the past year and I still", + "original_text": "I don't know what Jim's got to grumble about. My workload has doubled in the past year and I still [interrupt] manage to keep up with everything without much complaint, even though I've had to work late several nights a week and skip lunch breaks to meet all the deadlines.", + "start_time": 0, + "end_time": 14.349931972789115, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--82/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": true, + "text_after_interrupt": "manage to keep up with everything without much complaint, even though I've had to work late several nights a week and skip lunch breaks to meet all the deadlines." + }, + { + "speaker": "B", + "text": "Sorry to jump in, but do you think the boss is aware of how much your workload has increased? Maybe that's why he's more lenient with you.", + "original_text": "Sorry to jump in, but do you think the boss is aware of how much your workload has increased? Maybe that's why he's more lenient with you.", + "start_time": 5.851428571428571, + "end_time": 13.142494331065759, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--82/temp/line_1_B.wav", + "silence_duration": 0.495830806625727, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "He might be, but I was going to say that Jim isn't doing anything different from when he arrived, as far as I can see.", + "original_text": "He might be, but I was going to say that Jim isn't doing anything different from when he arrived, as far as I can see.", + "start_time": 14.918961478660325, + "end_time": 21.571478485463047, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--82/temp/line_2_A.wav", + "silence_duration": 0.56902950587121, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yeah, but he's not as energetic as you are. Well, no one is. But the boss doesn't blame me when I get a bit behind. He is very understanding with me. But with Jim, he goes on and on.", + "original_text": "Yeah, but he's not as energetic as you are. Well, no one is. But the boss doesn't blame me when I get a bit behind. He is very understanding with me. But with Jim, he goes on and on.", + "start_time": 22.03696297152614, + "end_time": 31.92866365179825, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--82/temp/line_3_B.wav", + "silence_duration": 0.46548448606309256, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Speaking of the boss, I didn't finish earlier—do you think he knows how much Jim's workload has changed since he started? Or does he think Jim's just not pulling his weight?", + "original_text": "Speaking of the boss, I didn't finish earlier—do you think he knows how much Jim's workload has changed since he started? Or does he think Jim's just not pulling his weight?", + "start_time": 32.452654550199725, + "end_time": 42.286305343850515, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--82/temp/line_4_A.wav", + "silence_duration": 0.523990898401476, + "is_interrupted": false + } + ] + }, + "DialogSum--val--83": { + "original_text": "A: I'd like to find a job.\nB: We have several part-time jobs available here. Would you like to [interrupt] hear more about them, or do you have a specific type of job in mind? We have positions ranging from customer service to technical support and even some entry-level IT roles.\nA: Sorry to jump in, could you tell me if any of these jobs are related to technology? I'm particularly interested in roles that involve working with computers.\nB: Yes, we do have a job at the computer center. Would you like to apply for it?\nA: Yes, thank you. I was about to ask if I need to fill out any forms for the application process [interrupt] or if there's an interview I should prepare for, and what kind of documentation I might need to bring with me for the hiring process.\nB: Please fill out the form.", + "cleaned_text": "A: I'd like to find a job.\nB:We have several part-time jobs available here. Would you like to hear more about them, or do you have a specific type of job in mind? We have positions ranging from customer service to technical support and even some entry-level IT roles.\nA: Sorry to jump in, could you tell me if any of these jobs are related to technology? I'm particularly interested in roles that involve working with computers.\nB: Yes, we do have a job at the computer center. Would you like to apply for it?\nA:Yes, thank you. I was about to ask if I need to fill out any forms for the application process or if there's an interview I should prepare for, and what kind of documentation I might need to bring with me for the hiring process.\nB: Please fill out the form.", + "total_duration": 37.43424036281179, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--83/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--83/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--83/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "I'd like to find a job.", + "original_text": "I'd like to find a job.", + "start_time": 0, + "end_time": 1.497687074829932, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--83/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "We have several part-time jobs available here. Would you like to", + "original_text": "We have several part-time jobs available here. Would you like to [interrupt] hear more about them, or do you have a specific type of job in mind? We have positions ranging from customer service to technical support and even some entry-level IT roles.", + "start_time": 1.8874399028055748, + "end_time": 15.146034007113965, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--83/temp/line_1_B.wav", + "silence_duration": 0.38975282797564287, + "is_interrupted": true, + "text_after_interrupt": "hear more about them, or do you have a specific type of job in mind? We have positions ranging from customer service to technical support and even some entry-level IT roles." + }, + { + "speaker": "A", + "text": "Sorry to jump in, could you tell me if any of these jobs are related to technology? I'm particularly interested in roles that involve working with computers.", + "original_text": "Sorry to jump in, could you tell me if any of these jobs are related to technology? I'm particularly interested in roles that involve working with computers.", + "start_time": 4.998913825708069, + "end_time": 14.867394551331651, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--83/temp/line_2_A.wav", + "silence_duration": 0.5735690309665286, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, we do have a job at the computer center. Would you like to apply for it?", + "original_text": "Yes, we do have a job at the computer center. Would you like to apply for it?", + "start_time": 15.5158027243346, + "end_time": 19.230995468098772, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--83/temp/line_3_B.wav", + "silence_duration": 0.36976871722063465, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Yes, thank you. I was about to ask if I need to fill out any forms for the application process", + "original_text": "Yes, thank you. I was about to ask if I need to fill out any forms for the application process [interrupt] or if there's an interview I should prepare for, and what kind of documentation I might need to bring with me for the hiring process.", + "start_time": 19.61296481272584, + "end_time": 32.51164961998207, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--83/temp/line_4_A.wav", + "silence_duration": 0.381969344627067, + "is_interrupted": true, + "text_after_interrupt": "or if there's an interview I should prepare for, and what kind of documentation I might need to bring with me for the hiring process." + }, + { + "speaker": "B", + "text": "Please fill out the form.", + "original_text": "Please fill out the form.", + "start_time": 36.12234996406859, + "end_time": 37.43427740171031, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--83/temp/line_5_B.wav", + "silence_duration": 0.5540416784786463, + "is_interrupted": false + } + ] + }, + "DialogSum--val--84": { + "original_text": "A: What did the boss say to you? \nB: He asked me to beef up in the work. \nA: Yeah. You look so unhappy recently. What's the [interrupt] making you feel this way? Is it just work-related stress or is there something else going on in your personal life that's affecting your mood? \nB: Sorry to cut you off, but when you say \"beef up,\" do you mean he wants you to take on more responsibility or just improve your current tasks? \nA: He wants me to improve my current tasks. By the way, you were asking what's the matter with me. Nothing, thanks. I am just not in the mood these days.", + "cleaned_text": "A: What did the boss say to you? \nB: He asked me to beef up in the work. \nA:Yeah. You look so unhappy recently. What's the making you feel this way? Is it just work-related stress or is there something else going on in your personal life that's affecting your mood?\nB: Sorry to cut you off, but when you say \"beef up,\" do you mean he wants you to take on more responsibility or just improve your current tasks? \nA: He wants me to improve my current tasks. By the way, you were asking what's the matter with me. Nothing, thanks. I am just not in the mood these days.", + "total_duration": 25.80063492063492, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--84/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--84/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--84/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "What did the boss say to you?", + "original_text": "What did the boss say to you?", + "start_time": 0, + "end_time": 1.6486167800453515, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--84/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "He asked me to beef up in the work.", + "original_text": "He asked me to beef up in the work.", + "start_time": 2.0874775963933536, + "end_time": 3.6432145578446007, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--84/temp/line_1_B.wav", + "silence_duration": 0.43886081634800195, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Yeah. You look so unhappy recently. What's the", + "original_text": "Yeah. You look so unhappy recently. What's the [interrupt] making you feel this way? Is it just work-related stress or is there something else going on in your personal life that's affecting your mood?", + "start_time": 4.0182716758889825, + "end_time": 15.976548319879912, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--84/temp/line_2_A.wav", + "silence_duration": 0.3750571180443814, + "is_interrupted": true, + "text_after_interrupt": "making you feel this way? Is it just work-related stress or is there something else going on in your personal life that's affecting your mood?" + }, + { + "speaker": "B", + "text": "Sorry to cut you off, but when you say \"beef up,\" do you mean he wants you to take on more responsibility or just improve your current tasks?", + "original_text": "Sorry to cut you off, but when you say \"beef up,\" do you mean he wants you to take on more responsibility or just improve your current tasks?", + "start_time": 7.79151430627447, + "end_time": 15.500539249585128, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--84/temp/line_3_B.wav", + "silence_duration": 0.31218725088591764, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "He wants me to improve my current tasks. By the way, you were asking what's the matter with me. Nothing, thanks. I am just not in the mood these days.", + "original_text": "He wants me to improve my current tasks. By the way, you were asking what's the matter with me. Nothing, thanks. I am just not in the mood these days.", + "start_time": 16.4313933783313, + "end_time": 25.800645079011574, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--84/temp/line_4_A.wav", + "silence_duration": 0.4548450584513869, + "is_interrupted": false + } + ] + }, + "DialogSum--val--85": { + "original_text": "A: I'll always remember my college days.\nB: Oh yeah?\nA: It was one of the best times in my life. It was tough, but I made it. I became a college [interrupt] graduate and made lifelong friends along the way while also developing valuable skills that have served me well throughout my professional career.\nB: Sorry to jump in, but how did you feel when you finally graduated? That must have been a big moment.\nA: It was a proud day for me. My family attended the graduation ceremony. I was so nervous. I couldn't find my cap and gown, but it all worked out in the end.\nB: What did you do after graduation?\nA: I was planning to attend graduate school, but then I was offered a good job doing marketing, so I changed my [interrupt] career path and decided to enter the workforce instead of pursuing further education immediately, which turned out to be the right choice for me.\nB: Marketing? That sounds like a great opportunity. Are you happy with your decision?\nA: I sure am. But I was going to say I changed my mind about grad school. So, what about you? How did you feel when you graduated?\nB: It was also a proud day for me, but I also felt like a kind of loss that day.\nA: How could it be?\nB: While seeing others going to work or continue their study, I didn't know what I would do.", + "cleaned_text": "A: I'll always remember my college days.\nB: Oh yeah?\nA:It was one of the best times in my life. It was tough, but I made it. I became a college graduate and made lifelong friends along the way while also developing valuable skills that have served me well throughout my professional career.\nB: Sorry to jump in, but how did you feel when you finally graduated? That must have been a big moment.\nA: It was a proud day for me. My family attended the graduation ceremony. I was so nervous. I couldn't find my cap and gown, but it all worked out in the end.\nB: What did you do after graduation?\nA:I was planning to attend graduate school, but then I was offered a good job doing marketing, so I changed my career path and decided to enter the workforce instead of pursuing further education immediately, which turned out to be the right choice for me.\nB: Marketing? That sounds like a great opportunity. Are you happy with your decision?\nA: I sure am. But I was going to say I changed my mind about grad school. So, what about you? How did you feel when you graduated?\nB: It was also a proud day for me, but I also felt like a kind of loss that day.\nA: How could it be?\nB: While seeing others going to work or continue their study, I didn't know what I would do.", + "total_duration": 68.11301587301587, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--85/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--85/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--85/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "I'll always remember my college days.", + "original_text": "I'll always remember my college days.", + "start_time": 0, + "end_time": 2.2987755102040817, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--85/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Oh yeah?", + "original_text": "Oh yeah?", + "start_time": 2.690507980900682, + "end_time": 3.305836779086623, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--85/temp/line_1_B.wav", + "silence_duration": 0.39173247069660067, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "It was one of the best times in my life. It was tough, but I made it. I became a college", + "original_text": "It was one of the best times in my life. It was tough, but I made it. I became a college [interrupt] graduate and made lifelong friends along the way while also developing valuable skills that have served me well throughout my professional career.", + "start_time": 3.6142188638831714, + "end_time": 17.929320904699498, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--85/temp/line_2_A.wav", + "silence_duration": 0.30838208479654833, + "is_interrupted": true, + "text_after_interrupt": "graduate and made lifelong friends along the way while also developing valuable skills that have served me well throughout my professional career." + }, + { + "speaker": "B", + "text": "Sorry to jump in, but how did you feel when you finally graduated? That must have been a big moment.", + "original_text": "Sorry to jump in, but how did you feel when you finally graduated? That must have been a big moment.", + "start_time": 10.289955825334419, + "end_time": 15.119706392227844, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--85/temp/line_3_B.wav", + "silence_duration": 0.45512343855087045, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "It was a proud day for me. My family attended the graduation ceremony. I was so nervous. I couldn't find my cap and gown, but it all worked out in the end.", + "original_text": "It was a proud day for me. My family attended the graduation ceremony. I was so nervous. I couldn't find my cap and gown, but it all worked out in the end.", + "start_time": 18.411521134976518, + "end_time": 29.023040409352937, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--85/temp/line_4_A.wav", + "silence_duration": 0.4822002302770184, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "What did you do after graduation?", + "original_text": "What did you do after graduation?", + "start_time": 29.459849618003332, + "end_time": 31.189736239318524, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--85/temp/line_5_B.wav", + "silence_duration": 0.43680920865039635, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I was planning to attend graduate school, but then I was offered a good job doing marketing, so I changed my", + "original_text": "I was planning to attend graduate school, but then I was offered a good job doing marketing, so I changed my [interrupt] career path and decided to enter the workforce instead of pursuing further education immediately, which turned out to be the right choice for me.", + "start_time": 31.561796169180937, + "end_time": 46.9334061465052, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--85/temp/line_6_A.wav", + "silence_duration": 0.3720599298624137, + "is_interrupted": true, + "text_after_interrupt": "career path and decided to enter the workforce instead of pursuing further education immediately, which turned out to be the right choice for me." + }, + { + "speaker": "B", + "text": "Marketing? That sounds like a great opportunity. Are you happy with your decision?", + "original_text": "Marketing? That sounds like a great opportunity. Are you happy with your decision?", + "start_time": 43.92145333618262, + "end_time": 48.96018349491278, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--85/temp/line_7_B.wav", + "silence_duration": 0.3796432225348423, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I sure am. But I was going to say I changed my mind about grad school. So, what about you? How did you feel when you graduated?", + "original_text": "I sure am. But I was going to say I changed my mind about grad school. So, what about you? How did you feel when you graduated?", + "start_time": 49.507968376137896, + "end_time": 57.51885272987939, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--85/temp/line_8_A.wav", + "silence_duration": 0.5477848812251094, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "It was also a proud day for me, but I also felt like a kind of loss that day.", + "original_text": "It was also a proud day for me, but I also felt like a kind of loss that day.", + "start_time": 57.992833155825544, + "end_time": 62.207254924533025, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--85/temp/line_9_B.wav", + "silence_duration": 0.4739804259461491, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "How could it be?", + "original_text": "How could it be?", + "start_time": 62.65106985418919, + "end_time": 63.74240772266992, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--85/temp/line_10_A.wav", + "silence_duration": 0.44381492965616154, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "While seeing others going to work or continue their study, I didn't know what I would do.", + "original_text": "While seeing others going to work or continue their study, I didn't know what I would do.", + "start_time": 64.31659133056972, + "end_time": 68.11305391560373, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--85/temp/line_11_B.wav", + "silence_duration": 0.5741836078998037, + "is_interrupted": false + } + ] + }, + "DialogSum--val--87": { + "original_text": "A: How old are you? \nB: Nine . . . but I'll be ten on May 1st. When is your [interrupt] birthday? I've been curious because we're in the same class and I'd love to know if we share the same birth month or maybe even the same day! \nA: Sorry, I just realized—I'll be ten on April 14th, so I'm a bit older than you! \nB: Oh, you're right! Are you going to have a birthday party? \nA: I might! But you were asking about my birthday earlier—it's on April 14th. What about you? Any party plans?", + "cleaned_text": "A: How old are you? \nB:Nine . . . but I'll be ten on May 1st. When is your birthday? I've been curious because we're in the same class and I'd love to know if we share the same birth month or maybe even the same day!\nA: Sorry, I just realized—I'll be ten on April 14th, so I'm a bit older than you! \nB: Oh, you're right! Are you going to have a birthday party? \nA: I might! But you were asking about my birthday earlier—it's on April 14th. What about you? Any party plans?", + "total_duration": 22.254285714285714, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--87/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--87/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--87/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "How old are you?", + "original_text": "How old are you?", + "start_time": 0, + "end_time": 0.9752380952380952, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--87/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Nine . . . but I'll be ten on May 1st. When is your", + "original_text": "Nine . . . but I'll be ten on May 1st. When is your [interrupt] birthday? I've been curious because we're in the same class and I'd love to know if we share the same birth month or maybe even the same day!", + "start_time": 1.440225771255217, + "end_time": 11.07650695039354, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--87/temp/line_1_B.wav", + "silence_duration": 0.4649876760171216, + "is_interrupted": true, + "text_after_interrupt": "birthday? I've been curious because we're in the same class and I'd love to know if we share the same birth month or maybe even the same day!" + }, + { + "speaker": "A", + "text": "Sorry, I just realized—I'll be ten on April 14th, so I'm a bit older than you!", + "original_text": "Sorry, I just realized—I'll be ten on April 14th, so I'm a bit older than you!", + "start_time": 4.7955092179672345, + "end_time": 10.635327812071543, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--87/temp/line_2_A.wav", + "silence_duration": 0.3309613165576649, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Oh, you're right! Are you going to have a birthday party?", + "original_text": "Oh, you're right! Are you going to have a birthday party?", + "start_time": 11.547122013360553, + "end_time": 13.845897523564634, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--87/temp/line_3_B.wav", + "silence_duration": 0.4706150629670141, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I might! But you were asking about my birthday earlier—it's on April 14th. What about you? Any party plans?", + "original_text": "I might! But you were asking about my birthday earlier—it's on April 14th. What about you? Any party plans?", + "start_time": 14.359524319478698, + "end_time": 22.254308899977566, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--87/temp/line_4_A.wav", + "silence_duration": 0.513626795914064, + "is_interrupted": false + } + ] + }, + "DialogSum--val--88": { + "original_text": "A: This party rocks! \nB: You said it. Good beer, good music, and on top of that, there are so many hot girls [interrupt] here tonight, each one more stunning than the last, and the atmosphere is absolutely electric with all these beautiful people mingling around. \nA: Speaking of hot girls, check out that one over there. I think I'm in love! \nB: Well, she's alright, but not really my cup of tea. What about the blond with the red dress? \nA: Oh, that's Janice. She's just new in town. You have a thing for blonds, eh? \nB: Yeah! She could do anything she wants to me! \nA: I bet. Why not go over and talk to her? She's really nice. \nB: I don't think so. I get so nervous talking to girls. I always put my foot in my mouth, scare her off, and end up looking like a real fool. Besides, she is way out of my comfort zone. I just don't have the confidence to approach her. \nA: Out of your league? Come on! Man up! You'll never know until you try. \nB: Okay okay, just let me have another cup of beers to get my head in the game. \nA: Alright. But I think you ought to move soon. \nB: Why? Oh, and what were you going to say about her being out of my league?", + "cleaned_text": "A: This party rocks! \nB:You said it. Good beer, good music, and on top of that, there are so many hot girls here tonight, each one more stunning than the last, and the atmosphere is absolutely electric with all these beautiful people mingling around.\nA: Speaking of hot girls, check out that one over there. I think I'm in love! \nB: Well, she's alright, but not really my cup of tea. What about the blond with the red dress? \nA: Oh, that's Janice. She's just new in town. You have a thing for blonds, eh? \nB: Yeah! She could do anything she wants to me! \nA: I bet. Why not go over and talk to her? She's really nice. \nB: I don't think so. I get so nervous talking to girls. I always put my foot in my mouth, scare her off, and end up looking like a real fool. Besides, she is way out of my comfort zone. I just don't have the confidence to approach her. \nA: Out of your league? Come on! Man up! You'll never know until you try. \nB: Okay okay, just let me have another cup of beers to get my head in the game. \nA: Alright. But I think you ought to move soon. \nB: Why? Oh, and what were you going to say about her being out of my league?", + "total_duration": 60.588208616780044, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--88/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--88/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--88/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "This party rocks!", + "original_text": "This party rocks!", + "start_time": 0, + "end_time": 1.3583673469387756, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--88/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "You said it. Good beer, good music, and on top of that, there are so many hot girls", + "original_text": "You said it. Good beer, good music, and on top of that, there are so many hot girls [interrupt] here tonight, each one more stunning than the last, and the atmosphere is absolutely electric with all these beautiful people mingling around.", + "start_time": 1.711904085871714, + "end_time": 13.205781636892121, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--88/temp/line_1_B.wav", + "silence_duration": 0.3535367389329384, + "is_interrupted": true, + "text_after_interrupt": "here tonight, each one more stunning than the last, and the atmosphere is absolutely electric with all these beautiful people mingling around." + }, + { + "speaker": "A", + "text": "Speaking of hot girls, check out that one over there. I think I'm in love!", + "original_text": "Speaking of hot girls, check out that one over there. I think I'm in love!", + "start_time": 6.181745355712984, + "end_time": 10.895396149363776, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--88/temp/line_2_A.wav", + "silence_duration": 0.47408244174811687, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Well, she's alright, but not really my cup of tea. What about the blond with the red dress?", + "original_text": "Well, she's alright, but not really my cup of tea. What about the blond with the red dress?", + "start_time": 13.511119486822098, + "end_time": 18.282820167094208, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--88/temp/line_3_B.wav", + "silence_duration": 0.305337849929977, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Oh, that's Janice. She's just new in town. You have a thing for blonds, eh?", + "original_text": "Oh, that's Janice. She's just new in town. You have a thing for blonds, eh?", + "start_time": 18.856456371399606, + "end_time": 24.06933618999371, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--88/temp/line_4_A.wav", + "silence_duration": 0.5736362043053975, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yeah! She could do anything she wants to me!", + "original_text": "Yeah! She could do anything she wants to me!", + "start_time": 24.471368003567978, + "end_time": 27.106832856175686, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--88/temp/line_5_B.wav", + "silence_duration": 0.40203181357426776, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I bet. Why not go over and talk to her? She's really nice.", + "original_text": "I bet. Why not go over and talk to her? She's really nice.", + "start_time": 27.415832438563644, + "end_time": 31.467714524731445, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--88/temp/line_6_A.wav", + "silence_duration": 0.30899958238795966, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I don't think so. I get so nervous talking to girls. I always put my foot in my mouth, scare her off, and end up looking like a real fool. Besides, she is way out of my comfort zone. I just don't have the confidence to approach her.", + "original_text": "I don't think so. I get so nervous talking to girls. I always put my foot in my mouth, scare her off, and end up looking like a real fool. Besides, she is way out of my comfort zone. I just don't have the confidence to approach her.", + "start_time": 31.83525631893802, + "end_time": 44.07217241871126, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--88/temp/line_7_B.wav", + "silence_duration": 0.3675417942065748, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Out of your league? Come on! Man up! You'll never know until you try.", + "original_text": "Out of your league? Come on! Man up! You'll never know until you try.", + "start_time": 44.388981967335575, + "end_time": 48.6846735773129, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--88/temp/line_8_A.wav", + "silence_duration": 0.3168095486243146, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Okay okay, just let me have another cup of beers to get my head in the game.", + "original_text": "Okay okay, just let me have another cup of beers to get my head in the game.", + "start_time": 49.2470309805543, + "end_time": 53.206033248127994, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--88/temp/line_9_B.wav", + "silence_duration": 0.5623574032413976, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Alright. But I think you ought to move soon.", + "original_text": "Alright. But I think you ought to move soon.", + "start_time": 53.65883763992112, + "end_time": 56.213032651258985, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--88/temp/line_10_A.wav", + "silence_duration": 0.45280439179312304, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Why? Oh, and what were you going to say about her being out of my league?", + "original_text": "Why? Oh, and what were you going to say about her being out of my league?", + "start_time": 56.652469646380084, + "end_time": 60.58825195930525, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--88/temp/line_11_B.wav", + "silence_duration": 0.4394369951210955, + "is_interrupted": false + } + ] + }, + "DialogSum--val--90": { + "original_text": "A: Good morning! \nB: Good morning, Gav! Did you sleep well last night? \nA: I slept like a baby. I fell asleep right away last night, didn't wake up once, and didn't have any [interrupt] strange dreams or anything like that, which is quite unusual for me since I typically have very vivid dreams that sometimes border on being unsettling. \nB: Nightmares? That's great news! You look much more relaxed than you did yesterday. \nA: I feel much better, but I'm still worried about something. \nB: What's that? \nA: Well, I have to drive to school for a meeting this morning, and I'm going to end up getting stuck in rush-hour traffic. \nB: That's annoying, but nothing to worry about. \nA: For me, traffic jams are quite stressful, because I'm pretty impatient. How can I prevent myself from getting stressed if I get stuck in a traffic jam? \nB: Just breathe deeply when you feel yourself getting [interrupt] tense or frustrated, and maybe try listening to some calming music or an interesting podcast to distract yourself from the situation while you're waiting. \nA: Upset? Ok, I'll try that. By the way, I didn't mention earlier, I didn't have any nightmares last night, which is rare for me. \nB: That's a good sign. Is there anything else bothering you?", + "cleaned_text": "A: Good morning! \nB: Good morning, Gav! Did you sleep well last night? \nA:I slept like a baby. I fell asleep right away last night, didn't wake up once, and didn't have any strange dreams or anything like that, which is quite unusual for me since I typically have very vivid dreams that sometimes border on being unsettling.\nB: Nightmares? That's great news! You look much more relaxed than you did yesterday. \nA: I feel much better, but I'm still worried about something. \nB: What's that? \nA: Well, I have to drive to school for a meeting this morning, and I'm going to end up getting stuck in rush-hour traffic. \nB: That's annoying, but nothing to worry about. \nA: For me, traffic jams are quite stressful, because I'm pretty impatient. How can I prevent myself from getting stressed if I get stuck in a traffic jam? \nB:Just breathe deeply when you feel yourself getting tense or frustrated, and maybe try listening to some calming music or an interesting podcast to distract yourself from the situation while you're waiting.\nA: Upset? Ok, I'll try that. By the way, I didn't mention earlier, I didn't have any nightmares last night, which is rare for me. \nB: That's a good sign. Is there anything else bothering you?", + "total_duration": 63.535328798185944, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--90/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--90/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--90/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Good morning!", + "original_text": "Good morning!", + "start_time": 0, + "end_time": 0.7894784580498866, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--90/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Good morning, Gav! Did you sleep well last night?", + "original_text": "Good morning, Gav! Did you sleep well last night?", + "start_time": 1.200643934771021, + "end_time": 3.3949296490567353, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--90/temp/line_1_B.wav", + "silence_duration": 0.41116547672113446, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I slept like a baby. I fell asleep right away last night, didn't wake up once, and didn't have any", + "original_text": "I slept like a baby. I fell asleep right away last night, didn't wake up once, and didn't have any [interrupt] strange dreams or anything like that, which is quite unusual for me since I typically have very vivid dreams that sometimes border on being unsettling.", + "start_time": 3.9279035868342653, + "end_time": 20.123821954181203, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--90/temp/line_2_A.wav", + "silence_duration": 0.5329739377775299, + "is_interrupted": true, + "text_after_interrupt": "strange dreams or anything like that, which is quite unusual for me since I typically have very vivid dreams that sometimes border on being unsettling." + }, + { + "speaker": "B", + "text": "Nightmares? That's great news! You look much more relaxed than you did yesterday.", + "original_text": "Nightmares? That's great news! You look much more relaxed than you did yesterday.", + "start_time": 10.74296027617667, + "end_time": 15.29407138728778, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--90/temp/line_3_B.wav", + "silence_duration": 0.5875764912666481, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I feel much better, but I'm still worried about something.", + "original_text": "I feel much better, but I'm still worried about something.", + "start_time": 20.655034482106196, + "end_time": 24.091587770088054, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--90/temp/line_4_A.wav", + "silence_duration": 0.5312125279249914, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "What's that?", + "original_text": "What's that?", + "start_time": 24.56613101729162, + "end_time": 25.378829429990034, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--90/temp/line_5_B.wav", + "silence_duration": 0.4745432472035652, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Well, I have to drive to school for a meeting this morning, and I'm going to end up getting stuck in rush-hour traffic.", + "original_text": "Well, I have to drive to school for a meeting this morning, and I'm going to end up getting stuck in rush-hour traffic.", + "start_time": 25.74502939635551, + "end_time": 32.11890694737592, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--90/temp/line_6_A.wav", + "silence_duration": 0.36619996636547325, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "That's annoying, but nothing to worry about.", + "original_text": "That's annoying, but nothing to worry about.", + "start_time": 32.541749431281346, + "end_time": 34.63154534964869, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--90/temp/line_7_B.wav", + "silence_duration": 0.4228424839054281, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "For me, traffic jams are quite stressful, because I'm pretty impatient. How can I prevent myself from getting stressed if I get stuck in a traffic jam?", + "original_text": "For me, traffic jams are quite stressful, because I'm pretty impatient. How can I prevent myself from getting stressed if I get stuck in a traffic jam?", + "start_time": 35.011870705073534, + "end_time": 43.986383176728864, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--90/temp/line_8_A.wav", + "silence_duration": 0.38032535542484225, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Just breathe deeply when you feel yourself getting", + "original_text": "Just breathe deeply when you feel yourself getting [interrupt] tense or frustrated, and maybe try listening to some calming music or an interesting podcast to distract yourself from the situation while you're waiting.", + "start_time": 44.44520152038284, + "end_time": 54.778081338976946, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--90/temp/line_9_B.wav", + "silence_duration": 0.4588183436539758, + "is_interrupted": true, + "text_after_interrupt": "tense or frustrated, and maybe try listening to some calming music or an interesting podcast to distract yourself from the situation while you're waiting." + }, + { + "speaker": "A", + "text": "Upset? Ok, I'll try that. By the way, I didn't mention earlier, I didn't have any nightmares last night, which is rare for me.", + "original_text": "Upset? Ok, I'll try that. By the way, I didn't mention earlier, I didn't have any nightmares last night, which is rare for me.", + "start_time": 52.04977746310153, + "end_time": 60.838530297568646, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--90/temp/line_10_A.wav", + "silence_duration": 0.5243225400412841, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "That's a good sign. Is there anything else bothering you?", + "original_text": "That's a good sign. Is there anything else bothering you?", + "start_time": 61.17853833249813, + "end_time": 63.53536372932353, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--90/temp/line_11_B.wav", + "silence_duration": 0.3400080349294858, + "is_interrupted": false + } + ] + }, + "DialogSum--val--91": { + "original_text": "A: I don't think the teacher had a right to say that. The teacher was wrong to have accused her in front of the whole class.\nB: You've got to be joking! It's the teacher's right to say anything she wants, and if she saw Myra cheating, she certainly had the right to [interrupt] call her out on it to maintain discipline in the classroom and set an example for other students who might be tempted to cheat as well.\nA: Sorry to cut in, but do you really think it's okay to embarrass someone publicly, even if they were caught cheating?\nB: Well, I see your point. I agree she had the right to say something, but I feel she should have done it privately.\nA: You're right. If I were the teacher, I wouldn't have done that. By the way, what were you saying about the teacher's right before I interrupted?", + "cleaned_text": "A: I don't think the teacher had a right to say that. The teacher was wrong to have accused her in front of the whole class.\nB:You've got to be joking! It's the teacher's right to say anything she wants, and if she saw Myra cheating, she certainly had the right to call her out on it to maintain discipline in the classroom and set an example for other students who might be tempted to cheat as well.\nA: Sorry to cut in, but do you really think it's okay to embarrass someone publicly, even if they were caught cheating?\nB: Well, I see your point. I agree she had the right to say something, but I feel she should have done it privately.\nA: You're right. If I were the teacher, I wouldn't have done that. By the way, what were you saying about the teacher's right before I interrupted?", + "total_duration": 35.80530612244898, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--91/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--91/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--91/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "I don't think the teacher had a right to say that. The teacher was wrong to have accused her in front of the whole class.", + "original_text": "I don't think the teacher had a right to say that. The teacher was wrong to have accused her in front of the whole class.", + "start_time": 0, + "end_time": 6.5712471655328795, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--91/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "You've got to be joking! It's the teacher's right to say anything she wants, and if she saw Myra cheating, she certainly had the right to", + "original_text": "You've got to be joking! It's the teacher's right to say anything she wants, and if she saw Myra cheating, she certainly had the right to [interrupt] call her out on it to maintain discipline in the classroom and set an example for other students who might be tempted to cheat as well.", + "start_time": 7.15127217251659, + "end_time": 20.549186004716134, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--91/temp/line_1_B.wav", + "silence_duration": 0.5800250069837107, + "is_interrupted": true, + "text_after_interrupt": "call her out on it to maintain discipline in the classroom and set an example for other students who might be tempted to cheat as well." + }, + { + "speaker": "A", + "text": "Sorry to cut in, but do you really think it's okay to embarrass someone publicly, even if they were caught cheating?", + "original_text": "Sorry to cut in, but do you really think it's okay to embarrass someone publicly, even if they were caught cheating?", + "start_time": 14.581657660044936, + "end_time": 21.477984190657182, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--91/temp/line_2_A.wav", + "silence_duration": 0.35549853989864305, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Well, I see your point. I agree she had the right to say something, but I feel she should have done it privately.", + "original_text": "Well, I see your point. I agree she had the right to say something, but I feel she should have done it privately.", + "start_time": 21.882417420292857, + "end_time": 27.838335787639796, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--91/temp/line_3_B.wav", + "silence_duration": 0.40443322963567413, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "You're right. If I were the teacher, I wouldn't have done that. By the way, what were you saying about the teacher's right before I interrupted?", + "original_text": "You're right. If I were the teacher, I wouldn't have done that. By the way, what were you saying about the teacher's right before I interrupted?", + "start_time": 28.165957059109648, + "end_time": 35.80532213847473, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--91/temp/line_4_A.wav", + "silence_duration": 0.3276212714698504, + "is_interrupted": false + } + ] + }, + "DialogSum--val--92": { + "original_text": "A: Listen, Karen, I need your help. I don't know anyone here yet.\nB: I'm glad to help you. What's wrong?\nA: My mother-in-law just went into the hospital in L. A. Hank and I will be flying there tonight.\nB: I'm sorry to hear it. What's wrong with [interrupt] her? Is it something serious? The suddenness of this situation must be really stressful for your family right now.\nA: Doctors aren't sure yet. But the real problem is Suzy. She has a bad cold, and we don't want to take her with us. But we don't know who can stay with her.\nB: You need a babysitter.\nA: Yes, I'd ask Jill, the girl I've had before, but I need someone overnight. Maybe even for two [interrupt] nights, which makes it tricky because we need someone reliable who can handle a sick child and follow all the medication instructions properly.\nB: Nights, right? I was going to suggest that she could stay at my place, but I know you're concerned about her cold.\nA: Exactly. Your own kids would get Suzy's cold. I think it would be better to have a good babysitter here. But I don't know who to ask. I need someone more mature than Jill. It might even be for two or three days.\nB: I know who we can ask. There is a girl I know, Sara Ralston. She is 17, and she will usually take this kind of job. I know her from my church, and I trust her completely.", + "cleaned_text": "A: Listen, Karen, I need your help. I don't know anyone here yet.\nB: I'm glad to help you. What's wrong?\nA: My mother-in-law just went into the hospital in L. A. Hank and I will be flying there tonight.\nB:I'm sorry to hear it. What's wrong with her? Is it something serious? The suddenness of this situation must be really stressful for your family right now.\nA: Doctors aren't sure yet. But the real problem is Suzy. She has a bad cold, and we don't want to take her with us. But we don't know who can stay with her.\nB: You need a babysitter.\nA:Yes, I'd ask Jill, the girl I've had before, but I need someone overnight. Maybe even for two nights, which makes it tricky because we need someone reliable who can handle a sick child and follow all the medication instructions properly.\nB: Nights, right? I was going to suggest that she could stay at my place, but I know you're concerned about her cold.\nA: Exactly. Your own kids would get Suzy's cold. I think it would be better to have a good babysitter here. But I don't know who to ask. I need someone more mature than Jill. It might even be for two or three days.\nB: I know who we can ask. There is a girl I know, Sara Ralston. She is 17, and she will usually take this kind of job. I know her from my church, and I trust her completely.", + "total_duration": 69.25038548752835, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--92/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--92/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--92/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Listen, Karen, I need your help. I don't know anyone here yet.", + "original_text": "Listen, Karen, I need your help. I don't know anyone here yet.", + "start_time": 0, + "end_time": 4.098321995464852, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--92/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I'm glad to help you. What's wrong?", + "original_text": "I'm glad to help you. What's wrong?", + "start_time": 4.635797941132024, + "end_time": 6.4353444263927955, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--92/temp/line_1_B.wav", + "silence_duration": 0.5374759456671718, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "My mother-in-law just went into the hospital in L. A. Hank and I will be flying there tonight.", + "original_text": "My mother-in-law just went into the hospital in L. A. Hank and I will be flying there tonight.", + "start_time": 6.7934287514450595, + "end_time": 12.052748479336216, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--92/temp/line_2_A.wav", + "silence_duration": 0.3580843250522644, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I'm sorry to hear it. What's wrong with", + "original_text": "I'm sorry to hear it. What's wrong with [interrupt] her? Is it something serious? The suddenness of this situation must be really stressful for your family right now.", + "start_time": 12.50602131210579, + "end_time": 20.505295688523024, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--92/temp/line_3_B.wav", + "silence_duration": 0.45327283276957353, + "is_interrupted": true, + "text_after_interrupt": "her? Is it something serious? The suddenness of this situation must be really stressful for your family right now." + }, + { + "speaker": "A", + "text": "Doctors aren't sure yet. But the real problem is Suzy. She has a bad cold, and we don't want to take her with us. But we don't know who can stay with her.", + "original_text": "Doctors aren't sure yet. But the real problem is Suzy. She has a bad cold, and we don't want to take her with us. But we don't know who can stay with her.", + "start_time": 14.560987298500349, + "end_time": 24.11599863636883, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--92/temp/line_4_A.wav", + "silence_duration": 0.4400349027045317, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "You need a babysitter.", + "original_text": "You need a babysitter.", + "start_time": 24.44686449755456, + "end_time": 25.944551572384494, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--92/temp/line_5_B.wav", + "silence_duration": 0.3308658611857301, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Yes, I'd ask Jill, the girl I've had before, but I need someone overnight. Maybe even for two", + "original_text": "Yes, I'd ask Jill, the girl I've had before, but I need someone overnight. Maybe even for two [interrupt] nights, which makes it tricky because we need someone reliable who can handle a sick child and follow all the medication instructions properly.", + "start_time": 26.49270112327391, + "end_time": 40.78458320944171, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--92/temp/line_6_A.wav", + "silence_duration": 0.5481495508894174, + "is_interrupted": true, + "text_after_interrupt": "nights, which makes it tricky because we need someone reliable who can handle a sick child and follow all the medication instructions properly." + }, + { + "speaker": "B", + "text": "Nights, right? I was going to suggest that she could stay at my place, but I know you're concerned about her cold.", + "original_text": "Nights, right? I was going to suggest that she could stay at my place, but I know you're concerned about her cold.", + "start_time": 39.458046326318545, + "end_time": 45.66938419479927, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--92/temp/line_7_B.wav", + "silence_duration": 0.45459232385572357, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Exactly. Your own kids would get Suzy's cold. I think it would be better to have a good babysitter here. But I don't know who to ask. I need someone more mature than Jill. It might even be for two or three days.", + "original_text": "Exactly. Your own kids would get Suzy's cold. I think it would be better to have a good babysitter here. But I don't know who to ask. I need someone more mature than Jill. It might even be for two or three days.", + "start_time": 46.1959170281782, + "end_time": 59.54739095108069, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--92/temp/line_8_A.wav", + "silence_duration": 0.5265328333789299, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I know who we can ask. There is a girl I know, Sara Ralston. She is 17, and she will usually take this kind of job. I know her from my church, and I trust her completely.", + "original_text": "I know who we can ask. There is a girl I know, Sara Ralston. She is 17, and she will usually take this kind of job. I know her from my church, and I trust her completely.", + "start_time": 60.1133723316644, + "end_time": 69.25042448585941, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--92/temp/line_9_B.wav", + "silence_duration": 0.5659813805837051, + "is_interrupted": false + } + ] + }, + "DialogSum--val--93": { + "original_text": "A: Anna just emailed to say that the managers meeting is put off till next Monday. Will you have everything ready by then, Sabrina? Hey Sabrina, what's [interrupt] on your mind? You seem a bit distracted and I noticed you've been staring at your phone all morning. Is everything okay?\nB: Sorry, Jason, I just can't focus right now. I'm so worried. I haven't heard from my sister for 2 weeks.\nA: Oh, I see. How often do you usually call each other?\nB: Normally at least once a week. But she's now a volunteer teacher in a mountain village in Africa. I can only write her.\nA: The mail can be really slow sometimes. I'm sure you'll hear from her soon.\nB: I hope so.\nA: You know the saying 'no news is good news'. If something were wrong, someone would have [interrupt] reached out to inform you by now through official channels or at least through the volunteer organization she's working with.\nB: Wait, Jason, I just realized—about the meeting next Monday, do you think we'll need to prepare anything extra since it's been delayed?\nA: Oh, right. I was going to mention that. We might need to review the budget allocations again, but don't worry about it now. And as I was saying, if something were wrong, someone would have called you.\nB: Maybe you're right. Thanks, Jason.", + "cleaned_text": "A:Anna just emailed to say that the managers meeting is put off till next Monday. Will you have everything ready by then, Sabrina? Hey Sabrina, what's on your mind? You seem a bit distracted and I noticed you've been staring at your phone all morning. Is everything okay?\nB: Sorry, Jason, I just can't focus right now. I'm so worried. I haven't heard from my sister for 2 weeks.\nA: Oh, I see. How often do you usually call each other?\nB: Normally at least once a week. But she's now a volunteer teacher in a mountain village in Africa. I can only write her.\nA: The mail can be really slow sometimes. I'm sure you'll hear from her soon.\nB: I hope so.\nA:You know the saying 'no news is good news'. If something were wrong, someone would have reached out to inform you by now through official channels or at least through the volunteer organization she's working with.\nB: Wait, Jason, I just realized—about the meeting next Monday, do you think we'll need to prepare anything extra since it's been delayed?\nA: Oh, right. I was going to mention that. We might need to review the budget allocations again, but don't worry about it now. And as I was saying, if something were wrong, someone would have called you.\nB: Maybe you're right. Thanks, Jason.", + "total_duration": 64.46934240362812, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--93/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--93/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--93/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Anna just emailed to say that the managers meeting is put off till next Monday. Will you have everything ready by then, Sabrina? Hey Sabrina, what's", + "original_text": "Anna just emailed to say that the managers meeting is put off till next Monday. Will you have everything ready by then, Sabrina? Hey Sabrina, what's [interrupt] on your mind? You seem a bit distracted and I noticed you've been staring at your phone all morning. Is everything okay?", + "start_time": 0, + "end_time": 16.114648526077097, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--93/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": true, + "text_after_interrupt": "on your mind? You seem a bit distracted and I noticed you've been staring at your phone all morning. Is everything okay?" + }, + { + "speaker": "B", + "text": "Sorry, Jason, I just can't focus right now. I'm so worried. I haven't heard from my sister for 2 weeks.", + "original_text": "Sorry, Jason, I just can't focus right now. I'm so worried. I haven't heard from my sister for 2 weeks.", + "start_time": 9.775600907029478, + "end_time": 15.685079365079364, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--93/temp/line_1_B.wav", + "silence_duration": 0.4374258719899188, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Oh, I see. How often do you usually call each other?", + "original_text": "Oh, I see. How often do you usually call each other?", + "start_time": 16.6653126846416, + "end_time": 20.60109499756677, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--93/temp/line_2_A.wav", + "silence_duration": 0.5506641585645028, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Normally at least once a week. But she's now a volunteer teacher in a mountain village in Africa. I can only write her.", + "original_text": "Normally at least once a week. But she's now a volunteer teacher in a mountain village in Africa. I can only write her.", + "start_time": 20.985405332547554, + "end_time": 27.47538265681059, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--93/temp/line_3_B.wav", + "silence_duration": 0.3843103349807853, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "The mail can be really slow sometimes. I'm sure you'll hear from her soon.", + "original_text": "The mail can be really slow sometimes. I'm sure you'll hear from her soon.", + "start_time": 27.854026556486897, + "end_time": 31.824638801384857, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--93/temp/line_4_A.wav", + "silence_duration": 0.3786438996763049, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I hope so.", + "original_text": "I hope so.", + "start_time": 32.300654393793565, + "end_time": 33.09013285184345, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--93/temp/line_5_B.wav", + "silence_duration": 0.47601559240870583, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "You know the saying 'no news is good news'. If something were wrong, someone would have", + "original_text": "You know the saying 'no news is good news'. If something were wrong, someone would have [interrupt] reached out to inform you by now through official channels or at least through the volunteer organization she's working with.", + "start_time": 33.65154847506921, + "end_time": 45.38923554989914, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--93/temp/line_6_A.wav", + "silence_duration": 0.5614156232257639, + "is_interrupted": true, + "text_after_interrupt": "reached out to inform you by now through official channels or at least through the volunteer organization she's working with." + }, + { + "speaker": "B", + "text": "Wait, Jason, I just realized—about the meeting next Monday, do you think we'll need to prepare anything extra since it's been delayed?", + "original_text": "Wait, Jason, I just realized—about the meeting next Monday, do you think we'll need to prepare anything extra since it's been delayed?", + "start_time": 45.215030081743805, + "end_time": 51.58890763276421, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--93/temp/line_7_B.wav", + "silence_duration": 0.3572964226216543, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Oh, right. I was going to mention that. We might need to review the budget allocations again, but don't worry about it now. And as I was saying, if something were wrong, someone would have called you.", + "original_text": "Oh, right. I was going to mention that. We might need to review the budget allocations again, but don't worry about it now. And as I was saying, if something were wrong, someone would have called you.", + "start_time": 51.980022129756335, + "end_time": 62.42900172159307, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--93/temp/line_8_A.wav", + "silence_duration": 0.3911144969921265, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Maybe you're right. Thanks, Jason.", + "original_text": "Maybe you're right. Thanks, Jason.", + "start_time": 62.971697110112686, + "end_time": 64.46938418494261, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--93/temp/line_9_B.wav", + "silence_duration": 0.5426953885196197, + "is_interrupted": false + } + ] + }, + "DialogSum--val--94": { + "original_text": "A: Hi, there. I think I'm coming down with something. I need some medicine to get me through the next few days.\nB: Wow, you look terrible. What's going on?\nA: Well, my throat hurts. My nose has been running and I have a bad cough. It could just be a cold, but I don't know for [interrupt] sure if it's something more serious like the flu or just a seasonal cold because the symptoms seem to be getting worse by the hour and I'm starting to feel really fatigued too.\nB: Have you checked your temperature? It might help to know if you have a fever.\nA: I haven't checked it yet. But I was saying, I don't know for sure if it's just a cold or something more serious.\nB: You should take some cold medicine and get some rest. You don't look well.\nA: I have a very important job and I can't miss any work. So, give me something strong.\nB: All right. But if you have the flu, only rest will help. Oh, by the way, did you mention whether you've had a fever? It could be important.\nA: No, I haven't checked my temperature yet. I'll do that first, but I still need something to help me push through the next few days.\nB: If you're still sick in 3 days, you should go see a doctor.", + "cleaned_text": "A: Hi, there. I think I'm coming down with something. I need some medicine to get me through the next few days.\nB: Wow, you look terrible. What's going on?\nA:Well, my throat hurts. My nose has been running and I have a bad cough. It could just be a cold, but I don't know for sure if it's something more serious like the flu or just a seasonal cold because the symptoms seem to be getting worse by the hour and I'm starting to feel really fatigued too.\nB: Have you checked your temperature? It might help to know if you have a fever.\nA: I haven't checked it yet. But I was saying, I don't know for sure if it's just a cold or something more serious.\nB: You should take some cold medicine and get some rest. You don't look well.\nA: I have a very important job and I can't miss any work. So, give me something strong.\nB: All right. But if you have the flu, only rest will help. Oh, by the way, did you mention whether you've had a fever? It could be important.\nA: No, I haven't checked my temperature yet. I'll do that first, but I still need something to help me push through the next few days.\nB: If you're still sick in 3 days, you should go see a doctor.", + "total_duration": 63.14027210884354, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--94/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--94/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--94/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Hi, there. I think I'm coming down with something. I need some medicine to get me through the next few days.", + "original_text": "Hi, there. I think I'm coming down with something. I need some medicine to get me through the next few days.", + "start_time": 0, + "end_time": 6.339047619047619, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--94/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Wow, you look terrible. What's going on?", + "original_text": "Wow, you look terrible. What's going on?", + "start_time": 6.673340338410183, + "end_time": 8.972115848614266, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--94/temp/line_1_B.wav", + "silence_duration": 0.3342927193625639, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Well, my throat hurts. My nose has been running and I have a bad cough. It could just be a cold, but I don't know for", + "original_text": "Well, my throat hurts. My nose has been running and I have a bad cough. It could just be a cold, but I don't know for [interrupt] sure if it's something more serious like the flu or just a seasonal cold because the symptoms seem to be getting worse by the hour and I'm starting to feel really fatigued too.", + "start_time": 9.562943389593618, + "end_time": 27.33781867304033, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--94/temp/line_2_A.wav", + "silence_duration": 0.5908275409793535, + "is_interrupted": true, + "text_after_interrupt": "sure if it's something more serious like the flu or just a seasonal cold because the symptoms seem to be getting worse by the hour and I'm starting to feel really fatigued too." + }, + { + "speaker": "B", + "text": "Have you checked your temperature? It might help to know if you have a fever.", + "original_text": "Have you checked your temperature? It might help to know if you have a fever.", + "start_time": 17.31840824220133, + "end_time": 21.09165087258682, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--94/temp/line_3_B.wav", + "silence_duration": 0.49053175253910725, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I haven't checked it yet. But I was saying, I don't know for sure if it's just a cold or something more serious.", + "original_text": "I haven't checked it yet. But I was saying, I don't know for sure if it's just a cold or something more serious.", + "start_time": 27.859981776510363, + "end_time": 34.733088352474084, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--94/temp/line_4_A.wav", + "silence_duration": 0.5221631034700305, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "You should take some cold medicine and get some rest. You don't look well.", + "original_text": "You should take some cold medicine and get some rest. You don't look well.", + "start_time": 35.23828503244724, + "end_time": 39.116017458751095, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--94/temp/line_5_B.wav", + "silence_duration": 0.5051966799731556, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I have a very important job and I can't miss any work. So, give me something strong.", + "original_text": "I have a very important job and I can't miss any work. So, give me something strong.", + "start_time": 39.46954599425522, + "end_time": 44.6592058582008, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--94/temp/line_6_A.wav", + "silence_duration": 0.3535285355041274, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "All right. But if you have the flu, only rest will help. Oh, by the way, did you mention whether you've had a fever? It could be important.", + "original_text": "All right. But if you have the flu, only rest will help. Oh, by the way, did you mention whether you've had a fever? It could be important.", + "start_time": 45.07000606439359, + "end_time": 52.163702209518306, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--94/temp/line_7_B.wav", + "silence_duration": 0.41080020619278595, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "No, I haven't checked my temperature yet. I'll do that first, but I still need something to help me push through the next few days.", + "original_text": "No, I haven't checked my temperature yet. I'll do that first, but I still need something to help me push through the next few days.", + "start_time": 52.5428621319495, + "end_time": 59.857147846235215, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--94/temp/line_8_A.wav", + "silence_duration": 0.3791599224311954, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "If you're still sick in 3 days, you should go see a doctor.", + "original_text": "If you're still sick in 3 days, you should go see a doctor.", + "start_time": 60.24942455348362, + "end_time": 63.14030890722512, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--94/temp/line_9_B.wav", + "silence_duration": 0.3922767072484084, + "is_interrupted": false + } + ] + }, + "DialogSum--val--95": { + "original_text": "A: There is only 20 minutes left. I've got an appointment. I'm meeting a friend in the City of Westminster at 9:00 AM. I hope not to [interrupt] be late, but I'm worried about the traffic especially since there's road construction happening along our usual route this morning. \nB: Sorry to interrupt, but do you think 20 minutes is enough time to get there? The traffic might be heavy at this hour. \nA: You're right. I'm a bit worried about that, too. But I was saying I hope not to miss it. \nB: Well, I'm going there, too. I can give you a lift if you like. \nA: Could you really? That would be kind. \nB: Where are you meeting your friend? \nA: Near the park. But if you can drop me at an underground station that will be [interrupt] just fine as I can take the tube from there and it should only take about five minutes to reach my destination once I'm on the train. \nB: Actually, the park's not far out of my way. I'll take you there. \nA: That's perfect! Thanks so much.", + "cleaned_text": "A:There is only 20 minutes left. I've got an appointment. I'm meeting a friend in the City of Westminster at 9:00 AM. I hope not to be late, but I'm worried about the traffic especially since there's road construction happening along our usual route this morning.\nB: Sorry to interrupt, but do you think 20 minutes is enough time to get there? The traffic might be heavy at this hour. \nA: You're right. I'm a bit worried about that, too. But I was saying I hope not to miss it. \nB: Well, I'm going there, too. I can give you a lift if you like. \nA: Could you really? That would be kind. \nB: Where are you meeting your friend? \nA:Near the park. But if you can drop me at an underground station that will be just fine as I can take the tube from there and it should only take about five minutes to reach my destination once I'm on the train.\nB: Actually, the park's not far out of my way. I'll take you there. \nA: That's perfect! Thanks so much.", + "total_duration": 48.346439909297054, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--95/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--95/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--95/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "There is only 20 minutes left. I've got an appointment. I'm meeting a friend in the City of Westminster at 9:00 AM. I hope not to", + "original_text": "There is only 20 minutes left. I've got an appointment. I'm meeting a friend in the City of Westminster at 9:00 AM. I hope not to [interrupt] be late, but I'm worried about the traffic especially since there's road construction happening along our usual route this morning.", + "start_time": 0, + "end_time": 16.01015873015873, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--95/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": true, + "text_after_interrupt": "be late, but I'm worried about the traffic especially since there's road construction happening along our usual route this morning." + }, + { + "speaker": "B", + "text": "Sorry to interrupt, but do you think 20 minutes is enough time to get there? The traffic might be heavy at this hour.", + "original_text": "Sorry to interrupt, but do you think 20 minutes is enough time to get there? The traffic might be heavy at this hour.", + "start_time": 9.450521541950113, + "end_time": 15.685079365079364, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--95/temp/line_1_B.wav", + "silence_duration": 0.33291740476364656, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "You're right. I'm a bit worried about that, too. But I was saying I hope not to miss it.", + "original_text": "You're right. I'm a bit worried about that, too. But I was saying I hope not to miss it.", + "start_time": 16.41650251072902, + "end_time": 21.768702057214284, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--95/temp/line_2_A.wav", + "silence_duration": 0.4063437805702921, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Well, I'm going there, too. I can give you a lift if you like.", + "original_text": "Well, I'm going there, too. I can give you a lift if you like.", + "start_time": 22.197822201327966, + "end_time": 25.57632560268851, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--95/temp/line_3_B.wav", + "silence_duration": 0.4291201441136816, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Could you really? That would be kind.", + "original_text": "Could you really? That would be kind.", + "start_time": 25.97376339202305, + "end_time": 28.38863867546976, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--95/temp/line_4_A.wav", + "silence_duration": 0.3974377893345403, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Where are you meeting your friend?", + "original_text": "Where are you meeting your friend?", + "start_time": 28.714651678813816, + "end_time": 30.02657911645554, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--95/temp/line_5_B.wav", + "silence_duration": 0.3260130033440569, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Near the park. But if you can drop me at an underground station that will be", + "original_text": "Near the park. But if you can drop me at an underground station that will be [interrupt] just fine as I can take the tube from there and it should only take about five minutes to reach my destination once I'm on the train.", + "start_time": 30.370757422135362, + "end_time": 42.526403680638765, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--95/temp/line_6_A.wav", + "silence_duration": 0.3441783056798206, + "is_interrupted": true, + "text_after_interrupt": "just fine as I can take the tube from there and it should only take about five minutes to reach my destination once I'm on the train." + }, + { + "speaker": "B", + "text": "Actually, the park's not far out of my way. I'll take you there.", + "original_text": "Actually, the park's not far out of my way. I'll take you there.", + "start_time": 41.98634054783336, + "end_time": 45.20230426665422, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--95/temp/line_7_B.wav", + "silence_duration": 0.43481818659479887, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "That's perfect! Thanks so much.", + "original_text": "That's perfect! Thanks so much.", + "start_time": 45.60651456215795, + "end_time": 48.34646921068403, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--95/temp/line_8_A.wav", + "silence_duration": 0.4042102955037335, + "is_interrupted": false + } + ] + }, + "DialogSum--val--96": { + "original_text": "A: How was your summer trip? \nB: It was great. My friend and I travelled throughout India. \nA: Sounds hot! How did you get along without studying the local language? \nB: Most people there speak English. But there were some remote places in the mountains where we had to learn a few words to communicate. Usually it was easy. One time, though, it got a little awkward. I was asking a baker for some bread and I said 'I want money' instead of 'I want bread'. The words for money and bread were so similar that I got them [interrupt] mixed up, and I didn't realize my mistake until I saw the baker's confused expression, which quickly turned into amusement once he understood what I actually meant to say. \nA: Wait, you actually said 'I want money' to the baker? That must have been quite a shock for him! \nB: Yeah, he looked a little scared but my friend quickly cleared up the confusion. We ended up becoming friends with the guy and he introduced us to more young people. Whenever we told the story of our meeting, it would make everyone laugh. \nA: That sounds like a great experience! But I'm curious, you mentioned earlier that the words for money and bread were similar. What were they?", + "cleaned_text": "A: How was your summer trip? \nB: It was great. My friend and I travelled throughout India. \nA: Sounds hot! How did you get along without studying the local language? \nB:Most people there speak English. But there were some remote places in the mountains where we had to learn a few words to communicate. Usually it was easy. One time, though, it got a little awkward. I was asking a baker for some bread and I said 'I want money' instead of 'I want bread'. The words for money and bread were so similar that I got them mixed up, and I didn't realize my mistake until I saw the baker's confused expression, which quickly turned into amusement once he understood what I actually meant to say.\nA: Wait, you actually said 'I want money' to the baker? That must have been quite a shock for him! \nB: Yeah, he looked a little scared but my friend quickly cleared up the confusion. We ended up becoming friends with the guy and he introduced us to more young people. Whenever we told the story of our meeting, it would make everyone laugh. \nA: That sounds like a great experience! But I'm curious, you mentioned earlier that the words for money and bread were similar. What were they?", + "total_duration": 57.1114739229025, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--96/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--96/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--96/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "How was your summer trip?", + "original_text": "How was your summer trip?", + "start_time": 0, + "end_time": 1.3931972789115645, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--96/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "It was great. My friend and I travelled throughout India.", + "original_text": "It was great. My friend and I travelled throughout India.", + "start_time": 1.7479245440169195, + "end_time": 4.603978965785627, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--96/temp/line_1_B.wav", + "silence_duration": 0.354727265105355, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Sounds hot! How did you get along without studying the local language?", + "original_text": "Sounds hot! How did you get along without studying the local language?", + "start_time": 5.140657792946105, + "end_time": 9.331859607005061, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--96/temp/line_2_A.wav", + "silence_duration": 0.5366788271604783, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Most people there speak English. But there were some remote places in the mountains where we had to learn a few words to communicate. Usually it was easy. One time, though, it got a little awkward. I was asking a baker for some bread and I said 'I want money' instead of 'I want bread'. The words for money and bread were so similar that I got them", + "original_text": "Most people there speak English. But there were some remote places in the mountains where we had to learn a few words to communicate. Usually it was easy. One time, though, it got a little awkward. I was asking a baker for some bread and I said 'I want money' instead of 'I want bread'. The words for money and bread were so similar that I got them [interrupt] mixed up, and I didn't realize my mistake until I saw the baker's confused expression, which quickly turned into amusement once he understood what I actually meant to say.", + "start_time": 9.832582633905883, + "end_time": 36.338160865198404, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--96/temp/line_3_B.wav", + "silence_duration": 0.5007230269008214, + "is_interrupted": true, + "text_after_interrupt": "mixed up, and I didn't realize my mistake until I saw the baker's confused expression, which quickly turned into amusement once he understood what I actually meant to say." + }, + { + "speaker": "A", + "text": "Wait, you actually said 'I want money' to the baker? That must have been quite a shock for him!", + "original_text": "Wait, you actually said 'I want money' to the baker? That must have been quite a shock for him!", + "start_time": 26.667049754087287, + "end_time": 33.06414725975622, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--96/temp/line_4_A.wav", + "silence_duration": 0.559599064369005, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yeah, he looked a little scared but my friend quickly cleared up the confusion. We ended up becoming friends with the guy and he introduced us to more young people. Whenever we told the story of our meeting, it would make everyone laugh.", + "original_text": "Yeah, he looked a little scared but my friend quickly cleared up the confusion. We ended up becoming friends with the guy and he introduced us to more young people. Whenever we told the story of our meeting, it would make everyone laugh.", + "start_time": 36.7532657352129, + "end_time": 48.32841312750315, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--96/temp/line_5_B.wav", + "silence_duration": 0.41510487001449536, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "That sounds like a great experience! But I'm curious, you mentioned earlier that the words for money and bread were similar. What were they?", + "original_text": "That sounds like a great experience! But I'm curious, you mentioned earlier that the words for money and bread were similar. What were they?", + "start_time": 48.63620942376435, + "end_time": 57.11149287047637, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--96/temp/line_6_A.wav", + "silence_duration": 0.30779629626120175, + "is_interrupted": false + } + ] + }, + "DialogSum--val--97": { + "original_text": "A: So, now, have you been asked for an interview, yet? \nB: Yes, I already have an interview schedule with the manager on [interrupt] Wednesday at 10 AM in their main office downtown, and I've been preparing extensively by researching the company's recent projects and potential interview questions. \nA: Wait, did you say with the manager? That's great! Do you know what kind of questions they might ask? \nB: I'm not sure yet, but I was about to say the interview is on Wednesday. \nA: Oh, that's the day after tomorrow, congratulations. Where will the interview be held? \nB: In a building which is very close to where you work, we can meet up then, and I'll tell you about it over some coffee.", + "cleaned_text": "A: So, now, have you been asked for an interview, yet? \nB:Yes, I already have an interview schedule with the manager on Wednesday at 10 AM in their main office downtown, and I've been preparing extensively by researching the company's recent projects and potential interview questions.\nA: Wait, did you say with the manager? That's great! Do you know what kind of questions they might ask? \nB: I'm not sure yet, but I was about to say the interview is on Wednesday. \nA: Oh, that's the day after tomorrow, congratulations. Where will the interview be held? \nB: In a building which is very close to where you work, we can meet up then, and I'll tell you about it over some coffee.", + "total_duration": 29.67795918367347, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--97/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--97/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--97/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "So, now, have you been asked for an interview, yet?", + "original_text": "So, now, have you been asked for an interview, yet?", + "start_time": 0, + "end_time": 3.030204081632653, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--97/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, I already have an interview schedule with the manager on", + "original_text": "Yes, I already have an interview schedule with the manager on [interrupt] Wednesday at 10 AM in their main office downtown, and I've been preparing extensively by researching the company's recent projects and potential interview questions.", + "start_time": 3.380006756161224, + "end_time": 14.513975010129478, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--97/temp/line_1_B.wav", + "silence_duration": 0.34980267452857133, + "is_interrupted": true, + "text_after_interrupt": "Wednesday at 10 AM in their main office downtown, and I've been preparing extensively by researching the company's recent projects and potential interview questions." + }, + { + "speaker": "A", + "text": "Wait, did you say with the manager? That's great! Do you know what kind of questions they might ask?", + "original_text": "Wait, did you say with the manager? That's great! Do you know what kind of questions they might ask?", + "start_time": 6.375380905821088, + "end_time": 12.42417909176213, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--97/temp/line_2_A.wav", + "silence_duration": 0.40379886880177784, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I'm not sure yet, but I was about to say the interview is on Wednesday.", + "original_text": "I'm not sure yet, but I was about to say the interview is on Wednesday.", + "start_time": 14.899270311006381, + "end_time": 19.05564219309255, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--97/temp/line_3_B.wav", + "silence_duration": 0.38529530087690234, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Oh, that's the day after tomorrow, congratulations. Where will the interview be held?", + "original_text": "Oh, that's the day after tomorrow, congratulations. Where will the interview be held?", + "start_time": 19.41376612612841, + "end_time": 24.208686761049044, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--97/temp/line_4_A.wav", + "silence_duration": 0.3581239330358633, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "In a building which is very close to where you work, we can meet up then, and I'll tell you about it over some coffee.", + "original_text": "In a building which is very close to where you work, we can meet up then, and I'll tell you about it over some coffee.", + "start_time": 24.604405587104, + "end_time": 29.67796567780695, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--97/temp/line_5_B.wav", + "silence_duration": 0.39571882605495623, + "is_interrupted": false + } + ] + }, + "DialogSum--val--98": { + "original_text": "A: I've been wondering how to start running. I want to run a marathon and I know you're a good runner. \nB: Well, you need to start out slowly. See if you can run a mile without stopping and then start increasing your distance [interrupt] gradually over several weeks while paying close attention to your body's signals to avoid overtraining or potential injuries. \nA: OK, do you think I should run on a running machine at the gym or start outside to get used to different terrains? \nB: Sorry to cut in, but before we get into that, have you thought about what your current fitness level is? It might help in deciding where to start. \nA: That's a good point. I think I'm in decent shape but haven't done much running lately. So, should I start on a treadmill or outside? \nB: Well, it depends on what you like. Running inside is nice because you can stay at a steady speed. But outside is nice too, because you're surrounded by nature and fresh air.", + "cleaned_text": "A: I've been wondering how to start running. I want to run a marathon and I know you're a good runner. \nB:Well, you need to start out slowly. See if you can run a mile without stopping and then start increasing your distance gradually over several weeks while paying close attention to your body's signals to avoid overtraining or potential injuries.\nA: OK, do you think I should run on a running machine at the gym or start outside to get used to different terrains? \nB: Sorry to cut in, but before we get into that, have you thought about what your current fitness level is? It might help in deciding where to start. \nA: That's a good point. I think I'm in decent shape but haven't done much running lately. So, should I start on a treadmill or outside? \nB: Well, it depends on what you like. Running inside is nice because you can stay at a steady speed. But outside is nice too, because you're surrounded by nature and fresh air.", + "total_duration": 44.75238095238095, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--98/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--98/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--98/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "I've been wondering how to start running. I want to run a marathon and I know you're a good runner.", + "original_text": "I've been wondering how to start running. I want to run a marathon and I know you're a good runner.", + "start_time": 0, + "end_time": 5.712108843537415, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--98/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Well, you need to start out slowly. See if you can run a mile without stopping and then start increasing your distance", + "original_text": "Well, you need to start out slowly. See if you can run a mile without stopping and then start increasing your distance [interrupt] gradually over several weeks while paying close attention to your body's signals to avoid overtraining or potential injuries.", + "start_time": 6.255376789683546, + "end_time": 18.828982231860415, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--98/temp/line_1_B.wav", + "silence_duration": 0.5432679461461315, + "is_interrupted": true, + "text_after_interrupt": "gradually over several weeks while paying close attention to your body's signals to avoid overtraining or potential injuries." + }, + { + "speaker": "A", + "text": "OK, do you think I should run on a running machine at the gym or start outside to get used to different terrains?", + "original_text": "OK, do you think I should run on a running machine at the gym or start outside to get used to different terrains?", + "start_time": 12.431884726191484, + "end_time": 19.40948109807357, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--98/temp/line_2_A.wav", + "silence_duration": 0.4278000050885971, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Sorry to cut in, but before we get into that, have you thought about what your current fitness level is? It might help in deciding where to start.", + "original_text": "Sorry to cut in, but before we get into that, have you thought about what your current fitness level is? It might help in deciding where to start.", + "start_time": 19.922073421507893, + "end_time": 27.155089294523766, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--98/temp/line_3_B.wav", + "silence_duration": 0.5125923234343216, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "That's a good point. I think I'm in decent shape but haven't done much running lately. So, should I start on a treadmill or outside?", + "original_text": "That's a good point. I think I'm in decent shape but haven't done much running lately. So, should I start on a treadmill or outside?", + "start_time": 27.554629235207802, + "end_time": 34.61349544835973, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--98/temp/line_4_A.wav", + "silence_duration": 0.39953994068403687, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Well, it depends on what you like. Running inside is nice because you can stay at a steady speed. But outside is nice too, because you're surrounded by nature and fresh air.", + "original_text": "Well, it depends on what you like. Running inside is nice because you can stay at a steady speed. But outside is nice too, because you're surrounded by nature and fresh air.", + "start_time": 34.91874013310915, + "end_time": 44.752390926759944, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--98/temp/line_5_B.wav", + "silence_duration": 0.30524468474941985, + "is_interrupted": false + } + ] + }, + "DialogSum--val--99": { + "original_text": "A: So Izek, is there a Christian church nearby? \nB: There is one, just 2 blocks from here, on the west end of the Ivy Street. So are you a Christian if you don't mind me [interrupt] asking? I've noticed you've been asking a lot of questions about religious institutions lately and was curious about your personal beliefs. \nA: Oh, no, it's not that. I'm actually working on an essay about the influence of Christian religion on western cultures. So I just want to do some research personally. \nB: I see. Actually, one of the priests in that church is my cousin. I can arrange a meeting between you two if you [interrupt] are interested in getting some more in-depth insights for your essay. He specializes in historical theology and could provide valuable perspectives on your topic. \nA: Wait, did you mention where exactly the church is? I might need to visit it first before meeting your cousin. \nB: Yes, it's on the west end of Ivy Street, just 2 blocks from here. And about the meeting, just let me know when you're ready, and I'll set it up. \nA: Perfect. Thanks again, Izek.", + "cleaned_text": "A: So Izek, is there a Christian church nearby? \nB:There is one, just 2 blocks from here, on the west end of the Ivy Street. So are you a Christian if you don't mind me asking? I've noticed you've been asking a lot of questions about religious institutions lately and was curious about your personal beliefs.\nA: Oh, no, it's not that. I'm actually working on an essay about the influence of Christian religion on western cultures. So I just want to do some research personally. \nB:I see. Actually, one of the priests in that church is my cousin. I can arrange a meeting between you two if you are interested in getting some more in-depth insights for your essay. He specializes in historical theology and could provide valuable perspectives on your topic.\nA: Wait, did you mention where exactly the church is? I might need to visit it first before meeting your cousin. \nB: Yes, it's on the west end of Ivy Street, just 2 blocks from here. And about the meeting, just let me know when you're ready, and I'll set it up. \nA: Perfect. Thanks again, Izek.", + "total_duration": 52.95047619047619, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--99/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--99/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--99/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "So Izek, is there a Christian church nearby?", + "original_text": "So Izek, is there a Christian church nearby?", + "start_time": 0, + "end_time": 2.7980045351473923, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--99/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "There is one, just 2 blocks from here, on the west end of the Ivy Street. So are you a Christian if you don't mind me", + "original_text": "There is one, just 2 blocks from here, on the west end of the Ivy Street. So are you a Christian if you don't mind me [interrupt] asking? I've noticed you've been asking a lot of questions about religious institutions lately and was curious about your personal beliefs.", + "start_time": 3.161294611525229, + "end_time": 16.15285923737557, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--99/temp/line_1_B.wav", + "silence_duration": 0.3632900763778365, + "is_interrupted": true, + "text_after_interrupt": "asking? I've noticed you've been asking a lot of questions about religious institutions lately and was curious about your personal beliefs." + }, + { + "speaker": "A", + "text": "Oh, no, it's not that. I'm actually working on an essay about the influence of Christian religion on western cultures. So I just want to do some research personally.", + "original_text": "Oh, no, it's not that. I'm actually working on an essay about the influence of Christian religion on western cultures. So I just want to do some research personally.", + "start_time": 8.594763999280332, + "end_time": 19.40365288816922, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--99/temp/line_2_A.wav", + "silence_duration": 0.5870881064454092, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I see. Actually, one of the priests in that church is my cousin. I can arrange a meeting between you two if you", + "original_text": "I see. Actually, one of the priests in that church is my cousin. I can arrange a meeting between you two if you [interrupt] are interested in getting some more in-depth insights for your essay. He specializes in historical theology and could provide valuable perspectives on your topic.", + "start_time": 19.828353096319432, + "end_time": 34.25955491037839, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--99/temp/line_3_B.wav", + "silence_duration": 0.4247002081502114, + "is_interrupted": true, + "text_after_interrupt": "are interested in getting some more in-depth insights for your essay. He specializes in historical theology and could provide valuable perspectives on your topic." + }, + { + "speaker": "A", + "text": "Wait, did you mention where exactly the church is? I might need to visit it first before meeting your cousin.", + "original_text": "Wait, did you mention where exactly the church is? I might need to visit it first before meeting your cousin.", + "start_time": 34.7334326313313, + "end_time": 41.30467979686418, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--99/temp/line_4_A.wav", + "silence_duration": 0.5714293578268721, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, it's on the west end of Ivy Street, just 2 blocks from here. And about the meeting, just let me know when you're ready, and I'll set it up.", + "original_text": "Yes, it's on the west end of Ivy Street, just 2 blocks from here. And about the meeting, just let me know when you're ready, and I'll set it up.", + "start_time": 41.885036065033766, + "end_time": 49.524401144398844, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--99/temp/line_5_B.wav", + "silence_duration": 0.580356268169588, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Perfect. Thanks again, Izek.", + "original_text": "Perfect. Thanks again, Izek.", + "start_time": 50.05959803955658, + "end_time": 52.95048239329808, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--99/temp/line_6_A.wav", + "silence_duration": 0.5351968951577417, + "is_interrupted": false + } + ] + }, + "DialogSum--val--100": { + "original_text": "A: Well, it's a nice room. Hmm... is there anything that I should [interrupt] be aware of regarding the house rules or any specific guidelines you have? I'd really appreciate knowing all the details upfront so we can avoid any misunderstandings later.\nB: Sorry to interrupt, but I just remembered something—do you allow pets? I have a small dog.\nA: Oh, I don't allow the cat to go upstairs at all, and I don't allow people to smoke in the bedrooms.\nB: Oh, I agree with that. I don't smoke anyway. But you mentioned cats—what about dogs?\nA: I don't allow dogs upstairs either, and I don't allow people to stick pictures up on the walls.\nB: Oh, I see. Can I use small nails or something?\nA: Oh yes, something like that is quite acceptable, and there are just two more things if you don't mind. If you go out, would you please remember to close the window?\nB: Right. I'll do that. By the way, you were about to mention something else after the window?\nA: Ah, yes, and there is the kettle. When you boil it, could you please put it on the floor? It's just a safety precaution I like to follow.", + "cleaned_text": "A:Well, it's a nice room. Hmm... is there anything that I should be aware of regarding the house rules or any specific guidelines you have? I'd really appreciate knowing all the details upfront so we can avoid any misunderstandings later.\nB: Sorry to interrupt, but I just remembered something—do you allow pets? I have a small dog.\nA: Oh, I don't allow the cat to go upstairs at all, and I don't allow people to smoke in the bedrooms.\nB: Oh, I agree with that. I don't smoke anyway. But you mentioned cats—what about dogs?\nA: I don't allow dogs upstairs either, and I don't allow people to stick pictures up on the walls.\nB: Oh, I see. Can I use small nails or something?\nA: Oh yes, something like that is quite acceptable, and there are just two more things if you don't mind. If you go out, would you please remember to close the window?\nB: Right. I'll do that. By the way, you were about to mention something else after the window?\nA: Ah, yes, and there is the kettle. When you boil it, could you please put it on the floor? It's just a safety precaution I like to follow.", + "total_duration": 57.12897959183673, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--100/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--100/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--100/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Well, it's a nice room. Hmm... is there anything that I should", + "original_text": "Well, it's a nice room. Hmm... is there anything that I should [interrupt] be aware of regarding the house rules or any specific guidelines you have? I'd really appreciate knowing all the details upfront so we can avoid any misunderstandings later.", + "start_time": 0, + "end_time": 14.349931972789115, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--100/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": true, + "text_after_interrupt": "be aware of regarding the house rules or any specific guidelines you have? I'd really appreciate knowing all the details upfront so we can avoid any misunderstandings later." + }, + { + "speaker": "B", + "text": "Sorry to interrupt, but I just remembered something—do you allow pets? I have a small dog.", + "original_text": "Sorry to interrupt, but I just remembered something—do you allow pets? I have a small dog.", + "start_time": 3.912562358276644, + "end_time": 9.09061224489796, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--100/temp/line_1_B.wav", + "silence_duration": 0.44416357069320417, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Oh, I don't allow the cat to go upstairs at all, and I don't allow people to smoke in the bedrooms.", + "original_text": "Oh, I don't allow the cat to go upstairs at all, and I don't allow people to smoke in the bedrooms.", + "start_time": 14.675872366795783, + "end_time": 20.631790734142722, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--100/temp/line_2_A.wav", + "silence_duration": 0.3259403940066688, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Oh, I agree with that. I don't smoke anyway. But you mentioned cats—what about dogs?", + "original_text": "Oh, I agree with that. I don't smoke anyway. But you mentioned cats—what about dogs?", + "start_time": 21.061794461933868, + "end_time": 25.39231600388398, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--100/temp/line_3_B.wav", + "silence_duration": 0.43000372779114615, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I don't allow dogs upstairs either, and I don't allow people to stick pictures up on the walls.", + "original_text": "I don't allow dogs upstairs either, and I don't allow people to stick pictures up on the walls.", + "start_time": 25.871686513102215, + "end_time": 31.50252551536979, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--100/temp/line_4_A.wav", + "silence_duration": 0.4793705092182363, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Oh, I see. Can I use small nails or something?", + "original_text": "Oh, I see. Can I use small nails or something?", + "start_time": 32.02774919789171, + "end_time": 34.802533778390575, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--100/temp/line_5_B.wav", + "silence_duration": 0.5252236825219191, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Oh yes, something like that is quite acceptable, and there are just two more things if you don't mind. If you go out, would you please remember to close the window?", + "original_text": "Oh yes, something like that is quite acceptable, and there are just two more things if you don't mind. If you go out, would you please remember to close the window?", + "start_time": 35.23802529028443, + "end_time": 44.38668742180371, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--100/temp/line_6_A.wav", + "silence_duration": 0.43549151189385893, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Right. I'll do that. By the way, you were about to mention something else after the window?", + "original_text": "Right. I'll do that. By the way, you were about to mention something else after the window?", + "start_time": 44.688052501535, + "end_time": 48.925694224891004, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--100/temp/line_7_B.wav", + "silence_duration": 0.3013650797312903, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Ah, yes, and there is the kettle. When you boil it, could you please put it on the floor? It's just a safety precaution I like to follow.", + "original_text": "Ah, yes, and there is the kettle. When you boil it, could you please put it on the floor? It's just a safety precaution I like to follow.", + "start_time": 49.23422093537065, + "end_time": 57.129005515869515, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--100/temp/line_8_A.wav", + "silence_duration": 0.30852671047964947, + "is_interrupted": false + } + ] + }, + "DialogSum--val--101": { + "original_text": "A: Excuse me, sir. You can't park here. \nB: I am just waiting for my friends. It won't be [interrupt] long. They should be here any minute now because we have an important appointment to attend and I don't want to be late for it. \nA: Sorry, but even if it's just for a short time, the curb here is not for parking. \nB: But I didn't see the sign, Ma 'am. \nA: There is a sign at the corner of the street. When you turned in here, you should have [interrupt] noticed it clearly since it's painted in bright yellow with bold red letters warning about the no parking zone. \nB: Oh, I must have missed it. Could you point out exactly where the sign is? \nA: Sure, it's right at the corner where you made the turn. You might want to check it out to avoid any future issues.", + "cleaned_text": "A: Excuse me, sir. You can't park here. \nB:I am just waiting for my friends. It won't be long. They should be here any minute now because we have an important appointment to attend and I don't want to be late for it.\nA: Sorry, but even if it's just for a short time, the curb here is not for parking. \nB: But I didn't see the sign, Ma 'am. \nA:There is a sign at the corner of the street. When you turned in here, you should have noticed it clearly since it's painted in bright yellow with bold red letters warning about the no parking zone.\nB: Oh, I must have missed it. Could you point out exactly where the sign is? \nA: Sure, it's right at the corner where you made the turn. You might want to check it out to avoid any future issues.", + "total_duration": 35.694331065759634, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--101/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--101/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--101/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Excuse me, sir. You can't park here.", + "original_text": "Excuse me, sir. You can't park here.", + "start_time": 0, + "end_time": 2.391655328798186, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--101/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I am just waiting for my friends. It won't be", + "original_text": "I am just waiting for my friends. It won't be [interrupt] long. They should be here any minute now because we have an important appointment to attend and I don't want to be late for it.", + "start_time": 2.9910471439960573, + "end_time": 11.44311063605955, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--101/temp/line_1_B.wav", + "silence_duration": 0.5993918151978711, + "is_interrupted": true, + "text_after_interrupt": "long. They should be here any minute now because we have an important appointment to attend and I don't want to be late for it." + }, + { + "speaker": "A", + "text": "Sorry, but even if it's just for a short time, the curb here is not for parking.", + "original_text": "Sorry, but even if it's just for a short time, the curb here is not for parking.", + "start_time": 5.382702472794243, + "end_time": 10.676852132658189, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--101/temp/line_2_A.wav", + "silence_duration": 0.5833639844809844, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "But I didn't see the sign, Ma 'am.", + "original_text": "But I didn't see the sign, Ma 'am.", + "start_time": 11.980746940177632, + "end_time": 13.989273017275137, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--101/temp/line_3_B.wav", + "silence_duration": 0.5376363041180818, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "There is a sign at the corner of the street. When you turned in here, you should have", + "original_text": "There is a sign at the corner of the street. When you turned in here, you should have [interrupt] noticed it clearly since it's painted in bright yellow with bold red letters warning about the no parking zone.", + "start_time": 14.331440241409563, + "end_time": 25.38413865410798, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--101/temp/line_4_A.wav", + "silence_duration": 0.342167224134427, + "is_interrupted": true, + "text_after_interrupt": "noticed it clearly since it's painted in bright yellow with bold red letters warning about the no parking zone." + }, + { + "speaker": "B", + "text": "Oh, I must have missed it. Could you point out exactly where the sign is?", + "original_text": "Oh, I must have missed it. Could you point out exactly where the sign is?", + "start_time": 25.093300037527968, + "end_time": 28.750442894670826, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--101/temp/line_5_B.wav", + "silence_duration": 0.5649350205469783, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Sure, it's right at the corner where you made the turn. You might want to check it out to avoid any future issues.", + "original_text": "Sure, it's right at the corner where you made the turn. You might want to check it out to avoid any future issues.", + "start_time": 29.21597889472425, + "end_time": 35.69434624166303, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--101/temp/line_6_A.wav", + "silence_duration": 0.4655360000534231, + "is_interrupted": false + } + ] + }, + "DialogSum--val--102": { + "original_text": "A: That China-gown of Tang-Dynasty style is so beautiful. Would you show it to me, please? \nB: Absolutely. Here it is. \nA: Could I try it on? \nB: Please do, the fitting-room is over there. \nA: It feels a little tight around the waist. Do you have a bigger [interrupt] size available in this style with the same intricate embroidery and high-quality silk fabric? \nB: Oh, before I forget, are you looking for this specific color, or would you consider other options? \nA: I was actually hoping for this color, but it's tight. Do you have a bigger size in this color? \nB: I'm sorry. We don't have this color in your size. We have some green ones in your size. Would you please have a look at this green one? \nA: OK. How much does it cost compared to the one I tried on? \nB: Oh, and just to clarify, the green one is the same price as the original. \nA: Got it. So, how much does it [interrupt] cost including any potential discounts or special offers you might have for this particular collection? \nB: It's 486 yuan.", + "cleaned_text": "A: That China-gown of Tang-Dynasty style is so beautiful. Would you show it to me, please? \nB: Absolutely. Here it is. \nA: Could I try it on? \nB: Please do, the fitting-room is over there. \nA:It feels a little tight around the waist. Do you have a bigger size available in this style with the same intricate embroidery and high-quality silk fabric?\nB: Oh, before I forget, are you looking for this specific color, or would you consider other options? \nA: I was actually hoping for this color, but it's tight. Do you have a bigger size in this color? \nB: I'm sorry. We don't have this color in your size. We have some green ones in your size. Would you please have a look at this green one? \nA: OK. How much does it cost compared to the one I tried on? \nB: Oh, and just to clarify, the green one is the same price as the original. \nA:Got it. So, how much does it cost including any potential discounts or special offers you might have for this particular collection?\nB: It's 486 yuan.", + "total_duration": 52.09328798185941, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--102/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--102/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--102/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "That China-gown of Tang-Dynasty style is so beautiful. Would you show it to me, please?", + "original_text": "That China-gown of Tang-Dynasty style is so beautiful. Would you show it to me, please?", + "start_time": 0, + "end_time": 5.375419501133787, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--102/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Absolutely. Here it is.", + "original_text": "Absolutely. Here it is.", + "start_time": 5.825248403384824, + "end_time": 7.473865183430176, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--102/temp/line_1_B.wav", + "silence_duration": 0.4498289022510375, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Could I try it on?", + "original_text": "Could I try it on?", + "start_time": 7.926489235500897, + "end_time": 9.075876990602938, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--102/temp/line_2_A.wav", + "silence_duration": 0.45262405207072093, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Please do, the fitting-room is over there.", + "original_text": "Please do, the fitting-room is over there.", + "start_time": 9.494639872137023, + "end_time": 11.572825813180106, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--102/temp/line_3_B.wav", + "silence_duration": 0.41876288153408603, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "It feels a little tight around the waist. Do you have a bigger", + "original_text": "It feels a little tight around the waist. Do you have a bigger [interrupt] size available in this style with the same intricate embroidery and high-quality silk fabric?", + "start_time": 12.147682027310628, + "end_time": 21.44727386404532, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--102/temp/line_4_A.wav", + "silence_duration": 0.574856214130522, + "is_interrupted": true, + "text_after_interrupt": "size available in this style with the same intricate embroidery and high-quality silk fabric?" + }, + { + "speaker": "B", + "text": "Oh, before I forget, are you looking for this specific color, or would you consider other options?", + "original_text": "Oh, before I forget, are you looking for this specific color, or would you consider other options?", + "start_time": 15.642285201913802, + "end_time": 20.135346426403597, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--102/temp/line_5_B.wav", + "silence_duration": 0.35638942073244195, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I was actually hoping for this color, but it's tight. Do you have a bigger size in this color?", + "original_text": "I was actually hoping for this color, but it's tight. Do you have a bigger size in this color?", + "start_time": 21.998387016072186, + "end_time": 27.176436902693503, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--102/temp/line_6_A.wav", + "silence_duration": 0.5511131520268651, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I'm sorry. We don't have this color in your size. We have some green ones in your size. Would you please have a look at this green one?", + "original_text": "I'm sorry. We don't have this color in your size. We have some green ones in your size. Would you please have a look at this green one?", + "start_time": 27.543948159219596, + "end_time": 33.47664657191801, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--102/temp/line_7_B.wav", + "silence_duration": 0.3675112565260921, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "OK. How much does it cost compared to the one I tried on?", + "original_text": "OK. How much does it cost compared to the one I tried on?", + "start_time": 34.01877784122632, + "end_time": 38.268029541906586, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--102/temp/line_8_A.wav", + "silence_duration": 0.5421312693083097, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Oh, and just to clarify, the green one is the same price as the original.", + "original_text": "Oh, and just to clarify, the green one is the same price as the original.", + "start_time": 38.584287775744315, + "end_time": 42.520070088669485, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--102/temp/line_9_B.wav", + "silence_duration": 0.3162582338377267, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Got it. So, how much does it", + "original_text": "Got it. So, how much does it [interrupt] cost including any potential discounts or special offers you might have for this particular collection?", + "start_time": 42.98744834613286, + "end_time": 51.381461951575034, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--102/temp/line_10_A.wav", + "silence_duration": 0.4673782574633764, + "is_interrupted": true, + "text_after_interrupt": "cost including any potential discounts or special offers you might have for this particular collection?" + }, + { + "speaker": "B", + "text": "It's 486 yuan.", + "original_text": "It's 486 yuan.", + "start_time": 50.154458579479154, + "end_time": 52.09332479263108, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--102/temp/line_11_B.wav", + "silence_duration": 0.3671991987014219, + "is_interrupted": false + } + ] + }, + "DialogSum--val--103": { + "original_text": "A: Hello, I brought a lap-top computer with me. Do you know how can I use the internet in my room?\nB: Well, right now, we can't afford internet use in the rooms. But you can go to the web [interrupt] connect in the lobby or other common areas where we've set up high-speed WiFi hotspots that are available 24/7 for all our guests' convenience.\nA: Oh, is there any possibility of getting internet access in the room, even if I have to pay extra?\nB: Unfortunately, we don't have that option at the moment. However, I was about to mention that the web bar is on the 12th floor. Would that work for you?", + "cleaned_text": "A: Hello, I brought a lap-top computer with me. Do you know how can I use the internet in my room?\nB:Well, right now, we can't afford internet use in the rooms. But you can go to the web connect in the lobby or other common areas where we've set up high-speed WiFi hotspots that are available 24/7 for all our guests' convenience.\nA: Oh, is there any possibility of getting internet access in the room, even if I have to pay extra?\nB: Unfortunately, we don't have that option at the moment. However, I was about to mention that the web bar is on the 12th floor. Would that work for you?", + "total_duration": 26.8518820861678, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--103/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--103/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--103/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Hello, I brought a lap-top computer with me. Do you know how can I use the internet in my room?", + "original_text": "Hello, I brought a lap-top computer with me. Do you know how can I use the internet in my room?", + "start_time": 0, + "end_time": 6.2345578231292516, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--103/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Well, right now, we can't afford internet use in the rooms. But you can go to the web", + "original_text": "Well, right now, we can't afford internet use in the rooms. But you can go to the web [interrupt] connect in the lobby or other common areas where we've set up high-speed WiFi hotspots that are available 24/7 for all our guests' convenience.", + "start_time": 6.677735887511609, + "end_time": 19.413881012228163, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--103/temp/line_1_B.wav", + "silence_duration": 0.44317806438235785, + "is_interrupted": true, + "text_after_interrupt": "connect in the lobby or other common areas where we've set up high-speed WiFi hotspots that are available 24/7 for all our guests' convenience." + }, + { + "speaker": "A", + "text": "Oh, is there any possibility of getting internet access in the room, even if I have to pay extra?", + "original_text": "Oh, is there any possibility of getting internet access in the room, even if I have to pay extra?", + "start_time": 10.99664745213746, + "end_time": 17.312475116536554, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--103/temp/line_2_A.wav", + "silence_duration": 0.5695054946243108, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Unfortunately, we don't have that option at the moment. However, I was about to mention that the web bar is on the 12th floor. Would that work for you?", + "original_text": "Unfortunately, we don't have that option at the moment. However, I was about to mention that the web bar is on the 12th floor. Would that work for you?", + "start_time": 19.78141815262876, + "end_time": 26.851894343104952, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--103/temp/line_3_B.wav", + "silence_duration": 0.36753714040059643, + "is_interrupted": false + } + ] + }, + "DialogSum--val--104": { + "original_text": "A: Can I have a look at that digital camera please? \nB: Yes of course. This is a really good one actually. It features a high-resolution sensor and advanced image stabilization [interrupt] technology that makes it perfect for both professional photographers and casual users who want to capture stunning photos in any lighting condition. \nA: How much does it cost? I'm trying to stay within my budget. \nB: Sorry, before I forget, I wanted to mention that there's a discount on accessories if you buy the camera today. \nA: That sounds great! But I was asking, how much does it cost? \nB: Oh, right! This one is 1500 yuan. \nA: It looks pretty good. I think I'll take it. \nB: Would you like anything else? \nA: Actually, about those accessories you mentioned earlier—what kind of discount are we talking about?", + "cleaned_text": "A: Can I have a look at that digital camera please? \nB:Yes of course. This is a really good one actually. It features a high-resolution sensor and advanced image stabilization technology that makes it perfect for both professional photographers and casual users who want to capture stunning photos in any lighting condition.\nA: How much does it cost? I'm trying to stay within my budget. \nB: Sorry, before I forget, I wanted to mention that there's a discount on accessories if you buy the camera today. \nA: That sounds great! But I was asking, how much does it cost? \nB: Oh, right! This one is 1500 yuan. \nA: It looks pretty good. I think I'll take it. \nB: Would you like anything else? \nA: Actually, about those accessories you mentioned earlier—what kind of discount are we talking about?", + "total_duration": 43.38848072562358, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--104/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--104/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--104/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Can I have a look at that digital camera please?", + "original_text": "Can I have a look at that digital camera please?", + "start_time": 0, + "end_time": 2.4961451247165534, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--104/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes of course. This is a really good one actually. It features a high-resolution sensor and advanced image stabilization", + "original_text": "Yes of course. This is a really good one actually. It features a high-resolution sensor and advanced image stabilization [interrupt] technology that makes it perfect for both professional photographers and casual users who want to capture stunning photos in any lighting condition.", + "start_time": 2.837776547861973, + "end_time": 17.129658634029774, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--104/temp/line_1_B.wav", + "silence_duration": 0.34163142314541955, + "is_interrupted": true, + "text_after_interrupt": "technology that makes it perfect for both professional photographers and casual users who want to capture stunning photos in any lighting condition." + }, + { + "speaker": "A", + "text": "How much does it cost? I'm trying to stay within my budget.", + "original_text": "How much does it cost? I'm trying to stay within my budget.", + "start_time": 9.536733463961745, + "end_time": 13.205486298428866, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--104/temp/line_2_A.wav", + "silence_duration": 0.353340906311347, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Sorry, before I forget, I wanted to mention that there's a discount on accessories if you buy the camera today.", + "original_text": "Sorry, before I forget, I wanted to mention that there's a discount on accessories if you buy the camera today.", + "start_time": 17.710926979129855, + "end_time": 23.968704756907634, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--104/temp/line_3_B.wav", + "silence_duration": 0.5812683451000825, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "That sounds great! But I was asking, how much does it cost?", + "original_text": "That sounds great! But I was asking, how much does it cost?", + "start_time": 24.48188330940715, + "end_time": 28.41766562233232, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--104/temp/line_4_A.wav", + "silence_duration": 0.5131785524995133, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Oh, right! This one is 1500 yuan.", + "original_text": "Oh, right! This one is 1500 yuan.", + "start_time": 28.721312497075825, + "end_time": 31.112967825874012, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--104/temp/line_5_B.wav", + "silence_duration": 0.3036468747435059, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "It looks pretty good. I think I'll take it.", + "original_text": "It looks pretty good. I think I'll take it.", + "start_time": 31.651901824977752, + "end_time": 35.3438746140934, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--104/temp/line_6_A.wav", + "silence_duration": 0.5389339991037414, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Would you like anything else?", + "original_text": "Would you like anything else?", + "start_time": 35.781532124256046, + "end_time": 37.09345956189777, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--104/temp/line_7_B.wav", + "silence_duration": 0.437657510162642, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Actually, about those accessories you mentioned earlier—what kind of discount are we talking about?", + "original_text": "Actually, about those accessories you mentioned earlier—what kind of discount are we talking about?", + "start_time": 37.65315353732676, + "end_time": 43.3884823355127, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--104/temp/line_8_A.wav", + "silence_duration": 0.5596939754289936, + "is_interrupted": false + } + ] + }, + "DialogSum--val--105": { + "original_text": "A: We really were lucky. We got the last available table for two—and we didn't even have a reservation! Did you see the long lines behind [interrupt] us stretching all the way out the door? I was worried we might have to wait for hours if we hadn't arrived when we did.\nB: Sorry, just thinking, should we order something to drink first? I'm really thirsty.\nA: Oh, good idea! We can ask for drinks while we look at the menu. But I was asking if you noticed the long lines behind us?\nB: Yeah, I did. I'm glad that we didn't have to wait long. I'm starving!\nA: Let's take a look at the menu so we can order. Do you want to choose an appetizer for us to start with? I'm open to anything.\nB: Oh, I was thinking about either samosas or poppadoms. What would you rather have?\nA: I heard that one of their specialties is the samosa [interrupt] which comes with three different chutneys and is made with a secret family recipe that's been passed down for generations.\nB: Well, let's get a plate of those then.\nA: Sounds good. What are you going to have for your main course?\nB: I think I might have a dahl.\nA: What's in a dahl?\nB: It's got chickpeas and vegetables in a spicy curry sauce with rice.\nA: That sounds nice. Do you want to share some kebabs as well?\nB: Ok. How about some lamb kebabs?", + "cleaned_text": "A:We really were lucky. We got the last available table for two—and we didn't even have a reservation! Did you see the long lines behind us stretching all the way out the door? I was worried we might have to wait for hours if we hadn't arrived when we did.\nB: Sorry, just thinking, should we order something to drink first? I'm really thirsty.\nA: Oh, good idea! We can ask for drinks while we look at the menu. But I was asking if you noticed the long lines behind us?\nB: Yeah, I did. I'm glad that we didn't have to wait long. I'm starving!\nA: Let's take a look at the menu so we can order. Do you want to choose an appetizer for us to start with? I'm open to anything.\nB: Oh, I was thinking about either samosas or poppadoms. What would you rather have?\nA:I heard that one of their specialties is the samosa which comes with three different chutneys and is made with a secret family recipe that's been passed down for generations.\nB: Well, let's get a plate of those then.\nA: Sounds good. What are you going to have for your main course?\nB: I think I might have a dahl.\nA: What's in a dahl?\nB: It's got chickpeas and vegetables in a spicy curry sauce with rice.\nA: That sounds nice. Do you want to share some kebabs as well?\nB: Ok. How about some lamb kebabs?", + "total_duration": 71.26036281179138, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--105/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--105/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--105/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "We really were lucky. We got the last available table for two—and we didn't even have a reservation! Did you see the long lines behind", + "original_text": "We really were lucky. We got the last available table for two—and we didn't even have a reservation! Did you see the long lines behind [interrupt] us stretching all the way out the door? I was worried we might have to wait for hours if we hadn't arrived when we did.", + "start_time": 0, + "end_time": 15.534149659863946, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--105/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": true, + "text_after_interrupt": "us stretching all the way out the door? I was worried we might have to wait for hours if we hadn't arrived when we did." + }, + { + "speaker": "B", + "text": "Sorry, just thinking, should we order something to drink first? I'm really thirsty.", + "original_text": "Sorry, just thinking, should we order something to drink first? I'm really thirsty.", + "start_time": 8.870022675736962, + "end_time": 13.583673469387755, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--105/temp/line_1_B.wav", + "silence_duration": 0.43142021535043396, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Oh, good idea! We can ask for drinks while we look at the menu. But I was asking if you noticed the long lines behind us?", + "original_text": "Oh, good idea! We can ask for drinks while we look at the menu. But I was asking if you noticed the long lines behind us?", + "start_time": 16.12832170026988, + "end_time": 23.639977029068064, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--105/temp/line_2_A.wav", + "silence_duration": 0.5941720404059317, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yeah, I did. I'm glad that we didn't have to wait long. I'm starving!", + "original_text": "Yeah, I did. I'm glad that we didn't have to wait long. I'm starving!", + "start_time": 24.232106666509296, + "end_time": 28.504578321838093, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--105/temp/line_3_B.wav", + "silence_duration": 0.5921296374412336, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Let's take a look at the menu so we can order. Do you want to choose an appetizer for us to start with? I'm open to anything.", + "original_text": "Let's take a look at the menu so we can order. Do you want to choose an appetizer for us to start with? I'm open to anything.", + "start_time": 29.000446714684767, + "end_time": 36.59337188475279, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--105/temp/line_4_A.wav", + "silence_duration": 0.4958683928466757, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Oh, I was thinking about either samosas or poppadoms. What would you rather have?", + "original_text": "Oh, I was thinking about either samosas or poppadoms. What would you rather have?", + "start_time": 37.05676767509047, + "end_time": 41.66592867282289, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--105/temp/line_5_B.wav", + "silence_duration": 0.46339579033767847, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I heard that one of their specialties is the samosa", + "original_text": "I heard that one of their specialties is the samosa [interrupt] which comes with three different chutneys and is made with a secret family recipe that's been passed down for generations.", + "start_time": 42.22556719303251, + "end_time": 52.11726787330462, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--105/temp/line_6_A.wav", + "silence_duration": 0.5596385202096177, + "is_interrupted": true, + "text_after_interrupt": "which comes with three different chutneys and is made with a secret family recipe that's been passed down for generations." + }, + { + "speaker": "B", + "text": "Well, let's get a plate of those then.", + "original_text": "Well, let's get a plate of those then.", + "start_time": 49.71076289785657, + "end_time": 52.04436834003344, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--105/temp/line_7_B.wav", + "silence_duration": 0.5909607226400633, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Sounds good. What are you going to have for your main course?", + "original_text": "Sounds good. What are you going to have for your main course?", + "start_time": 52.42127006736166, + "end_time": 55.75333355942515, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--105/temp/line_8_A.wav", + "silence_duration": 0.30400219405703804, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I think I might have a dahl.", + "original_text": "I think I might have a dahl.", + "start_time": 56.11171669249244, + "end_time": 57.644233699295164, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--105/temp/line_9_B.wav", + "silence_duration": 0.3583831330672956, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "What's in a dahl?", + "original_text": "What's in a dahl?", + "start_time": 57.96861086608001, + "end_time": 59.11799862118205, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--105/temp/line_10_A.wav", + "silence_duration": 0.32437716678484896, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "It's got chickpeas and vegetables in a spicy curry sauce with rice.", + "original_text": "It's got chickpeas and vegetables in a spicy curry sauce with rice.", + "start_time": 59.45452870734249, + "end_time": 63.05362167786403, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--105/temp/line_11_B.wav", + "silence_duration": 0.3365300861604357, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "That sounds nice. Do you want to share some kebabs as well?", + "original_text": "That sounds nice. Do you want to share some kebabs as well?", + "start_time": 63.59071734383003, + "end_time": 67.54971961140373, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--105/temp/line_12_A.wav", + "silence_duration": 0.5370956659659982, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Ok. How about some lamb kebabs?", + "original_text": "Ok. How about some lamb kebabs?", + "start_time": 67.90509990354427, + "end_time": 71.26038335025629, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--105/temp/line_13_B.wav", + "silence_duration": 0.35538029214053646, + "is_interrupted": false + } + ] + }, + "DialogSum--val--106": { + "original_text": "A: You went out on a date last night, didn't you? \nB: Yes, I did, but Linda stood me up. She didn't keep the date for the first [interrupt] time, and it's starting to make me wonder if she's losing interest or if there's something else going on that she hasn't told me about yet. \nA: Wait, she stood you up? That must have been frustrating. Did she give any reason at all? \nB: I don't know. I tried calling her this morning, but she hung up on me. I think she is going to walk out on our relationship, and I'm not sure what to do about it. \nA: Hold on, she hung up on you? That sounds serious. Maybe you should try talking to her in person instead of over the phone. \nB: You're right, I should try that. I still need to figure out why she didn't keep the date last night. \nA: Yeah, understanding what happened could really help. Good luck with that, and don't hesitate to reach out if you need more advice. \nB: I will. Thanks for your advice.", + "cleaned_text": "A: You went out on a date last night, didn't you? \nB:Yes, I did, but Linda stood me up. She didn't keep the date for the first time, and it's starting to make me wonder if she's losing interest or if there's something else going on that she hasn't told me about yet.\nA: Wait, she stood you up? That must have been frustrating. Did she give any reason at all? \nB: I don't know. I tried calling her this morning, but she hung up on me. I think she is going to walk out on our relationship, and I'm not sure what to do about it. \nA: Hold on, she hung up on you? That sounds serious. Maybe you should try talking to her in person instead of over the phone. \nB: You're right, I should try that. I still need to figure out why she didn't keep the date last night. \nA: Yeah, understanding what happened could really help. Good luck with that, and don't hesitate to reach out if you need more advice. \nB: I will. Thanks for your advice.", + "total_duration": 44.97369614512472, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--106/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--106/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--106/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "You went out on a date last night, didn't you?", + "original_text": "You went out on a date last night, didn't you?", + "start_time": 0, + "end_time": 2.414875283446712, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--106/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, I did, but Linda stood me up. She didn't keep the date for the first", + "original_text": "Yes, I did, but Linda stood me up. She didn't keep the date for the first [interrupt] time, and it's starting to make me wonder if she's losing interest or if there's something else going on that she hasn't told me about yet.", + "start_time": 2.7727823642907645, + "end_time": 13.512011389234075, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--106/temp/line_1_B.wav", + "silence_duration": 0.3579070808440525, + "is_interrupted": true, + "text_after_interrupt": "time, and it's starting to make me wonder if she's losing interest or if there's something else going on that she hasn't told me about yet." + }, + { + "speaker": "A", + "text": "Wait, she stood you up? That must have been frustrating. Did she give any reason at all?", + "original_text": "Wait, she stood you up? That must have been frustrating. Did she give any reason at all?", + "start_time": 6.871104359755616, + "end_time": 12.525163316671716, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--106/temp/line_2_A.wav", + "silence_duration": 0.4359612979804942, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I don't know. I tried calling her this morning, but she hung up on me. I think she is going to walk out on our relationship, and I'm not sure what to do about it.", + "original_text": "I don't know. I tried calling her this morning, but she hung up on me. I think she is going to walk out on our relationship, and I'm not sure what to do about it.", + "start_time": 13.90026085171008, + "end_time": 21.713775590939104, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--106/temp/line_3_B.wav", + "silence_duration": 0.38824946247600484, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Hold on, she hung up on you? That sounds serious. Maybe you should try talking to her in person instead of over the phone.", + "original_text": "Hold on, she hung up on you? That sounds serious. Maybe you should try talking to her in person instead of over the phone.", + "start_time": 22.287616727310912, + "end_time": 29.567072509623838, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--106/temp/line_4_A.wav", + "silence_duration": 0.5738411363718097, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "You're right, I should try that. I still need to figure out why she didn't keep the date last night.", + "original_text": "You're right, I should try that. I still need to figure out why she didn't keep the date last night.", + "start_time": 30.024738634811072, + "end_time": 34.738389428461865, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--106/temp/line_5_B.wav", + "silence_duration": 0.45766612518723593, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Yeah, understanding what happened could really help. Good luck with that, and don't hesitate to reach out if you need more advice.", + "original_text": "Yeah, understanding what happened could really help. Good luck with that, and don't hesitate to reach out if you need more advice.", + "start_time": 35.22747031425936, + "end_time": 42.84361543897591, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--106/temp/line_6_A.wav", + "silence_duration": 0.48908088579748954, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I will. Thanks for your advice.", + "original_text": "I will. Thanks for your advice.", + "start_time": 43.17417976708361, + "end_time": 44.97372625234438, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--106/temp/line_7_B.wav", + "silence_duration": 0.33056432810769704, + "is_interrupted": false + } + ] + }, + "DialogSum--val--107": { + "original_text": "A: Excuse me. This chicken doesn't taste right to me. \nB: What seems to be the [interrupt] wrong with it? The texture, the flavor, or maybe something else specifically that's bothering you about the dish? \nA: How should I know? It's just kind of cold in the middle. It just doesn't taste right. Do you want to try it? \nB: Well, let me get that out of your way. Would you like to order something else from the menu? Or I could bring you another order of chicken if you'd [interrupt] prefer that instead, though I completely understand if you'd rather try something different given this experience. \nA: Another one? I don't want another one. Give me something simple. You've got steak, right? \nB: Yes, we do. How would you like it cooked?", + "cleaned_text": "A: Excuse me. This chicken doesn't taste right to me. \nB:What seems to be the wrong with it? The texture, the flavor, or maybe something else specifically that's bothering you about the dish?\nA: How should I know? It's just kind of cold in the middle. It just doesn't taste right. Do you want to try it? \nB:Well, let me get that out of your way. Would you like to order something else from the menu? Or I could bring you another order of chicken if you'd prefer that instead, though I completely understand if you'd rather try something different given this experience.\nA: Another one? I don't want another one. Give me something simple. You've got steak, right? \nB: Yes, we do. How would you like it cooked?", + "total_duration": 33.690068027210884, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--107/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--107/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--107/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Excuse me. This chicken doesn't taste right to me.", + "original_text": "Excuse me. This chicken doesn't taste right to me.", + "start_time": 0, + "end_time": 3.355283446712018, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--107/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "What seems to be the", + "original_text": "What seems to be the [interrupt] wrong with it? The texture, the flavor, or maybe something else specifically that's bothering you about the dish?", + "start_time": 3.9547259609890695, + "end_time": 11.013592174140996, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--107/temp/line_1_B.wav", + "silence_duration": 0.5994425142770512, + "is_interrupted": true, + "text_after_interrupt": "wrong with it? The texture, the flavor, or maybe something else specifically that's bothering you about the dish?" + }, + { + "speaker": "A", + "text": "How should I know? It's just kind of cold in the middle. It just doesn't taste right. Do you want to try it?", + "original_text": "How should I know? It's just kind of cold in the middle. It just doesn't taste right. Do you want to try it?", + "start_time": 5.034453852145532, + "end_time": 11.82629058683941, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--107/temp/line_2_A.wav", + "silence_duration": 0.4788460372201747, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Well, let me get that out of your way. Would you like to order something else from the menu? Or I could bring you another order of chicken if you'd", + "original_text": "Well, let me get that out of your way. Would you like to order something else from the menu? Or I could bring you another order of chicken if you'd [interrupt] prefer that instead, though I completely understand if you'd rather try something different given this experience.", + "start_time": 12.151347105509645, + "end_time": 23.58717476990874, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--107/temp/line_3_B.wav", + "silence_duration": 0.3250565186702355, + "is_interrupted": true, + "text_after_interrupt": "prefer that instead, though I completely understand if you'd rather try something different given this experience." + }, + { + "speaker": "A", + "text": "Another one? I don't want another one. Give me something simple. You've got steak, right?", + "original_text": "Another one? I don't want another one. Give me something simple. You've got steak, right?", + "start_time": 24.544576655555723, + "end_time": 30.477275068254137, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--107/temp/line_4_A.wav", + "silence_duration": 0.5630438121146621, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, we do. How would you like it cooked?", + "original_text": "Yes, we do. How would you like it cooked?", + "start_time": 31.019806920081997, + "end_time": 33.690101704662496, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--107/temp/line_5_B.wav", + "silence_duration": 0.5425318518278606, + "is_interrupted": false + } + ] + }, + "DialogSum--val--108": { + "original_text": "A: Will you be joining Billy and I at the Bar?\nB: Which one will you be [interrupt] going to? I've heard there are several new establishments that have opened downtown recently, each with their own unique atmosphere and specialty cocktails.\nA: Sorry, we're going to try the new one that opened up on 17th Street.\nB: Sure, I've been meaning to visit that place myself. I want to stop off at my apartment to get changed so I should be there by 9 pm.\nA: OK, can I bring a date with me?\nB: Certainly. But if there are going to be four of us, I had better make reservations.\nA: Yes. that is a very good idea. It would be a shame if we could not find a place to sit.\nB: Then I'II make reservations for 9 pm for a party of four.\nA: I'll be there. Oh, is there a cover charge at the bar?\nB: Not that I know of. Why do you ask?\nA: I just want to make sure I bring enough money for my date and I. By the way, did you already mention the name of the bar?", + "cleaned_text": "A: Will you be joining Billy and I at the Bar?\nB:Which one will you be going to? I've heard there are several new establishments that have opened downtown recently, each with their own unique atmosphere and specialty cocktails.\nA: Sorry, we're going to try the new one that opened up on 17th Street.\nB: Sure, I've been meaning to visit that place myself. I want to stop off at my apartment to get changed so I should be there by 9 pm.\nA: OK, can I bring a date with me?\nB: Certainly. But if there are going to be four of us, I had better make reservations.\nA: Yes. that is a very good idea. It would be a shame if we could not find a place to sit.\nB: Then I'II make reservations for 9 pm for a party of four.\nA: I'll be there. Oh, is there a cover charge at the bar?\nB: Not that I know of. Why do you ask?\nA: I just want to make sure I bring enough money for my date and I. By the way, did you already mention the name of the bar?", + "total_duration": 50.3809977324263, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--108/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--108/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--108/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Will you be joining Billy and I at the Bar?", + "original_text": "Will you be joining Billy and I at the Bar?", + "start_time": 0, + "end_time": 2.589024943310658, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--108/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Which one will you be", + "original_text": "Which one will you be [interrupt] going to? I've heard there are several new establishments that have opened downtown recently, each with their own unique atmosphere and specialty cocktails.", + "start_time": 2.9431991661357904, + "end_time": 11.476532499469123, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--108/temp/line_1_B.wav", + "silence_duration": 0.3541742228251327, + "is_interrupted": true, + "text_after_interrupt": "going to? I've heard there are several new establishments that have opened downtown recently, each with their own unique atmosphere and specialty cocktails." + }, + { + "speaker": "A", + "text": "Sorry, we're going to try the new one that opened up on 17th Street.", + "original_text": "Sorry, we're going to try the new one that opened up on 17th Street.", + "start_time": 3.9764871479952006, + "end_time": 8.051589188811526, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--108/temp/line_2_A.wav", + "silence_duration": 0.40065565110640783, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Sure, I've been meaning to visit that place myself. I want to stop off at my apartment to get changed so I should be there by 9 pm.", + "original_text": "Sure, I've been meaning to visit that place myself. I want to stop off at my apartment to get changed so I should be there by 9 pm.", + "start_time": 11.84326162477378, + "end_time": 18.820857996655867, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--108/temp/line_3_B.wav", + "silence_duration": 0.36672912530465673, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "OK, can I bring a date with me?", + "original_text": "OK, can I bring a date with me?", + "start_time": 19.141563556072065, + "end_time": 21.556438839518776, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--108/temp/line_4_A.wav", + "silence_duration": 0.3207055594161968, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Certainly. But if there are going to be four of us, I had better make reservations.", + "original_text": "Certainly. But if there are going to be four of us, I had better make reservations.", + "start_time": 22.002323424758202, + "end_time": 26.11225539754732, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--108/temp/line_5_B.wav", + "silence_duration": 0.44588458523942515, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Yes. that is a very good idea. It would be a shame if we could not find a place to sit.", + "original_text": "Yes. that is a very good idea. It would be a shame if we could not find a place to sit.", + "start_time": 26.61448422896455, + "end_time": 31.850584002207178, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--108/temp/line_6_A.wav", + "silence_duration": 0.5022288314172311, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Then I'II make reservations for 9 pm for a party of four.", + "original_text": "Then I'II make reservations for 9 pm for a party of four.", + "start_time": 32.36376657741472, + "end_time": 35.75387995609953, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--108/temp/line_7_B.wav", + "silence_duration": 0.5131825752075425, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I'll be there. Oh, is there a cover charge at the bar?", + "original_text": "I'll be there. Oh, is there a cover charge at the bar?", + "start_time": 36.17532920941625, + "end_time": 39.91374190782895, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--108/temp/line_8_A.wav", + "silence_duration": 0.42144925331671435, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Not that I know of. Why do you ask?", + "original_text": "Not that I know of. Why do you ask?", + "start_time": 40.217842553089426, + "end_time": 42.51661806329351, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--108/temp/line_9_B.wav", + "silence_duration": 0.3041006452604763, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I just want to make sure I bring enough money for my date and I. By the way, did you already mention the name of the bar?", + "original_text": "I just want to make sure I bring enough money for my date and I. By the way, did you already mention the name of the bar?", + "start_time": 42.84612266631007, + "end_time": 50.38099794975678, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--108/temp/line_10_A.wav", + "silence_duration": 0.32950460301656975, + "is_interrupted": false + } + ] + }, + "DialogSum--val--109": { + "original_text": "A: ABC Rent-a-Car. May I help you? \nB: I would like to rent a car. What kind of car do you [interrupt] need for your trip? Are you planning to drive long distances or just around the city, and do you have any specific preferences regarding fuel efficiency or seating capacity? \nA: Sorry to interrupt, but I need to know if you are looking for a specific type, like a sedan or an SUV, before I list our options. \nB: I'm actually open to any type, just something economical. \nA: We have Volkswagen, Pinto, Plymouth, and Datsun. \nB: What is the rate? \nA: Twenty dollars per day for Volkswagen, Pinto, and Datsun, and twenty-seven dollars for the Plymouth, which is a bit larger and more comfortable. \nB: Wait, does that include insurance, or is that an extra cost? \nA: Insurance is extra, but I was about to mention that the twenty-seven dollars is for the Plymouth. How about mileage and gas? \nB: Oh, yes, please let me know about that. \nA: There is no charge for mileage. And fill up the gas when you return the car to us as it is not included. \nB: OK. I'll try a Pinto. I want to rent a car for one week. \nA: All right, sir. May I have your driver's license? \nB: Here you are.", + "cleaned_text": "A: ABC Rent-a-Car. May I help you? \nB:I would like to rent a car. What kind of car do you need for your trip? Are you planning to drive long distances or just around the city, and do you have any specific preferences regarding fuel efficiency or seating capacity?\nA: Sorry to interrupt, but I need to know if you are looking for a specific type, like a sedan or an SUV, before I list our options. \nB: I'm actually open to any type, just something economical. \nA: We have Volkswagen, Pinto, Plymouth, and Datsun. \nB: What is the rate? \nA: Twenty dollars per day for Volkswagen, Pinto, and Datsun, and twenty-seven dollars for the Plymouth, which is a bit larger and more comfortable. \nB: Wait, does that include insurance, or is that an extra cost? \nA: Insurance is extra, but I was about to mention that the twenty-seven dollars is for the Plymouth. How about mileage and gas? \nB: Oh, yes, please let me know about that. \nA: There is no charge for mileage. And fill up the gas when you return the car to us as it is not included. \nB: OK. I'll try a Pinto. I want to rent a car for one week. \nA: All right, sir. May I have your driver's license? \nB: Here you are.", + "total_duration": 64.05918367346939, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--109/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--109/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--109/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "ABC Rent-a-Car. May I help you?", + "original_text": "ABC Rent-a-Car. May I help you?", + "start_time": 0, + "end_time": 2.995374149659864, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--109/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I would like to rent a car. What kind of car do you", + "original_text": "I would like to rent a car. What kind of car do you [interrupt] need for your trip? Are you planning to drive long distances or just around the city, and do you have any specific preferences regarding fuel efficiency or seating capacity?", + "start_time": 3.435205983891517, + "end_time": 15.37026267323392, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--109/temp/line_1_B.wav", + "silence_duration": 0.439831834231653, + "is_interrupted": true, + "text_after_interrupt": "need for your trip? Are you planning to drive long distances or just around the city, and do you have any specific preferences regarding fuel efficiency or seating capacity?" + }, + { + "speaker": "A", + "text": "Sorry to interrupt, but I need to know if you are looking for a specific type, like a sedan or an SUV, before I list our options.", + "original_text": "Sorry to interrupt, but I need to know if you are looking for a specific type, like a sedan or an SUV, before I list our options.", + "start_time": 6.372530246930065, + "end_time": 14.789763807020767, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--109/temp/line_2_A.wav", + "silence_duration": 0.34132454540441215, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I'm actually open to any type, just something economical.", + "original_text": "I'm actually open to any type, just something economical.", + "start_time": 15.79755160511119, + "end_time": 18.63038607223137, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--109/temp/line_3_B.wav", + "silence_duration": 0.42728893187726885, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "We have Volkswagen, Pinto, Plymouth, and Datsun.", + "original_text": "We have Volkswagen, Pinto, Plymouth, and Datsun.", + "start_time": 19.120034835852053, + "end_time": 22.289558645375863, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--109/temp/line_4_A.wav", + "silence_duration": 0.489648763620683, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "What is the rate?", + "original_text": "What is the rate?", + "start_time": 22.689429089417583, + "end_time": 23.54856741141305, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--109/temp/line_5_B.wav", + "silence_duration": 0.39987044404172023, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Twenty dollars per day for Volkswagen, Pinto, and Datsun, and twenty-seven dollars for the Plymouth, which is a bit larger and more comfortable.", + "original_text": "Twenty dollars per day for Volkswagen, Pinto, and Datsun, and twenty-seven dollars for the Plymouth, which is a bit larger and more comfortable.", + "start_time": 23.890519530355444, + "end_time": 33.46875082287245, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--109/temp/line_6_A.wav", + "silence_duration": 0.34195211894239297, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Wait, does that include insurance, or is that an extra cost?", + "original_text": "Wait, does that include insurance, or is that an extra cost?", + "start_time": 33.879273862700906, + "end_time": 37.13006751349456, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--109/temp/line_7_B.wav", + "silence_duration": 0.41052303982845295, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Insurance is extra, but I was about to mention that the twenty-seven dollars is for the Plymouth. How about mileage and gas?", + "original_text": "Insurance is extra, but I was about to mention that the twenty-seven dollars is for the Plymouth. How about mileage and gas?", + "start_time": 37.5562466028276, + "end_time": 45.04468197697726, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--109/temp/line_8_A.wav", + "silence_duration": 0.4261790893330428, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Oh, yes, please let me know about that.", + "original_text": "Oh, yes, please let me know about that.", + "start_time": 45.63983666576739, + "end_time": 48.07793190386263, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--109/temp/line_9_B.wav", + "silence_duration": 0.595154688790128, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "There is no charge for mileage. And fill up the gas when you return the car to us as it is not included.", + "original_text": "There is no charge for mileage. And fill up the gas when you return the car to us as it is not included.", + "start_time": 48.53145399675194, + "end_time": 55.28846079947303, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--109/temp/line_10_A.wav", + "silence_duration": 0.4535220928893151, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "OK. I'll try a Pinto. I want to rent a car for one week.", + "original_text": "OK. I'll try a Pinto. I want to rent a car for one week.", + "start_time": 55.62695987958829, + "end_time": 59.28410273673115, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--109/temp/line_11_B.wav", + "silence_duration": 0.33849908011526597, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "All right, sir. May I have your driver's license?", + "original_text": "All right, sir. May I have your driver's license?", + "start_time": 59.69837603792697, + "end_time": 62.80984996082947, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--109/temp/line_12_A.wav", + "silence_duration": 0.41427330119581757, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Here you are.", + "original_text": "Here you are.", + "start_time": 63.3277956204976, + "end_time": 64.05922419192616, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--109/temp/line_13_B.wav", + "silence_duration": 0.5179456596681261, + "is_interrupted": false + } + ] + }, + "DialogSum--val--110": { + "original_text": "A: When in Rome, do as the Romans do, they say. \nB: What do you mean? \nA: Roman is living in Rome, of course. And go to work by car, or bus, or on [interrupt] foot, especially if they live close to their workplace, as it allows them to enjoy the beautiful architecture and vibrant street life along the way. \nB: Sorry to jump in, but do you know if the public transportation there is reliable? I'm considering using it if I visit. \nA: Yes, the public transportation is quite reliable, but I was about to mention that some people also prefer walking. Anyway, Roman really loves life. He knows how to enjoy [interrupt] the simple pleasures, like a stroll through the city or a coffee at a local café, which are often accompanied by lively conversations with friends and neighbors. \nB: Speaking of enjoying life, do you know any good spots in Rome where I can experience authentic Roman cuisine? \nA: Not always. But they like a good meal. Actually, I forgot to mention earlier, they also enjoy walking to work when the weather is nice. \nB: Really? So how can I go there to have a taste? \nA: By air, of course.", + "cleaned_text": "A: When in Rome, do as the Romans do, they say. \nB: What do you mean? \nA:Roman is living in Rome, of course. And go to work by car, or bus, or on foot, especially if they live close to their workplace, as it allows them to enjoy the beautiful architecture and vibrant street life along the way.\nB: Sorry to jump in, but do you know if the public transportation there is reliable? I'm considering using it if I visit. \nA:Yes, the public transportation is quite reliable, but I was about to mention that some people also prefer walking. Anyway, Roman really loves life. He knows how to enjoy the simple pleasures, like a stroll through the city or a coffee at a local café, which are often accompanied by lively conversations with friends and neighbors.\nB: Speaking of enjoying life, do you know any good spots in Rome where I can experience authentic Roman cuisine? \nA: Not always. But they like a good meal. Actually, I forgot to mention earlier, they also enjoy walking to work when the weather is nice. \nB: Really? So how can I go there to have a taste? \nA: By air, of course.", + "total_duration": 54.881133786848075, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--110/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--110/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--110/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "When in Rome, do as the Romans do, they say.", + "original_text": "When in Rome, do as the Romans do, they say.", + "start_time": 0, + "end_time": 2.8908843537414968, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--110/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "What do you mean?", + "original_text": "What do you mean?", + "start_time": 3.326095835904999, + "end_time": 4.080744361982097, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--110/temp/line_1_B.wav", + "silence_duration": 0.43521148216350225, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Roman is living in Rome, of course. And go to work by car, or bus, or on", + "original_text": "Roman is living in Rome, of course. And go to work by car, or bus, or on [interrupt] foot, especially if they live close to their workplace, as it allows them to enjoy the beautiful architecture and vibrant street life along the way.", + "start_time": 4.571151680376995, + "end_time": 17.748475943415542, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--110/temp/line_2_A.wav", + "silence_duration": 0.4904073183948984, + "is_interrupted": true, + "text_after_interrupt": "foot, especially if they live close to their workplace, as it allows them to enjoy the beautiful architecture and vibrant street life along the way." + }, + { + "speaker": "B", + "text": "Sorry to jump in, but do you know if the public transportation there is reliable? I'm considering using it if I visit.", + "original_text": "Sorry to jump in, but do you know if the public transportation there is reliable? I'm considering using it if I visit.", + "start_time": 10.445800206454091, + "end_time": 16.575868233664977, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--110/temp/line_3_B.wav", + "silence_duration": 0.5790838794231798, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Yes, the public transportation is quite reliable, but I was about to mention that some people also prefer walking. Anyway, Roman really loves life. He knows how to enjoy", + "original_text": "Yes, the public transportation is quite reliable, but I was about to mention that some people also prefer walking. Anyway, Roman really loves life. He knows how to enjoy [interrupt] the simple pleasures, like a stroll through the city or a coffee at a local café, which are often accompanied by lively conversations with friends and neighbors.", + "start_time": 18.172795807454158, + "end_time": 38.281276533077744, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--110/temp/line_4_A.wav", + "silence_duration": 0.42431986403861366, + "is_interrupted": true, + "text_after_interrupt": "the simple pleasures, like a stroll through the city or a coffee at a local café, which are often accompanied by lively conversations with friends and neighbors." + }, + { + "speaker": "B", + "text": "Speaking of enjoying life, do you know any good spots in Rome where I can experience authentic Roman cuisine?", + "original_text": "Speaking of enjoying life, do you know any good spots in Rome where I can experience authentic Roman cuisine?", + "start_time": 35.597492816676684, + "end_time": 41.05418215908031, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--110/temp/line_5_B.wav", + "silence_duration": 0.5574189984334239, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Not always. But they like a good meal. Actually, I forgot to mention earlier, they also enjoy walking to work when the weather is nice.", + "original_text": "Not always. But they like a good meal. Actually, I forgot to mention earlier, they also enjoy walking to work when the weather is nice.", + "start_time": 41.62809719707916, + "end_time": 49.99889084787281, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--110/temp/line_6_A.wav", + "silence_duration": 0.5739150379988452, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Really? So how can I go there to have a taste?", + "original_text": "Really? So how can I go there to have a taste?", + "start_time": 50.53494733632366, + "end_time": 53.08914234766153, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--110/temp/line_7_B.wav", + "silence_duration": 0.536056488450852, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "By air, of course.", + "original_text": "By air, of course.", + "start_time": 53.464735854944834, + "end_time": 54.881153088504924, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--110/temp/line_8_A.wav", + "silence_duration": 0.37559350728330876, + "is_interrupted": false + } + ] + }, + "DialogSum--val--111": { + "original_text": "A: Jenny, you look terrible. What's eating you? \nB: Don't worry about me, it's just been a rough day dealing with [interrupt] multiple deadlines at work and some personal issues that have been weighing heavily on my mind lately. \nA: Sorry to interrupt, but I just want to know if there's anything I can do to help. \nB: Hey, Chillon, I'm just trying to help. \nA: Sorry, Sally, it's not your fault. \nB: So, what's the problem? \nA: I drew a blank on ~ about the test. \nB: No kidding! Didn't you study for it? \nA: Yeah, but nothing was clear during the test. \nB: That's too bad, anyway, I'm sure things will turn around next week if you keep at it and [interrupt] focus on developing better study habits while also seeking help from tutors or study groups when needed. \nA: Wait, did you mean next semester? Because I was actually thinking of dropping out. \nB: You can't do that, Jenny! \nA: I'm dead serious about this, Sally.", + "cleaned_text": "A: Jenny, you look terrible. What's eating you? \nB:Don't worry about me, it's just been a rough day dealing with multiple deadlines at work and some personal issues that have been weighing heavily on my mind lately.\nA: Sorry to interrupt, but I just want to know if there's anything I can do to help. \nB: Hey, Chillon, I'm just trying to help. \nA: Sorry, Sally, it's not your fault. \nB: So, what's the problem? \nA: I drew a blank on ~ about the test. \nB: No kidding! Didn't you study for it? \nA: Yeah, but nothing was clear during the test. \nB:That's too bad, anyway, I'm sure things will turn around next week if you keep at it and focus on developing better study habits while also seeking help from tutors or study groups when needed.\nA: Wait, did you mean next semester? Because I was actually thinking of dropping out. \nB: You can't do that, Jenny! \nA: I'm dead serious about this, Sally.", + "total_duration": 47.87795918367347, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--111/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--111/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--111/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Jenny, you look terrible. What's eating you?", + "original_text": "Jenny, you look terrible. What's eating you?", + "start_time": 0, + "end_time": 2.8560544217687074, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--111/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Don't worry about me, it's just been a rough day dealing with", + "original_text": "Don't worry about me, it's just been a rough day dealing with [interrupt] multiple deadlines at work and some personal issues that have been weighing heavily on my mind lately.", + "start_time": 3.4429385519334024, + "end_time": 10.977813835380115, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--111/temp/line_1_B.wav", + "silence_duration": 0.586884130164695, + "is_interrupted": true, + "text_after_interrupt": "multiple deadlines at work and some personal issues that have been weighing heavily on my mind lately." + }, + { + "speaker": "A", + "text": "Sorry to interrupt, but I just want to know if there's anything I can do to help.", + "original_text": "Sorry to interrupt, but I just want to know if there's anything I can do to help.", + "start_time": 6.298992973702109, + "end_time": 11.674412474835897, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--111/temp/line_2_A.wav", + "silence_duration": 0.34202304523445853, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Hey, Chillon, I'm just trying to help.", + "original_text": "Hey, Chillon, I'm just trying to help.", + "start_time": 12.04074819126265, + "end_time": 14.351133678790996, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--111/temp/line_3_B.wav", + "silence_duration": 0.3663357164267543, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Sorry, Sally, it's not your fault.", + "original_text": "Sorry, Sally, it's not your fault.", + "start_time": 14.689473146136889, + "end_time": 17.243668157474758, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--111/temp/line_4_A.wav", + "silence_duration": 0.33833946734589265, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "So, what's the problem?", + "original_text": "So, what's the problem?", + "start_time": 17.703541836954862, + "end_time": 19.015469274596587, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--111/temp/line_5_B.wav", + "silence_duration": 0.4598736794801041, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I drew a blank on ~ about the test.", + "original_text": "I drew a blank on ~ about the test.", + "start_time": 19.561577658383822, + "end_time": 21.999672896479062, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--111/temp/line_6_A.wav", + "silence_duration": 0.546108383787234, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "No kidding! Didn't you study for it?", + "original_text": "No kidding! Didn't you study for it?", + "start_time": 22.440634531226056, + "end_time": 24.193741107189776, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--111/temp/line_7_B.wav", + "silence_duration": 0.440961634746993, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Yeah, but nothing was clear during the test.", + "original_text": "Yeah, but nothing was clear during the test.", + "start_time": 24.782275120822653, + "end_time": 27.754429315833992, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--111/temp/line_8_A.wav", + "silence_duration": 0.5885340136328763, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "That's too bad, anyway, I'm sure things will turn around next week if you keep at it and", + "original_text": "That's too bad, anyway, I'm sure things will turn around next week if you keep at it and [interrupt] focus on developing better study habits while also seeking help from tutors or study groups when needed.", + "start_time": 28.123587437421424, + "end_time": 38.1197779136119, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--111/temp/line_9_B.wav", + "silence_duration": 0.36915812158743344, + "is_interrupted": true, + "text_after_interrupt": "focus on developing better study habits while also seeking help from tutors or study groups when needed." + }, + { + "speaker": "A", + "text": "Wait, did you mean next semester? Because I was actually thinking of dropping out.", + "original_text": "Wait, did you mean next semester? Because I was actually thinking of dropping out.", + "start_time": 37.48717984100991, + "end_time": 43.22250863919585, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--111/temp/line_10_A.wav", + "silence_duration": 0.3740723295225749, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "You can't do that, Jenny!", + "original_text": "You can't do that, Jenny!", + "start_time": 43.79715015268753, + "end_time": 45.05102770370794, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--111/temp/line_11_B.wav", + "silence_duration": 0.5746415134916767, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I'm dead serious about this, Sally.", + "original_text": "I'm dead serious about this, Sally.", + "start_time": 45.625668349640215, + "end_time": 47.878003950547246, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--111/temp/line_12_A.wav", + "silence_duration": 0.5746406459322776, + "is_interrupted": false + } + ] + }, + "DialogSum--val--112": { + "original_text": "A: You honestly believe the world's improving every year? \nB: Yes, I do. I think that science is making us wiser. What do you think about the role of science in society's progress? \nA: Sorry to jump in, but when you say \"wiser,\" do you mean in terms of knowledge or decision-making? \nB: Both, actually. With advances in education and technology, people have more access to information and tools that help them make better decisions. But I was asking what you think about that. \nA: I don't think you're right there. \nB: I believe industry is making us wealthier. \nA: I don't believe that. And in my opinion, medicine is making us [interrupt] live longer and healthier lives, which is a significant improvement that has been consistently demonstrated through global health statistics and increasing life expectancy trends. \nB: Healthier, right? I agree with you in that sense. But we're all more miserable than ever, aren't we? \nA: I don't agree with you. I maintain that we're healthier, wealthier and wiser than we were a hundred years ago.", + "cleaned_text": "A: You honestly believe the world's improving every year? \nB: Yes, I do. I think that science is making us wiser. What do you think about the role of science in society's progress? \nA: Sorry to jump in, but when you say \"wiser,\" do you mean in terms of knowledge or decision-making? \nB: Both, actually. With advances in education and technology, people have more access to information and tools that help them make better decisions. But I was asking what you think about that. \nA: I don't think you're right there. \nB: I believe industry is making us wealthier. \nA:I don't believe that. And in my opinion, medicine is making us live longer and healthier lives, which is a significant improvement that has been consistently demonstrated through global health statistics and increasing life expectancy trends.\nB: Healthier, right? I agree with you in that sense. But we're all more miserable than ever, aren't we? \nA: I don't agree with you. I maintain that we're healthier, wealthier and wiser than we were a hundred years ago.", + "total_duration": 52.38290249433106, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--112/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--112/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--112/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "You honestly believe the world's improving every year?", + "original_text": "You honestly believe the world's improving every year?", + "start_time": 0, + "end_time": 3.01859410430839, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--112/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, I do. I think that science is making us wiser. What do you think about the role of science in society's progress?", + "original_text": "Yes, I do. I think that science is making us wiser. What do you think about the role of science in society's progress?", + "start_time": 3.5130933475814516, + "end_time": 9.991460694520228, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--112/temp/line_1_B.wav", + "silence_duration": 0.4944992432730615, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Sorry to jump in, but when you say \"wiser,\" do you mean in terms of knowledge or decision-making?", + "original_text": "Sorry to jump in, but when you say \"wiser,\" do you mean in terms of knowledge or decision-making?", + "start_time": 10.323554879849327, + "end_time": 16.44201292973595, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--112/temp/line_2_A.wav", + "silence_duration": 0.3320941853290998, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Both, actually. With advances in education and technology, people have more access to information and tools that help them make better decisions. But I was asking what you think about that.", + "original_text": "Both, actually. With advances in education and technology, people have more access to information and tools that help them make better decisions. But I was asking what you think about that.", + "start_time": 17.02464614421814, + "end_time": 26.858296937868932, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--112/temp/line_3_B.wav", + "silence_duration": 0.5826332144821882, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I don't think you're right there.", + "original_text": "I don't think you're right there.", + "start_time": 27.328516922798556, + "end_time": 29.000353657492433, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--112/temp/line_4_A.wav", + "silence_duration": 0.4702199849296236, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I believe industry is making us wealthier.", + "original_text": "I believe industry is making us wealthier.", + "start_time": 29.457383391107232, + "end_time": 31.70971899201426, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--112/temp/line_5_B.wav", + "silence_duration": 0.4570297336147997, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I don't believe that. And in my opinion, medicine is making us", + "original_text": "I don't believe that. And in my opinion, medicine is making us [interrupt] live longer and healthier lives, which is a significant improvement that has been consistently demonstrated through global health statistics and increasing life expectancy trends.", + "start_time": 32.02276857681786, + "end_time": 45.560002136908565, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--112/temp/line_6_A.wav", + "silence_duration": 0.313049584803604, + "is_interrupted": true, + "text_after_interrupt": "live longer and healthier lives, which is a significant improvement that has been consistently demonstrated through global health statistics and increasing life expectancy trends." + }, + { + "speaker": "B", + "text": "Healthier, right? I agree with you in that sense. But we're all more miserable than ever, aren't we?", + "original_text": "Healthier, right? I agree with you in that sense. But we're all more miserable than ever, aren't we?", + "start_time": 36.07465066298566, + "end_time": 40.788301456636454, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--112/temp/line_7_B.wav", + "silence_duration": 0.5038880190568945, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I don't agree with you. I maintain that we're healthier, wealthier and wiser than we were a hundred years ago.", + "original_text": "I don't agree with you. I maintain that we're healthier, wealthier and wiser than we were a hundred years ago.", + "start_time": 46.06710056576682, + "end_time": 52.382928230165916, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--112/temp/line_8_A.wav", + "silence_duration": 0.5070984288582535, + "is_interrupted": false + } + ] + }, + "DialogSum--val--114": { + "original_text": "A: Hi Mary, how's it going? \nB: Well, last night I had a big argument with Ann. \nA: Terrible. It must be something serious. You two are such close friends. \nB: Now that I look back at it, it wasn't that big a deal. I shouldn't have [interrupt] let my emotions get the best of me and reacted so strongly without considering her perspective first. \nA: What happened? I mean, you two are usually so good at resolving things. \nB: It's just we've been planning to go to the beach for a while, and we decided we could both make it this weekend. Then out of nowhere she called me up, said her boyfriend had made plans and that she [interrupt] wanted to spend time with him instead because they haven't seen each other in weeks due to his busy work schedule. \nA: Wait, so she just canceled on you because of her boyfriend? That's pretty harsh. \nB: I know, but I was so upset. I mean, come on! Does she have to do everything her boyfriend says? \nA: You know she probably feels just as bad. But, what was she planning to do with him anyway? \nB: Well, I think I was being a little selfish myself. I know they don't get to see each other very often. \nA: Well, in that case, I guess maybe you can be more understanding. You shouldn't let a trivial thing like this stand in the way of your friendship. After all, you can go to the beach anytime you want. \nB: Yeah, I'll call her later to patch things up.", + "cleaned_text": "A: Hi Mary, how's it going? \nB: Well, last night I had a big argument with Ann. \nA: Terrible. It must be something serious. You two are such close friends. \nB:Now that I look back at it, it wasn't that big a deal. I shouldn't have let my emotions get the best of me and reacted so strongly without considering her perspective first.\nA: What happened? I mean, you two are usually so good at resolving things. \nB:It's just we've been planning to go to the beach for a while, and we decided we could both make it this weekend. Then out of nowhere she called me up, said her boyfriend had made plans and that she wanted to spend time with him instead because they haven't seen each other in weeks due to his busy work schedule.\nA: Wait, so she just canceled on you because of her boyfriend? That's pretty harsh. \nB: I know, but I was so upset. I mean, come on! Does she have to do everything her boyfriend says? \nA: You know she probably feels just as bad. But, what was she planning to do with him anyway? \nB: Well, I think I was being a little selfish myself. I know they don't get to see each other very often. \nA: Well, in that case, I guess maybe you can be more understanding. You shouldn't let a trivial thing like this stand in the way of your friendship. After all, you can go to the beach anytime you want. \nB: Yeah, I'll call her later to patch things up.", + "total_duration": 70.73106575963719, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--114/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--114/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--114/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Hi Mary, how's it going?", + "original_text": "Hi Mary, how's it going?", + "start_time": 0, + "end_time": 1.555736961451247, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--114/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Well, last night I had a big argument with Ann.", + "original_text": "Well, last night I had a big argument with Ann.", + "start_time": 2.049562665848381, + "end_time": 4.743077405077406, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--114/temp/line_1_B.wav", + "silence_duration": 0.49382570439713397, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Terrible. It must be something serious. You two are such close friends.", + "original_text": "Terrible. It must be something serious. You two are such close friends.", + "start_time": 5.261059658983452, + "end_time": 10.055980293904087, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--114/temp/line_2_A.wav", + "silence_duration": 0.5179822539060459, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Now that I look back at it, it wasn't that big a deal. I shouldn't have", + "original_text": "Now that I look back at it, it wasn't that big a deal. I shouldn't have [interrupt] let my emotions get the best of me and reacted so strongly without considering her perspective first.", + "start_time": 10.414780775834078, + "end_time": 18.924894154518885, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--114/temp/line_3_B.wav", + "silence_duration": 0.35880048192999225, + "is_interrupted": true, + "text_after_interrupt": "let my emotions get the best of me and reacted so strongly without considering her perspective first." + }, + { + "speaker": "A", + "text": "What happened? I mean, you two are usually so good at resolving things.", + "original_text": "What happened? I mean, you two are usually so good at resolving things.", + "start_time": 14.350563088759248, + "end_time": 19.319633383543827, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--114/temp/line_4_A.wav", + "silence_duration": 0.5102074609086429, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "It's just we've been planning to go to the beach for a while, and we decided we could both make it this weekend. Then out of nowhere she called me up, said her boyfriend had made plans and that she", + "original_text": "It's just we've been planning to go to the beach for a while, and we decided we could both make it this weekend. Then out of nowhere she called me up, said her boyfriend had made plans and that she [interrupt] wanted to spend time with him instead because they haven't seen each other in weeks due to his busy work schedule.", + "start_time": 19.901581815627758, + "end_time": 34.07736412855293, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--114/temp/line_5_B.wav", + "silence_duration": 0.5819484320839284, + "is_interrupted": true, + "text_after_interrupt": "wanted to spend time with him instead because they haven't seen each other in weeks due to his busy work schedule." + }, + { + "speaker": "A", + "text": "Wait, so she just canceled on you because of her boyfriend? That's pretty harsh.", + "original_text": "Wait, so she just canceled on you because of her boyfriend? That's pretty harsh.", + "start_time": 33.604979134695036, + "end_time": 38.34184988299435, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--114/temp/line_6_A.wav", + "silence_duration": 0.5847550636919706, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I know, but I was so upset. I mean, come on! Does she have to do everything her boyfriend says?", + "original_text": "I know, but I was so upset. I mean, come on! Does she have to do everything her boyfriend says?", + "start_time": 38.917751457611374, + "end_time": 44.432490686636314, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--114/temp/line_7_B.wav", + "silence_duration": 0.5759015746170212, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "You know she probably feels just as bad. But, what was she planning to do with him anyway?", + "original_text": "You know she probably feels just as bad. But, what was she planning to do with him anyway?", + "start_time": 45.02736768949368, + "end_time": 50.46083707724878, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--114/temp/line_8_A.wav", + "silence_duration": 0.5948770028573689, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Well, I think I was being a little selfish myself. I know they don't get to see each other very often.", + "original_text": "Well, I think I was being a little selfish myself. I know they don't get to see each other very often.", + "start_time": 50.909323740678936, + "end_time": 56.28474324181272, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--114/temp/line_9_B.wav", + "silence_duration": 0.44848666343014904, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Well, in that case, I guess maybe you can be more understanding. You shouldn't let a trivial thing like this stand in the way of your friendship. After all, you can go to the beach anytime you want.", + "original_text": "Well, in that case, I guess maybe you can be more understanding. You shouldn't let a trivial thing like this stand in the way of your friendship. After all, you can go to the beach anytime you want.", + "start_time": 56.8261141861658, + "end_time": 67.8207627122429, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--114/temp/line_10_A.wav", + "silence_duration": 0.5413709443530839, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yeah, I'll call her later to patch things up.", + "original_text": "Yeah, I'll call her later to patch things up.", + "start_time": 68.21171398991031, + "end_time": 70.73107906927538, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--114/temp/line_11_B.wav", + "silence_duration": 0.39095127766741217, + "is_interrupted": false + } + ] + }, + "DialogSum--val--115": { + "original_text": "A: Hello, Neal. How are you? \nB: I'm fine, thanks. And you? \nA: Very well, thanks. Nice to see you again. I haven't seen you for a long time. What have you been doing [interrupt] working on lately? I've been really curious about your projects since we last met, especially with all the technological advancements happening these days. \nB: Oh, actually, before I forget, I wanted to ask you—have you heard about the new AI research project at the university? \nA: Not yet, but it sounds interesting! Anyway, I was saying, I went to Singapore to study for a period. \nB: Wow, that's great. What have you been studying? \nA: Natural language processing. \nB: Oh, that's hard. I've been studying for my exams. My school exams will [interrupt] be quite challenging this time because they've introduced new topics and the syllabus has been expanded significantly compared to previous years. \nA: Speaking of exams, do you know if the NLP course has any prerequisites? I'm considering taking it next semester. \nB: The course I took didn't have any specific prerequisites, but it's good to have some background in machine learning. By the way, my school exams will begin next month. \nA: Really? Good luck with them. \nB: Thanks. And how are your parents? \nA: They're both very well, thanks. \nB: Where are you going now? \nA: I'm going to read some papers and then attend a seminar. Why don't you come with me?", + "cleaned_text": "A: Hello, Neal. How are you? \nB: I'm fine, thanks. And you? \nA:Very well, thanks. Nice to see you again. I haven't seen you for a long time. What have you been doing working on lately? I've been really curious about your projects since we last met, especially with all the technological advancements happening these days.\nB: Oh, actually, before I forget, I wanted to ask you—have you heard about the new AI research project at the university? \nA: Not yet, but it sounds interesting! Anyway, I was saying, I went to Singapore to study for a period. \nB: Wow, that's great. What have you been studying? \nA: Natural language processing. \nB:Oh, that's hard. I've been studying for my exams. My school exams will be quite challenging this time because they've introduced new topics and the syllabus has been expanded significantly compared to previous years.\nA: Speaking of exams, do you know if the NLP course has any prerequisites? I'm considering taking it next semester. \nB: The course I took didn't have any specific prerequisites, but it's good to have some background in machine learning. By the way, my school exams will begin next month. \nA: Really? Good luck with them. \nB: Thanks. And how are your parents? \nA: They're both very well, thanks. \nB: Where are you going now? \nA: I'm going to read some papers and then attend a seminar. Why don't you come with me?", + "total_duration": 73.54294784580499, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--115/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--115/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--115/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Hello, Neal. How are you?", + "original_text": "Hello, Neal. How are you?", + "start_time": 0, + "end_time": 2.089795918367347, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--115/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I'm fine, thanks. And you?", + "original_text": "I'm fine, thanks. And you?", + "start_time": 2.476369353434933, + "end_time": 4.171426042777337, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--115/temp/line_1_B.wav", + "silence_duration": 0.3865734350675858, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Very well, thanks. Nice to see you again. I haven't seen you for a long time. What have you been doing", + "original_text": "Very well, thanks. Nice to see you again. I haven't seen you for a long time. What have you been doing [interrupt] working on lately? I've been really curious about your projects since we last met, especially with all the technological advancements happening these days.", + "start_time": 4.5142518927363255, + "end_time": 19.723322187520907, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--115/temp/line_2_A.wav", + "silence_duration": 0.3428258499589885, + "is_interrupted": true, + "text_after_interrupt": "working on lately? I've been really curious about your projects since we last met, especially with all the technological advancements happening these days." + }, + { + "speaker": "B", + "text": "Oh, actually, before I forget, I wanted to ask you—have you heard about the new AI research project at the university?", + "original_text": "Oh, actually, before I forget, I wanted to ask you—have you heard about the new AI research project at the university?", + "start_time": 10.551440101353105, + "end_time": 16.820827856455146, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--115/temp/line_3_B.wav", + "silence_duration": 0.39795239190808795, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Not yet, but it sounds interesting! Anyway, I was saying, I went to Singapore to study for a period.", + "original_text": "Not yet, but it sounds interesting! Anyway, I was saying, I went to Singapore to study for a period.", + "start_time": 20.137702394204034, + "end_time": 26.61606974114281, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--115/temp/line_4_A.wav", + "silence_duration": 0.4143802066831283, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Wow, that's great. What have you been studying?", + "original_text": "Wow, that's great. What have you been studying?", + "start_time": 27.17188342077558, + "end_time": 29.66802854549213, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--115/temp/line_5_B.wav", + "silence_duration": 0.555813679632771, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Natural language processing.", + "original_text": "Natural language processing.", + "start_time": 30.029256973168945, + "end_time": 31.759143594484136, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--115/temp/line_6_A.wav", + "silence_duration": 0.3612284276768145, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Oh, that's hard. I've been studying for my exams. My school exams will", + "original_text": "Oh, that's hard. I've been studying for my exams. My school exams will [interrupt] be quite challenging this time because they've introduced new topics and the syllabus has been expanded significantly compared to previous years.", + "start_time": 32.342609611225996, + "end_time": 43.69716743435525, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--115/temp/line_7_B.wav", + "silence_duration": 0.5834660167418575, + "is_interrupted": true, + "text_after_interrupt": "be quite challenging this time because they've introduced new topics and the syllabus has been expanded significantly compared to previous years." + }, + { + "speaker": "A", + "text": "Speaking of exams, do you know if the NLP course has any prerequisites? I'm considering taking it next semester.", + "original_text": "Speaking of exams, do you know if the NLP course has any prerequisites? I'm considering taking it next semester.", + "start_time": 43.12044439748492, + "end_time": 51.49123804827857, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--115/temp/line_8_A.wav", + "silence_duration": 0.3624957544514108, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "The course I took didn't have any specific prerequisites, but it's good to have some background in machine learning. By the way, my school exams will begin next month.", + "original_text": "The course I took didn't have any specific prerequisites, but it's good to have some background in machine learning. By the way, my school exams will begin next month.", + "start_time": 51.929637098909495, + "end_time": 59.859251611381154, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--115/temp/line_9_B.wav", + "silence_duration": 0.4383990506309279, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Really? Good luck with them.", + "original_text": "Really? Good luck with them.", + "start_time": 60.19412683111997, + "end_time": 61.97045336173222, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--115/temp/line_10_A.wav", + "silence_duration": 0.3348752197388179, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Thanks. And how are your parents?", + "original_text": "Thanks. And how are your parents?", + "start_time": 62.48864711565563, + "end_time": 64.34624348753772, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--115/temp/line_11_B.wav", + "silence_duration": 0.5181937539234108, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "They're both very well, thanks.", + "original_text": "They're both very well, thanks.", + "start_time": 64.75019337055524, + "end_time": 66.50329994651895, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--115/temp/line_12_A.wav", + "silence_duration": 0.4039498830175198, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Where are you going now?", + "original_text": "Where are you going now?", + "start_time": 67.00556324325858, + "end_time": 68.25944079427899, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--115/temp/line_13_B.wav", + "silence_duration": 0.5022632967396294, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I'm going to read some papers and then attend a seminar. Why don't you come with me?", + "original_text": "I'm going to read some papers and then attend a seminar. Why don't you come with me?", + "start_time": 68.72484745267005, + "end_time": 73.54298804223922, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--115/temp/line_14_A.wav", + "silence_duration": 0.46540665839106743, + "is_interrupted": false + } + ] + }, + "DialogSum--val--116": { + "original_text": "A: Susan, Is the manager in this office? \nB: Yes. But he is meeting a client. \nA: Oh, that's too bad. I just got a phone call saying that my wife is now in the hospital. She is going to deliver a baby. I must take the day off to go to the hospital. May I [interrupt] leave immediately after informing him about this family emergency situation and assure him that I'll complete all pending tasks as soon as I return?\nB: Oh, congratulations! But it might be difficult to speak to him directly right now. I could convey your leave to him after the client goes. \nA: Thanks, I appreciate that. But I wanted to ask him directly because I need to make sure it's approved immediately. Could you also let him know that I [interrupt] will be away for the rest of the day and possibly tomorrow depending on how the delivery goes and that my colleague John has agreed to cover my urgent tasks?\nB: I understand. I'll make it a priority to inform him as soon as possible. But what else should I tell him besides your leave request? \nA: Please let him know that I'll be reachable by phone in case of any urgent issues.", + "cleaned_text": "A: Susan, Is the manager in this office? \nB: Yes. But he is meeting a client. \nA:Oh, that's too bad. I just got a phone call saying that my wife is now in the hospital. She is going to deliver a baby. I must take the day off to go to the hospital. May I leave immediately after informing him about this family emergency situation and assure him that I'll complete all pending tasks as soon as I return?\nB: Oh, congratulations! But it might be difficult to speak to him directly right now. I could convey your leave to him after the client goes. \nA:Thanks, I appreciate that. But I wanted to ask him directly because I need to make sure it's approved immediately. Could you also let him know that I will be away for the rest of the day and possibly tomorrow depending on how the delivery goes and that my colleague John has agreed to cover my urgent tasks?\nB: I understand. I'll make it a priority to inform him as soon as possible. But what else should I tell him besides your leave request? \nA: Please let him know that I'll be reachable by phone in case of any urgent issues.", + "total_duration": 52.92961451247166, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--116/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--116/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--116/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Susan, Is the manager in this office?", + "original_text": "Susan, Is the manager in this office?", + "start_time": 0, + "end_time": 2.8792743764172335, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--116/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes. But he is meeting a client.", + "original_text": "Yes. But he is meeting a client.", + "start_time": 3.314707567636048, + "end_time": 5.114254052896818, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--116/temp/line_1_B.wav", + "silence_duration": 0.4354331912188145, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Oh, that's too bad. I just got a phone call saying that my wife is now in the hospital. She is going to deliver a baby. I must take the day off to go to the hospital. May I", + "original_text": "Oh, that's too bad. I just got a phone call saying that my wife is now in the hospital. She is going to deliver a baby. I must take the day off to go to the hospital. May I [interrupt] leave immediately after informing him about this family emergency situation and assure him that I'll complete all pending tasks as soon as I return?", + "start_time": 5.479310178242051, + "end_time": 24.29908342087244, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--116/temp/line_2_A.wav", + "silence_duration": 0.36505612534523324, + "is_interrupted": true, + "text_after_interrupt": "leave immediately after informing him about this family emergency situation and assure him that I'll complete all pending tasks as soon as I return?" + }, + { + "speaker": "B", + "text": "Oh, congratulations! But it might be difficult to speak to him directly right now. I could convey your leave to him after the client goes.", + "original_text": "Oh, congratulations! But it might be difficult to speak to him directly right now. I could convey your leave to him after the client goes.", + "start_time": 15.591600427675157, + "end_time": 22.871056209988083, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--116/temp/line_3_B.wav", + "silence_duration": 0.5821146823898338, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Thanks, I appreciate that. But I wanted to ask him directly because I need to make sure it's approved immediately. Could you also let him know that I", + "original_text": "Thanks, I appreciate that. But I wanted to ask him directly because I need to make sure it's approved immediately. Could you also let him know that I [interrupt] will be away for the rest of the day and possibly tomorrow depending on how the delivery goes and that my colleague John has agreed to cover my urgent tasks?", + "start_time": 24.679233899793076, + "end_time": 42.488939115212574, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--116/temp/line_4_A.wav", + "silence_duration": 0.3801504789206361, + "is_interrupted": true, + "text_after_interrupt": "will be away for the rest of the day and possibly tomorrow depending on how the delivery goes and that my colleague John has agreed to cover my urgent tasks?" + }, + { + "speaker": "B", + "text": "I understand. I'll make it a priority to inform him as soon as possible. But what else should I tell him besides your leave request?", + "original_text": "I understand. I'll make it a priority to inform him as soon as possible. But what else should I tell him besides your leave request?", + "start_time": 41.680852793245066, + "end_time": 48.15922014018384, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--116/temp/line_5_B.wav", + "silence_duration": 0.3825947561854628, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Please let him know that I'll be reachable by phone in case of any urgent issues.", + "original_text": "Please let him know that I'll be reachable by phone in case of any urgent issues.", + "start_time": 48.57590781614903, + "end_time": 52.929649312747664, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--116/temp/line_6_A.wav", + "silence_duration": 0.41668767596518724, + "is_interrupted": false + } + ] + }, + "DialogSum--val--117": { + "original_text": "A: I'm looking for a pan I can use in my kitchen. \nB: What size pan were you thinking of? \nA: I've already got a small pan. I need a big [interrupt] one for cooking larger meals, especially when we have guests over, and it should be durable enough to handle frequent use without warping or losing its shape. \nB: Sorry to jump in, but do you have any specific material in mind? Like stainless steel or non-stick? \nA: I hadn't thought about that yet. But actually, I do prefer non-stick. Well, this one might work for you. \nB: Oh, no, that's way too heavy a pan for me. \nA: Here, lift this aluminum pan. It's the same size. \nB: Yes, it's very lightweight. But I don't want this aluminum handle. \nA: Here's a similar aluminum pan. But it has a heat-resistant handle. \nB: Oh, this feels very nice. It's perfect. I'll take it. \nA: I knew we'd find the right pan sooner or later. How would you like to pay? \nB: Cash. But first, I need a lid for [interrupt] this pan because I like to cover my dishes while cooking to retain moisture and ensure even heat distribution throughout the cooking process. \nA: Oh, right, I almost forgot to ask—did you still want a big pan or was this size sufficient? \nB: This size is fine. But yes, I still need a lid for this pan. \nA: Oh, no problem. Here's the lid that comes with the pan.", + "cleaned_text": "A: I'm looking for a pan I can use in my kitchen. \nB: What size pan were you thinking of? \nA:I've already got a small pan. I need a big one for cooking larger meals, especially when we have guests over, and it should be durable enough to handle frequent use without warping or losing its shape.\nB: Sorry to jump in, but do you have any specific material in mind? Like stainless steel or non-stick? \nA: I hadn't thought about that yet. But actually, I do prefer non-stick. Well, this one might work for you. \nB: Oh, no, that's way too heavy a pan for me. \nA: Here, lift this aluminum pan. It's the same size. \nB: Yes, it's very lightweight. But I don't want this aluminum handle. \nA: Here's a similar aluminum pan. But it has a heat-resistant handle. \nB: Oh, this feels very nice. It's perfect. I'll take it. \nA: I knew we'd find the right pan sooner or later. How would you like to pay? \nB:Cash. But first, I need a lid for this pan because I like to cover my dishes while cooking to retain moisture and ensure even heat distribution throughout the cooking process.\nA: Oh, right, I almost forgot to ask—did you still want a big pan or was this size sufficient? \nB: This size is fine. But yes, I still need a lid for this pan. \nA: Oh, no problem. Here's the lid that comes with the pan.", + "total_duration": 72.12566893424037, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--117/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--117/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--117/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "I'm looking for a pan I can use in my kitchen.", + "original_text": "I'm looking for a pan I can use in my kitchen.", + "start_time": 0, + "end_time": 2.7980045351473923, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--117/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "What size pan were you thinking of?", + "original_text": "What size pan were you thinking of?", + "start_time": 3.285069987989317, + "end_time": 5.154276337195666, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--117/temp/line_1_B.wav", + "silence_duration": 0.4870654528419246, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I've already got a small pan. I need a big", + "original_text": "I've already got a small pan. I need a big [interrupt] one for cooking larger meals, especially when we have guests over, and it should be durable enough to handle frequent use without warping or losing its shape.", + "start_time": 5.676676778494419, + "end_time": 17.867152968970608, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--117/temp/line_2_A.wav", + "silence_duration": 0.5224004412987527, + "is_interrupted": true, + "text_after_interrupt": "one for cooking larger meals, especially when we have guests over, and it should be durable enough to handle frequent use without warping or losing its shape." + }, + { + "speaker": "B", + "text": "Sorry to jump in, but do you have any specific material in mind? Like stainless steel or non-stick?", + "original_text": "Sorry to jump in, but do you have any specific material in mind? Like stainless steel or non-stick?", + "start_time": 8.69527088280281, + "end_time": 14.569919408879906, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--117/temp/line_3_B.wav", + "silence_duration": 0.5293517379301216, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I hadn't thought about that yet. But actually, I do prefer non-stick. Well, this one might work for you.", + "original_text": "I hadn't thought about that yet. But actually, I do prefer non-stick. Well, this one might work for you.", + "start_time": 18.266021721992523, + "end_time": 25.25522807119887, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--117/temp/line_4_A.wav", + "silence_duration": 0.3988687530219154, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Oh, no, that's way too heavy a pan for me.", + "original_text": "Oh, no, that's way too heavy a pan for me.", + "start_time": 25.641141471976745, + "end_time": 27.754157344992617, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--117/temp/line_5_B.wav", + "silence_duration": 0.38591340077787434, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Here, lift this aluminum pan. It's the same size.", + "original_text": "Here, lift this aluminum pan. It's the same size.", + "start_time": 28.181231260642264, + "end_time": 31.652614480596913, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--117/temp/line_6_A.wav", + "silence_duration": 0.42707391564964803, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, it's very lightweight. But I don't want this aluminum handle.", + "original_text": "Yes, it's very lightweight. But I don't want this aluminum handle.", + "start_time": 31.959283169583315, + "end_time": 35.19846684305271, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--117/temp/line_7_B.wav", + "silence_duration": 0.30666868898640354, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Here's a similar aluminum pan. But it has a heat-resistant handle.", + "original_text": "Here's a similar aluminum pan. But it has a heat-resistant handle.", + "start_time": 35.73122320723197, + "end_time": 40.10818465847913, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--117/temp/line_8_A.wav", + "silence_duration": 0.532756364179264, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Oh, this feels very nice. It's perfect. I'll take it.", + "original_text": "Oh, this feels very nice. It's perfect. I'll take it.", + "start_time": 40.468528914127575, + "end_time": 43.66127267829991, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--117/temp/line_9_B.wav", + "silence_duration": 0.36034425564844436, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I knew we'd find the right pan sooner or later. How would you like to pay?", + "original_text": "I knew we'd find the right pan sooner or later. How would you like to pay?", + "start_time": 44.09043540330973, + "end_time": 48.420956945259846, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--117/temp/line_10_A.wav", + "silence_duration": 0.4291627250098211, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Cash. But first, I need a lid for", + "original_text": "Cash. But first, I need a lid for [interrupt] this pan because I like to cover my dishes while cooking to retain moisture and ensure even heat distribution throughout the cooking process.", + "start_time": 48.76320290857959, + "end_time": 58.062794745314285, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--117/temp/line_11_B.wav", + "silence_duration": 0.342245963319747, + "is_interrupted": true, + "text_after_interrupt": "this pan because I like to cover my dishes while cooking to retain moisture and ensure even heat distribution throughout the cooking process." + }, + { + "speaker": "A", + "text": "Oh, right, I almost forgot to ask—did you still want a big pan or was this size sufficient?", + "original_text": "Oh, right, I almost forgot to ask—did you still want a big pan or was this size sufficient?", + "start_time": 58.1083175529138, + "end_time": 63.82042639645122, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--117/temp/line_12_A.wav", + "silence_duration": 0.3282547100655181, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "This size is fine. But yes, I still need a lid for this pan.", + "original_text": "This size is fine. But yes, I still need a lid for this pan.", + "start_time": 64.19097558071668, + "end_time": 67.96421821110216, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--117/temp/line_13_B.wav", + "silence_duration": 0.37054918426546146, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Oh, no problem. Here's the lid that comes with the pan.", + "original_text": "Oh, no problem. Here's the lid that comes with the pan.", + "start_time": 68.45691799818877, + "end_time": 72.12567083265589, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--117/temp/line_14_A.wav", + "silence_duration": 0.49269978708660184, + "is_interrupted": false + } + ] + }, + "DialogSum--val--119": { + "original_text": "A: This is 911. \nB: Send an ambulance fast! My husband is having a heart attack! \nA: Slow down and tell me your [interrupt] location so we can send help immediately and provide you with the necessary medical instructions while you wait for the paramedics to arrive. \nB: 1177 Oak lane in Smithfield! Oh, hurry, I don't know what to do! \nA: An ambulance is on its way right now. They should be there any minute. Are you close to him? Can you stay with him until help arrives? \nB: Yes, yes, he's right here by me! \nA: Is he breathing? \nB: Yes, he's breathing, but he's not conscious! Oh, please hurry! \nA: Just to confirm, your address is 1177 Oak Lane in Smithfield, right? The ambulance is on its way. Stay with him and keep monitoring his breathing.", + "cleaned_text": "A: This is 911. \nB: Send an ambulance fast! My husband is having a heart attack! \nA:Slow down and tell me your location so we can send help immediately and provide you with the necessary medical instructions while you wait for the paramedics to arrive.\nB: 1177 Oak lane in Smithfield! Oh, hurry, I don't know what to do! \nA: An ambulance is on its way right now. They should be there any minute. Are you close to him? Can you stay with him until help arrives? \nB: Yes, yes, he's right here by me! \nA: Is he breathing? \nB: Yes, he's breathing, but he's not conscious! Oh, please hurry! \nA: Just to confirm, your address is 1177 Oak Lane in Smithfield, right? The ambulance is on its way. Stay with him and keep monitoring his breathing.", + "total_duration": 42.262403628117916, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--119/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--119/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--119/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "This is 911.", + "original_text": "This is 911.", + "start_time": 0, + "end_time": 1.8343764172335602, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--119/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Send an ambulance fast! My husband is having a heart attack!", + "original_text": "Send an ambulance fast! My husband is having a heart attack!", + "start_time": 2.2000683007639967, + "end_time": 5.4508619515576475, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--119/temp/line_1_B.wav", + "silence_duration": 0.3656918835304364, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Slow down and tell me your", + "original_text": "Slow down and tell me your [interrupt] location so we can send help immediately and provide you with the necessary medical instructions while you wait for the paramedics to arrive.", + "start_time": 5.903117989931798, + "end_time": 15.632278987664225, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--119/temp/line_2_A.wav", + "silence_duration": 0.4522560383741503, + "is_interrupted": true, + "text_after_interrupt": "location so we can send help immediately and provide you with the necessary medical instructions while you wait for the paramedics to arrive." + }, + { + "speaker": "B", + "text": "1177 Oak lane in Smithfield! Oh, hurry, I don't know what to do!", + "original_text": "1177 Oak lane in Smithfield! Oh, hurry, I don't know what to do!", + "start_time": 8.120623658866037, + "end_time": 12.45114520081615, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--119/temp/line_3_B.wav", + "silence_duration": 0.48344937506313257, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "An ambulance is on its way right now. They should be there any minute. Are you close to him? Can you stay with him until help arrives?", + "original_text": "An ambulance is on its way right now. They should be there any minute. Are you close to him? Can you stay with him until help arrives?", + "start_time": 16.151596264322073, + "end_time": 24.208920527360622, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--119/temp/line_4_A.wav", + "silence_duration": 0.5193172766578481, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, yes, he's right here by me!", + "original_text": "Yes, yes, he's right here by me!", + "start_time": 24.67892190660249, + "end_time": 26.47846839186326, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--119/temp/line_5_B.wav", + "silence_duration": 0.4700013792418676, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Is he breathing?", + "original_text": "Is he breathing?", + "start_time": 26.856233738915773, + "end_time": 27.831471834153866, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--119/temp/line_6_A.wav", + "silence_duration": 0.3777653470525143, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, he's breathing, but he's not conscious! Oh, please hurry!", + "original_text": "Yes, he's breathing, but he's not conscious! Oh, please hurry!", + "start_time": 28.21042457014218, + "end_time": 31.60053794882699, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--119/temp/line_7_B.wav", + "silence_duration": 0.3789527359883133, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Just to confirm, your address is 1177 Oak Lane in Smithfield, right? The ambulance is on its way. Stay with him and keep monitoring his breathing.", + "original_text": "Just to confirm, your address is 1177 Oak Lane in Smithfield, right? The ambulance is on its way. Stay with him and keep monitoring his breathing.", + "start_time": 32.18495070092121, + "end_time": 42.26241101838153, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--119/temp/line_8_A.wav", + "silence_duration": 0.5844127520942237, + "is_interrupted": false + } + ] + }, + "DialogSum--val--120": { + "original_text": "A: Can I help you? \nB: Yes. When is the next train to New York City? \nA: Let me see. . . the train to New York City. . . here it is. . . daily except Sunday at ten thirty, twelve twenty and [interrupt] at fifteen ten, with additional express services available during peak hours that can get you there much faster if you're in a hurry. \nB: Wait, aren't there any trains before ten thirty? \nA: Sorry, not before ten thirty. \nB: Then one to New York at ten thirty. \nA: One way or round trip? \nB: One way. \nA: A soft seat or hard one? \nB: How much is a soft? \nA: 15 dollars. And for a hard one, only 6 dollars. \nB: Then one hard seat, please. Oh, by the way, you were about to mention the other train times after twelve twenty? \nA: Yes, the other one is at fifteen ten.", + "cleaned_text": "A: Can I help you? \nB: Yes. When is the next train to New York City? \nA:Let me see. . . the train to New York City. . . here it is. . . daily except Sunday at ten thirty, twelve twenty and at fifteen ten, with additional express services available during peak hours that can get you there much faster if you're in a hurry.\nB: Wait, aren't there any trains before ten thirty? \nA: Sorry, not before ten thirty. \nB: Then one to New York at ten thirty. \nA: One way or round trip? \nB: One way. \nA: A soft seat or hard one? \nB: How much is a soft? \nA: 15 dollars. And for a hard one, only 6 dollars. \nB: Then one hard seat, please. Oh, by the way, you were about to mention the other train times after twelve twenty? \nA: Yes, the other one is at fifteen ten.", + "total_duration": 43.52553287981859, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--120/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--120/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--120/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Can I help you?", + "original_text": "Can I help you?", + "start_time": 0, + "end_time": 0.9287981859410431, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--120/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes. When is the next train to New York City?", + "original_text": "Yes. When is the next train to New York City?", + "start_time": 1.2453457967227686, + "end_time": 3.6370011255209547, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--120/temp/line_1_B.wav", + "silence_duration": 0.3165476107817255, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Let me see. . . the train to New York City. . . here it is. . . daily except Sunday at ten thirty, twelve twenty and", + "original_text": "Let me see. . . the train to New York City. . . here it is. . . daily except Sunday at ten thirty, twelve twenty and [interrupt] at fifteen ten, with additional express services available during peak hours that can get you there much faster if you're in a hurry.", + "start_time": 4.0580375593947, + "end_time": 19.011688353045493, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--120/temp/line_2_A.wav", + "silence_duration": 0.42103643387374534, + "is_interrupted": true, + "text_after_interrupt": "at fifteen ten, with additional express services available during peak hours that can get you there much faster if you're in a hurry." + }, + { + "speaker": "B", + "text": "Wait, aren't there any trains before ten thirty?", + "original_text": "Wait, aren't there any trains before ten thirty?", + "start_time": 11.767062502705357, + "end_time": 14.286427582070438, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--120/temp/line_3_B.wav", + "silence_duration": 0.3438829723152557, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Sorry, not before ten thirty.", + "original_text": "Sorry, not before ten thirty.", + "start_time": 19.4169760424403, + "end_time": 21.3326223009437, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--120/temp/line_4_A.wav", + "silence_duration": 0.4052876893948089, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Then one to New York at ten thirty.", + "original_text": "Then one to New York at ten thirty.", + "start_time": 21.6676390222082, + "end_time": 23.42074559817192, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--120/temp/line_5_B.wav", + "silence_duration": 0.33501672126449755, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "One way or round trip?", + "original_text": "One way or round trip?", + "start_time": 23.763627721774746, + "end_time": 25.017505272795155, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--120/temp/line_6_A.wav", + "silence_duration": 0.3428821236028273, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "One way.", + "original_text": "One way.", + "start_time": 25.34705975789393, + "end_time": 26.078488329322504, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--120/temp/line_7_B.wav", + "silence_duration": 0.32955448509877566, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "A soft seat or hard one?", + "original_text": "A soft seat or hard one?", + "start_time": 26.63345682129805, + "end_time": 28.38656339726177, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--120/temp/line_8_A.wav", + "silence_duration": 0.5549684919755475, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "How much is a soft?", + "original_text": "How much is a soft?", + "start_time": 28.833254262120626, + "end_time": 30.052301881168244, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--120/temp/line_9_B.wav", + "silence_duration": 0.44669086485885534, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "15 dollars. And for a hard one, only 6 dollars.", + "original_text": "15 dollars. And for a hard one, only 6 dollars.", + "start_time": 30.473461941326818, + "end_time": 34.36280434495494, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--120/temp/line_10_A.wav", + "silence_duration": 0.42116006015857305, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Then one hard seat, please. Oh, by the way, you were about to mention the other train times after twelve twenty?", + "original_text": "Then one hard seat, please. Oh, by the way, you were about to mention the other train times after twelve twenty?", + "start_time": 34.88343906844037, + "end_time": 40.86257739043583, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--120/temp/line_11_B.wav", + "silence_duration": 0.5206347234854309, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Yes, the other one is at fifteen ten.", + "original_text": "Yes, the other one is at fifteen ten.", + "start_time": 41.16872758552553, + "end_time": 43.52555298235093, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--120/temp/line_12_A.wav", + "silence_duration": 0.3061501950896993, + "is_interrupted": false + } + ] + }, + "DialogSum--val--121": { + "original_text": "A: Can you believe that Obama is our new President? I feel like this is such a historic moment for our country and [interrupt] it marks a significant turning point in American politics that will inspire generations to come.\nB: I'm so happy about that. Did you vote for him, by the way?\nA: Sorry to cut in, but I just wanted to ask, what do you think his first big move will be?\nB: I think he's going to focus on the economy first. But, wait, you were asking if I voted for him—yes, I did. How about you?\nA: I voted for him. I have complete confidence in our new President.\nB: Is that right?\nA: I know he will help change America.\nB: I hope so, because America needs a change.\nA: I feel like things are already changing, because he was elected.\nB: I agree with you completely.\nA: I'm not worried about our country now that it's in his hands.", + "cleaned_text": "A:Can you believe that Obama is our new President? I feel like this is such a historic moment for our country and it marks a significant turning point in American politics that will inspire generations to come.\nB: I'm so happy about that. Did you vote for him, by the way?\nA: Sorry to cut in, but I just wanted to ask, what do you think his first big move will be?\nB: I think he's going to focus on the economy first. But, wait, you were asking if I voted for him—yes, I did. How about you?\nA: I voted for him. I have complete confidence in our new President.\nB: Is that right?\nA: I know he will help change America.\nB: I hope so, because America needs a change.\nA: I feel like things are already changing, because he was elected.\nB: I agree with you completely.\nA: I'm not worried about our country now that it's in his hands.", + "total_duration": 47.14113378684807, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--121/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--121/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--121/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Can you believe that Obama is our new President? I feel like this is such a historic moment for our country and", + "original_text": "Can you believe that Obama is our new President? I feel like this is such a historic moment for our country and [interrupt] it marks a significant turning point in American politics that will inspire generations to come.", + "start_time": 0, + "end_time": 12.759365079365079, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--121/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": true, + "text_after_interrupt": "it marks a significant turning point in American politics that will inspire generations to come." + }, + { + "speaker": "B", + "text": "I'm so happy about that. Did you vote for him, by the way?", + "original_text": "I'm so happy about that. Did you vote for him, by the way?", + "start_time": 7.2562358276643995, + "end_time": 9.810430839002269, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--121/temp/line_1_B.wav", + "silence_duration": 0.5229735893536273, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Sorry to cut in, but I just wanted to ask, what do you think his first big move will be?", + "original_text": "Sorry to cut in, but I just wanted to ask, what do you think his first big move will be?", + "start_time": 13.201097168627756, + "end_time": 18.41397698722186, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--121/temp/line_2_A.wav", + "silence_duration": 0.4417320892626768, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I think he's going to focus on the economy first. But, wait, you were asking if I voted for him—yes, I did. How about you?", + "original_text": "I think he's going to focus on the economy first. But, wait, you were asking if I voted for him—yes, I did. How about you?", + "start_time": 18.72658067920933, + "end_time": 26.1801861213862, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--121/temp/line_3_B.wav", + "silence_duration": 0.3126036919874709, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I voted for him. I have complete confidence in our new President.", + "original_text": "I voted for him. I have complete confidence in our new President.", + "start_time": 26.544778044420777, + "end_time": 30.503780311994472, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--121/temp/line_4_A.wav", + "silence_duration": 0.3645919230345766, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Is that right?", + "original_text": "Is that right?", + "start_time": 30.959139438523447, + "end_time": 31.713787964600545, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--121/temp/line_5_B.wav", + "silence_duration": 0.4553591265289765, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I know he will help change America.", + "original_text": "I know he will help change America.", + "start_time": 32.090378820891665, + "end_time": 34.04085501136785, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--121/temp/line_6_A.wav", + "silence_duration": 0.37659085629112116, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I hope so, because America needs a change.", + "original_text": "I hope so, because America needs a change.", + "start_time": 34.458326616073435, + "end_time": 36.757102126277516, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--121/temp/line_7_B.wav", + "silence_duration": 0.41747160470558553, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I feel like things are already changing, because he was elected.", + "original_text": "I feel like things are already changing, because he was elected.", + "start_time": 37.28193786455476, + "end_time": 41.391869837343876, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--121/temp/line_8_A.wav", + "silence_duration": 0.5248357382772433, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I agree with you completely.", + "original_text": "I agree with you completely.", + "start_time": 41.93531344067444, + "end_time": 43.328510719586006, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--121/temp/line_9_B.wav", + "silence_duration": 0.5434436033305651, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I'm not worried about our country now that it's in his hands.", + "original_text": "I'm not worried about our country now that it's in his hands.", + "start_time": 43.64657595399362, + "end_time": 47.1411791285968, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--121/temp/line_10_A.wav", + "silence_duration": 0.3180652344076125, + "is_interrupted": false + } + ] + }, + "DialogSum--val--122": { + "original_text": "A: How do I know if I qualify for unemployment benefits?\nB: Are you working fewer hours than you used to work?\nA: I got laid [interrupt] off last week, and it's been a tough situation to manage especially since I wasn't given much notice and have bills piling up that I need to figure out how to cover.\nB: Oh, I'm sorry to hear that. In that case, you usually qualify if you got laid off or are working a lot fewer hours. But just to clarify, when you mentioned being laid off, did your employer provide any severance or mention anything about unemployment benefits?\nA: They didn't mention much about unemployment, but I was wondering—do all jobs provide unemployment?\nB: Most jobs provide unemployment, but some don't. You can call your unemployment office, and they can check for you. By the way, I didn't catch earlier—did you say whether your job pays unemployment?\nA: I'm not sure, that's why I was asking. Do you think that my job pays unemployment?\nB: It's hard to say for certain, but again, the unemployment office can confirm that for you. Will I be able to collect a lot of money on unemployment?\nA: There is a formula to determine the amount based on how much you earned. They will let you know when you file your claim.", + "cleaned_text": "A: How do I know if I qualify for unemployment benefits?\nB: Are you working fewer hours than you used to work?\nA:I got laid off last week, and it's been a tough situation to manage especially since I wasn't given much notice and have bills piling up that I need to figure out how to cover.\nB: Oh, I'm sorry to hear that. In that case, you usually qualify if you got laid off or are working a lot fewer hours. But just to clarify, when you mentioned being laid off, did your employer provide any severance or mention anything about unemployment benefits?\nA: They didn't mention much about unemployment, but I was wondering—do all jobs provide unemployment?\nB: Most jobs provide unemployment, but some don't. You can call your unemployment office, and they can check for you. By the way, I didn't catch earlier—did you say whether your job pays unemployment?\nA: I'm not sure, that's why I was asking. Do you think that my job pays unemployment?\nB: It's hard to say for certain, but again, the unemployment office can confirm that for you. Will I be able to collect a lot of money on unemployment?\nA: There is a formula to determine the amount based on how much you earned. They will let you know when you file your claim.", + "total_duration": 58.15369614512472, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--122/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--122/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--122/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "How do I know if I qualify for unemployment benefits?", + "original_text": "How do I know if I qualify for unemployment benefits?", + "start_time": 0, + "end_time": 3.599092970521542, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--122/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Are you working fewer hours than you used to work?", + "original_text": "Are you working fewer hours than you used to work?", + "start_time": 4.189134240470118, + "end_time": 6.267320181513202, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--122/temp/line_1_B.wav", + "silence_duration": 0.5900412699485755, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I got laid", + "original_text": "I got laid [interrupt] off last week, and it's been a tough situation to manage especially since I wasn't given much notice and have bills piling up that I need to figure out how to cover.", + "start_time": 6.660927167880479, + "end_time": 16.90092716788048, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--122/temp/line_2_A.wav", + "silence_duration": 0.39360698636727787, + "is_interrupted": true, + "text_after_interrupt": "off last week, and it's been a tough situation to manage especially since I wasn't given much notice and have bills piling up that I need to figure out how to cover." + }, + { + "speaker": "B", + "text": "Oh, I'm sorry to hear that. In that case, you usually qualify if you got laid off or are working a lot fewer hours. But just to clarify, when you mentioned being laid off, did your employer provide any severance or mention anything about unemployment benefits?", + "original_text": "Oh, I'm sorry to hear that. In that case, you usually qualify if you got laid off or are working a lot fewer hours. But just to clarify, when you mentioned being laid off, did your employer provide any severance or mention anything about unemployment benefits?", + "start_time": 7.740655059036942, + "end_time": 21.092128981939435, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--122/temp/line_3_B.wav", + "silence_duration": 0.4108465999388726, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "They didn't mention much about unemployment, but I was wondering—do all jobs provide unemployment?", + "original_text": "They didn't mention much about unemployment, but I was wondering—do all jobs provide unemployment?", + "start_time": 21.45804913358979, + "end_time": 27.054058203884573, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--122/temp/line_4_A.wav", + "silence_duration": 0.36592015165035385, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Most jobs provide unemployment, but some don't. You can call your unemployment office, and they can check for you. By the way, I didn't catch earlier—did you say whether your job pays unemployment?", + "original_text": "Most jobs provide unemployment, but some don't. You can call your unemployment office, and they can check for you. By the way, I didn't catch earlier—did you say whether your job pays unemployment?", + "start_time": 27.520409935819487, + "end_time": 37.957779550331956, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--122/temp/line_5_B.wav", + "silence_duration": 0.4663517319349133, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I'm not sure, that's why I was asking. Do you think that my job pays unemployment?", + "original_text": "I'm not sure, that's why I was asking. Do you think that my job pays unemployment?", + "start_time": 38.317410402056936, + "end_time": 43.553510175299564, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--122/temp/line_6_A.wav", + "silence_duration": 0.3596308517249768, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "It's hard to say for certain, but again, the unemployment office can confirm that for you. Will I be able to collect a lot of money on unemployment?", + "original_text": "It's hard to say for certain, but again, the unemployment office can confirm that for you. Will I be able to collect a lot of money on unemployment?", + "start_time": 44.134645102303686, + "end_time": 51.47215077123793, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--122/temp/line_7_B.wav", + "silence_duration": 0.5811349270041226, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "There is a formula to determine the amount based on how much you earned. They will let you know when you file your claim.", + "original_text": "There is a formula to determine the amount based on how much you earned. They will let you know when you file your claim.", + "start_time": 51.95398721190486, + "end_time": 58.15371510306132, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--122/temp/line_8_A.wav", + "silence_duration": 0.48183644066693143, + "is_interrupted": false + } + ] + }, + "DialogSum--val--123": { + "original_text": "A: Have you read the feature article about Oprah Winfrey in this magazine? \nB: No, what's it about? \nA: Apparently, she's being given an award for donating so much money to charity and [interrupt] for her lifelong commitment to philanthropy that has inspired millions of people around the world to give back to their communities. \nB: She's very generous with her money. I think that's because she was poor when she was young and knows what it's like to struggle. \nA: Oh, speaking of her generosity, did they mention anything about her recent projects in the article? \nB: Yes, actually! She's not only building a school for underprivileged girls in Africa, but is also using her own money for the upkeep of the school and to pay the teachers a fair salary. \nA: That's really commendable. I think more celebrities should use their money to help people like Oprah has. \nB: I agree. So many celebrities waste their money on sports cars, expensive clothing, and luxurious hotels. \nA: It's amazing how much money they can spend. By the way, you were saying something about Oprah being poor when she was young? \nB: Right, I think her difficult upbringing is what drives her to give back so much now.", + "cleaned_text": "A: Have you read the feature article about Oprah Winfrey in this magazine? \nB: No, what's it about? \nA:Apparently, she's being given an award for donating so much money to charity and for her lifelong commitment to philanthropy that has inspired millions of people around the world to give back to their communities.\nB: She's very generous with her money. I think that's because she was poor when she was young and knows what it's like to struggle. \nA: Oh, speaking of her generosity, did they mention anything about her recent projects in the article? \nB: Yes, actually! She's not only building a school for underprivileged girls in Africa, but is also using her own money for the upkeep of the school and to pay the teachers a fair salary. \nA: That's really commendable. I think more celebrities should use their money to help people like Oprah has. \nB: I agree. So many celebrities waste their money on sports cars, expensive clothing, and luxurious hotels. \nA: It's amazing how much money they can spend. By the way, you were saying something about Oprah being poor when she was young? \nB: Right, I think her difficult upbringing is what drives her to give back so much now.", + "total_duration": 58.444263038548755, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--123/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--123/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--123/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Have you read the feature article about Oprah Winfrey in this magazine?", + "original_text": "Have you read the feature article about Oprah Winfrey in this magazine?", + "start_time": 0, + "end_time": 3.5294331065759637, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--123/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "No, what's it about?", + "original_text": "No, what's it about?", + "start_time": 3.871507692906359, + "end_time": 5.125385243926767, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--123/temp/line_1_B.wav", + "silence_duration": 0.3420745863303957, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Apparently, she's being given an award for donating so much money to charity and", + "original_text": "Apparently, she's being given an award for donating so much money to charity and [interrupt] for her lifelong commitment to philanthropy that has inspired millions of people around the world to give back to their communities.", + "start_time": 5.4371338160961695, + "end_time": 17.34897055079005, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--123/temp/line_2_A.wav", + "silence_duration": 0.31174857216940255, + "is_interrupted": true, + "text_after_interrupt": "for her lifelong commitment to philanthropy that has inspired millions of people around the world to give back to their communities." + }, + { + "speaker": "B", + "text": "She's very generous with her money. I think that's because she was poor when she was young and knows what it's like to struggle.", + "original_text": "She's very generous with her money. I think that's because she was poor when she was young and knows what it's like to struggle.", + "start_time": 10.011464881855806, + "end_time": 15.770013634690272, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--123/temp/line_3_B.wav", + "silence_duration": 0.389517306394859, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Oh, speaking of her generosity, did they mention anything about her recent projects in the article?", + "original_text": "Oh, speaking of her generosity, did they mention anything about her recent projects in the article?", + "start_time": 17.84198649745461, + "end_time": 23.321895794506766, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--123/temp/line_4_A.wav", + "silence_duration": 0.4930159466645599, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, actually! She's not only building a school for underprivileged girls in Africa, but is also using her own money for the upkeep of the school and to pay the teachers a fair salary.", + "original_text": "Yes, actually! She's not only building a school for underprivileged girls in Africa, but is also using her own money for the upkeep of the school and to pay the teachers a fair salary.", + "start_time": 23.739378124000268, + "end_time": 33.09701984735628, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--123/temp/line_5_B.wav", + "silence_duration": 0.41748232949350356, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "That's really commendable. I think more celebrities should use their money to help people like Oprah has.", + "original_text": "That's really commendable. I think more celebrities should use their money to help people like Oprah has.", + "start_time": 33.47811572324224, + "end_time": 39.735893501020016, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--123/temp/line_6_A.wav", + "silence_duration": 0.38109587588595933, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I agree. So many celebrities waste their money on sports cars, expensive clothing, and luxurious hotels.", + "original_text": "I agree. So many celebrities waste their money on sports cars, expensive clothing, and luxurious hotels.", + "start_time": 40.04807691225183, + "end_time": 46.096875098192875, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--123/temp/line_7_B.wav", + "silence_duration": 0.3121834112318176, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "It's amazing how much money they can spend. By the way, you were saying something about Oprah being poor when she was young?", + "original_text": "It's amazing how much money they can spend. By the way, you were saying something about Oprah being poor when she was young?", + "start_time": 46.531005319219986, + "end_time": 53.48538173645355, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--123/temp/line_8_A.wav", + "silence_duration": 0.4341302210271094, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Right, I think her difficult upbringing is what drives her to give back so much now.", + "original_text": "Right, I think her difficult upbringing is what drives her to give back so much now.", + "start_time": 54.009291247075005, + "end_time": 58.444302584943486, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--123/temp/line_9_B.wav", + "silence_duration": 0.523909510621458, + "is_interrupted": false + } + ] + }, + "DialogSum--val--124": { + "original_text": "A: Thank you for your interest in this job. You'll be hearing from us. Send the next applicant in on your way out, please.\nB: Thank you very much for offering me this opportunity. It has been pleasant talking with [interrupt] you and learning more about the company's culture, values, and future growth plans which align perfectly with my career aspirations.\nA: Sorry to jump in, but before you go, may I call you at your home about our final decision?\nB: Yes, please. My telephone number is 367 - 1314. You can call me between four and six in the afternoon.\nA: Great, we'll get in touch with you by next Wednesday. By the way, I didn't catch the rest of what you were saying earlier. You mentioned it was pleasant talking with...?\nB: Oh, right! I was just saying it has been pleasant talking with you too. Thank you.\nA: Thank you for your interview.", + "cleaned_text": "A: Thank you for your interest in this job. You'll be hearing from us. Send the next applicant in on your way out, please.\nB:Thank you very much for offering me this opportunity. It has been pleasant talking with you and learning more about the company's culture, values, and future growth plans which align perfectly with my career aspirations.\nA: Sorry to jump in, but before you go, may I call you at your home about our final decision?\nB: Yes, please. My telephone number is 367 - 1314. You can call me between four and six in the afternoon.\nA: Great, we'll get in touch with you by next Wednesday. By the way, I didn't catch the rest of what you were saying earlier. You mentioned it was pleasant talking with...?\nB: Oh, right! I was just saying it has been pleasant talking with you too. Thank you.\nA: Thank you for your interview.", + "total_duration": 42.739501133786845, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--124/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--124/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--124/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Thank you for your interest in this job. You'll be hearing from us. Send the next applicant in on your way out, please.", + "original_text": "Thank you for your interest in this job. You'll be hearing from us. Send the next applicant in on your way out, please.", + "start_time": 0, + "end_time": 7.151746031746032, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--124/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Thank you very much for offering me this opportunity. It has been pleasant talking with", + "original_text": "Thank you very much for offering me this opportunity. It has been pleasant talking with [interrupt] you and learning more about the company's culture, values, and future growth plans which align perfectly with my career aspirations.", + "start_time": 7.494375778810392, + "end_time": 18.38453450896912, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--124/temp/line_1_B.wav", + "silence_duration": 0.3426297470643601, + "is_interrupted": true, + "text_after_interrupt": "you and learning more about the company's culture, values, and future growth plans which align perfectly with my career aspirations." + }, + { + "speaker": "A", + "text": "Sorry to jump in, but before you go, may I call you at your home about our final decision?", + "original_text": "Sorry to jump in, but before you go, may I call you at your home about our final decision?", + "start_time": 11.790067388787715, + "end_time": 17.664715914864814, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--124/temp/line_2_A.wav", + "silence_duration": 0.3945883096632385, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, please. My telephone number is 367 - 1314. You can call me between four and six in the afternoon.", + "original_text": "Yes, please. My telephone number is 367 - 1314. You can call me between four and six in the afternoon.", + "start_time": 18.687813344750012, + "end_time": 26.698697698491507, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--124/temp/line_3_B.wav", + "silence_duration": 0.30327883578089077, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Great, we'll get in touch with you by next Wednesday. By the way, I didn't catch the rest of what you were saying earlier. You mentioned it was pleasant talking with...?", + "original_text": "Great, we'll get in touch with you by next Wednesday. By the way, I didn't catch the rest of what you were saying earlier. You mentioned it was pleasant talking with...?", + "start_time": 27.13030799878865, + "end_time": 36.104820470443975, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--124/temp/line_4_A.wav", + "silence_duration": 0.4316103002971401, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Oh, right! I was just saying it has been pleasant talking with you too. Thank you.", + "original_text": "Oh, right! I was just saying it has been pleasant talking with you too. Thank you.", + "start_time": 36.4343407869363, + "end_time": 40.764862328886416, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--124/temp/line_5_B.wav", + "silence_duration": 0.3295203164923261, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Thank you for your interview.", + "original_text": "Thank you for your interview.", + "start_time": 41.206994555333466, + "end_time": 42.73951156213619, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--124/temp/line_6_A.wav", + "silence_duration": 0.44213222644704714, + "is_interrupted": false + } + ] + }, + "DialogSum--val--125": { + "original_text": "A: Dental clinic. This is Mr. Adams. \nB: Hi. My name's David Johnson. I'd like to make an appointment. \nA: All right, David. Is this for a checkup or a [interrupt] cleaning? We have availability for both procedures, but the scheduling might differ depending on which service you require and the severity of your dental concerns. \nB: Sorry to cut in, but I have a really bad cavity. Half the side of my head hurts. \nA: Oh, that sounds painful. We'll definitely need to check that out. Which tooth is giving you the most pain? \nB: One of the back ones. But you were asking if it was for a checkup or a cleaning? \nA: Yes, I was. So, it's for a checkup then, right?", + "cleaned_text": "A: Dental clinic. This is Mr. Adams. \nB: Hi. My name's David Johnson. I'd like to make an appointment. \nA:All right, David. Is this for a checkup or a cleaning? We have availability for both procedures, but the scheduling might differ depending on which service you require and the severity of your dental concerns.\nB: Sorry to cut in, but I have a really bad cavity. Half the side of my head hurts. \nA: Oh, that sounds painful. We'll definitely need to check that out. Which tooth is giving you the most pain? \nB: One of the back ones. But you were asking if it was for a checkup or a cleaning? \nA: Yes, I was. So, it's for a checkup then, right?", + "total_duration": 35.582630385487526, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--125/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--125/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--125/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Dental clinic. This is Mr. Adams.", + "original_text": "Dental clinic. This is Mr. Adams.", + "start_time": 0, + "end_time": 3.111473922902494, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--125/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Hi. My name's David Johnson. I'd like to make an appointment.", + "original_text": "Hi. My name's David Johnson. I'd like to make an appointment.", + "start_time": 3.454511112795135, + "end_time": 7.06521406064094, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--125/temp/line_1_B.wav", + "silence_duration": 0.34303718989264115, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "All right, David. Is this for a checkup or a", + "original_text": "All right, David. Is this for a checkup or a [interrupt] cleaning? We have availability for both procedures, but the scheduling might differ depending on which service you require and the severity of your dental concerns.", + "start_time": 7.63116872808864, + "end_time": 20.065454442374353, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--125/temp/line_2_A.wav", + "silence_duration": 0.5659546674476997, + "is_interrupted": true, + "text_after_interrupt": "cleaning? We have availability for both procedures, but the scheduling might differ depending on which service you require and the severity of your dental concerns." + }, + { + "speaker": "B", + "text": "Sorry to cut in, but I have a really bad cavity. Half the side of my head hurts.", + "original_text": "Sorry to cut in, but I have a really bad cavity. Half the side of my head hurts.", + "start_time": 11.090941970719026, + "end_time": 15.560783240560296, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--125/temp/line_3_B.wav", + "silence_duration": 0.3574883979480218, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Oh, that sounds painful. We'll definitely need to check that out. Which tooth is giving you the most pain?", + "original_text": "Oh, that sounds painful. We'll definitely need to check that out. Which tooth is giving you the most pain?", + "start_time": 20.482633148931424, + "end_time": 27.019050382491514, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--125/temp/line_4_A.wav", + "silence_duration": 0.4171787065570718, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "One of the back ones. But you were asking if it was for a checkup or a cleaning?", + "original_text": "One of the back ones. But you were asking if it was for a checkup or a cleaning?", + "start_time": 27.47279573050383, + "end_time": 31.30408824751063, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--125/temp/line_5_B.wav", + "silence_duration": 0.4537453480123148, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Yes, I was. So, it's for a checkup then, right?", + "original_text": "Yes, I was. So, it's for a checkup then, right?", + "start_time": 31.809417300642917, + "end_time": 35.5826599310284, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--125/temp/line_6_A.wav", + "silence_duration": 0.5053290531322859, + "is_interrupted": false + } + ] + }, + "DialogSum--val--126": { + "original_text": "A: Have you moved into your new house yet, Michael? \nB: We just moved in yesterday, actually. \nA: So, what do you think about the place? Are you glad that you [interrupt] finally settled in after all the moving chaos? It must be such a relief to have everything unpacked and organized after weeks of preparation. \nB: Sorry to jump in, but I wanted to ask—how old is the house? \nA: It's about 200 years old. It has a lot of history! But I was going to say, yes, we're glad we moved in, though we're going to spend a fortune doing everything up. \nB: Sounds fascinating. Where is your new house located? \nA: It's just off of the ring road. \nB: Do you have a big yard? \nA: It's bigger than our last one. I've got flowers in the front, and fruits, vegetables, and a [interrupt] small herb garden that I'm really excited about because I've always wanted to grow my own fresh herbs for cooking and medicinal purposes. \nB: Oh, I forgot to ask earlier—does your house get enough natural light? \nA: Yes, it does! Our windows let plenty of natural light in. I was just about to mention that we also have a fish pond in the back, along with the fruits and vegetables. Plus, the windows have wonderful views of the park behind our house.", + "cleaned_text": "A: Have you moved into your new house yet, Michael? \nB: We just moved in yesterday, actually. \nA:So, what do you think about the place? Are you glad that you finally settled in after all the moving chaos? It must be such a relief to have everything unpacked and organized after weeks of preparation.\nB: Sorry to jump in, but I wanted to ask—how old is the house? \nA: It's about 200 years old. It has a lot of history! But I was going to say, yes, we're glad we moved in, though we're going to spend a fortune doing everything up. \nB: Sounds fascinating. Where is your new house located? \nA: It's just off of the ring road. \nB: Do you have a big yard? \nA:It's bigger than our last one. I've got flowers in the front, and fruits, vegetables, and a small herb garden that I'm really excited about because I've always wanted to grow my own fresh herbs for cooking and medicinal purposes.\nB: Oh, I forgot to ask earlier—does your house get enough natural light? \nA: Yes, it does! Our windows let plenty of natural light in. I was just about to mention that we also have a fish pond in the back, along with the fruits and vegetables. Plus, the windows have wonderful views of the park behind our house.", + "total_duration": 64.27301587301588, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--126/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--126/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--126/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Have you moved into your new house yet, Michael?", + "original_text": "Have you moved into your new house yet, Michael?", + "start_time": 0, + "end_time": 2.414875283446712, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--126/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "We just moved in yesterday, actually.", + "original_text": "We just moved in yesterday, actually.", + "start_time": 2.7281114771314687, + "end_time": 4.678587667607659, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--126/temp/line_1_B.wav", + "silence_duration": 0.31323619368475675, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "So, what do you think about the place? Are you glad that you", + "original_text": "So, what do you think about the place? Are you glad that you [interrupt] finally settled in after all the moving chaos? It must be such a relief to have everything unpacked and organized after weeks of preparation.", + "start_time": 5.229735651784598, + "end_time": 17.002252658587317, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--126/temp/line_2_A.wav", + "silence_duration": 0.551147984176938, + "is_interrupted": true, + "text_after_interrupt": "finally settled in after all the moving chaos? It must be such a relief to have everything unpacked and organized after weeks of preparation." + }, + { + "speaker": "B", + "text": "Sorry to jump in, but I wanted to ask—how old is the house?", + "original_text": "Sorry to jump in, but I wanted to ask—how old is the house?", + "start_time": 9.002978282170085, + "end_time": 12.660121139312942, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--126/temp/line_3_B.wav", + "silence_duration": 0.3069361077866654, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "It's about 200 years old. It has a lot of history! But I was going to say, yes, we're glad we moved in, though we're going to spend a fortune doing everything up.", + "original_text": "It's about 200 years old. It has a lot of history! But I was going to say, yes, we're glad we moved in, though we're going to spend a fortune doing everything up.", + "start_time": 17.458027526686944, + "end_time": 27.698027526686943, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--126/temp/line_4_A.wav", + "silence_duration": 0.45577486809962897, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Sounds fascinating. Where is your new house located?", + "original_text": "Sounds fascinating. Where is your new house located?", + "start_time": 28.002638956430726, + "end_time": 31.021233060739117, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--126/temp/line_5_B.wav", + "silence_duration": 0.3046114297437835, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "It's just off of the ring road.", + "original_text": "It's just off of the ring road.", + "start_time": 31.491644093627507, + "end_time": 33.50017017072501, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--126/temp/line_6_A.wav", + "silence_duration": 0.47041103288838826, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Do you have a big yard?", + "original_text": "Do you have a big yard?", + "start_time": 34.034248221160155, + "end_time": 35.20685593091072, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--126/temp/line_7_B.wav", + "silence_duration": 0.5340780504351388, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "It's bigger than our last one. I've got flowers in the front, and fruits, vegetables, and a", + "original_text": "It's bigger than our last one. I've got flowers in the front, and fruits, vegetables, and a [interrupt] small herb garden that I'm really excited about because I've always wanted to grow my own fresh herbs for cooking and medicinal purposes.", + "start_time": 35.7645280151184, + "end_time": 50.335049557068515, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--126/temp/line_8_A.wav", + "silence_duration": 0.5576720842076791, + "is_interrupted": true, + "text_after_interrupt": "small herb garden that I'm really excited about because I've always wanted to grow my own fresh herbs for cooking and medicinal purposes." + }, + { + "speaker": "B", + "text": "Oh, I forgot to ask earlier—does your house get enough natural light?", + "original_text": "Oh, I forgot to ask earlier—does your house get enough natural light?", + "start_time": 45.51393759039357, + "end_time": 49.34523010740037, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--126/temp/line_9_B.wav", + "silence_duration": 0.45364577030240816, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Yes, it does! Our windows let plenty of natural light in. I was just about to mention that we also have a fish pond in the back, along with the fruits and vegetables. Plus, the windows have wonderful views of the park behind our house.", + "original_text": "Yes, it does! Our windows let plenty of natural light in. I was just about to mention that we also have a fish pond in the back, along with the fruits and vegetables. Plus, the windows have wonderful views of the park behind our house.", + "start_time": 50.93315549888695, + "end_time": 64.27301944446518, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--126/temp/line_10_A.wav", + "silence_duration": 0.5981059418184309, + "is_interrupted": false + } + ] + }, + "DialogSum--val--127": { + "original_text": "A: Good afternoon. \nB: Good afternoon. Can I help you? \nA: I've got this important letter to send to Hainan. Can I send it by registered [interrupt] mail with tracking and insurance? I want to make sure it is properly tracked throughout its journey and arrives safely at its destination without any issues. \nB: Sorry to interrupt, but do you need it to arrive by a specific date? We have options for faster delivery if it's urgent. \nA: No, regular registered mail is fine. How much will I have to pay? \nB: Two yuan, please. \nA: Here are the letter and the money. \nB: Wait a moment. It seems that your letter is overweight. Let me [interrupt] carefully check the exact weight on our precision scale and calculate the additional postage required based on the current postal rates for overweight items. \nA: Overweight? Does that mean I need to pay more? \nB: Yes, I'm afraid it is. So you will have to pay two yuan extra. The total charge is four yuan. \nA: All right. Here is the money. \nB: Here are the stamps and your receipt.", + "cleaned_text": "A: Good afternoon. \nB: Good afternoon. Can I help you? \nA:I've got this important letter to send to Hainan. Can I send it by registered mail with tracking and insurance? I want to make sure it is properly tracked throughout its journey and arrives safely at its destination without any issues.\nB: Sorry to interrupt, but do you need it to arrive by a specific date? We have options for faster delivery if it's urgent. \nA: No, regular registered mail is fine. How much will I have to pay? \nB: Two yuan, please. \nA: Here are the letter and the money. \nB:Wait a moment. It seems that your letter is overweight. Let me carefully check the exact weight on our precision scale and calculate the additional postage required based on the current postal rates for overweight items.\nA: Overweight? Does that mean I need to pay more? \nB: Yes, I'm afraid it is. So you will have to pay two yuan extra. The total charge is four yuan. \nA: All right. Here is the money. \nB: Here are the stamps and your receipt.", + "total_duration": 50.33986394557823, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--127/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--127/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--127/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Good afternoon.", + "original_text": "Good afternoon.", + "start_time": 0, + "end_time": 0.9984580498866213, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--127/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Good afternoon. Can I help you?", + "original_text": "Good afternoon. Can I help you?", + "start_time": 1.5338582076120166, + "end_time": 3.124425101036053, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--127/temp/line_1_B.wav", + "silence_duration": 0.5354001577253953, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I've got this important letter to send to Hainan. Can I send it by registered", + "original_text": "I've got this important letter to send to Hainan. Can I send it by registered [interrupt] mail with tracking and insurance? I want to make sure it is properly tracked throughout its journey and arrives safely at its destination without any issues.", + "start_time": 3.708932207369429, + "end_time": 17.524805223242446, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--127/temp/line_2_A.wav", + "silence_duration": 0.584507106333376, + "is_interrupted": true, + "text_after_interrupt": "mail with tracking and insurance? I want to make sure it is properly tracked throughout its journey and arrives safely at its destination without any issues." + }, + { + "speaker": "B", + "text": "Sorry to interrupt, but do you need it to arrive by a specific date? We have options for faster delivery if it's urgent.", + "original_text": "Sorry to interrupt, but do you need it to arrive by a specific date? We have options for faster delivery if it's urgent.", + "start_time": 8.387753069047434, + "end_time": 14.924170302607525, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--127/temp/line_3_B.wav", + "silence_duration": 0.40268372852641254, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "No, regular registered mail is fine. How much will I have to pay?", + "original_text": "No, regular registered mail is fine. How much will I have to pay?", + "start_time": 17.868751181644488, + "end_time": 22.04834301837918, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--127/temp/line_4_A.wav", + "silence_duration": 0.3439459584020403, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Two yuan, please.", + "original_text": "Two yuan, please.", + "start_time": 22.480186243574185, + "end_time": 23.652793953324753, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--127/temp/line_5_B.wav", + "silence_duration": 0.4318432251950026, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Here are the letter and the money.", + "original_text": "Here are the letter and the money.", + "start_time": 24.242403133430244, + "end_time": 25.774920140232965, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--127/temp/line_6_A.wav", + "silence_duration": 0.5896091801054908, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Wait a moment. It seems that your letter is overweight. Let me", + "original_text": "Wait a moment. It seems that your letter is overweight. Let me [interrupt] carefully check the exact weight on our precision scale and calculate the additional postage required based on the current postal rates for overweight items.", + "start_time": 26.369422823463548, + "end_time": 37.08543189375833, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--127/temp/line_7_B.wav", + "silence_duration": 0.5945026832305838, + "is_interrupted": true, + "text_after_interrupt": "carefully check the exact weight on our precision scale and calculate the additional postage required based on the current postal rates for overweight items." + }, + { + "speaker": "A", + "text": "Overweight? Does that mean I need to pay more?", + "original_text": "Overweight? Does that mean I need to pay more?", + "start_time": 36.51221984813608, + "end_time": 39.786233453578255, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--127/temp/line_8_A.wav", + "silence_duration": 0.5029309081377347, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, I'm afraid it is. So you will have to pay two yuan extra. The total charge is four yuan.", + "original_text": "Yes, I'm afraid it is. So you will have to pay two yuan extra. The total charge is four yuan.", + "start_time": 40.281756544689514, + "end_time": 45.970645433578404, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--127/temp/line_9_B.wav", + "silence_duration": 0.49552309111126147, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "All right. Here is the money.", + "original_text": "All right. Here is the money.", + "start_time": 46.3177162922848, + "end_time": 48.03599293627573, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--127/temp/line_10_A.wav", + "silence_duration": 0.34707085870639487, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Here are the stamps and your receipt.", + "original_text": "Here are the stamps and your receipt.", + "start_time": 48.56356955668884, + "end_time": 50.339896087301085, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--127/temp/line_11_B.wav", + "silence_duration": 0.5275766204131056, + "is_interrupted": false + } + ] + }, + "DialogSum--val--129": { + "original_text": "A: I have a good feeling about this house. \nB: Yes, I liked it the first moment I pulled up to it. \nA: I love the paint job! \nB: If you like the outside, you are going to really love the [interrupt] interior design; it has a modern yet cozy feel to it with beautiful hardwood floors, an open floor plan, and plenty of natural light streaming through the large windows. \nA: Oh, before we go inside, do you know if the roof has been recently inspected? I always worry about potential issues like that. \nB: That's a great question. Yes, the roof was inspected last year, and it's in excellent condition. Now, as I was saying, the inside is really something special. What a beautiful home! \nA: You'll notice that the window treatments, carpeting, and drapes are all new. \nB: I like the way the blinds give you privacy from the street. \nA: Follow me into the kitchen. You will love it. \nB: I love that they put a wine storage area in the kitchen. \nA: The best part is the bedroom and attached bathroom. \nB: I love the relaxing colors in the tile and floor covering! \nA: Oh, we didn't take any pictures of the kitchen yet, did we? Let's take a few pictures so that we can remember what we like about this home.", + "cleaned_text": "A: I have a good feeling about this house. \nB: Yes, I liked it the first moment I pulled up to it. \nA: I love the paint job! \nB:If you like the outside, you are going to really love the interior design; it has a modern yet cozy feel to it with beautiful hardwood floors, an open floor plan, and plenty of natural light streaming through the large windows.\nA: Oh, before we go inside, do you know if the roof has been recently inspected? I always worry about potential issues like that. \nB: That's a great question. Yes, the roof was inspected last year, and it's in excellent condition. Now, as I was saying, the inside is really something special. What a beautiful home! \nA: You'll notice that the window treatments, carpeting, and drapes are all new. \nB: I like the way the blinds give you privacy from the street. \nA: Follow me into the kitchen. You will love it. \nB: I love that they put a wine storage area in the kitchen. \nA: The best part is the bedroom and attached bathroom. \nB: I love the relaxing colors in the tile and floor covering! \nA: Oh, we didn't take any pictures of the kitchen yet, did we? Let's take a few pictures so that we can remember what we like about this home.", + "total_duration": 58.50621315192744, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--129/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--129/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--129/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "I have a good feeling about this house.", + "original_text": "I have a good feeling about this house.", + "start_time": 0, + "end_time": 2.159455782312925, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--129/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, I liked it the first moment I pulled up to it.", + "original_text": "Yes, I liked it the first moment I pulled up to it.", + "start_time": 2.5331576691946567, + "end_time": 5.482091909557468, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--129/temp/line_1_B.wav", + "silence_duration": 0.3737018868817316, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I love the paint job!", + "original_text": "I love the paint job!", + "start_time": 6.064701647783414, + "end_time": 7.481118881343504, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--129/temp/line_2_A.wav", + "silence_duration": 0.5826097382259456, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "If you like the outside, you are going to really love the", + "original_text": "If you like the outside, you are going to really love the [interrupt] interior design; it has a modern yet cozy feel to it with beautiful hardwood floors, an open floor plan, and plenty of natural light streaming through the large windows.", + "start_time": 7.861210059128695, + "end_time": 19.819486703119622, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--129/temp/line_3_B.wav", + "silence_duration": 0.38009117778519025, + "is_interrupted": true, + "text_after_interrupt": "interior design; it has a modern yet cozy feel to it with beautiful hardwood floors, an open floor plan, and plenty of natural light streaming through the large windows." + }, + { + "speaker": "A", + "text": "Oh, before we go inside, do you know if the roof has been recently inspected? I always worry about potential issues like that.", + "original_text": "Oh, before we go inside, do you know if the roof has been recently inspected? I always worry about potential issues like that.", + "start_time": 11.158443619219398, + "end_time": 19.215767882257946, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--129/temp/line_4_A.wav", + "silence_duration": 0.55643880718499, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "That's a great question. Yes, the roof was inspected last year, and it's in excellent condition. Now, as I was saying, the inside is really something special. What a beautiful home!", + "original_text": "That's a great question. Yes, the roof was inspected last year, and it's in excellent condition. Now, as I was saying, the inside is really something special. What a beautiful home!", + "start_time": 20.21883005183577, + "end_time": 30.156970641404932, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--129/temp/line_5_B.wav", + "silence_duration": 0.3993433487161465, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "You'll notice that the window treatments, carpeting, and drapes are all new.", + "original_text": "You'll notice that the window treatments, carpeting, and drapes are all new.", + "start_time": 30.648604459037838, + "end_time": 34.47989697604464, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--129/temp/line_6_A.wav", + "silence_duration": 0.49163381763290437, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I like the way the blinds give you privacy from the street.", + "original_text": "I like the way the blinds give you privacy from the street.", + "start_time": 34.99863757000475, + "end_time": 37.73859221853083, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--129/temp/line_7_B.wav", + "silence_duration": 0.5187405939601086, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Follow me into the kitchen. You will love it.", + "original_text": "Follow me into the kitchen. You will love it.", + "start_time": 38.22717184444797, + "end_time": 40.421457558733685, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--129/temp/line_8_A.wav", + "silence_duration": 0.48857962591713777, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I love that they put a wine storage area in the kitchen.", + "original_text": "I love that they put a wine storage area in the kitchen.", + "start_time": 40.930140777238485, + "end_time": 43.762975244358664, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--129/temp/line_9_B.wav", + "silence_duration": 0.5086832185048005, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "The best part is the bedroom and attached bathroom.", + "original_text": "The best part is the bedroom and attached bathroom.", + "start_time": 44.186581100537985, + "end_time": 47.15873529554932, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--129/temp/line_10_A.wav", + "silence_duration": 0.42360585617932167, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I love the relaxing colors in the tile and floor covering!", + "original_text": "I love the relaxing colors in the tile and floor covering!", + "start_time": 47.55255776634591, + "end_time": 50.48988202938446, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--129/temp/line_11_B.wav", + "silence_duration": 0.39382247079659016, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Oh, we didn't take any pictures of the kitchen yet, did we? Let's take a few pictures so that we can remember what we like about this home.", + "original_text": "Oh, we didn't take any pictures of the kitchen yet, did we? Let's take a few pictures so that we can remember what we like about this home.", + "start_time": 51.07584767508425, + "end_time": 58.506233162612595, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--129/temp/line_12_A.wav", + "silence_duration": 0.5859656456997852, + "is_interrupted": false + } + ] + }, + "DialogSum--val--130": { + "original_text": "A: What is your favorite kind of music?\nB: I listen to various types of music.\nA: What genres?\nB: I enjoy listening to both Rock and R & [interrupt] B, particularly the way these genres blend soulful melodies with powerful rhythms and often incorporate meaningful lyrics that resonate with personal experiences.\nA: Sorry to jump in, but I'm curious—when you say Rock, are you more into classic rock or modern rock bands?\nB: I'm more into classic rock, but I also appreciate some modern bands. By the way, I was about to mention that I also listen to R & B.\nA: Oh, got it. What interests you in that type of music?\nB: I enjoy the different types of instruments that they use.\nA: That is a perfect reason to like a certain kind of music.\nB: That's exactly what I think too.", + "cleaned_text": "A: What is your favorite kind of music?\nB: I listen to various types of music.\nA: What genres?\nB:I enjoy listening to both Rock and R & B, particularly the way these genres blend soulful melodies with powerful rhythms and often incorporate meaningful lyrics that resonate with personal experiences.\nA: Sorry to jump in, but I'm curious—when you say Rock, are you more into classic rock or modern rock bands?\nB: I'm more into classic rock, but I also appreciate some modern bands. By the way, I was about to mention that I also listen to R & B.\nA: Oh, got it. What interests you in that type of music?\nB: I enjoy the different types of instruments that they use.\nA: That is a perfect reason to like a certain kind of music.\nB: That's exactly what I think too.", + "total_duration": 36.824126984126984, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--130/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--130/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--130/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "What is your favorite kind of music?", + "original_text": "What is your favorite kind of music?", + "start_time": 0, + "end_time": 2.0085260770975055, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--130/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I listen to various types of music.", + "original_text": "I listen to various types of music.", + "start_time": 2.4182176438361696, + "end_time": 4.357083856988097, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--130/temp/line_1_B.wav", + "silence_duration": 0.4096915667386639, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "What genres?", + "original_text": "What genres?", + "start_time": 4.722922100610206, + "end_time": 5.593670399929934, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--130/temp/line_2_A.wav", + "silence_duration": 0.36583824362210904, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I enjoy listening to both Rock and R &", + "original_text": "I enjoy listening to both Rock and R & [interrupt] B, particularly the way these genres blend soulful melodies with powerful rhythms and often incorporate meaningful lyrics that resonate with personal experiences.", + "start_time": 5.898863460918122, + "end_time": 16.614872531212907, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--130/temp/line_3_B.wav", + "silence_duration": 0.3051930609881875, + "is_interrupted": true, + "text_after_interrupt": "B, particularly the way these genres blend soulful melodies with powerful rhythms and often incorporate meaningful lyrics that resonate with personal experiences." + }, + { + "speaker": "A", + "text": "Sorry to jump in, but I'm curious—when you say Rock, are you more into classic rock or modern rock bands?", + "original_text": "Sorry to jump in, but I'm curious—when you say Rock, are you more into classic rock or modern rock bands?", + "start_time": 8.56915824549862, + "end_time": 15.662854390623338, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--130/temp/line_4_A.wav", + "silence_duration": 0.33984288930581863, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I'm more into classic rock, but I also appreciate some modern bands. By the way, I was about to mention that I also listen to R & B.", + "original_text": "I'm more into classic rock, but I also appreciate some modern bands. By the way, I was about to mention that I also listen to R & B.", + "start_time": 17.16068843277106, + "end_time": 24.010575054086253, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--130/temp/line_5_B.wav", + "silence_duration": 0.5458159015581521, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Oh, got it. What interests you in that type of music?", + "original_text": "Oh, got it. What interests you in that type of music?", + "start_time": 24.355711241003036, + "end_time": 27.745824619687845, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--130/temp/line_6_A.wav", + "silence_duration": 0.3451361869167835, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I enjoy the different types of instruments that they use.", + "original_text": "I enjoy the different types of instruments that they use.", + "start_time": 28.309718970675178, + "end_time": 30.94518382328289, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--130/temp/line_7_B.wav", + "silence_duration": 0.5638943509873346, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "That is a perfect reason to like a certain kind of music.", + "original_text": "That is a perfect reason to like a certain kind of music.", + "start_time": 31.452933911022768, + "end_time": 34.75016747111347, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--130/temp/line_8_A.wav", + "silence_duration": 0.5077500877398808, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "That's exactly what I think too.", + "original_text": "That's exactly what I think too.", + "start_time": 35.09426760843166, + "end_time": 36.82415422974685, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--130/temp/line_9_B.wav", + "silence_duration": 0.344100137318185, + "is_interrupted": false + } + ] + }, + "DialogSum--val--132": { + "original_text": "A: What seems to be the problem? \nB: I have a really bad toothache! My cheek is swollen and I can't eat [interrupt] anything without feeling a sharp pain that radiates all the way to my ear and makes it difficult to even drink water comfortably. \nA: Swollen? That sounds serious. Let's have a look. Mmmm. This doesn't look too good. I think we may have to pull out your wisdom tooth. It's pressing against your molars and that's one of the reasons you are experiencing so much pain. \nB: When you pull my tooth will you also have to extract the nerve and the root? I'm really worried about the pain afterwards. \nA: Before we get into that, we should take some x-rays to see exactly what we're dealing with. I also noticed a small cavity up front here, so you're going to need a filling as well. \nB: Oh, I see. I guess that's what I get for not flossing or brushing my teeth three times a day. But about the nerve and root, will you have to extract them too?", + "cleaned_text": "A: What seems to be the problem? \nB:I have a really bad toothache! My cheek is swollen and I can't eat anything without feeling a sharp pain that radiates all the way to my ear and makes it difficult to even drink water comfortably.\nA: Swollen? That sounds serious. Let's have a look. Mmmm. This doesn't look too good. I think we may have to pull out your wisdom tooth. It's pressing against your molars and that's one of the reasons you are experiencing so much pain. \nB: When you pull my tooth will you also have to extract the nerve and the root? I'm really worried about the pain afterwards. \nA: Before we get into that, we should take some x-rays to see exactly what we're dealing with. I also noticed a small cavity up front here, so you're going to need a filling as well. \nB: Oh, I see. I guess that's what I get for not flossing or brushing my teeth three times a day. But about the nerve and root, will you have to extract them too?", + "total_duration": 46.25927437641723, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--132/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--132/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--132/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "What seems to be the problem?", + "original_text": "What seems to be the problem?", + "start_time": 0, + "end_time": 1.5325170068027212, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--132/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I have a really bad toothache! My cheek is swollen and I can't eat", + "original_text": "I have a really bad toothache! My cheek is swollen and I can't eat [interrupt] anything without feeling a sharp pain that radiates all the way to my ear and makes it difficult to even drink water comfortably.", + "start_time": 2.017326701385192, + "end_time": 11.909027381657301, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--132/temp/line_1_B.wav", + "silence_duration": 0.4848096945824708, + "is_interrupted": true, + "text_after_interrupt": "anything without feeling a sharp pain that radiates all the way to my ear and makes it difficult to even drink water comfortably." + }, + { + "speaker": "A", + "text": "Swollen? That sounds serious. Let's have a look. Mmmm. This doesn't look too good. I think we may have to pull out your wisdom tooth. It's pressing against your molars and that's one of the reasons you are experiencing so much pain.", + "original_text": "Swollen? That sounds serious. Let's have a look. Mmmm. This doesn't look too good. I think we may have to pull out your wisdom tooth. It's pressing against your molars and that's one of the reasons you are experiencing so much pain.", + "start_time": 5.477099944015578, + "end_time": 20.175331236532585, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--132/temp/line_2_A.wav", + "silence_duration": 0.491011052094094, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "When you pull my tooth will you also have to extract the nerve and the root? I'm really worried about the pain afterwards.", + "original_text": "When you pull my tooth will you also have to extract the nerve and the root? I'm really worried about the pain afterwards.", + "start_time": 20.502569635093092, + "end_time": 26.737127458222343, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--132/temp/line_3_B.wav", + "silence_duration": 0.3272383985605062, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Before we get into that, we should take some x-rays to see exactly what we're dealing with. I also noticed a small cavity up front here, so you're going to need a filling as well.", + "original_text": "Before we get into that, we should take some x-rays to see exactly what we're dealing with. I also noticed a small cavity up front here, so you're going to need a filling as well.", + "start_time": 27.253131671115177, + "end_time": 37.748551172248966, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--132/temp/line_4_A.wav", + "silence_duration": 0.5160042128928362, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Oh, I see. I guess that's what I get for not flossing or brushing my teeth three times a day. But about the nerve and root, will you have to extract them too?", + "original_text": "Oh, I see. I guess that's what I get for not flossing or brushing my teeth three times a day. But about the nerve and root, will you have to extract them too?", + "start_time": 38.16716072774325, + "end_time": 46.25931492275459, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--132/temp/line_5_B.wav", + "silence_duration": 0.4186095554942861, + "is_interrupted": false + } + ] + }, + "DialogSum--val--134": { + "original_text": "A: My hand still hurts from the fall on the ice yesterday. I wonder if I broke [interrupt] a bone or just sprained it because the pain seems to be concentrated around my wrist joint and gets worse when I try to move it in certain directions.\nB: Sorry to jump in, but did you notice any swelling or unusual stiffness? That could be a sign of something more serious. \nA: There is some swelling, but it's not black and blue or anything. I was going to say earlier, I might just need to rest it for a few days, but if the swelling doesn't go down, I should probably see a doctor.", + "cleaned_text": "A:My hand still hurts from the fall on the ice yesterday. I wonder if I broke a bone or just sprained it because the pain seems to be concentrated around my wrist joint and gets worse when I try to move it in certain directions.\nB: Sorry to jump in, but did you notice any swelling or unusual stiffness? That could be a sign of something more serious. \nA: There is some swelling, but it's not black and blue or anything. I was going to say earlier, I might just need to rest it for a few days, but if the swelling doesn't go down, I should probably see a doctor.", + "total_duration": 26.542267573696144, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--134/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--134/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--134/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "My hand still hurts from the fall on the ice yesterday. I wonder if I broke", + "original_text": "My hand still hurts from the fall on the ice yesterday. I wonder if I broke [interrupt] a bone or just sprained it because the pain seems to be concentrated around my wrist joint and gets worse when I try to move it in certain directions.", + "start_time": 0, + "end_time": 14.489251700680272, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--134/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": true, + "text_after_interrupt": "a bone or just sprained it because the pain seems to be concentrated around my wrist joint and gets worse when I try to move it in certain directions." + }, + { + "speaker": "B", + "text": "Sorry to jump in, but did you notice any swelling or unusual stiffness? That could be a sign of something more serious.", + "original_text": "Sorry to jump in, but did you notice any swelling or unusual stiffness? That could be a sign of something more serious.", + "start_time": 4.748480725623582, + "end_time": 11.017868480725623, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--134/temp/line_1_B.wav", + "silence_duration": 0.5919336156432857, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "There is some swelling, but it's not black and blue or anything. I was going to say earlier, I might just need to rest it for a few days, but if the swelling doesn't go down, I should probably see a doctor.", + "original_text": "There is some swelling, but it's not black and blue or anything. I was going to say earlier, I might just need to rest it for a few days, but if the swelling doesn't go down, I should probably see a doctor.", + "start_time": 14.827809646556947, + "end_time": 26.542276766738354, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--134/temp/line_2_A.wav", + "silence_duration": 0.3385579458766745, + "is_interrupted": false + } + ] + }, + "DialogSum--val--135": { + "original_text": "A: Good morning. May I help you? \nB: I'd like to rent a car, please. \nA: Okay. Full-size, mid-size, or compact, madam? \nB: Compact is OK. What's the rate? \nA: 78 dollars a day. \nB: And I'd like to have insurance just in [interrupt] case something unexpected happens during the rental period, especially since I'll be driving in unfamiliar areas where road conditions might be challenging. \nA: Sorry to interrupt, but I just realized—do you have any preference for automatic or manual transmission? \nB: Oh, automatic would be better for me. But as I was saying, I'd like to have insurance just in case. \nA: If you want full coverage insurance, it will be 8 dollars per day. \nB: All right, I'll take that, too. \nA: Here is our brochure, madam. Er... compact... OK. Please choose a model in this section. \nB: How about this one? \nA: All right. How many days would you like to use it? \nB: Just one day. \nA: Oh, and I forgot to ask earlier—did you need any additional equipment, like a GPS or a child seat?", + "cleaned_text": "A: Good morning. May I help you? \nB: I'd like to rent a car, please. \nA: Okay. Full-size, mid-size, or compact, madam? \nB: Compact is OK. What's the rate? \nA: 78 dollars a day. \nB:And I'd like to have insurance just in case something unexpected happens during the rental period, especially since I'll be driving in unfamiliar areas where road conditions might be challenging.\nA: Sorry to interrupt, but I just realized—do you have any preference for automatic or manual transmission? \nB: Oh, automatic would be better for me. But as I was saying, I'd like to have insurance just in case. \nA: If you want full coverage insurance, it will be 8 dollars per day. \nB: All right, I'll take that, too. \nA: Here is our brochure, madam. Er... compact... OK. Please choose a model in this section. \nB: How about this one? \nA: All right. How many days would you like to use it? \nB: Just one day. \nA: Oh, and I forgot to ask earlier—did you need any additional equipment, like a GPS or a child seat?", + "total_duration": 55.3756462585034, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--135/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--135/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--135/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Good morning. May I help you?", + "original_text": "Good morning. May I help you?", + "start_time": 0, + "end_time": 1.5789569160997732, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--135/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I'd like to rent a car, please.", + "original_text": "I'd like to rent a car, please.", + "start_time": 2.0105416094670456, + "end_time": 3.5662785709182927, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--135/temp/line_1_B.wav", + "silence_duration": 0.4315846933672727, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Okay. Full-size, mid-size, or compact, madam?", + "original_text": "Okay. Full-size, mid-size, or compact, madam?", + "start_time": 4.019380049998345, + "end_time": 8.071262136166146, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--135/temp/line_2_A.wav", + "silence_duration": 0.4531014790800518, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Compact is OK. What's the rate?", + "original_text": "Compact is OK. What's the rate?", + "start_time": 8.668263441020141, + "end_time": 10.827719223333066, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--135/temp/line_3_B.wav", + "silence_duration": 0.5970013048539942, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "78 dollars a day.", + "original_text": "78 dollars a day.", + "start_time": 11.37989568851001, + "end_time": 13.109782309825203, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--135/temp/line_4_A.wav", + "silence_duration": 0.5521764651769439, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "And I'd like to have insurance just in", + "original_text": "And I'd like to have insurance just in [interrupt] case something unexpected happens during the rental period, especially since I'll be driving in unfamiliar areas where road conditions might be challenging.", + "start_time": 13.439746590036657, + "end_time": 22.936708041283822, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--135/temp/line_5_B.wav", + "silence_duration": 0.329964280211454, + "is_interrupted": true, + "text_after_interrupt": "case something unexpected happens during the rental period, especially since I'll be driving in unfamiliar areas where road conditions might be challenging." + }, + { + "speaker": "A", + "text": "Sorry to interrupt, but I just realized—do you have any preference for automatic or manual transmission?", + "original_text": "Sorry to interrupt, but I just realized—do you have any preference for automatic or manual transmission?", + "start_time": 15.4366626898099, + "end_time": 21.69444046758768, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--135/temp/line_6_A.wav", + "silence_duration": 0.3686332838705165, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Oh, automatic would be better for me. But as I was saying, I'd like to have insurance just in case.", + "original_text": "Oh, automatic would be better for me. But as I was saying, I'd like to have insurance just in case.", + "start_time": 23.29034385493621, + "end_time": 28.28263410436932, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--135/temp/line_7_B.wav", + "silence_duration": 0.35363581365238866, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "If you want full coverage insurance, it will be 8 dollars per day.", + "original_text": "If you want full coverage insurance, it will be 8 dollars per day.", + "start_time": 28.733171887403063, + "end_time": 33.028863497380385, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--135/temp/line_8_A.wav", + "silence_duration": 0.4505377830337461, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "All right, I'll take that, too.", + "original_text": "All right, I'll take that, too.", + "start_time": 33.44510286988963, + "end_time": 35.0240597859894, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--135/temp/line_9_B.wav", + "silence_duration": 0.4162393725092443, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Here is our brochure, madam. Er... compact... OK. Please choose a model in this section.", + "original_text": "Here is our brochure, madam. Er... compact... OK. Please choose a model in this section.", + "start_time": 35.45503062740188, + "end_time": 41.07425965234519, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--135/temp/line_10_A.wav", + "silence_duration": 0.43097084141247977, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "How about this one?", + "original_text": "How about this one?", + "start_time": 41.488446089549306, + "end_time": 42.521734071408716, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--135/temp/line_11_B.wav", + "silence_duration": 0.41418643720411513, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "All right. How many days would you like to use it?", + "original_text": "All right. How many days would you like to use it?", + "start_time": 43.0579128508204, + "end_time": 46.413196297532416, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--135/temp/line_12_A.wav", + "silence_duration": 0.5361787794116855, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Just one day.", + "original_text": "Just one day.", + "start_time": 47.009301503493745, + "end_time": 47.96131964408332, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--135/temp/line_13_B.wav", + "silence_duration": 0.5961052059613312, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Oh, and I forgot to ask earlier—did you need any additional equipment, like a GPS or a child seat?", + "original_text": "Oh, and I forgot to ask earlier—did you need any additional equipment, like a GPS or a child seat?", + "start_time": 48.316815881472664, + "end_time": 55.375682094624594, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--135/temp/line_14_A.wav", + "silence_duration": 0.35549623738934477, + "is_interrupted": false + } + ] + }, + "DialogSum--val--136": { + "original_text": "A: Maria, I know you've arrived here only recently. Can you tell me if there is anything that has surprised you about British people? \nB: People here are more serious than that in Spain. Spanish people are lazy but fun to be with. Also, before I came to England, people told me that the English are very polite. It is known internationally. But I don't think it is always as genuine as people might expect. Sometimes, it feels more like a formality rather than true kindness, [interrupt] especially when compared to the spontaneous warmth and hospitality I've experienced in Mediterranean cultures where people seem to genuinely care about your wellbeing without any pretense or social obligation. \nA: Sorry to jump in, but could you explain what you mean by \"real politeness\"? I'm curious about how it's different from what you've experienced here. \nB: Sure, what I meant is that real politeness goes beyond just using words like please, thank you, sorry, and excuse me. It's more about genuine consideration and warmth. By the way, I didn't get to finish earlier—what I was going to say is that I don't think it is true that all British people are as polite as their reputation suggests.", + "cleaned_text": "A: Maria, I know you've arrived here only recently. Can you tell me if there is anything that has surprised you about British people? \nB:People here are more serious than that in Spain. Spanish people are lazy but fun to be with. Also, before I came to England, people told me that the English are very polite. It is known internationally. But I don't think it is always as genuine as people might expect. Sometimes, it feels more like a formality rather than true kindness, especially when compared to the spontaneous warmth and hospitality I've experienced in Mediterranean cultures where people seem to genuinely care about your wellbeing without any pretense or social obligation.\nA: Sorry to jump in, but could you explain what you mean by \"real politeness\"? I'm curious about how it's different from what you've experienced here. \nB: Sure, what I meant is that real politeness goes beyond just using words like please, thank you, sorry, and excuse me. It's more about genuine consideration and warmth. By the way, I didn't get to finish earlier—what I was going to say is that I don't think it is true that all British people are as polite as their reputation suggests.", + "total_duration": 53.83954648526077, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--136/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--136/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--136/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Maria, I know you've arrived here only recently. Can you tell me if there is anything that has surprised you about British people?", + "original_text": "Maria, I know you've arrived here only recently. Can you tell me if there is anything that has surprised you about British people?", + "start_time": 0, + "end_time": 6.977596371882086, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--136/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "People here are more serious than that in Spain. Spanish people are lazy but fun to be with. Also, before I came to England, people told me that the English are very polite. It is known internationally. But I don't think it is always as genuine as people might expect. Sometimes, it feels more like a formality rather than true kindness,", + "original_text": "People here are more serious than that in Spain. Spanish people are lazy but fun to be with. Also, before I came to England, people told me that the English are very polite. It is known internationally. But I don't think it is always as genuine as people might expect. Sometimes, it feels more like a formality rather than true kindness, [interrupt] especially when compared to the spontaneous warmth and hospitality I've experienced in Mediterranean cultures where people seem to genuinely care about your wellbeing without any pretense or social obligation.", + "start_time": 7.3075534793680115, + "end_time": 35.56623828662425, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--136/temp/line_1_B.wav", + "silence_duration": 0.3299571074859252, + "is_interrupted": true, + "text_after_interrupt": "especially when compared to the spontaneous warmth and hospitality I've experienced in Mediterranean cultures where people seem to genuinely care about your wellbeing without any pretense or social obligation." + }, + { + "speaker": "A", + "text": "Sorry to jump in, but could you explain what you mean by \"real politeness\"? I'm curious about how it's different from what you've experienced here.", + "original_text": "Sorry to jump in, but could you explain what you mean by \"real politeness\"? I'm curious about how it's different from what you've experienced here.", + "start_time": 25.279798377327193, + "end_time": 33.731861869390684, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--136/temp/line_2_A.wav", + "silence_duration": 0.44663854862556485, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Sure, what I meant is that real politeness goes beyond just using words like please, thank you, sorry, and excuse me. It's more about genuine consideration and warmth. By the way, I didn't get to finish earlier—what I was going to say is that I don't think it is true that all British people are as polite as their reputation suggests.", + "original_text": "Sure, what I meant is that real politeness goes beyond just using words like please, thank you, sorry, and excuse me. It's more about genuine consideration and warmth. By the way, I didn't get to finish earlier—what I was going to say is that I don't think it is true that all British people are as polite as their reputation suggests.", + "start_time": 36.11111178912789, + "end_time": 53.839547163277544, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--136/temp/line_3_B.wav", + "silence_duration": 0.544873502503638, + "is_interrupted": false + } + ] + }, + "DialogSum--val--138": { + "original_text": "A: Did you see today's newspaper? That building over there in Centerville was just struck by lightning for the fourth [interrupt] time this year, which is statistically extremely unusual given the average lightning strike frequency in our region. It's becoming a bit of a mystery.\nB: Wow, for the fourth time? That sounds like a real hotspot for lightning strikes. Do they know why it keeps happening?\nA: I'm not surprised. If the conditions for lightning to strike are right one time, they might be as good another time. But I was about to mention that I don't take any chances. If I'm caught in a thunderstorm, I will look for a building or a closed car. Also, I was told that if you're stuck outdoors, the best thing you can do is to keep yourself close to the ground and avoid bodies of water.\nB: That's good advice. You know, I actually avoid using any electrical devices during a storm. I don't even take baths or showers. Maybe I'm a bit too [interrupt] cautious, but I'd rather be overly careful than risk it, especially after hearing about all these documented cases of people getting injured through household appliances during thunderstorms.\nA: Anxious? No, I totally get it. It's better to be safe than sorry. But I was curious, do you also avoid using your phone during a storm?", + "cleaned_text": "A:Did you see today's newspaper? That building over there in Centerville was just struck by lightning for the fourth time this year, which is statistically extremely unusual given the average lightning strike frequency in our region. It's becoming a bit of a mystery.\nB: Wow, for the fourth time? That sounds like a real hotspot for lightning strikes. Do they know why it keeps happening?\nA: I'm not surprised. If the conditions for lightning to strike are right one time, they might be as good another time. But I was about to mention that I don't take any chances. If I'm caught in a thunderstorm, I will look for a building or a closed car. Also, I was told that if you're stuck outdoors, the best thing you can do is to keep yourself close to the ground and avoid bodies of water.\nB:That's good advice. You know, I actually avoid using any electrical devices during a storm. I don't even take baths or showers. Maybe I'm a bit too cautious, but I'd rather be overly careful than risk it, especially after hearing about all these documented cases of people getting injured through household appliances during thunderstorms.\nA: Anxious? No, I totally get it. It's better to be safe than sorry. But I was curious, do you also avoid using your phone during a storm?", + "total_duration": 62.436780045351476, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--138/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--138/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--138/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Did you see today's newspaper? That building over there in Centerville was just struck by lightning for the fourth", + "original_text": "Did you see today's newspaper? That building over there in Centerville was just struck by lightning for the fourth [interrupt] time this year, which is statistically extremely unusual given the average lightning strike frequency in our region. It's becoming a bit of a mystery.", + "start_time": 0, + "end_time": 15.011700680272108, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--138/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": true, + "text_after_interrupt": "time this year, which is statistically extremely unusual given the average lightning strike frequency in our region. It's becoming a bit of a mystery." + }, + { + "speaker": "B", + "text": "Wow, for the fourth time? That sounds like a real hotspot for lightning strikes. Do they know why it keeps happening?", + "original_text": "Wow, for the fourth time? That sounds like a real hotspot for lightning strikes. Do they know why it keeps happening?", + "start_time": 6.629297052154195, + "end_time": 12.620045351473923, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--138/temp/line_1_B.wav", + "silence_duration": 0.3936384304381987, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I'm not surprised. If the conditions for lightning to strike are right one time, they might be as good another time. But I was about to mention that I don't take any chances. If I'm caught in a thunderstorm, I will look for a building or a closed car. Also, I was told that if you're stuck outdoors, the best thing you can do is to keep yourself close to the ground and avoid bodies of water.", + "original_text": "I'm not surprised. If the conditions for lightning to strike are right one time, they might be as good another time. But I was about to mention that I don't take any chances. If I'm caught in a thunderstorm, I will look for a building or a closed car. Also, I was told that if you're stuck outdoors, the best thing you can do is to keep yourself close to the ground and avoid bodies of water.", + "start_time": 15.48713464035514, + "end_time": 37.76668112561591, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--138/temp/line_2_A.wav", + "silence_duration": 0.47543396008303296, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "That's good advice. You know, I actually avoid using any electrical devices during a storm. I don't even take baths or showers. Maybe I'm a bit too", + "original_text": "That's good advice. You know, I actually avoid using any electrical devices during a storm. I don't even take baths or showers. Maybe I'm a bit too [interrupt] cautious, but I'd rather be overly careful than risk it, especially after hearing about all these documented cases of people getting injured through household appliances during thunderstorms.", + "start_time": 38.27873142358377, + "end_time": 55.415057954196016, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--138/temp/line_3_B.wav", + "silence_duration": 0.512050297967861, + "is_interrupted": true, + "text_after_interrupt": "cautious, but I'd rather be overly careful than risk it, especially after hearing about all these documented cases of people getting injured through household appliances during thunderstorms." + }, + { + "speaker": "A", + "text": "Anxious? No, I totally get it. It's better to be safe than sorry. But I was curious, do you also avoid using your phone during a storm?", + "original_text": "Anxious? No, I totally get it. It's better to be safe than sorry. But I was curious, do you also avoid using your phone during a storm?", + "start_time": 52.9282306546987, + "end_time": 62.43680208327013, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--138/temp/line_4_A.wav", + "silence_duration": 0.5325514605902028, + "is_interrupted": false + } + ] + }, + "DialogSum--val--140": { + "original_text": "A: Hi. I think I'm sitting next to you. Seat 35B. \nB: Oh, sorry. I'll just move my things. Hold on a minute. \nA: Thanks. Phwoo...I've been waiting in departure for ages. \nB: Mmm...The flight was delayed leaving Beijing. Security checks, you [interrupt] really have to be patient with them, but they were extra strict today because of some heightened security alerts about potential threats on international flights. \nA: Sorry to cut in, but those security checks were a nightmare, weren't they? I almost missed the flight because of them. \nB: Yeah, they were really thorough. So, are you going to London, then? \nA: Yes. I'm going to the LSE to do a master's degree in International Relations. \nB: Really? That sounds interesting. You must be really clever. \nA: So are you going to London too? \nB: Well actually, I'm going to the University of Middlesex to do Business Studies. \nA: That sounds interesting. \nB: Well actually, it's my parents who want me to do Business Studies. I'd rather study Philosophy, but my dad [interrupt] thinks it's not practical and won't lead to a stable career despite the fact that many philosophy graduates go on to have successful careers in law, politics, and even business consulting. \nA: Philosophy? That's fascinating! What draws you to Philosophy over Business Studies? \nB: I just find it more fulfilling, you know? But my dad wants me to take over the family business. He thinks Business Studies will make me rich.", + "cleaned_text": "A: Hi. I think I'm sitting next to you. Seat 35B. \nB: Oh, sorry. I'll just move my things. Hold on a minute. \nA: Thanks. Phwoo...I've been waiting in departure for ages. \nB:Mmm...The flight was delayed leaving Beijing. Security checks, you really have to be patient with them, but they were extra strict today because of some heightened security alerts about potential threats on international flights.\nA: Sorry to cut in, but those security checks were a nightmare, weren't they? I almost missed the flight because of them. \nB: Yeah, they were really thorough. So, are you going to London, then? \nA: Yes. I'm going to the LSE to do a master's degree in International Relations. \nB: Really? That sounds interesting. You must be really clever. \nA: So are you going to London too? \nB: Well actually, I'm going to the University of Middlesex to do Business Studies. \nA: That sounds interesting. \nB:Well actually, it's my parents who want me to do Business Studies. I'd rather study Philosophy, but my dad thinks it's not practical and won't lead to a stable career despite the fact that many philosophy graduates go on to have successful careers in law, politics, and even business consulting.\nA: Philosophy? That's fascinating! What draws you to Philosophy over Business Studies? \nB: I just find it more fulfilling, you know? But my dad wants me to take over the family business. He thinks Business Studies will make me rich.", + "total_duration": 71.52748299319728, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--140/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--140/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--140/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Hi. I think I'm sitting next to you. Seat 35B.", + "original_text": "Hi. I think I'm sitting next to you. Seat 35B.", + "start_time": 0, + "end_time": 3.93578231292517, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--140/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Oh, sorry. I'll just move my things. Hold on a minute.", + "original_text": "Oh, sorry. I'll just move my things. Hold on a minute.", + "start_time": 4.312073252254335, + "end_time": 6.924318150213518, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--140/temp/line_1_B.wav", + "silence_duration": 0.3762909393291648, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Thanks. Phwoo...I've been waiting in departure for ages.", + "original_text": "Thanks. Phwoo...I've been waiting in departure for ages.", + "start_time": 7.370691223643924, + "end_time": 11.085883967408096, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--140/temp/line_2_A.wav", + "silence_duration": 0.44637307343040566, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Mmm...The flight was delayed leaving Beijing. Security checks, you", + "original_text": "Mmm...The flight was delayed leaving Beijing. Security checks, you [interrupt] really have to be patient with them, but they were extra strict today because of some heightened security alerts about potential threats on international flights.", + "start_time": 11.508882030214163, + "end_time": 23.38588883293525, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--140/temp/line_3_B.wav", + "silence_duration": 0.42299806280606767, + "is_interrupted": true, + "text_after_interrupt": "really have to be patient with them, but they were extra strict today because of some heightened security alerts about potential threats on international flights." + }, + { + "speaker": "A", + "text": "Sorry to cut in, but those security checks were a nightmare, weren't they? I almost missed the flight because of them.", + "original_text": "Sorry to cut in, but those security checks were a nightmare, weren't they? I almost missed the flight because of them.", + "start_time": 15.583984071030489, + "end_time": 22.259721032481735, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--140/temp/line_4_A.wav", + "silence_duration": 0.32280626002545515, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yeah, they were really thorough. So, are you going to London, then?", + "original_text": "Yeah, they were really thorough. So, are you going to London, then?", + "start_time": 23.95436536593227, + "end_time": 27.367698699265603, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--140/temp/line_5_B.wav", + "silence_duration": 0.5684765329970161, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Yes. I'm going to the LSE to do a master's degree in International Relations.", + "original_text": "Yes. I'm going to the LSE to do a master's degree in International Relations.", + "start_time": 27.796414330992334, + "end_time": 33.47369324255696, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--140/temp/line_6_A.wav", + "silence_duration": 0.428715631726731, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Really? That sounds interesting. You must be really clever.", + "original_text": "Really? That sounds interesting. You must be really clever.", + "start_time": 33.77394977265675, + "end_time": 37.29177290190845, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--140/temp/line_7_B.wav", + "silence_duration": 0.3002565300997882, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "So are you going to London too?", + "original_text": "So are you going to London too?", + "start_time": 37.66365012700703, + "end_time": 39.39353674832223, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--140/temp/line_8_A.wav", + "silence_duration": 0.37187722509857774, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Well actually, I'm going to the University of Middlesex to do Business Studies.", + "original_text": "Well actually, I'm going to the University of Middlesex to do Business Studies.", + "start_time": 39.915606415814054, + "end_time": 43.967488501981855, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--140/temp/line_9_B.wav", + "silence_duration": 0.5220696674918298, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "That sounds interesting.", + "original_text": "That sounds interesting.", + "start_time": 44.453970262082706, + "end_time": 46.00970722353395, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--140/temp/line_10_A.wav", + "silence_duration": 0.48648176010085126, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Well actually, it's my parents who want me to do Business Studies. I'd rather study Philosophy, but my dad", + "original_text": "Well actually, it's my parents who want me to do Business Studies. I'd rather study Philosophy, but my dad [interrupt] thinks it's not practical and won't lead to a stable career despite the fact that many philosophy graduates go on to have successful careers in law, politics, and even business consulting.", + "start_time": 46.54549631893995, + "end_time": 61.35982738469959, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--140/temp/line_11_B.wav", + "silence_duration": 0.5357890954060056, + "is_interrupted": true, + "text_after_interrupt": "thinks it's not practical and won't lead to a stable career despite the fact that many philosophy graduates go on to have successful careers in law, politics, and even business consulting." + }, + { + "speaker": "A", + "text": "Philosophy? That's fascinating! What draws you to Philosophy over Business Studies?", + "original_text": "Philosophy? That's fascinating! What draws you to Philosophy over Business Studies?", + "start_time": 58.70347178194109, + "end_time": 63.93957155518372, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--140/temp/line_12_A.wav", + "silence_duration": 0.5757989961211427, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I just find it more fulfilling, you know? But my dad wants me to take over the family business. He thinks Business Studies will make me rich.", + "original_text": "I just find it more fulfilling, you know? But my dad wants me to take over the family business. He thinks Business Studies will make me rich.", + "start_time": 64.46863186771019, + "end_time": 71.52749808086212, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--140/temp/line_13_B.wav", + "silence_duration": 0.5290603125264688, + "is_interrupted": false + } + ] + }, + "DialogSum--val--141": { + "original_text": "A: I'm sure it will be wet when we arrive. \nB: Yes. I dare say it will be. \nA: It will be Sunday so I expected everything will be [interrupt] closed, especially the smaller shops and local businesses, which typically observe the day of rest more strictly than larger chain stores and supermarkets. \nB: Sorry, but are you sure everything will be closed? I mean, some places are sure to be open, right? \nA: No. I don't think that's possible. But the bank should be closed, so we shouldn't be able to get any money. \nB: Mmm, you may be right. Do you think we'll need our overcoats? \nA: No. We couldn't possibly. \nB: Why not? \nA: It will be summer. So it will be [interrupt] warm enough to not need them, though we might want to bring a light jacket just in case the evenings turn unexpectedly chilly or if we encounter some rain showers. \nB: Wait, did you mean it's unlikely to be hot in England during summer? \nA: Oh, I was just about to say it will be hot. But yes, in England, it could happen.", + "cleaned_text": "A: I'm sure it will be wet when we arrive. \nB: Yes. I dare say it will be. \nA:It will be Sunday so I expected everything will be closed, especially the smaller shops and local businesses, which typically observe the day of rest more strictly than larger chain stores and supermarkets.\nB: Sorry, but are you sure everything will be closed? I mean, some places are sure to be open, right? \nA: No. I don't think that's possible. But the bank should be closed, so we shouldn't be able to get any money. \nB: Mmm, you may be right. Do you think we'll need our overcoats? \nA: No. We couldn't possibly. \nB: Why not? \nA:It will be summer. So it will be warm enough to not need them, though we might want to bring a light jacket just in case the evenings turn unexpectedly chilly or if we encounter some rain showers.\nB: Wait, did you mean it's unlikely to be hot in England during summer? \nA: Oh, I was just about to say it will be hot. But yes, in England, it could happen.", + "total_duration": 49.53297052154195, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--141/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--141/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--141/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "I'm sure it will be wet when we arrive.", + "original_text": "I'm sure it will be wet when we arrive.", + "start_time": 0, + "end_time": 2.2755555555555556, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--141/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes. I dare say it will be.", + "original_text": "Yes. I dare say it will be.", + "start_time": 2.731052021561026, + "end_time": 4.368058824282114, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--141/temp/line_1_B.wav", + "silence_duration": 0.4554964660054702, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "It will be Sunday so I expected everything will be", + "original_text": "It will be Sunday so I expected everything will be [interrupt] closed, especially the smaller shops and local businesses, which typically observe the day of rest more strictly than larger chain stores and supermarkets.", + "start_time": 4.929522350615214, + "end_time": 17.72371736195308, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--141/temp/line_2_A.wav", + "silence_duration": 0.5614635263330998, + "is_interrupted": true, + "text_after_interrupt": "closed, especially the smaller shops and local businesses, which typically observe the day of rest more strictly than larger chain stores and supermarkets." + }, + { + "speaker": "B", + "text": "Sorry, but are you sure everything will be closed? I mean, some places are sure to be open, right?", + "original_text": "Sorry, but are you sure everything will be closed? I mean, some places are sure to be open, right?", + "start_time": 7.58820715787145, + "end_time": 13.35836588803018, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--141/temp/line_3_B.wav", + "silence_duration": 0.38978002750622076, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "No. I don't think that's possible. But the bank should be closed, so we shouldn't be able to get any money.", + "original_text": "No. I don't think that's possible. But the bank should be closed, so we shouldn't be able to get any money.", + "start_time": 18.290527044379996, + "end_time": 24.18839552510562, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--141/temp/line_4_A.wav", + "silence_duration": 0.5668096824269133, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Mmm, you may be right. Do you think we'll need our overcoats?", + "original_text": "Mmm, you may be right. Do you think we'll need our overcoats?", + "start_time": 24.681733838038546, + "end_time": 27.87447760221088, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--141/temp/line_5_B.wav", + "silence_duration": 0.4933383129329262, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "No. We couldn't possibly.", + "original_text": "No. We couldn't possibly.", + "start_time": 28.275322500965206, + "end_time": 30.086478963550242, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--141/temp/line_6_A.wav", + "silence_duration": 0.4008448987543258, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Why not?", + "original_text": "Why not?", + "start_time": 30.617482366891366, + "end_time": 31.337300960995673, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--141/temp/line_7_B.wav", + "silence_duration": 0.5310034033411236, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "It will be summer. So it will be", + "original_text": "It will be summer. So it will be [interrupt] warm enough to not need them, though we might want to bring a light jacket just in case the evenings turn unexpectedly chilly or if we encounter some rain showers.", + "start_time": 31.904941391637905, + "end_time": 43.36398901068552, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--141/temp/line_8_A.wav", + "silence_duration": 0.5676404306422322, + "is_interrupted": true, + "text_after_interrupt": "warm enough to not need them, though we might want to bring a light jacket just in case the evenings turn unexpectedly chilly or if we encounter some rain showers." + }, + { + "speaker": "B", + "text": "Wait, did you mean it's unlikely to be hot in England during summer?", + "original_text": "Wait, did you mean it's unlikely to be hot in England during summer?", + "start_time": 40.07179644183188, + "end_time": 43.70571934432621, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--141/temp/line_9_B.wav", + "silence_duration": 0.46127943630328544, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Oh, I was just about to say it will be hot. But yes, in England, it could happen.", + "original_text": "Oh, I was just about to say it will be hot. But yes, in England, it could happen.", + "start_time": 44.05307119573612, + "end_time": 49.532980492788276, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--141/temp/line_10_A.wav", + "silence_duration": 0.3473518514099111, + "is_interrupted": false + } + ] + }, + "DialogSum--val--142": { + "original_text": "A: Are you an art aficionado? \nB: Not really. I like going to an art exhibition once or twice a year. I hardly know anything about art or sculpture. You are a true art lover, aren't [interrupt] you? You seem to have a deep appreciation for different art forms and can probably discuss the nuances of various artistic movements with great insight. \nA: Sorry to jump in, but I just remembered—do you usually visit exhibitions alone, or do you go with friends? \nB: I usually go alone, but sometimes I go with friends who share the same interest. I love going to art galleries, particularly when one is holding an exhibition of abstract art. \nA: I never understand the meaning of those paintings. They are too abstract for me. I didn't pay much attention in art class at school. \nB: Art isn't for everyone. I'm going to an exhibition tomorrow at the national gallery. It's an exhibition of Greek and Roman sculpture. \nA: I like sculpture, especially that from ancient Rome or Greece. What time are you thinking of going? I'd love to go with you. \nB: I thought I'd have an early lunch and go immediately afterwards. Does that sound ok to you? Bus 51 goes directly [interrupt] to the gallery from the central station, and it has a special route that avoids most of the downtown traffic during midday hours. \nA: Oh, speaking of the bus, do you know if it's usually crowded around that time? \nB: Good point, it can be. But I was saying that Bus 51 goes directly there. What time shall we meet at the bus stop?", + "cleaned_text": "A: Are you an art aficionado? \nB:Not really. I like going to an art exhibition once or twice a year. I hardly know anything about art or sculpture. You are a true art lover, aren't you? You seem to have a deep appreciation for different art forms and can probably discuss the nuances of various artistic movements with great insight.\nA: Sorry to jump in, but I just remembered—do you usually visit exhibitions alone, or do you go with friends? \nB: I usually go alone, but sometimes I go with friends who share the same interest. I love going to art galleries, particularly when one is holding an exhibition of abstract art. \nA: I never understand the meaning of those paintings. They are too abstract for me. I didn't pay much attention in art class at school. \nB: Art isn't for everyone. I'm going to an exhibition tomorrow at the national gallery. It's an exhibition of Greek and Roman sculpture. \nA: I like sculpture, especially that from ancient Rome or Greece. What time are you thinking of going? I'd love to go with you. \nB:I thought I'd have an early lunch and go immediately afterwards. Does that sound ok to you? Bus 51 goes directly to the gallery from the central station, and it has a special route that avoids most of the downtown traffic during midday hours.\nA: Oh, speaking of the bus, do you know if it's usually crowded around that time? \nB: Good point, it can be. But I was saying that Bus 51 goes directly there. What time shall we meet at the bus stop?", + "total_duration": 76.03687074829932, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--142/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--142/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--142/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Are you an art aficionado?", + "original_text": "Are you an art aficionado?", + "start_time": 0, + "end_time": 1.7298866213151927, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--142/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Not really. I like going to an art exhibition once or twice a year. I hardly know anything about art or sculpture. You are a true art lover, aren't", + "original_text": "Not really. I like going to an art exhibition once or twice a year. I hardly know anything about art or sculpture. You are a true art lover, aren't [interrupt] you? You seem to have a deep appreciation for different art forms and can probably discuss the nuances of various artistic movements with great insight.", + "start_time": 2.163099315453045, + "end_time": 18.219697954908828, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--142/temp/line_1_B.wav", + "silence_duration": 0.43321269413785246, + "is_interrupted": true, + "text_after_interrupt": "you? You seem to have a deep appreciation for different art forms and can probably discuss the nuances of various artistic movements with great insight." + }, + { + "speaker": "A", + "text": "Sorry to jump in, but I just remembered—do you usually visit exhibitions alone, or do you go with friends?", + "original_text": "Sorry to jump in, but I just remembered—do you usually visit exhibitions alone, or do you go with friends?", + "start_time": 10.05788389595191, + "end_time": 16.62913106148479, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--142/temp/line_2_A.wav", + "silence_duration": 0.545215828417374, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I usually go alone, but sometimes I go with friends who share the same interest. I love going to art galleries, particularly when one is holding an exhibition of abstract art.", + "original_text": "I usually go alone, but sometimes I go with friends who share the same interest. I love going to art galleries, particularly when one is holding an exhibition of abstract art.", + "start_time": 18.68504977273139, + "end_time": 27.404142743252933, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--142/temp/line_3_B.wav", + "silence_duration": 0.4653518178225618, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I never understand the meaning of those paintings. They are too abstract for me. I didn't pay much attention in art class at school.", + "original_text": "I never understand the meaning of those paintings. They are too abstract for me. I didn't pay much attention in art class at school.", + "start_time": 27.907432867317397, + "end_time": 35.63967776527658, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--142/temp/line_4_A.wav", + "silence_duration": 0.5032901240644645, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Art isn't for everyone. I'm going to an exhibition tomorrow at the national gallery. It's an exhibition of Greek and Roman sculpture.", + "original_text": "Art isn't for everyone. I'm going to an exhibition tomorrow at the national gallery. It's an exhibition of Greek and Roman sculpture.", + "start_time": 35.988151353346716, + "end_time": 42.9657477252288, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--142/temp/line_5_B.wav", + "silence_duration": 0.3484735880701369, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I like sculpture, especially that from ancient Rome or Greece. What time are you thinking of going? I'd love to go with you.", + "original_text": "I like sculpture, especially that from ancient Rome or Greece. What time are you thinking of going? I'd love to go with you.", + "start_time": 43.514949091424256, + "end_time": 50.91050464697981, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--142/temp/line_6_A.wav", + "silence_duration": 0.5492013661954565, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I thought I'd have an early lunch and go immediately afterwards. Does that sound ok to you? Bus 51 goes directly", + "original_text": "I thought I'd have an early lunch and go immediately afterwards. Does that sound ok to you? Bus 51 goes directly [interrupt] to the gallery from the central station, and it has a special route that avoids most of the downtown traffic during midday hours.", + "start_time": 51.38607602104491, + "end_time": 64.14544110040998, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--142/temp/line_7_B.wav", + "silence_duration": 0.47557137406509487, + "is_interrupted": true, + "text_after_interrupt": "to the gallery from the central station, and it has a special route that avoids most of the downtown traffic during midday hours." + }, + { + "speaker": "A", + "text": "Oh, speaking of the bus, do you know if it's usually crowded around that time?", + "original_text": "Oh, speaking of the bus, do you know if it's usually crowded around that time?", + "start_time": 64.36649911944622, + "end_time": 69.57937893804032, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--142/temp/line_8_A.wav", + "silence_duration": 0.46202780923221815, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Good point, it can be. But I was saying that Bus 51 goes directly there. What time shall we meet at the bus stop?", + "original_text": "Good point, it can be. But I was saying that Bus 51 goes directly there. What time shall we meet at the bus stop?", + "start_time": 70.057769465333, + "end_time": 76.03690778732846, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--142/temp/line_9_B.wav", + "silence_duration": 0.4783905272926682, + "is_interrupted": false + } + ] + }, + "DialogSum--val--143": { + "original_text": "A: Let's call it a day. \nB: It's nice to go home earlier once in a while. But it's the evening [interrupt] rush hour and I was hoping to catch up on some reading before it gets too late, though I might need to adjust my plans depending on how long the commute takes tonight. \nA: Sorry to interrupt, but did you check the traffic app? We might want to avoid any major delays. \nB: Oh, good point. I was just about to mention that it's the evening rush, and it's hard to find a clear route home without getting stuck in traffic [interrupt] for at least an hour or more, especially with all the road closures and detours happening downtown this week. \nA: Yeah, commuting a long way can be such a pain, especially with all the construction going on lately.", + "cleaned_text": "A: Let's call it a day. \nB:It's nice to go home earlier once in a while. But it's the evening rush hour and I was hoping to catch up on some reading before it gets too late, though I might need to adjust my plans depending on how long the commute takes tonight.\nA: Sorry to interrupt, but did you check the traffic app? We might want to avoid any major delays. \nB:Oh, good point. I was just about to mention that it's the evening rush, and it's hard to find a clear route home without getting stuck in traffic for at least an hour or more, especially with all the road closures and detours happening downtown this week.\nA: Yeah, commuting a long way can be such a pain, especially with all the construction going on lately.", + "total_duration": 33.45192743764172, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--143/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--143/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--143/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Let's call it a day.", + "original_text": "Let's call it a day.", + "start_time": 0, + "end_time": 1.3583673469387756, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--143/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "It's nice to go home earlier once in a while. But it's the evening", + "original_text": "It's nice to go home earlier once in a while. But it's the evening [interrupt] rush hour and I was hoping to catch up on some reading before it gets too late, though I might need to adjust my plans depending on how long the commute takes tonight.", + "start_time": 1.7370346982586806, + "end_time": 12.569143541796096, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--143/temp/line_1_B.wav", + "silence_duration": 0.378667351319905, + "is_interrupted": true, + "text_after_interrupt": "rush hour and I was hoping to catch up on some reading before it gets too late, though I might need to adjust my plans depending on how long the commute takes tonight." + }, + { + "speaker": "A", + "text": "Sorry to interrupt, but did you check the traffic app? We might want to avoid any major delays.", + "original_text": "Sorry to interrupt, but did you check the traffic app? We might want to avoid any major delays.", + "start_time": 5.196807940889066, + "end_time": 11.512635605288159, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--143/temp/line_2_A.wav", + "silence_duration": 0.4770660363454462, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Oh, good point. I was just about to mention that it's the evening rush, and it's hard to find a clear route home without getting stuck in traffic", + "original_text": "Oh, good point. I was just about to mention that it's the evening rush, and it's hard to find a clear route home without getting stuck in traffic [interrupt] for at least an hour or more, especially with all the road closures and detours happening downtown this week.", + "start_time": 13.108434330724096, + "end_time": 24.74163160963566, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--143/temp/line_3_B.wav", + "silence_duration": 0.5392907889279989, + "is_interrupted": true, + "text_after_interrupt": "for at least an hour or more, especially with all the road closures and detours happening downtown this week." + }, + { + "speaker": "A", + "text": "Yeah, commuting a long way can be such a pain, especially with all the construction going on lately.", + "original_text": "Yeah, commuting a long way can be such a pain, especially with all the construction going on lately.", + "start_time": 27.217378634755534, + "end_time": 33.451936457884784, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--143/temp/line_4_A.wav", + "silence_duration": 0.5634956928290551, + "is_interrupted": false + } + ] + }, + "DialogSum--val--144": { + "original_text": "A: Can anyone tell me where I can buy the ingredients to make Chinese food? \nB: There is a supermarket in Kensington High Street. I'll come and give you a [interrupt] hand with finding everything you need since I'm quite familiar with their Asian food section and know exactly where to find all the specialty ingredients you're looking for. \nA: Sorry, before you finish—do they stock all the essentials there? I need specific ingredients like Chinese cabbage and pork. \nB: Yes, they do. I was just saying I'll give you a hand. Here, take one of these trolleys. What do you want exactly? \nA: I'm after things to stuff dumplings with, like Chinese cabbage—oh, and pork too. Where's the meat counter? \nB: The fruit and vegetables are over there. The meat counter is just around the corner to the left.", + "cleaned_text": "A: Can anyone tell me where I can buy the ingredients to make Chinese food? \nB:There is a supermarket in Kensington High Street. I'll come and give you a hand with finding everything you need since I'm quite familiar with their Asian food section and know exactly where to find all the specialty ingredients you're looking for.\nA: Sorry, before you finish—do they stock all the essentials there? I need specific ingredients like Chinese cabbage and pork. \nB: Yes, they do. I was just saying I'll give you a hand. Here, take one of these trolleys. What do you want exactly? \nA: I'm after things to stuff dumplings with, like Chinese cabbage—oh, and pork too. Where's the meat counter? \nB: The fruit and vegetables are over there. The meat counter is just around the corner to the left.", + "total_duration": 35.009024943310656, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--144/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--144/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--144/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Can anyone tell me where I can buy the ingredients to make Chinese food?", + "original_text": "Can anyone tell me where I can buy the ingredients to make Chinese food?", + "start_time": 0, + "end_time": 3.912562358276644, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--144/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "There is a supermarket in Kensington High Street. I'll come and give you a", + "original_text": "There is a supermarket in Kensington High Street. I'll come and give you a [interrupt] hand with finding everything you need since I'm quite familiar with their Asian food section and know exactly where to find all the specialty ingredients you're looking for.", + "start_time": 4.490977948335877, + "end_time": 16.12417522724744, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--144/temp/line_1_B.wav", + "silence_duration": 0.5784155900592336, + "is_interrupted": true, + "text_after_interrupt": "hand with finding everything you need since I'm quite familiar with their Asian food section and know exactly where to find all the specialty ingredients you're looking for." + }, + { + "speaker": "A", + "text": "Sorry, before you finish—do they stock all the essentials there? I need specific ingredients like Chinese cabbage and pork.", + "original_text": "Sorry, before you finish—do they stock all the essentials there? I need specific ingredients like Chinese cabbage and pork.", + "start_time": 8.647349830422044, + "end_time": 16.135785204571704, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--144/temp/line_2_A.wav", + "silence_duration": 0.3627298838508233, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, they do. I was just saying I'll give you a hand. Here, take one of these trolleys. What do you want exactly?", + "original_text": "Yes, they do. I was just saying I'll give you a hand. Here, take one of these trolleys. What do you want exactly?", + "start_time": 16.4608397743367, + "end_time": 22.056848844631485, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--144/temp/line_3_B.wav", + "silence_duration": 0.3250545697649959, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I'm after things to stuff dumplings with, like Chinese cabbage—oh, and pork too. Where's the meat counter?", + "original_text": "I'm after things to stuff dumplings with, like Chinese cabbage—oh, and pork too. Where's the meat counter?", + "start_time": 22.527481483309483, + "end_time": 29.59795767378567, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--144/temp/line_4_A.wav", + "silence_duration": 0.47063263867799904, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "The fruit and vegetables are over there. The meat counter is just around the corner to the left.", + "original_text": "The fruit and vegetables are over there. The meat counter is just around the corner to the left.", + "start_time": 30.098009940536592, + "end_time": 35.00903034869986, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--144/temp/line_5_B.wav", + "silence_duration": 0.5000522667509215, + "is_interrupted": false + } + ] + }, + "DialogSum--val--145": { + "original_text": "A: Excuse me. Do you think I can get there in time to catch the 11:30 train? \nB: Well, let me see. Now it's 11:00 sharp. It's a long way to go. If I take the shortest route, we may come across a traffic jam. If I take a less heavy route, it will save us 10 or more minutes, but you'll have to pay more. Which do you [interrupt] think would be better for you considering both time efficiency and cost effectiveness in this particular situation? \nA: Are you sure that I can get there in time if we take the less heavy route? \nB: Generally speaking, we can if we go at this speed and nothing unexpected happens. But as I was saying, which do you prefer? \nA: Oh, I think I prefer the less heavy route. How much more do I have to pay? \nB: Compared to the shortest route, you may pay around 5 Euro more. \nA: That's acceptable. No one wants to miss a train. \nB: OK. . . Here we are. We'll turn left at this cross. To go straight ahead is the shortest [interrupt] route, but it might be slower due to traffic congestion during this peak hour, especially with all the construction work happening downtown. \nA: Sorry, just to clarify, the left turn is the less heavy route, right? \nB: Exactly. The straight route is the shortest, but it might be risky with the traffic.", + "cleaned_text": "A: Excuse me. Do you think I can get there in time to catch the 11:30 train? \nB:Well, let me see. Now it's 11:00 sharp. It's a long way to go. If I take the shortest route, we may come across a traffic jam. If I take a less heavy route, it will save us 10 or more minutes, but you'll have to pay more. Which do you think would be better for you considering both time efficiency and cost effectiveness in this particular situation?\nA: Are you sure that I can get there in time if we take the less heavy route? \nB: Generally speaking, we can if we go at this speed and nothing unexpected happens. But as I was saying, which do you prefer? \nA: Oh, I think I prefer the less heavy route. How much more do I have to pay? \nB: Compared to the shortest route, you may pay around 5 Euro more. \nA: That's acceptable. No one wants to miss a train. \nB:OK. . . Here we are. We'll turn left at this cross. To go straight ahead is the shortest route, but it might be slower due to traffic congestion during this peak hour, especially with all the construction work happening downtown.\nA: Sorry, just to clarify, the left turn is the less heavy route, right? \nB: Exactly. The straight route is the shortest, but it might be risky with the traffic.", + "total_duration": 62.49641723356009, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--145/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--145/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--145/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Excuse me. Do you think I can get there in time to catch the 11:30 train?", + "original_text": "Excuse me. Do you think I can get there in time to catch the 11:30 train?", + "start_time": 0, + "end_time": 4.597551020408163, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--145/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Well, let me see. Now it's 11:00 sharp. It's a long way to go. If I take the shortest route, we may come across a traffic jam. If I take a less heavy route, it will save us 10 or more minutes, but you'll have to pay more. Which do you", + "original_text": "Well, let me see. Now it's 11:00 sharp. It's a long way to go. If I take the shortest route, we may come across a traffic jam. If I take a less heavy route, it will save us 10 or more minutes, but you'll have to pay more. Which do you [interrupt] think would be better for you considering both time efficiency and cost effectiveness in this particular situation?", + "start_time": 5.029981363723378, + "end_time": 23.6175550598685, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--145/temp/line_1_B.wav", + "silence_duration": 0.4324303433152142, + "is_interrupted": true, + "text_after_interrupt": "think would be better for you considering both time efficiency and cost effectiveness in this particular situation?" + }, + { + "speaker": "A", + "text": "Are you sure that I can get there in time if we take the less heavy route?", + "original_text": "Are you sure that I can get there in time if we take the less heavy route?", + "start_time": 17.580366851251725, + "end_time": 21.550979096149685, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--145/temp/line_2_A.wav", + "silence_duration": 0.3105066031565129, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Generally speaking, we can if we go at this speed and nothing unexpected happens. But as I was saying, which do you prefer?", + "original_text": "Generally speaking, we can if we go at this speed and nothing unexpected happens. But as I was saying, which do you prefer?", + "start_time": 24.043649219837324, + "end_time": 30.60328640804594, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--145/temp/line_3_B.wav", + "silence_duration": 0.4260941599688236, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Oh, I think I prefer the less heavy route. How much more do I have to pay?", + "original_text": "Oh, I think I prefer the less heavy route. How much more do I have to pay?", + "start_time": 30.942349043535756, + "end_time": 35.35414042675571, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--145/temp/line_4_A.wav", + "silence_duration": 0.3390626354898182, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Compared to the shortest route, you may pay around 5 Euro more.", + "original_text": "Compared to the shortest route, you may pay around 5 Euro more.", + "start_time": 35.9516004049163, + "end_time": 39.864162763192944, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--145/temp/line_5_B.wav", + "silence_duration": 0.5974599781605865, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "That's acceptable. No one wants to miss a train.", + "original_text": "That's acceptable. No one wants to miss a train.", + "start_time": 40.34851261687727, + "end_time": 43.599306267670926, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--145/temp/line_6_A.wav", + "silence_duration": 0.4843498536843304, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "OK. . . Here we are. We'll turn left at this cross. To go straight ahead is the shortest", + "original_text": "OK. . . Here we are. We'll turn left at this cross. To go straight ahead is the shortest [interrupt] route, but it might be slower due to traffic congestion during this peak hour, especially with all the construction work happening downtown.", + "start_time": 43.926140438147804, + "end_time": 56.46491594835189, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--145/temp/line_7_B.wav", + "silence_duration": 0.32683417047687585, + "is_interrupted": true, + "text_after_interrupt": "route, but it might be slower due to traffic congestion during this peak hour, especially with all the construction work happening downtown." + }, + { + "speaker": "A", + "text": "Sorry, just to clarify, the left turn is the less heavy route, right?", + "original_text": "Sorry, just to clarify, the left turn is the less heavy route, right?", + "start_time": 53.42127604862483, + "end_time": 57.61247786268379, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--145/temp/line_8_A.wav", + "silence_duration": 0.3179184129913707, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Exactly. The straight route is the shortest, but it might be risky with the traffic.", + "original_text": "Exactly. The straight route is the shortest, but it might be risky with the traffic.", + "start_time": 58.1659030406875, + "end_time": 62.496424582637616, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--145/temp/line_9_B.wav", + "silence_duration": 0.5534251780037116, + "is_interrupted": false + } + ] + }, + "DialogSum--val--146": { + "original_text": "A: Nice to see you again, Mike. How was your trip to China? \nB: It was great. I flew to Beijing with my wife last month and I stayed there for 3 days. There were so many things to see and so many places of interest to visit in Beijing that we really couldn't decide whether to [interrupt] explore more of the city or take a day trip to the nearby Great Wall, especially since both options offered such unique cultural experiences and breathtaking views. \nA: Oh, I've heard Beijing can be overwhelming with so much to do! Did you manage to visit the Great Wall? \nB: Yes, we did! And after Beijing, we also visited Shanghai and Nanjing, each city for 2 days. Finally, we paid a visit to Guilin, where we spent 3 days. They were so beautiful that we were deeply impressed by these cities. \nA: Guilin sounds amazing! But I'm curious, you mentioned you couldn't decide whether to stay in Beijing or... what was the other option?", + "cleaned_text": "A: Nice to see you again, Mike. How was your trip to China? \nB:It was great. I flew to Beijing with my wife last month and I stayed there for 3 days. There were so many things to see and so many places of interest to visit in Beijing that we really couldn't decide whether to explore more of the city or take a day trip to the nearby Great Wall, especially since both options offered such unique cultural experiences and breathtaking views.\nA: Oh, I've heard Beijing can be overwhelming with so much to do! Did you manage to visit the Great Wall? \nB: Yes, we did! And after Beijing, we also visited Shanghai and Nanjing, each city for 2 days. Finally, we paid a visit to Guilin, where we spent 3 days. They were so beautiful that we were deeply impressed by these cities. \nA: Guilin sounds amazing! But I'm curious, you mentioned you couldn't decide whether to stay in Beijing or... what was the other option?", + "total_duration": 44.32371882086168, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--146/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--146/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--146/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Nice to see you again, Mike. How was your trip to China?", + "original_text": "Nice to see you again, Mike. How was your trip to China?", + "start_time": 0, + "end_time": 3.6919727891156464, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--146/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "It was great. I flew to Beijing with my wife last month and I stayed there for 3 days. There were so many things to see and so many places of interest to visit in Beijing that we really couldn't decide whether to", + "original_text": "It was great. I flew to Beijing with my wife last month and I stayed there for 3 days. There were so many things to see and so many places of interest to visit in Beijing that we really couldn't decide whether to [interrupt] explore more of the city or take a day trip to the nearby Great Wall, especially since both options offered such unique cultural experiences and breathtaking views.", + "start_time": 4.131345260971364, + "end_time": 23.067218276844383, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--146/temp/line_1_B.wav", + "silence_duration": 0.4393724718557181, + "is_interrupted": true, + "text_after_interrupt": "explore more of the city or take a day trip to the nearby Great Wall, especially since both options offered such unique cultural experiences and breathtaking views." + }, + { + "speaker": "A", + "text": "Oh, I've heard Beijing can be overwhelming with so much to do! Did you manage to visit the Great Wall?", + "original_text": "Oh, I've heard Beijing can be overwhelming with so much to do! Did you manage to visit the Great Wall?", + "start_time": 15.648442766640297, + "end_time": 21.824950703148232, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--146/temp/line_2_A.wav", + "silence_duration": 0.3930033494468438, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, we did! And after Beijing, we also visited Shanghai and Nanjing, each city for 2 days. Finally, we paid a visit to Guilin, where we spent 3 days. They were so beautiful that we were deeply impressed by these cities.", + "original_text": "Yes, we did! And after Beijing, we also visited Shanghai and Nanjing, each city for 2 days. Finally, we paid a visit to Guilin, where we spent 3 days. They were so beautiful that we were deeply impressed by these cities.", + "start_time": 23.56371029986793, + "end_time": 35.313007352022126, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--146/temp/line_3_B.wav", + "silence_duration": 0.49649202302355067, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Guilin sounds amazing! But I'm curious, you mentioned you couldn't decide whether to stay in Beijing or... what was the other option?", + "original_text": "Guilin sounds amazing! But I'm curious, you mentioned you couldn't decide whether to stay in Beijing or... what was the other option?", + "start_time": 35.651098382769746, + "end_time": 44.32375144399423, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--146/temp/line_4_A.wav", + "silence_duration": 0.33809103074761976, + "is_interrupted": false + } + ] + }, + "DialogSum--val--147": { + "original_text": "A: That concludes the Consumer Report for tonight. Let's go over now to Jerry Ryan and find out what's happening in the world of sports. Jerry?\nB: Thanks, Sarah. And good evening, sports fans. It was an exciting day in world soccer. Mexico defeated France 7 to 6 in the close game that offered spectators plenty of [interrupt] thrilling moments, especially during the last few minutes when both teams were pushing hard for victory and the crowd was on their feet cheering wildly throughout the entire overtime period.\nA: Sorry to jump in, Jerry, but that Mexico-France score is incredible! Do you think this result could shake up the rankings significantly?\nB: Absolutely, Sarah. This win could definitely impact the rankings. But I was just about to mention the excitement in the Canada-Argentina match, which ended in a tie, 3 to 3. And in a game that's still in progress [interrupt] we might see another upset as Haiti has been showing remarkable defensive skills against Italy's aggressive offense, making this one of the most unpredictable matches of the tournament so far.\nA: Oh, right! You were saying something about another ongoing match—what's the latest on that?\nB: Yes, Italy is leading Haiti 2 to 1, with 30 minutes left to go. It's shaping up to be another thrilling finish!", + "cleaned_text": "A: That concludes the Consumer Report for tonight. Let's go over now to Jerry Ryan and find out what's happening in the world of sports. Jerry?\nB:Thanks, Sarah. And good evening, sports fans. It was an exciting day in world soccer. Mexico defeated France 7 to 6 in the close game that offered spectators plenty of thrilling moments, especially during the last few minutes when both teams were pushing hard for victory and the crowd was on their feet cheering wildly throughout the entire overtime period.\nA: Sorry to jump in, Jerry, but that Mexico-France score is incredible! Do you think this result could shake up the rankings significantly?\nB:Absolutely, Sarah. This win could definitely impact the rankings. But I was just about to mention the excitement in the Canada-Argentina match, which ended in a tie, 3 to 3. And in a game that's still in progress we might see another upset as Haiti has been showing remarkable defensive skills against Italy's aggressive offense, making this one of the most unpredictable matches of the tournament so far.\nA: Oh, right! You were saying something about another ongoing match—what's the latest on that?\nB: Yes, Italy is leading Haiti 2 to 1, with 30 minutes left to go. It's shaping up to be another thrilling finish!", + "total_duration": 62.225804988662134, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--147/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--147/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--147/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "That concludes the Consumer Report for tonight. Let's go over now to Jerry Ryan and find out what's happening in the world of sports. Jerry?", + "original_text": "That concludes the Consumer Report for tonight. Let's go over now to Jerry Ryan and find out what's happening in the world of sports. Jerry?", + "start_time": 0, + "end_time": 8.777142857142858, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--147/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Thanks, Sarah. And good evening, sports fans. It was an exciting day in world soccer. Mexico defeated France 7 to 6 in the close game that offered spectators plenty of", + "original_text": "Thanks, Sarah. And good evening, sports fans. It was an exciting day in world soccer. Mexico defeated France 7 to 6 in the close game that offered spectators plenty of [interrupt] thrilling moments, especially during the last few minutes when both teams were pushing hard for victory and the crowd was on their feet cheering wildly throughout the entire overtime period.", + "start_time": 9.309879060144235, + "end_time": 28.408291758556935, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--147/temp/line_1_B.wav", + "silence_duration": 0.5327362030013767, + "is_interrupted": true, + "text_after_interrupt": "thrilling moments, especially during the last few minutes when both teams were pushing hard for victory and the crowd was on their feet cheering wildly throughout the entire overtime period." + }, + { + "speaker": "A", + "text": "Sorry to jump in, Jerry, but that Mexico-France score is incredible! Do you think this result could shake up the rankings significantly?", + "original_text": "Sorry to jump in, Jerry, but that Mexico-France score is incredible! Do you think this result could shake up the rankings significantly?", + "start_time": 18.980990171255346, + "end_time": 26.933824638375526, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--147/temp/line_2_A.wav", + "silence_duration": 0.5544553253162495, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Absolutely, Sarah. This win could definitely impact the rankings. But I was just about to mention the excitement in the Canada-Argentina match, which ended in a tie, 3 to 3. And in a game that's still in progress", + "original_text": "Absolutely, Sarah. This win could definitely impact the rankings. But I was just about to mention the excitement in the Canada-Argentina match, which ended in a tie, 3 to 3. And in a game that's still in progress [interrupt] we might see another upset as Haiti has been showing remarkable defensive skills against Italy's aggressive offense, making this one of the most unpredictable matches of the tournament so far.", + "start_time": 28.728703187085436, + "end_time": 50.24199116894485, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--147/temp/line_3_B.wav", + "silence_duration": 0.3204114285284999, + "is_interrupted": true, + "text_after_interrupt": "we might see another upset as Haiti has been showing remarkable defensive skills against Italy's aggressive offense, making this one of the most unpredictable matches of the tournament so far." + }, + { + "speaker": "A", + "text": "Oh, right! You were saying something about another ongoing match—what's the latest on that?", + "original_text": "Oh, right! You were saying something about another ongoing match—what's the latest on that?", + "start_time": 49.92438838187882, + "end_time": 55.3346378149854, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--147/temp/line_4_A.wav", + "silence_duration": 0.5080782092019016, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, Italy is leading Haiti 2 to 1, with 30 minutes left to go. It's shaping up to be another thrilling finish!", + "original_text": "Yes, Italy is leading Haiti 2 to 1, with 30 minutes left to go. It's shaping up to be another thrilling finish!", + "start_time": 55.81711101145916, + "end_time": 62.225818494452355, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--147/temp/line_5_B.wav", + "silence_duration": 0.48247319647375986, + "is_interrupted": false + } + ] + }, + "DialogSum--val--150": { + "original_text": "A: Good afternoon, sir. \nB: Good afternoon. We want a table for 4. \nA: This way, please. It's near the window, so you'll have a good view of the garden and the fountain outside while you enjoy your meal. Sit down, please. \nB: Thank you. Do you serve good Chinese [interrupt] cuisine with authentic flavors and a wide variety of regional specialties that would satisfy our diverse tastes? \nA: Yes, sir. We serve Chinese food of various styles, such as Hunan food, Sichuan food and Zhejiang food. The first two are a bit hot. Do you want to [interrupt] start with some appetizers while you browse through our extensive menu that features both traditional and modern interpretations of these regional cuisines? \nB: Actually, before we decide, could you tell me more about the Zhejiang food? Is it sweet enough for our taste? \nA: Certainly! Zhejiang food is known for its fresh and delicate flavors, often leaning towards a slightly sweet taste with subtle vinegary notes that create a perfect balance in every dish. Would you like to try some signature dishes from that style? \nB: Yes, that sounds perfect. We like food that tastes a bit sweet.", + "cleaned_text": "A: Good afternoon, sir. \nB: Good afternoon. We want a table for 4. \nA: This way, please. It's near the window, so you'll have a good view of the garden and the fountain outside while you enjoy your meal. Sit down, please. \nB:Thank you. Do you serve good Chinese cuisine with authentic flavors and a wide variety of regional specialties that would satisfy our diverse tastes?\nA:Yes, sir. We serve Chinese food of various styles, such as Hunan food, Sichuan food and Zhejiang food. The first two are a bit hot. Do you want to start with some appetizers while you browse through our extensive menu that features both traditional and modern interpretations of these regional cuisines?\nB: Actually, before we decide, could you tell me more about the Zhejiang food? Is it sweet enough for our taste? \nA: Certainly! Zhejiang food is known for its fresh and delicate flavors, often leaning towards a slightly sweet taste with subtle vinegary notes that create a perfect balance in every dish. Would you like to try some signature dishes from that style? \nB: Yes, that sounds perfect. We like food that tastes a bit sweet.", + "total_duration": 58.20467120181406, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--150/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--150/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--150/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Good afternoon, sir.", + "original_text": "Good afternoon, sir.", + "start_time": 0, + "end_time": 1.253877551020408, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--150/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Good afternoon. We want a table for 4.", + "original_text": "Good afternoon. We want a table for 4.", + "start_time": 1.8083858699007098, + "end_time": 4.141991312077581, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--150/temp/line_1_B.wav", + "silence_duration": 0.5545083188803017, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "This way, please. It's near the window, so you'll have a good view of the garden and the fountain outside while you enjoy your meal. Sit down, please.", + "original_text": "This way, please. It's near the window, so you'll have a good view of the garden and the fountain outside while you enjoy your meal. Sit down, please.", + "start_time": 4.580875179252634, + "end_time": 13.47411780963812, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--150/temp/line_2_A.wav", + "silence_duration": 0.43888386717505357, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Thank you. Do you serve good Chinese", + "original_text": "Thank you. Do you serve good Chinese [interrupt] cuisine with authentic flavors and a wide variety of regional specialties that would satisfy our diverse tastes?", + "start_time": 14.009044669017781, + "end_time": 21.021470972872656, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--150/temp/line_3_B.wav", + "silence_duration": 0.534926859379661, + "is_interrupted": true, + "text_after_interrupt": "cuisine with authentic flavors and a wide variety of regional specialties that would satisfy our diverse tastes?" + }, + { + "speaker": "A", + "text": "Yes, sir. We serve Chinese food of various styles, such as Hunan food, Sichuan food and Zhejiang food. The first two are a bit hot. Do you want to", + "original_text": "Yes, sir. We serve Chinese food of various styles, such as Hunan food, Sichuan food and Zhejiang food. The first two are a bit hot. Do you want to [interrupt] start with some appetizers while you browse through our extensive menu that features both traditional and modern interpretations of these regional cuisines?", + "start_time": 15.785371199630026, + "end_time": 33.73439614294068, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--150/temp/line_4_A.wav", + "silence_duration": 0.333962512564991, + "is_interrupted": true, + "text_after_interrupt": "start with some appetizers while you browse through our extensive menu that features both traditional and modern interpretations of these regional cuisines?" + }, + { + "speaker": "B", + "text": "Actually, before we decide, could you tell me more about the Zhejiang food? Is it sweet enough for our taste?", + "original_text": "Actually, before we decide, could you tell me more about the Zhejiang food? Is it sweet enough for our taste?", + "start_time": 32.744821240539686, + "end_time": 38.87488926775057, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--150/temp/line_5_B.wav", + "silence_duration": 0.30564477370757115, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Certainly! Zhejiang food is known for its fresh and delicate flavors, often leaning towards a slightly sweet taste with subtle vinegary notes that create a perfect balance in every dish. Would you like to try some signature dishes from that style?", + "original_text": "Certainly! Zhejiang food is known for its fresh and delicate flavors, often leaning towards a slightly sweet taste with subtle vinegary notes that create a perfect balance in every dish. Would you like to try some signature dishes from that style?", + "start_time": 39.32401177546145, + "end_time": 54.1963927278424, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--150/temp/line_6_A.wav", + "silence_duration": 0.44912250771088036, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, that sounds perfect. We like food that tastes a bit sweet.", + "original_text": "Yes, that sounds perfect. We like food that tastes a bit sweet.", + "start_time": 54.76811812030833, + "end_time": 58.20467140829019, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--150/temp/line_7_B.wav", + "silence_duration": 0.5717253924659272, + "is_interrupted": false + } + ] + }, + "DialogSum--val--151": { + "original_text": "A: May I come in, Mr. Sun? \nB: I'd rather you didn't, Miss Yang. I'm very busy now. \nA: Can I try later then? \nB: Yes, of course. \nA: Is it all right for me to come in now, Mr. Sun? \nB: Well, uh... I'm still pretty busy, but... all right. Come in. What can I do for you? \nA: Do you mind if I sit down? \nB: Not at all. Take a seat. Now what can I do for you? \nA: I want to leave the department. Do you think I could put in for a transfer? \nB: Yes. But why should you want to [interrupt] leave when you've been doing so well here and have shown such great potential for advancement within this department? \nA: Sorry to interrupt, Mr. Sun, but I just want to clarify—would this transfer have any impact on my current projects? \nB: Your current projects? Well, it might, but I was actually asking about your reasons for wanting the transfer. \nA: Right, about that—do you mind if I speak frankly? \nB: Not at all. Go ahead.", + "cleaned_text": "A: May I come in, Mr. Sun? \nB: I'd rather you didn't, Miss Yang. I'm very busy now. \nA: Can I try later then? \nB: Yes, of course. \nA: Is it all right for me to come in now, Mr. Sun? \nB: Well, uh... I'm still pretty busy, but... all right. Come in. What can I do for you? \nA: Do you mind if I sit down? \nB: Not at all. Take a seat. Now what can I do for you? \nA: I want to leave the department. Do you think I could put in for a transfer? \nB:Yes. But why should you want to leave when you've been doing so well here and have shown such great potential for advancement within this department?\nA: Sorry to interrupt, Mr. Sun, but I just want to clarify—would this transfer have any impact on my current projects? \nB: Your current projects? Well, it might, but I was actually asking about your reasons for wanting the transfer. \nA: Right, about that—do you mind if I speak frankly? \nB: Not at all. Go ahead.", + "total_duration": 47.22240362811792, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--151/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--151/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--151/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "May I come in, Mr. Sun?", + "original_text": "May I come in, Mr. Sun?", + "start_time": 0, + "end_time": 1.6370068027210884, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--151/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I'd rather you didn't, Miss Yang. I'm very busy now.", + "original_text": "I'd rather you didn't, Miss Yang. I'm very busy now.", + "start_time": 2.111735239351503, + "end_time": 4.631100318716582, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--151/temp/line_1_B.wav", + "silence_duration": 0.47472843663041453, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Can I try later then?", + "original_text": "Can I try later then?", + "start_time": 4.971171204692334, + "end_time": 6.3063185969825835, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--151/temp/line_2_A.wav", + "silence_duration": 0.34007088597575214, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, of course.", + "original_text": "Yes, of course.", + "start_time": 6.709311780015164, + "end_time": 7.684549875253259, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--151/temp/line_3_B.wav", + "silence_duration": 0.4029931830325802, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Is it all right for me to come in now, Mr. Sun?", + "original_text": "Is it all right for me to come in now, Mr. Sun?", + "start_time": 8.277662566288276, + "end_time": 11.110497033408457, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--151/temp/line_4_A.wav", + "silence_duration": 0.5931126910350176, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Well, uh... I'm still pretty busy, but... all right. Come in. What can I do for you?", + "original_text": "Well, uh... I'm still pretty busy, but... all right. Come in. What can I do for you?", + "start_time": 11.693282654763742, + "end_time": 16.244393765874854, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--151/temp/line_5_B.wav", + "silence_duration": 0.5827856213552856, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Do you mind if I sit down?", + "original_text": "Do you mind if I sit down?", + "start_time": 16.57258758277393, + "end_time": 18.070274657603864, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--151/temp/line_6_A.wav", + "silence_duration": 0.32819381689907856, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Not at all. Take a seat. Now what can I do for you?", + "original_text": "Not at all. Take a seat. Now what can I do for you?", + "start_time": 18.416982908980156, + "end_time": 21.72582644639512, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--151/temp/line_7_B.wav", + "silence_duration": 0.346708251376292, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I want to leave the department. Do you think I could put in for a transfer?", + "original_text": "I want to leave the department. Do you think I could put in for a transfer?", + "start_time": 22.242487974765815, + "end_time": 26.712329244607083, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--151/temp/line_8_A.wav", + "silence_duration": 0.516661528370695, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes. But why should you want to", + "original_text": "Yes. But why should you want to [interrupt] leave when you've been doing so well here and have shown such great potential for advancement within this department?", + "start_time": 27.048034431770592, + "end_time": 33.816651211815945, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--151/temp/line_9_B.wav", + "silence_duration": 0.335705187163508, + "is_interrupted": true, + "text_after_interrupt": "leave when you've been doing so well here and have shown such great potential for advancement within this department?" + }, + { + "speaker": "A", + "text": "Sorry to interrupt, Mr. Sun, but I just want to clarify—would this transfer have any impact on my current projects?", + "original_text": "Sorry to interrupt, Mr. Sun, but I just want to clarify—would this transfer have any impact on my current projects?", + "start_time": 29.323589987326148, + "end_time": 36.52177592836923, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--151/temp/line_10_A.wav", + "silence_duration": 0.41474789730857897, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Your current projects? Well, it might, but I was actually asking about your reasons for wanting the transfer.", + "original_text": "Your current projects? Well, it might, but I was actually asking about your reasons for wanting the transfer.", + "start_time": 36.83677902770809, + "end_time": 42.51405793927272, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--151/temp/line_11_B.wav", + "silence_duration": 0.3150030993388616, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Right, about that—do you mind if I speak frankly?", + "original_text": "Right, about that—do you mind if I speak frankly?", + "start_time": 42.8430372311841, + "end_time": 45.559771925061646, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--151/temp/line_12_A.wav", + "silence_duration": 0.32897929191137826, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Not at all. Go ahead.", + "original_text": "Not at all. Go ahead.", + "start_time": 45.991773418464746, + "end_time": 47.22243101483663, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--151/temp/line_13_B.wav", + "silence_duration": 0.43200149340309923, + "is_interrupted": false + } + ] + }, + "DialogSum--val--153": { + "original_text": "A: Hello, Sir. So, you are back? \nB: Yes, hello again. I would like to know the exact difference between Dividend Deposit and Dividend Participated Deposit. \nA: That's pretty easy to explain. With the Deposit, the interest is fixed, but the Dividend of each policy will be transferred automatically into your bank account by the end of each year. The longer the term, the higher the Dividend you [interrupt] can expect to accumulate over time, which can significantly impact your overall returns and provide a steady stream of passive income for your financial planning needs.\nB: Sorry to cut in, but when you say \"the longer the term,\" do you mean there's a significant difference in the Dividend if I opt for, say, a 10-year term versus a 5-year term? \nA: Yes, exactly. The compound interest effect becomes more pronounced over longer terms. But I was also going to mention that the Dividend is calculated at the Compound Interest Rate which means your returns will grow faster as time goes on.\nB: Got it. And I can purchase that here? \nA: Yes, you can purchase it here directly.", + "cleaned_text": "A: Hello, Sir. So, you are back? \nB: Yes, hello again. I would like to know the exact difference between Dividend Deposit and Dividend Participated Deposit. \nA:That's pretty easy to explain. With the Deposit, the interest is fixed, but the Dividend of each policy will be transferred automatically into your bank account by the end of each year. The longer the term, the higher the Dividend you can expect to accumulate over time, which can significantly impact your overall returns and provide a steady stream of passive income for your financial planning needs.\nB: Sorry to cut in, but when you say \"the longer the term,\" do you mean there's a significant difference in the Dividend if I opt for, say, a 10-year term versus a 5-year term? \nA: Yes, exactly. The compound interest effect becomes more pronounced over longer terms. But I was also going to mention that the Dividend is calculated at the Compound Interest Rate which means your returns will grow faster as time goes on.\nB: Got it. And I can purchase that here? \nA: Yes, you can purchase it here directly.", + "total_duration": 55.126938775510204, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--153/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--153/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--153/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Hello, Sir. So, you are back?", + "original_text": "Hello, Sir. So, you are back?", + "start_time": 0, + "end_time": 2.0317460317460316, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--153/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, hello again. I would like to know the exact difference between Dividend Deposit and Dividend Participated Deposit.", + "original_text": "Yes, hello again. I would like to know the exact difference between Dividend Deposit and Dividend Participated Deposit.", + "start_time": 2.425744190497618, + "end_time": 9.298850766461337, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--153/temp/line_1_B.wav", + "silence_duration": 0.3939981587515864, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "That's pretty easy to explain. With the Deposit, the interest is fixed, but the Dividend of each policy will be transferred automatically into your bank account by the end of each year. The longer the term, the higher the Dividend you", + "original_text": "That's pretty easy to explain. With the Deposit, the interest is fixed, but the Dividend of each policy will be transferred automatically into your bank account by the end of each year. The longer the term, the higher the Dividend you [interrupt] can expect to accumulate over time, which can significantly impact your overall returns and provide a steady stream of passive income for your financial planning needs.", + "start_time": 9.801468858805261, + "end_time": 33.95022169327238, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--153/temp/line_2_A.wav", + "silence_duration": 0.5026180923439244, + "is_interrupted": true, + "text_after_interrupt": "can expect to accumulate over time, which can significantly impact your overall returns and provide a steady stream of passive income for your financial planning needs." + }, + { + "speaker": "B", + "text": "Sorry to cut in, but when you say \"the longer the term,\" do you mean there's a significant difference in the Dividend if I opt for, say, a 10-year term versus a 5-year term?", + "original_text": "Sorry to cut in, but when you say \"the longer the term,\" do you mean there's a significant difference in the Dividend if I opt for, say, a 10-year term versus a 5-year term?", + "start_time": 24.232670672864216, + "end_time": 35.111219425698685, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--153/temp/line_3_B.wav", + "silence_duration": 0.40742076177013303, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Yes, exactly. The compound interest effect becomes more pronounced over longer terms. But I was also going to mention that the Dividend is calculated at the Compound Interest Rate which means your returns will grow faster as time goes on.", + "original_text": "Yes, exactly. The compound interest effect becomes more pronounced over longer terms. But I was also going to mention that the Dividend is calculated at the Compound Interest Rate which means your returns will grow faster as time goes on.", + "start_time": 35.70982435853599, + "end_time": 50.14102617259495, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--153/temp/line_4_A.wav", + "silence_duration": 0.5986049328373055, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Got it. And I can purchase that here?", + "original_text": "Got it. And I can purchase that here?", + "start_time": 50.614535281387184, + "end_time": 52.425691743972216, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--153/temp/line_5_B.wav", + "silence_duration": 0.4735091087922355, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Yes, you can purchase it here directly.", + "original_text": "Yes, you can purchase it here directly.", + "start_time": 52.8978542670376, + "end_time": 55.12696991329611, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--153/temp/line_6_A.wav", + "silence_duration": 0.4721625230653847, + "is_interrupted": false + } + ] + }, + "DialogSum--val--154": { + "original_text": "A: I think I may rent this apartment from you. \nB: That's great to hear. How much are you looking to offer for the rent? \nA: Sorry to cut in, but before we talk about the price, can you tell me if the utilities are included in the rent? \nB: No, utilities are separate. For each month you would have to pay $1050. \nA: That is too expensive. \nB: I don't think that is too much for [interrupt] an apartment in this location with all the amenities provided, including high-speed internet, a fully equipped gym, and 24/7 security services that ensure your safety at all times. \nA: I understand your point, but I was hoping we could negotiate a bit. How does $850 a month sound to you? \nB: That's not enough. \nA: Would you please reconsider? \nB: That's my final offer. Take it or leave it.", + "cleaned_text": "A: I think I may rent this apartment from you. \nB: That's great to hear. How much are you looking to offer for the rent? \nA: Sorry to cut in, but before we talk about the price, can you tell me if the utilities are included in the rent? \nB: No, utilities are separate. For each month you would have to pay $1050. \nA: That is too expensive. \nB:I don't think that is too much for an apartment in this location with all the amenities provided, including high-speed internet, a fully equipped gym, and 24/7 security services that ensure your safety at all times.\nA: I understand your point, but I was hoping we could negotiate a bit. How does $850 a month sound to you? \nB: That's not enough. \nA: Would you please reconsider? \nB: That's my final offer. Take it or leave it.", + "total_duration": 37.7928798185941, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--154/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--154/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--154/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "I think I may rent this apartment from you.", + "original_text": "I think I may rent this apartment from you.", + "start_time": 0, + "end_time": 2.4380952380952383, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--154/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "That's great to hear. How much are you looking to offer for the rent?", + "original_text": "That's great to hear. How much are you looking to offer for the rent?", + "start_time": 2.761370931246943, + "end_time": 6.012164582040594, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--154/temp/line_1_B.wav", + "silence_duration": 0.3232756931517045, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Sorry to cut in, but before we talk about the price, can you tell me if the utilities are included in the rent?", + "original_text": "Sorry to cut in, but before we talk about the price, can you tell me if the utilities are included in the rent?", + "start_time": 6.377499543476445, + "end_time": 13.297046028737217, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--154/temp/line_2_A.wav", + "silence_duration": 0.3653349614358518, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "No, utilities are separate. For each month you would have to pay $1050.", + "original_text": "No, utilities are separate. For each month you would have to pay $1050.", + "start_time": 13.72299775584796, + "end_time": 18.018689365825285, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--154/temp/line_3_B.wav", + "silence_duration": 0.42595172711074203, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "That is too expensive.", + "original_text": "That is too expensive.", + "start_time": 18.596661254630323, + "end_time": 19.989858533541888, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--154/temp/line_4_A.wav", + "silence_duration": 0.5779718888050394, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I don't think that is too much for", + "original_text": "I don't think that is too much for [interrupt] an apartment in this location with all the amenities provided, including high-speed internet, a fully equipped gym, and 24/7 security services that ensure your safety at all times.", + "start_time": 20.34397045654206, + "end_time": 32.05843757672346, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--154/temp/line_5_B.wav", + "silence_duration": 0.3541119230001733, + "is_interrupted": true, + "text_after_interrupt": "an apartment in this location with all the amenities provided, including high-speed internet, a fully equipped gym, and 24/7 security services that ensure your safety at all times." + }, + { + "speaker": "A", + "text": "I understand your point, but I was hoping we could negotiate a bit. How does $850 a month sound to you?", + "original_text": "I understand your point, but I was hoping we could negotiate a bit. How does $850 a month sound to you?", + "start_time": 21.87648746334478, + "end_time": 29.434582701440018, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--154/temp/line_6_A.wav", + "silence_duration": 0.39869460535117085, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "That's not enough.", + "original_text": "That's not enough.", + "start_time": 32.465017729040255, + "end_time": 33.44025582427835, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--154/temp/line_7_B.wav", + "silence_duration": 0.4065801523167922, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Would you please reconsider?", + "original_text": "Would you please reconsider?", + "start_time": 33.747295999283715, + "end_time": 35.22176311946512, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--154/temp/line_8_A.wav", + "silence_duration": 0.30704017500535863, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "That's my final offer. Take it or leave it.", + "original_text": "That's my final offer. Take it or leave it.", + "start_time": 35.76116139145378, + "end_time": 37.792907423199814, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--154/temp/line_9_B.wav", + "silence_duration": 0.5393982719886582, + "is_interrupted": false + } + ] + }, + "DialogSum--val--155": { + "original_text": "A: So the company decided to cancel your trip to Hong Kong? \nB: Yes, The SARS epidemic is not under effective control yet. So I'd better not [interrupt] go, even though I was really looking forward to the trip and had already made some exciting plans to visit local markets and try authentic Cantonese cuisine. \nA: Sorry to hear that, but do you think this might affect any of your upcoming projects? \nB: It could, but I think we can manage remotely. However, I was about to say that I shouldn't risk it. Maybe it's a good thing. If you don't have to go to Hong Kong, you can take a break and take things easy for a while. \nA: You are right. Maybe we should work out a fitness plan and start to do more exercise. Sitting around in the office all day is no way of keeping fit.", + "cleaned_text": "A: So the company decided to cancel your trip to Hong Kong? \nB:Yes, The SARS epidemic is not under effective control yet. So I'd better not go, even though I was really looking forward to the trip and had already made some exciting plans to visit local markets and try authentic Cantonese cuisine.\nA: Sorry to hear that, but do you think this might affect any of your upcoming projects? \nB: It could, but I think we can manage remotely. However, I was about to say that I shouldn't risk it. Maybe it's a good thing. If you don't have to go to Hong Kong, you can take a break and take things easy for a while. \nA: You are right. Maybe we should work out a fitness plan and start to do more exercise. Sitting around in the office all day is no way of keeping fit.", + "total_duration": 37.39424036281179, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--155/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--155/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--155/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "So the company decided to cancel your trip to Hong Kong?", + "original_text": "So the company decided to cancel your trip to Hong Kong?", + "start_time": 0, + "end_time": 3.1927437641723357, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--155/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, The SARS epidemic is not under effective control yet. So I'd better not", + "original_text": "Yes, The SARS epidemic is not under effective control yet. So I'd better not [interrupt] go, even though I was really looking forward to the trip and had already made some exciting plans to visit local markets and try authentic Cantonese cuisine.", + "start_time": 3.501970712561393, + "end_time": 15.611177061767743, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--155/temp/line_1_B.wav", + "silence_duration": 0.3092269483890571, + "is_interrupted": true, + "text_after_interrupt": "go, even though I was really looking forward to the trip and had already made some exciting plans to visit local markets and try authentic Cantonese cuisine." + }, + { + "speaker": "A", + "text": "Sorry to hear that, but do you think this might affect any of your upcoming projects?", + "original_text": "Sorry to hear that, but do you think this might affect any of your upcoming projects?", + "start_time": 8.215621506212187, + "end_time": 13.486551211427606, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--155/temp/line_2_A.wav", + "silence_duration": 0.3881130586676246, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "It could, but I think we can manage remotely. However, I was about to say that I shouldn't risk it. Maybe it's a good thing. If you don't have to go to Hong Kong, you can take a break and take things easy for a while.", + "original_text": "It could, but I think we can manage remotely. However, I was about to say that I shouldn't risk it. Maybe it's a good thing. If you don't have to go to Hong Kong, you can take a break and take things easy for a while.", + "start_time": 16.09022445818726, + "end_time": 27.36351244004667, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--155/temp/line_3_B.wav", + "silence_duration": 0.47904739641952043, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "You are right. Maybe we should work out a fitness plan and start to do more exercise. Sitting around in the office all day is no way of keeping fit.", + "original_text": "You are right. Maybe we should work out a fitness plan and start to do more exercise. Sitting around in the office all day is no way of keeping fit.", + "start_time": 27.757965380908427, + "end_time": 37.39424656004675, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--155/temp/line_4_A.wav", + "silence_duration": 0.3944529408617588, + "is_interrupted": false + } + ] + }, + "DialogSum--val--156": { + "original_text": "A: I want to get on the bus already. \nB: It just isn't on time today. \nA: It was supposed to be here thirty minutes [interrupt] ago according to the schedule, and I'm starting to get really frustrated because this happens way too often with this particular route. \nB: Thirty minutes? That's way too long. Do you think there's a chance it got delayed by traffic or something? \nA: Possibly, but I think it'll be here pretty soon. I need to get to work, so it better. \nB: Yeah, I really do hate public transportation. \nA: I agree, it's just never on time. And I was saying earlier, it was supposed to be here thirty minutes ago. \nB: That's right. I also hate having to stand at a bus stop in all kinds of [interrupt] weather conditions for extended periods, especially when it's really bad like during heavy snowstorms or torrential downpours. \nA: Weather, exactly! Especially when it's raining or freezing cold. We need to get a car. \nB: I completely agree with that.", + "cleaned_text": "A: I want to get on the bus already. \nB: It just isn't on time today. \nA:It was supposed to be here thirty minutes ago according to the schedule, and I'm starting to get really frustrated because this happens way too often with this particular route.\nB: Thirty minutes? That's way too long. Do you think there's a chance it got delayed by traffic or something? \nA: Possibly, but I think it'll be here pretty soon. I need to get to work, so it better. \nB: Yeah, I really do hate public transportation. \nA: I agree, it's just never on time. And I was saying earlier, it was supposed to be here thirty minutes ago. \nB:That's right. I also hate having to stand at a bus stop in all kinds of weather conditions for extended periods, especially when it's really bad like during heavy snowstorms or torrential downpours.\nA: Weather, exactly! Especially when it's raining or freezing cold. We need to get a car. \nB: I completely agree with that.", + "total_duration": 49.3827664399093, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--156/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--156/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--156/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "I want to get on the bus already.", + "original_text": "I want to get on the bus already.", + "start_time": 0, + "end_time": 2.2175056689342405, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--156/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "It just isn't on time today.", + "original_text": "It just isn't on time today.", + "start_time": 2.625199664618265, + "end_time": 4.436356127203299, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--156/temp/line_1_B.wav", + "silence_duration": 0.40769399568402476, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "It was supposed to be here thirty minutes", + "original_text": "It was supposed to be here thirty minutes [interrupt] ago according to the schedule, and I'm starting to get really frustrated because this happens way too often with this particular route.", + "start_time": 4.756323756345823, + "end_time": 14.973103801697297, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--156/temp/line_2_A.wav", + "silence_duration": 0.3199676291425236, + "is_interrupted": true, + "text_after_interrupt": "ago according to the schedule, and I'm starting to get really frustrated because this happens way too often with this particular route." + }, + { + "speaker": "B", + "text": "Thirty minutes? That's way too long. Do you think there's a chance it got delayed by traffic or something?", + "original_text": "Thirty minutes? That's way too long. Do you think there's a chance it got delayed by traffic or something?", + "start_time": 7.031879311901379, + "end_time": 12.442128745007956, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--156/temp/line_3_B.wav", + "silence_duration": 0.4323177008384066, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Possibly, but I think it'll be here pretty soon. I need to get to work, so it better.", + "original_text": "Possibly, but I think it'll be here pretty soon. I need to get to work, so it better.", + "start_time": 15.437593496846207, + "end_time": 20.83623295262852, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--156/temp/line_4_A.wav", + "silence_duration": 0.46448969514891025, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yeah, I really do hate public transportation.", + "original_text": "Yeah, I really do hate public transportation.", + "start_time": 21.39365177968571, + "end_time": 24.28453613342721, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--156/temp/line_5_B.wav", + "silence_duration": 0.5574188270571918, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I agree, it's just never on time. And I was saying earlier, it was supposed to be here thirty minutes ago.", + "original_text": "I agree, it's just never on time. And I was saying earlier, it was supposed to be here thirty minutes ago.", + "start_time": 24.84188358681763, + "end_time": 31.40152077502625, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--156/temp/line_6_A.wav", + "silence_duration": 0.5573474533904208, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "That's right. I also hate having to stand at a bus stop in all kinds of", + "original_text": "That's right. I also hate having to stand at a bus stop in all kinds of [interrupt] weather conditions for extended periods, especially when it's really bad like during heavy snowstorms or torrential downpours.", + "start_time": 31.800080832653965, + "end_time": 41.9355910367356, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--156/temp/line_7_B.wav", + "silence_duration": 0.398560057627714, + "is_interrupted": true, + "text_after_interrupt": "weather conditions for extended periods, especially when it's really bad like during heavy snowstorms or torrential downpours." + }, + { + "speaker": "A", + "text": "Weather, exactly! Especially when it's raining or freezing cold. We need to get a car.", + "original_text": "Weather, exactly! Especially when it's raining or freezing cold. We need to get a car.", + "start_time": 41.89632485809977, + "end_time": 47.515553883043076, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--156/temp/line_8_A.wav", + "silence_duration": 0.31544970059774496, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I completely agree with that.", + "original_text": "I completely agree with that.", + "start_time": 47.850294119768236, + "end_time": 49.38281112657096, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--156/temp/line_9_B.wav", + "silence_duration": 0.334740236725163, + "is_interrupted": false + } + ] + }, + "DialogSum--val--157": { + "original_text": "A: You have been here for how long? Four months now? \nB: Yeah, about. \nA: Do you know Chinese better now? \nB: Oh, definitely. I remember, when I first arrived in Guangzhou, my girlfriend was haggling with a sales clerk over the price of a mobile [interrupt] phone case, and I was completely lost in the conversation because they were using so many local slang terms and bargaining tactics that I'd never heard before. \nA: Oh, yeah. Many Chinese like to bargain. It happens almost everywhere. \nB: Right, but what surprised me was the speed of the conversation—it kept getting faster, and I honestly thought they were about to start fighting. It sounded like a shouting match to me, even though it was just a normal negotiation process, but I couldn't understand a word back then. \nA: A shouting match? You're so funny. You must be exaggerating. I don't believe it. \nB: I swear, that's how it felt at the time! But, oh, I didn't finish earlier—my girlfriend was haggling over a mobile phone, and the whole thing just escalated so quickly. \nA: Yes, perhaps. Chinese usually don't notice that sort of thing. Maybe it's quite natural to us. \nB: Yes, absolutely true.", + "cleaned_text": "A: You have been here for how long? Four months now? \nB: Yeah, about. \nA: Do you know Chinese better now? \nB:Oh, definitely. I remember, when I first arrived in Guangzhou, my girlfriend was haggling with a sales clerk over the price of a mobile phone case, and I was completely lost in the conversation because they were using so many local slang terms and bargaining tactics that I'd never heard before.\nA: Oh, yeah. Many Chinese like to bargain. It happens almost everywhere. \nB: Right, but what surprised me was the speed of the conversation—it kept getting faster, and I honestly thought they were about to start fighting. It sounded like a shouting match to me, even though it was just a normal negotiation process, but I couldn't understand a word back then. \nA: A shouting match? You're so funny. You must be exaggerating. I don't believe it. \nB: I swear, that's how it felt at the time! But, oh, I didn't finish earlier—my girlfriend was haggling over a mobile phone, and the whole thing just escalated so quickly. \nA: Yes, perhaps. Chinese usually don't notice that sort of thing. Maybe it's quite natural to us. \nB: Yes, absolutely true.", + "total_duration": 59.61573696145125, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--157/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--157/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--157/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "You have been here for how long? Four months now?", + "original_text": "You have been here for how long? Four months now?", + "start_time": 0, + "end_time": 3.076643990929705, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--157/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yeah, about.", + "original_text": "Yeah, about.", + "start_time": 3.4474247407382297, + "end_time": 4.306563062733694, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--157/temp/line_1_B.wav", + "silence_duration": 0.3707807498085244, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Do you know Chinese better now?", + "original_text": "Do you know Chinese better now?", + "start_time": 4.849960095101958, + "end_time": 6.568236739092887, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--157/temp/line_2_A.wav", + "silence_duration": 0.5433970323682638, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Oh, definitely. I remember, when I first arrived in Guangzhou, my girlfriend was haggling with a sales clerk over the price of a mobile", + "original_text": "Oh, definitely. I remember, when I first arrived in Guangzhou, my girlfriend was haggling with a sales clerk over the price of a mobile [interrupt] phone case, and I was completely lost in the conversation because they were using so many local slang terms and bargaining tactics that I'd never heard before.", + "start_time": 6.9983894843693575, + "end_time": 22.56736907620609, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--157/temp/line_3_B.wav", + "silence_duration": 0.43015274527647046, + "is_interrupted": true, + "text_after_interrupt": "phone case, and I was completely lost in the conversation because they were using so many local slang terms and bargaining tactics that I'd never heard before." + }, + { + "speaker": "A", + "text": "Oh, yeah. Many Chinese like to bargain. It happens almost everywhere.", + "original_text": "Oh, yeah. Many Chinese like to bargain. It happens almost everywhere.", + "start_time": 14.707414427680014, + "end_time": 19.11920581089997, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--157/temp/line_4_A.wav", + "silence_duration": 0.5889818686877968, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Right, but what surprised me was the speed of the conversation—it kept getting faster, and I honestly thought they were about to start fighting. It sounded like a shouting match to me, even though it was just a normal negotiation process, but I couldn't understand a word back then.", + "original_text": "Right, but what surprised me was the speed of the conversation—it kept getting faster, and I honestly thought they were about to start fighting. It sounded like a shouting match to me, even though it was just a normal negotiation process, but I couldn't understand a word back then.", + "start_time": 22.969417857465608, + "end_time": 36.7620709186901, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--157/temp/line_5_B.wav", + "silence_duration": 0.4020487812595167, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "A shouting match? You're so funny. You must be exaggerating. I don't believe it.", + "original_text": "A shouting match? You're so funny. You must be exaggerating. I don't believe it.", + "start_time": 37.24078445565311, + "end_time": 42.07053502254654, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--157/temp/line_6_A.wav", + "silence_duration": 0.4787135369630161, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I swear, that's how it felt at the time! But, oh, I didn't finish earlier—my girlfriend was haggling over a mobile phone, and the whole thing just escalated so quickly.", + "original_text": "I swear, that's how it felt at the time! But, oh, I didn't finish earlier—my girlfriend was haggling over a mobile phone, and the whole thing just escalated so quickly.", + "start_time": 42.649449003242786, + "end_time": 51.3453220191158, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--157/temp/line_7_B.wav", + "silence_duration": 0.5789139806962496, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Yes, perhaps. Chinese usually don't notice that sort of thing. Maybe it's quite natural to us.", + "original_text": "Yes, perhaps. Chinese usually don't notice that sort of thing. Maybe it's quite natural to us.", + "start_time": 51.77890278957931, + "end_time": 57.71160120227773, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--157/temp/line_8_A.wav", + "silence_duration": 0.4335807704635164, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, absolutely true.", + "original_text": "Yes, absolutely true.", + "start_time": 58.11807670505384, + "end_time": 59.61576377988377, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--157/temp/line_9_B.wav", + "silence_duration": 0.40647550277610733, + "is_interrupted": false + } + ] + }, + "DialogSum--val--158": { + "original_text": "A: Hmm, what should I wear today? \nB: Come on, you think about what to wear almost every day. There are thousands of clothes in your wardrobe. \nA: Well, haven't you ever heard people say that there is always one piece of clothes missing from a woman's wardrobe? \nB: I have and I can prove that is 100% true for you. \nA: Loving to look beautiful is women's nature. In fact, I am thinking about going to my favorite clothing shop today because they just got [interrupt] a new collection of summer dresses that would perfectly complement the shoes I need to exchange. \nB: No kidding! Again?! You just went shopping yesterday. You really are a dedicated fashion enthusiast, always on the lookout for the latest trends. \nA: Oh, it's not just about shopping. I need to change the shoes I bought from Nasi. They are too small. I want to ask them whether they come in a larger size. \nB: OK. Do you have the receipt with you? I think they will ask you to show them the receipt first. \nA: Oh, I forgot to mention—before you interrupted—what were you saying about me being a shopaholic? \nB: I was just saying you really have a knack for shopping, but I guess it's justified if you need to exchange something.", + "cleaned_text": "A: Hmm, what should I wear today? \nB: Come on, you think about what to wear almost every day. There are thousands of clothes in your wardrobe. \nA: Well, haven't you ever heard people say that there is always one piece of clothes missing from a woman's wardrobe? \nB: I have and I can prove that is 100% true for you. \nA:Loving to look beautiful is women's nature. In fact, I am thinking about going to my favorite clothing shop today because they just got a new collection of summer dresses that would perfectly complement the shoes I need to exchange.\nB: No kidding! Again?! You just went shopping yesterday. You really are a dedicated fashion enthusiast, always on the lookout for the latest trends. \nA: Oh, it's not just about shopping. I need to change the shoes I bought from Nasi. They are too small. I want to ask them whether they come in a larger size. \nB: OK. Do you have the receipt with you? I think they will ask you to show them the receipt first. \nA: Oh, I forgot to mention—before you interrupted—what were you saying about me being a shopaholic? \nB: I was just saying you really have a knack for shopping, but I guess it's justified if you need to exchange something.", + "total_duration": 62.514648526077096, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--158/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--158/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--158/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Hmm, what should I wear today?", + "original_text": "Hmm, what should I wear today?", + "start_time": 0, + "end_time": 1.7182766439909296, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--158/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Come on, you think about what to wear almost every day. There are thousands of clothes in your wardrobe.", + "original_text": "Come on, you think about what to wear almost every day. There are thousands of clothes in your wardrobe.", + "start_time": 2.1469786771200847, + "end_time": 7.406298405011242, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--158/temp/line_1_B.wav", + "silence_duration": 0.4287020331291552, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Well, haven't you ever heard people say that there is always one piece of clothes missing from a woman's wardrobe?", + "original_text": "Well, haven't you ever heard people say that there is always one piece of clothes missing from a woman's wardrobe?", + "start_time": 7.879504640559794, + "end_time": 14.39270191947136, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--158/temp/line_2_A.wav", + "silence_duration": 0.47320623554855257, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I have and I can prove that is 100% true for you.", + "original_text": "I have and I can prove that is 100% true for you.", + "start_time": 14.984654095361478, + "end_time": 18.038078131642656, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--158/temp/line_3_B.wav", + "silence_duration": 0.5919521758901183, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Loving to look beautiful is women's nature. In fact, I am thinking about going to my favorite clothing shop today because they just got", + "original_text": "Loving to look beautiful is women's nature. In fact, I am thinking about going to my favorite clothing shop today because they just got [interrupt] a new collection of summer dresses that would perfectly complement the shoes I need to exchange.", + "start_time": 18.47377454794612, + "end_time": 32.06905799465814, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--158/temp/line_4_A.wav", + "silence_duration": 0.435696416303464, + "is_interrupted": true, + "text_after_interrupt": "a new collection of summer dresses that would perfectly complement the shoes I need to exchange." + }, + { + "speaker": "B", + "text": "No kidding! Again?! You just went shopping yesterday. You really are a dedicated fashion enthusiast, always on the lookout for the latest trends.", + "original_text": "No kidding! Again?! You just went shopping yesterday. You really are a dedicated fashion enthusiast, always on the lookout for the latest trends.", + "start_time": 27.227697450440452, + "end_time": 35.08765209896653, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--158/temp/line_5_B.wav", + "silence_duration": 0.38291126120548075, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Oh, it's not just about shopping. I need to change the shoes I bought from Nasi. They are too small. I want to ask them whether they come in a larger size.", + "original_text": "Oh, it's not just about shopping. I need to change the shoes I bought from Nasi. They are too small. I want to ask them whether they come in a larger size.", + "start_time": 35.5494258914935, + "end_time": 45.208927025280346, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--158/temp/line_6_A.wav", + "silence_duration": 0.46177379252696943, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "OK. Do you have the receipt with you? I think they will ask you to show them the receipt first.", + "original_text": "OK. Do you have the receipt with you? I think they will ask you to show them the receipt first.", + "start_time": 45.7158457149922, + "end_time": 50.893895601613515, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--158/temp/line_7_B.wav", + "silence_duration": 0.5069186897118552, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Oh, I forgot to mention—before you interrupted—what were you saying about me being a shopaholic?", + "original_text": "Oh, I forgot to mention—before you interrupted—what were you saying about me being a shopaholic?", + "start_time": 51.47418187003142, + "end_time": 57.16307075892031, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--158/temp/line_8_A.wav", + "silence_duration": 0.5802862684179088, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I was just saying you really have a knack for shopping, but I guess it's justified if you need to exchange something.", + "original_text": "I was just saying you really have a knack for shopping, but I guess it's justified if you need to exchange something.", + "start_time": 57.49917870224439, + "end_time": 62.51468890632603, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--158/temp/line_9_B.wav", + "silence_duration": 0.3361079433240824, + "is_interrupted": false + } + ] + }, + "DialogSum--val--159": { + "original_text": "A: Good morning. Phyllis Seymour speaking.\nB: Hi, Ms. Seymour? It's Allan Parker. I've been waiting to call you and thank you for all your help last week.\nA: Thank you very much, Mr. Parker. But, that is my [interrupt] pleasure and I truly mean it. Helping clients like you navigate through complex situations is what makes my job so rewarding and fulfilling in the first place.\nB: Sorry to jump in, but I just wanted to ask—did everything go smoothly after we made those final adjustments?\nA: Yes, everything went well. I was going to say that it's my job to assist, but I appreciate your kind words. By the way, you mentioned wanting to let my boss know something?\nB: Oh, right! I was saying that she'd better hold on to you! You're a hard worker!", + "cleaned_text": "A: Good morning. Phyllis Seymour speaking.\nB: Hi, Ms. Seymour? It's Allan Parker. I've been waiting to call you and thank you for all your help last week.\nA:Thank you very much, Mr. Parker. But, that is my pleasure and I truly mean it. Helping clients like you navigate through complex situations is what makes my job so rewarding and fulfilling in the first place.\nB: Sorry to jump in, but I just wanted to ask—did everything go smoothly after we made those final adjustments?\nA: Yes, everything went well. I was going to say that it's my job to assist, but I appreciate your kind words. By the way, you mentioned wanting to let my boss know something?\nB: Oh, right! I was saying that she'd better hold on to you! You're a hard worker!", + "total_duration": 36.087755102040816, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--159/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--159/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--159/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Good morning. Phyllis Seymour speaking.", + "original_text": "Good morning. Phyllis Seymour speaking.", + "start_time": 0, + "end_time": 2.2175056689342405, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--159/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Hi, Ms. Seymour? It's Allan Parker. I've been waiting to call you and thank you for all your help last week.", + "original_text": "Hi, Ms. Seymour? It's Allan Parker. I've been waiting to call you and thank you for all your help last week.", + "start_time": 2.5671811065730354, + "end_time": 8.302509904758978, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--159/temp/line_1_B.wav", + "silence_duration": 0.34967543763879516, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Thank you very much, Mr. Parker. But, that is my", + "original_text": "Thank you very much, Mr. Parker. But, that is my [interrupt] pleasure and I truly mean it. Helping clients like you navigate through complex situations is what makes my job so rewarding and fulfilling in the first place.", + "start_time": 8.68857893090681, + "end_time": 21.006764871949894, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--159/temp/line_2_A.wav", + "silence_duration": 0.38606902614783284, + "is_interrupted": true, + "text_after_interrupt": "pleasure and I truly mean it. Helping clients like you navigate through complex situations is what makes my job so rewarding and fulfilling in the first place." + }, + { + "speaker": "B", + "text": "Sorry to jump in, but I just wanted to ask—did everything go smoothly after we made those final adjustments?", + "original_text": "Sorry to jump in, but I just wanted to ask—did everything go smoothly after we made those final adjustments?", + "start_time": 12.54309140256214, + "end_time": 18.1158805182084, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--159/temp/line_3_B.wav", + "silence_duration": 0.3707359130446497, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Yes, everything went well. I was going to say that it's my job to assist, but I appreciate your kind words. By the way, you mentioned wanting to let my boss know something?", + "original_text": "Yes, everything went well. I was going to say that it's my job to assist, but I appreciate your kind words. By the way, you mentioned wanting to let my boss know something?", + "start_time": 21.40883362284319, + "end_time": 31.428244053682192, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--159/temp/line_4_A.wav", + "silence_duration": 0.4020687508932962, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Oh, right! I was saying that she'd better hold on to you! You're a hard worker!", + "original_text": "Oh, right! I was saying that she'd better hold on to you! You're a hard worker!", + "start_time": 31.896593093987487, + "end_time": 36.08779490804645, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--159/temp/line_5_B.wav", + "silence_duration": 0.46834904030529567, + "is_interrupted": false + } + ] + }, + "DialogSum--val--160": { + "original_text": "A: Well, Mike, nowadays there's much talk about nanometer. But what on earth is it? \nB: Nanometer is a length scale. It's one billionth of a meter, roughly ten times the size of an individual [interrupt] atoms, which are the building blocks of matter and understanding their scale is crucial for nanotechnology applications in medicine and electronics. \nA: Sorry to interrupt, but when you say \"ten times the size,\" do you mean it's ten times larger or smaller than an atom? \nB: It's ten times larger than an individual atom. But as I was saying, it's still extremely small. For comparison, 10 NM is 1000 times smaller than the diameter of a human hair. There are as many nanometers in an inch as there are inches in [interrupt] a long distance, which makes it a very tiny unit of measurement that's essential for working with materials at the atomic and molecular level. \nA: Wait, could you clarify that part about nanometers and inches again? I want to make sure I got that right. \nB: Sure, I was just saying that there are as many nanometers in an inch as there are inches in 400 miles.", + "cleaned_text": "A: Well, Mike, nowadays there's much talk about nanometer. But what on earth is it? \nB:Nanometer is a length scale. It's one billionth of a meter, roughly ten times the size of an individual atoms, which are the building blocks of matter and understanding their scale is crucial for nanotechnology applications in medicine and electronics.\nA: Sorry to interrupt, but when you say \"ten times the size,\" do you mean it's ten times larger or smaller than an atom? \nB:It's ten times larger than an individual atom. But as I was saying, it's still extremely small. For comparison, 10 NM is 1000 times smaller than the diameter of a human hair. There are as many nanometers in an inch as there are inches in a long distance, which makes it a very tiny unit of measurement that's essential for working with materials at the atomic and molecular level.\nA: Wait, could you clarify that part about nanometers and inches again? I want to make sure I got that right. \nB: Sure, I was just saying that there are as many nanometers in an inch as there are inches in 400 miles.", + "total_duration": 56.8390022675737, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--160/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--160/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--160/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Well, Mike, nowadays there's much talk about nanometer. But what on earth is it?", + "original_text": "Well, Mike, nowadays there's much talk about nanometer. But what on earth is it?", + "start_time": 0, + "end_time": 5.979138321995465, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--160/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Nanometer is a length scale. It's one billionth of a meter, roughly ten times the size of an individual", + "original_text": "Nanometer is a length scale. It's one billionth of a meter, roughly ten times the size of an individual [interrupt] atoms, which are the building blocks of matter and understanding their scale is crucial for nanotechnology applications in medicine and electronics.", + "start_time": 6.524616435496629, + "end_time": 20.235999655451277, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--160/temp/line_1_B.wav", + "silence_duration": 0.5454781135011644, + "is_interrupted": true, + "text_after_interrupt": "atoms, which are the building blocks of matter and understanding their scale is crucial for nanotechnology applications in medicine and electronics." + }, + { + "speaker": "A", + "text": "Sorry to interrupt, but when you say \"ten times the size,\" do you mean it's ten times larger or smaller than an atom?", + "original_text": "Sorry to interrupt, but when you say \"ten times the size,\" do you mean it's ten times larger or smaller than an atom?", + "start_time": 12.480534802843568, + "end_time": 20.677178793773273, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--160/temp/line_2_A.wav", + "silence_duration": 0.5995395098160606, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "It's ten times larger than an individual atom. But as I was saying, it's still extremely small. For comparison, 10 NM is 1000 times smaller than the diameter of a human hair. There are as many nanometers in an inch as there are inches in", + "original_text": "It's ten times larger than an individual atom. But as I was saying, it's still extremely small. For comparison, 10 NM is 1000 times smaller than the diameter of a human hair. There are as many nanometers in an inch as there are inches in [interrupt] a long distance, which makes it a very tiny unit of measurement that's essential for working with materials at the atomic and molecular level.", + "start_time": 21.10039241923296, + "end_time": 42.23055114939169, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--160/temp/line_3_B.wav", + "silence_duration": 0.42321362545968944, + "is_interrupted": true, + "text_after_interrupt": "a long distance, which makes it a very tiny unit of measurement that's essential for working with materials at the atomic and molecular level." + }, + { + "speaker": "A", + "text": "Wait, could you clarify that part about nanometers and inches again? I want to make sure I got that right.", + "original_text": "Wait, could you clarify that part about nanometers and inches again? I want to make sure I got that right.", + "start_time": 43.788738016318334, + "end_time": 50.627014660309264, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--160/temp/line_4_A.wav", + "silence_duration": 0.3758603680226678, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Sure, I was just saying that there are as many nanometers in an inch as there are inches in 400 miles.", + "original_text": "Sure, I was just saying that there are as many nanometers in an inch as there are inches in 400 miles.", + "start_time": 51.21980852099551, + "end_time": 56.839037545938815, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--160/temp/line_5_B.wav", + "silence_duration": 0.5927938606862406, + "is_interrupted": false + } + ] + }, + "DialogSum--val--161": { + "original_text": "A: I heard that Ben is forming his own band. \nB: It will be a rock and roll band probably. He's a very good guitarist. \nA: Can you play a musical instrument? If you can, he might ask you to [interrupt] join his band as a drummer, especially since he's looking for a good rhythm section to complement his guitar skills and complete the band's lineup. \nB: I can play drums, but I haven't played for a while. I'm not sure I'd be good enough to play in a band. \nA: I wish I could play a musical instrument. I love music. \nB: Nowadays, you can be a DJ. You can mix dance music. You don't need to be able to play a musical instrument or [interrupt] spend years learning music theory like traditional musicians do because modern DJ software comes with intuitive interfaces and built-in tutorials that make the learning process much easier. \nA: I love to try it, but the instrument is expensive and it still needs a lot of practice. By the way, you mentioned Ben might ask me to join the band? \nB: Oh, right! If you get back into drumming, Ben might consider asking you to join. You should give it some thought! \nA: Maybe I will. And about that DJ idea, I could try using a computer program to mix music.", + "cleaned_text": "A: I heard that Ben is forming his own band. \nB: It will be a rock and roll band probably. He's a very good guitarist. \nA:Can you play a musical instrument? If you can, he might ask you to join his band as a drummer, especially since he's looking for a good rhythm section to complement his guitar skills and complete the band's lineup.\nB: I can play drums, but I haven't played for a while. I'm not sure I'd be good enough to play in a band. \nA: I wish I could play a musical instrument. I love music. \nB:Nowadays, you can be a DJ. You can mix dance music. You don't need to be able to play a musical instrument or spend years learning music theory like traditional musicians do because modern DJ software comes with intuitive interfaces and built-in tutorials that make the learning process much easier.\nA: I love to try it, but the instrument is expensive and it still needs a lot of practice. By the way, you mentioned Ben might ask me to join the band? \nB: Oh, right! If you get back into drumming, Ben might consider asking you to join. You should give it some thought! \nA: Maybe I will. And about that DJ idea, I could try using a computer program to mix music.", + "total_duration": 58.9340589569161, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--161/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--161/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--161/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "I heard that Ben is forming his own band.", + "original_text": "I heard that Ben is forming his own band.", + "start_time": 0, + "end_time": 2.5309750566893423, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--161/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "It will be a rock and roll band probably. He's a very good guitarist.", + "original_text": "It will be a rock and roll band probably. He's a very good guitarist.", + "start_time": 3.0010240475071632, + "end_time": 6.751046723244125, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--161/temp/line_1_B.wav", + "silence_duration": 0.4700489908178209, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Can you play a musical instrument? If you can, he might ask you to", + "original_text": "Can you play a musical instrument? If you can, he might ask you to [interrupt] join his band as a drummer, especially since he's looking for a good rhythm section to complement his guitar skills and complete the band's lineup.", + "start_time": 7.227892806712864, + "end_time": 20.184627500590416, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--161/temp/line_2_A.wav", + "silence_duration": 0.4768460834687396, + "is_interrupted": true, + "text_after_interrupt": "join his band as a drummer, especially since he's looking for a good rhythm section to complement his guitar skills and complete the band's lineup." + }, + { + "speaker": "B", + "text": "I can play drums, but I haven't played for a while. I'm not sure I'd be good enough to play in a band.", + "original_text": "I can play drums, but I haven't played for a while. I'm not sure I'd be good enough to play in a band.", + "start_time": 11.802223872472501, + "end_time": 17.34018305614597, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--161/temp/line_3_B.wav", + "silence_duration": 0.36799529004950987, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I wish I could play a musical instrument. I love music.", + "original_text": "I wish I could play a musical instrument. I love music.", + "start_time": 20.77450030517049, + "end_time": 24.32715336639498, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--161/temp/line_4_A.wav", + "silence_duration": 0.5898728045800768, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Nowadays, you can be a DJ. You can mix dance music. You don't need to be able to play a musical instrument or", + "original_text": "Nowadays, you can be a DJ. You can mix dance music. You don't need to be able to play a musical instrument or [interrupt] spend years learning music theory like traditional musicians do because modern DJ software comes with intuitive interfaces and built-in tutorials that make the learning process much easier.", + "start_time": 24.726426637471246, + "end_time": 41.259034347221814, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--161/temp/line_5_B.wav", + "silence_duration": 0.39927327107626503, + "is_interrupted": true, + "text_after_interrupt": "spend years learning music theory like traditional musicians do because modern DJ software comes with intuitive interfaces and built-in tutorials that make the learning process much easier." + }, + { + "speaker": "A", + "text": "I love to try it, but the instrument is expensive and it still needs a lot of practice. By the way, you mentioned Ben might ask me to join the band?", + "original_text": "I love to try it, but the instrument is expensive and it still needs a lot of practice. By the way, you mentioned Ben might ask me to join the band?", + "start_time": 36.71881004703491, + "end_time": 45.67010256404171, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--161/temp/line_6_A.wav", + "silence_duration": 0.5364096910459999, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Oh, right! If you get back into drumming, Ben might consider asking you to join. You should give it some thought!", + "original_text": "Oh, right! If you get back into drumming, Ben might consider asking you to join. You should give it some thought!", + "start_time": 46.01838701110571, + "end_time": 52.067185197046754, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--161/temp/line_7_B.wav", + "silence_duration": 0.3482844470639978, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Maybe I will. And about that DJ idea, I could try using a computer program to mix music.", + "original_text": "Maybe I will. And about that DJ idea, I could try using a computer program to mix music.", + "start_time": 52.664679607435474, + "end_time": 58.93406736253751, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--161/temp/line_8_A.wav", + "silence_duration": 0.5974944103887193, + "is_interrupted": false + } + ] + }, + "DialogSum--val--162": { + "original_text": "A: Where can I buy textbooks? \nB: First, you need to have the list of books for your class. Do you have [interrupt] the list with you right now or do you need to get it from your professor's office first? \nA: Yes, I have that. \nB: Well, when you have that, you can take it over to the bookstore. Can you find it? \nA: No, I don't know where the bookstore is. \nB: Just pass the gym and it's the first door on your left. Were you aware that you can also turn in your old textbooks for [interrupt] some extra cash if they're in good condition? The bookstore usually offers about 30-50% of the original price depending on demand and book condition. \nA: Really? How can I do that? \nB: Take your used textbooks with you and give them to the representative near the entrance. He will pay you for them. Are you going today? \nA: No, I can't make it today. \nB: I could help you with buying your books if you meet me there at 1. \nA: No, thanks. I'm good. \nB: I'll see you later then. Have a great day!", + "cleaned_text": "A: Where can I buy textbooks? \nB:First, you need to have the list of books for your class. Do you have the list with you right now or do you need to get it from your professor's office first?\nA: Yes, I have that. \nB: Well, when you have that, you can take it over to the bookstore. Can you find it? \nA: No, I don't know where the bookstore is. \nB:Just pass the gym and it's the first door on your left. Were you aware that you can also turn in your old textbooks for some extra cash if they're in good condition? The bookstore usually offers about 30-50% of the original price depending on demand and book condition.\nA: Really? How can I do that? \nB: Take your used textbooks with you and give them to the representative near the entrance. He will pay you for them. Are you going today? \nA: No, I can't make it today. \nB: I could help you with buying your books if you meet me there at 1. \nA: No, thanks. I'm good. \nB: I'll see you later then. Have a great day!", + "total_duration": 47.3459410430839, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--162/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--162/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--162/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Where can I buy textbooks?", + "original_text": "Where can I buy textbooks?", + "start_time": 0, + "end_time": 1.7182766439909296, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--162/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "First, you need to have the list of books for your class. Do you have", + "original_text": "First, you need to have the list of books for your class. Do you have [interrupt] the list with you right now or do you need to get it from your professor's office first?", + "start_time": 2.097178847388994, + "end_time": 9.52756433491734, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--162/temp/line_1_B.wav", + "silence_duration": 0.3789022033980646, + "is_interrupted": true, + "text_after_interrupt": "the list with you right now or do you need to get it from your professor's office first?" + }, + { + "speaker": "A", + "text": "Yes, I have that.", + "original_text": "Yes, I have that.", + "start_time": 5.951691319044323, + "end_time": 7.402938484577202, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--162/temp/line_2_A.wav", + "silence_duration": 0.3072705874439552, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Well, when you have that, you can take it over to the bookstore. Can you find it?", + "original_text": "Well, when you have that, you can take it over to the bookstore. Can you find it?", + "start_time": 10.088746092492233, + "end_time": 13.583349267095407, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--162/temp/line_3_B.wav", + "silence_duration": 0.5611817575748934, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "No, I don't know where the bookstore is.", + "original_text": "No, I don't know where the bookstore is.", + "start_time": 14.112736524298509, + "end_time": 16.481171898448167, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--162/temp/line_4_A.wav", + "silence_duration": 0.5293872572031022, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Just pass the gym and it's the first door on your left. Were you aware that you can also turn in your old textbooks for", + "original_text": "Just pass the gym and it's the first door on your left. Were you aware that you can also turn in your old textbooks for [interrupt] some extra cash if they're in good condition? The bookstore usually offers about 30-50% of the original price depending on demand and book condition.", + "start_time": 16.905676208159747, + "end_time": 30.222320199089452, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--162/temp/line_5_B.wav", + "silence_duration": 0.42450430971158115, + "is_interrupted": true, + "text_after_interrupt": "some extra cash if they're in good condition? The bookstore usually offers about 30-50% of the original price depending on demand and book condition." + }, + { + "speaker": "A", + "text": "Really? How can I do that?", + "original_text": "Really? How can I do that?", + "start_time": 23.32191607159863, + "end_time": 25.713571400396816, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--162/temp/line_6_A.wav", + "silence_duration": 0.42336510926955767, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Take your used textbooks with you and give them to the representative near the entrance. He will pay you for them. Are you going today?", + "original_text": "Take your used textbooks with you and give them to the representative near the entrance. He will pay you for them. Are you going today?", + "start_time": 30.790892813469476, + "end_time": 37.2228202511112, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--162/temp/line_7_B.wav", + "silence_duration": 0.5685726143800243, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "No, I can't make it today.", + "original_text": "No, I can't make it today.", + "start_time": 37.66393835661171, + "end_time": 39.498314773845266, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--162/temp/line_8_A.wav", + "silence_duration": 0.44111810550050823, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I could help you with buying your books if you meet me there at 1.", + "original_text": "I could help you with buying your books if you meet me there at 1.", + "start_time": 39.92495977644225, + "end_time": 42.804234152859486, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--162/temp/line_9_B.wav", + "silence_duration": 0.4266450025969833, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "No, thanks. I'm good.", + "original_text": "No, thanks. I'm good.", + "start_time": 43.18388889295793, + "end_time": 44.7628458090577, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--162/temp/line_10_A.wav", + "silence_duration": 0.3796547400984477, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I'll see you later then. Have a great day!", + "original_text": "I'll see you later then. Have a great day!", + "start_time": 45.33745094161327, + "end_time": 47.34597701871078, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--162/temp/line_11_B.wav", + "silence_duration": 0.5746051325555712, + "is_interrupted": false + } + ] + }, + "DialogSum--val--163": { + "original_text": "A: I'm going to try sky diving this weekend. \nB: I wouldn't do it if I were you. \nA: It sounds like [interrupt] a thrilling experience, something I've always wanted to try ever since I saw those breathtaking videos of people freefalling through the clouds with the most spectacular views imaginable. \nB: Sorry to jump in, but have you thought about the safety measures? It's very dangerous, you know. \nA: I want to try something exciting. \nB: It's an easy way to get hurt, let me tell you. \nA: I'll tell you all about it next Monday. By the way, you mentioned safety measures earlier—what exactly did you mean? \nB: Well, take care of yourself, and don't say I didn't warn you.", + "cleaned_text": "A: I'm going to try sky diving this weekend. \nB: I wouldn't do it if I were you. \nA:It sounds like a thrilling experience, something I've always wanted to try ever since I saw those breathtaking videos of people freefalling through the clouds with the most spectacular views imaginable.\nB: Sorry to jump in, but have you thought about the safety measures? It's very dangerous, you know. \nA: I want to try something exciting. \nB: It's an easy way to get hurt, let me tell you. \nA: I'll tell you all about it next Monday. By the way, you mentioned safety measures earlier—what exactly did you mean? \nB: Well, take care of yourself, and don't say I didn't warn you.", + "total_duration": 32.39569160997733, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--163/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--163/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--163/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "I'm going to try sky diving this weekend.", + "original_text": "I'm going to try sky diving this weekend.", + "start_time": 0, + "end_time": 2.5193650793650795, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--163/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I wouldn't do it if I were you.", + "original_text": "I wouldn't do it if I were you.", + "start_time": 2.962575210738239, + "end_time": 4.576362058810801, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--163/temp/line_1_B.wav", + "silence_duration": 0.4432101313731596, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "It sounds like", + "original_text": "It sounds like [interrupt] a thrilling experience, something I've always wanted to try ever since I saw those breathtaking videos of people freefalling through the clouds with the most spectacular views imaginable.", + "start_time": 4.957527339501261, + "end_time": 17.473082895056816, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--163/temp/line_2_A.wav", + "silence_duration": 0.38116528069045935, + "is_interrupted": true, + "text_after_interrupt": "a thrilling experience, something I've always wanted to try ever since I saw those breathtaking videos of people freefalling through the clouds with the most spectacular views imaginable." + }, + { + "speaker": "B", + "text": "Sorry to jump in, but have you thought about the safety measures? It's very dangerous, you know.", + "original_text": "Sorry to jump in, but have you thought about the safety measures? It's very dangerous, you know.", + "start_time": 6.0488652079819865, + "end_time": 11.14564525333346, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--163/temp/line_3_B.wav", + "silence_duration": 0.5047903300738846, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I want to try something exciting.", + "original_text": "I want to try something exciting.", + "start_time": 17.90844371656658, + "end_time": 19.77765006577293, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--163/temp/line_4_A.wav", + "silence_duration": 0.4353608215097645, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "It's an easy way to get hurt, let me tell you.", + "original_text": "It's an easy way to get hurt, let me tell you.", + "start_time": 20.21331060282799, + "end_time": 22.34954643049239, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--163/temp/line_5_B.wav", + "silence_duration": 0.4356605370550572, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I'll tell you all about it next Monday. By the way, you mentioned safety measures earlier—what exactly did you mean?", + "original_text": "I'll tell you all about it next Monday. By the way, you mentioned safety measures earlier—what exactly did you mean?", + "start_time": 22.829470590467817, + "end_time": 29.226568096136752, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--163/temp/line_6_A.wav", + "silence_duration": 0.47992415997543003, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Well, take care of yourself, and don't say I didn't warn you.", + "original_text": "Well, take care of yourself, and don't say I didn't warn you.", + "start_time": 29.562863940694758, + "end_time": 32.39569840781494, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--163/temp/line_7_B.wav", + "silence_duration": 0.33629584455800476, + "is_interrupted": false + } + ] + }, + "DialogSum--val--164": { + "original_text": "A: So, Emily, how was your day? \nB: I don't think you really want to hear about it. \nA: It can't have been that bad. Go on and tell me about it. \nB: To be honest, it was horrible! My manager is such a pain in the neck! \nA: Why? What happened? \nB: Well, he made quite a few mistakes on the monthly report and when his supervisor found them, my manager blamed them on [interrupt] me, even though I wasn't the one who worked on that section of the report and had clear evidence showing I wasn't involved in that project at all. \nA: Wait, he blamed you? That's completely unfair! How did you respond to that? \nB: There wasn't really anything that I could do. There's always been a lot of bad blood between my manager and myself. If I had said anything, he would have fired me for sure. \nA: Does he treat everyone in your department like this? \nB: He treats everyone pretty badly, but the way he treats me really takes the cake! \nA: Do you have any idea why he treats you worse than the others? \nB: I really have no idea. All I know is that the thought of him really curls my hair! Oh, and about the report, I didn't get to finish earlier—he blamed the mistakes on me, but I couldn't even defend myself. \nA: That's so frustrating. Maybe there's a way to address this with HR?", + "cleaned_text": "A: So, Emily, how was your day? \nB: I don't think you really want to hear about it. \nA: It can't have been that bad. Go on and tell me about it. \nB: To be honest, it was horrible! My manager is such a pain in the neck! \nA: Why? What happened? \nB:Well, he made quite a few mistakes on the monthly report and when his supervisor found them, my manager blamed them on me, even though I wasn't the one who worked on that section of the report and had clear evidence showing I wasn't involved in that project at all.\nA: Wait, he blamed you? That's completely unfair! How did you respond to that? \nB: There wasn't really anything that I could do. There's always been a lot of bad blood between my manager and myself. If I had said anything, he would have fired me for sure. \nA: Does he treat everyone in your department like this? \nB: He treats everyone pretty badly, but the way he treats me really takes the cake! \nA: Do you have any idea why he treats you worse than the others? \nB: I really have no idea. All I know is that the thought of him really curls my hair! Oh, and about the report, I didn't get to finish earlier—he blamed the mistakes on me, but I couldn't even defend myself. \nA: That's so frustrating. Maybe there's a way to address this with HR?", + "total_duration": 65.28984126984128, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--164/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--164/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--164/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "So, Emily, how was your day?", + "original_text": "So, Emily, how was your day?", + "start_time": 0, + "end_time": 1.8692063492063493, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--164/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I don't think you really want to hear about it.", + "original_text": "I don't think you really want to hear about it.", + "start_time": 2.1868173119748615, + "end_time": 4.0792436158297365, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--164/temp/line_1_B.wav", + "silence_duration": 0.31761096276851214, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "It can't have been that bad. Go on and tell me about it.", + "original_text": "It can't have been that bad. Go on and tell me about it.", + "start_time": 4.3885300316720794, + "end_time": 8.161772662057567, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--164/temp/line_2_A.wav", + "silence_duration": 0.3092864158423431, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "To be honest, it was horrible! My manager is such a pain in the neck!", + "original_text": "To be honest, it was horrible! My manager is such a pain in the neck!", + "start_time": 8.637374761866116, + "end_time": 12.66603689338539, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--164/temp/line_3_B.wav", + "silence_duration": 0.4756020998085492, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Why? What happened?", + "original_text": "Why? What happened?", + "start_time": 13.006140318440368, + "end_time": 14.178748028190935, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--164/temp/line_4_A.wav", + "silence_duration": 0.34010342505497665, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Well, he made quite a few mistakes on the monthly report and when his supervisor found them, my manager blamed them on", + "original_text": "Well, he made quite a few mistakes on the monthly report and when his supervisor found them, my manager blamed them on [interrupt] me, even though I wasn't the one who worked on that section of the report and had clear evidence showing I wasn't involved in that project at all.", + "start_time": 14.499835151132304, + "end_time": 28.21121837108695, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--164/temp/line_5_B.wav", + "silence_duration": 0.321087122941369, + "is_interrupted": true, + "text_after_interrupt": "me, even though I wasn't the one who worked on that section of the report and had clear evidence showing I wasn't involved in that project at all." + }, + { + "speaker": "A", + "text": "Wait, he blamed you? That's completely unfair! How did you respond to that?", + "original_text": "Wait, he blamed you? That's completely unfair! How did you respond to that?", + "start_time": 20.815662815531397, + "end_time": 26.353621999204865, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--164/temp/line_6_A.wav", + "silence_duration": 0.5308565592063332, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "There wasn't really anything that I could do. There's always been a lot of bad blood between my manager and myself. If I had said anything, he would have fired me for sure.", + "original_text": "There wasn't really anything that I could do. There's always been a lot of bad blood between my manager and myself. If I had said anything, he would have fired me for sure.", + "start_time": 28.743720600762913, + "end_time": 38.159412210740236, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--164/temp/line_7_B.wav", + "silence_duration": 0.5325022296759616, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Does he treat everyone in your department like this?", + "original_text": "Does he treat everyone in your department like this?", + "start_time": 38.58119862242945, + "end_time": 41.1702235657401, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--164/temp/line_8_A.wav", + "silence_duration": 0.4217864116892105, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "He treats everyone pretty badly, but the way he treats me really takes the cake!", + "original_text": "He treats everyone pretty badly, but the way he treats me really takes the cake!", + "start_time": 41.58466875681442, + "end_time": 45.60172091100944, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--164/temp/line_9_B.wav", + "silence_duration": 0.4144451910743231, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Do you have any idea why he treats you worse than the others?", + "original_text": "Do you have any idea why he treats you worse than the others?", + "start_time": 45.91977903080206, + "end_time": 49.112522794974396, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--164/temp/line_10_A.wav", + "silence_duration": 0.31805811979262544, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I really have no idea. All I know is that the thought of him really curls my hair! Oh, and about the report, I didn't get to finish earlier—he blamed the mistakes on me, but I couldn't even defend myself.", + "original_text": "I really have no idea. All I know is that the thought of him really curls my hair! Oh, and about the report, I didn't get to finish earlier—he blamed the mistakes on me, but I couldn't even defend myself.", + "start_time": 49.49472495566771, + "end_time": 60.38488368582644, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--164/temp/line_11_B.wav", + "silence_duration": 0.38220216069331364, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "That's so frustrating. Maybe there's a way to address this with HR?", + "original_text": "That's so frustrating. Maybe there's a way to address this with HR?", + "start_time": 60.83161419223428, + "end_time": 65.28984548475128, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--164/temp/line_12_A.wav", + "silence_duration": 0.4467305064078363, + "is_interrupted": false + } + ] + }, + "DialogSum--val--165": { + "original_text": "A: I came to this lab to have my blood drawn. \nB: You are in the right place. Roll up your left sleeve and have a seat. \nA: What am I being tested for? \nB: Your doctor wants to know what your white blood cell count [interrupt] is, which can indicate if there's an infection or another condition that needs attention, along with other important markers like hemoglobin levels and platelet counts for a comprehensive health assessment. \nA: Oh, does that mean he's worried about something specific? \nB: Usually if your white count is off, the doctor suspects an infection. But as I was saying, your white blood cell count is what we're checking. \nA: I see. How much will it hurt? \nB: It is only a pin prick. I have to put this tourniquet on your arm to make the vein easier to find. \nA: Is that my blood going into that tube? \nB: That blood that just filled the tube is all that I needed. Thanks for coming in!", + "cleaned_text": "A: I came to this lab to have my blood drawn. \nB: You are in the right place. Roll up your left sleeve and have a seat. \nA: What am I being tested for? \nB:Your doctor wants to know what your white blood cell count is, which can indicate if there's an infection or another condition that needs attention, along with other important markers like hemoglobin levels and platelet counts for a comprehensive health assessment.\nA: Oh, does that mean he's worried about something specific? \nB: Usually if your white count is off, the doctor suspects an infection. But as I was saying, your white blood cell count is what we're checking. \nA: I see. How much will it hurt? \nB: It is only a pin prick. I have to put this tourniquet on your arm to make the vein easier to find. \nA: Is that my blood going into that tube? \nB: That blood that just filled the tube is all that I needed. Thanks for coming in!", + "total_duration": 44.02126984126984, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--165/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--165/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--165/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "I came to this lab to have my blood drawn.", + "original_text": "I came to this lab to have my blood drawn.", + "start_time": 0, + "end_time": 2.4729251700680273, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--165/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "You are in the right place. Roll up your left sleeve and have a seat.", + "original_text": "You are in the right place. Roll up your left sleeve and have a seat.", + "start_time": 2.8748780353077428, + "end_time": 5.928302071588922, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--165/temp/line_1_B.wav", + "silence_duration": 0.4019528652397155, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "What am I being tested for?", + "original_text": "What am I being tested for?", + "start_time": 6.407081189056948, + "end_time": 8.0556979691023, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--165/temp/line_2_A.wav", + "silence_duration": 0.4787791174680258, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Your doctor wants to know what your white blood cell count", + "original_text": "Your doctor wants to know what your white blood cell count [interrupt] is, which can indicate if there's an infection or another condition that needs attention, along with other important markers like hemoglobin levels and platelet counts for a comprehensive health assessment.", + "start_time": 8.370461666768206, + "end_time": 21.52456597515823, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--165/temp/line_3_B.wav", + "silence_duration": 0.3147636976659062, + "is_interrupted": true, + "text_after_interrupt": "is, which can indicate if there's an infection or another condition that needs attention, along with other important markers like hemoglobin levels and platelet counts for a comprehensive health assessment." + }, + { + "speaker": "A", + "text": "Oh, does that mean he's worried about something specific?", + "original_text": "Oh, does that mean he's worried about something specific?", + "start_time": 11.261346020509702, + "end_time": 14.094180487629883, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--165/temp/line_4_A.wav", + "silence_duration": 0.5448981264338182, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Usually if your white count is off, the doctor suspects an infection. But as I was saying, your white blood cell count is what we're checking.", + "original_text": "Usually if your white count is off, the doctor suspects an infection. But as I was saying, your white blood cell count is what we're checking.", + "start_time": 21.841947380536734, + "end_time": 28.993693412282767, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--165/temp/line_5_B.wav", + "silence_duration": 0.31738140537850595, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I see. How much will it hurt?", + "original_text": "I see. How much will it hurt?", + "start_time": 29.323833733964722, + "end_time": 31.239479992468123, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--165/temp/line_6_A.wav", + "silence_duration": 0.33014032168195745, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "It is only a pin prick. I have to put this tourniquet on your arm to make the vein easier to find.", + "original_text": "It is only a pin prick. I have to put this tourniquet on your arm to make the vein easier to find.", + "start_time": 31.665247857437098, + "end_time": 36.878127676031205, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--165/temp/line_7_B.wav", + "silence_duration": 0.425767864968976, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Is that my blood going into that tube?", + "original_text": "Is that my blood going into that tube?", + "start_time": 37.29512523600195, + "end_time": 39.48941095028766, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--165/temp/line_8_A.wav", + "silence_duration": 0.4169975599707421, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "That blood that just filled the tube is all that I needed. Thanks for coming in!", + "original_text": "That blood that just filled the tube is all that I needed. Thanks for coming in!", + "start_time": 39.992624524806956, + "end_time": 44.02128665632623, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--165/temp/line_9_B.wav", + "silence_duration": 0.5032135745192905, + "is_interrupted": false + } + ] + }, + "DialogSum--val--166": { + "original_text": "A: Do you have this design with only one breast pocket? \nB: Let me see. Oh, we have the design but not the same color as [interrupt] the one you're holding right now, but we do have it in several other elegant shades that might suit your preferences better, including some beautiful earth tones and soft pastels. \nA: Sorry to interrupt, but is the color you have more subtle? I prefer something that's not too loud. \nB: Yes, it's a more muted shade, but I was going to mention that it's a bit different from this one in terms of fabric as well. \nA: Oh, I see. What kind of fabric is it?", + "cleaned_text": "A: Do you have this design with only one breast pocket? \nB:Let me see. Oh, we have the design but not the same color as the one you're holding right now, but we do have it in several other elegant shades that might suit your preferences better, including some beautiful earth tones and soft pastels.\nA: Sorry to interrupt, but is the color you have more subtle? I prefer something that's not too loud. \nB: Yes, it's a more muted shade, but I was going to mention that it's a bit different from this one in terms of fabric as well. \nA: Oh, I see. What kind of fabric is it?", + "total_duration": 24.789478458049885, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--166/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--166/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--166/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Do you have this design with only one breast pocket?", + "original_text": "Do you have this design with only one breast pocket?", + "start_time": 0, + "end_time": 2.589024943310658, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--166/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Let me see. Oh, we have the design but not the same color as", + "original_text": "Let me see. Oh, we have the design but not the same color as [interrupt] the one you're holding right now, but we do have it in several other elegant shades that might suit your preferences better, including some beautiful earth tones and soft pastels.", + "start_time": 3.0448182591859365, + "end_time": 14.875385152609972, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--166/temp/line_1_B.wav", + "silence_duration": 0.4557933158752786, + "is_interrupted": true, + "text_after_interrupt": "the one you're holding right now, but we do have it in several other elegant shades that might suit your preferences better, including some beautiful earth tones and soft pastels." + }, + { + "speaker": "A", + "text": "Sorry to interrupt, but is the color you have more subtle? I prefer something that's not too loud.", + "original_text": "Sorry to interrupt, but is the color you have more subtle? I prefer something that's not too loud.", + "start_time": 6.643911229707479, + "end_time": 12.657879483675732, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--166/temp/line_2_A.wav", + "silence_duration": 0.5319631192528508, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, it's a more muted shade, but I was going to mention that it's a bit different from this one in terms of fabric as well.", + "original_text": "Yes, it's a more muted shade, but I was going to mention that it's a bit different from this one in terms of fabric as well.", + "start_time": 15.401952981002758, + "end_time": 21.520411030889377, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--166/temp/line_3_B.wav", + "silence_duration": 0.5265678283927859, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Oh, I see. What kind of fabric is it?", + "original_text": "Oh, I see. What kind of fabric is it?", + "start_time": 21.956662453280046, + "end_time": 24.78949692040023, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--166/temp/line_4_A.wav", + "silence_duration": 0.4362514223906693, + "is_interrupted": false + } + ] + }, + "DialogSum--val--167": { + "original_text": "A: May I be of any help? \nB: Yes. Show me the sweaters, please. \nA: What style? \nB: Well, could you bring me all the styles of pullovers? I am not quite sure which one I will [interrupt] prefer, but I want to see a variety before making a decision because sometimes the fit and color look different in person than they do online or in catalogs. \nA: Before I bring them all, do you have a preference for material? It might help narrow down the options. \nB: Oh, I hadn't thought about that. I do prefer wool over cotton. But I was going to say, I'm not sure which one I will buy yet, so having a variety would still be helpful. \nA: No problem, I'll bring a selection of wool pullovers in different styles then.", + "cleaned_text": "A: May I be of any help? \nB: Yes. Show me the sweaters, please. \nA: What style? \nB:Well, could you bring me all the styles of pullovers? I am not quite sure which one I will prefer, but I want to see a variety before making a decision because sometimes the fit and color look different in person than they do online or in catalogs.\nA: Before I bring them all, do you have a preference for material? It might help narrow down the options. \nB: Oh, I hadn't thought about that. I do prefer wool over cotton. But I was going to say, I'm not sure which one I will buy yet, so having a variety would still be helpful. \nA: No problem, I'll bring a selection of wool pullovers in different styles then.", + "total_duration": 33.35900226757369, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--167/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--167/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--167/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "May I be of any help?", + "original_text": "May I be of any help?", + "start_time": 0, + "end_time": 1.3119274376417234, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--167/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes. Show me the sweaters, please.", + "original_text": "Yes. Show me the sweaters, please.", + "start_time": 1.803992726873136, + "end_time": 3.9982784411588503, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--167/temp/line_1_B.wav", + "silence_duration": 0.4920652892314126, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "What style?", + "original_text": "What style?", + "start_time": 4.5774060996767085, + "end_time": 5.587474126887593, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--167/temp/line_2_A.wav", + "silence_duration": 0.5791276585178585, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Well, could you bring me all the styles of pullovers? I am not quite sure which one I will", + "original_text": "Well, could you bring me all the styles of pullovers? I am not quite sure which one I will [interrupt] prefer, but I want to see a variety before making a decision because sometimes the fit and color look different in person than they do online or in catalogs.", + "start_time": 6.14312921984016, + "end_time": 19.274013573581655, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--167/temp/line_3_B.wav", + "silence_duration": 0.5556550929525674, + "is_interrupted": true, + "text_after_interrupt": "prefer, but I want to see a variety before making a decision because sometimes the fit and color look different in person than they do online or in catalogs." + }, + { + "speaker": "A", + "text": "Before I bring them all, do you have a preference for material? It might help narrow down the options.", + "original_text": "Before I bring them all, do you have a preference for material? It might help narrow down the options.", + "start_time": 11.019319696030637, + "end_time": 17.23065756451136, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--167/temp/line_4_A.wav", + "silence_duration": 0.49137801752507393, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Oh, I hadn't thought about that. I do prefer wool over cotton. But I was going to say, I'm not sure which one I will buy yet, so having a variety would still be helpful.", + "original_text": "Oh, I hadn't thought about that. I do prefer wool over cotton. But I was going to say, I'm not sure which one I will buy yet, so having a variety would still be helpful.", + "start_time": 19.68193054676515, + "end_time": 28.551953222502114, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--167/temp/line_5_B.wav", + "silence_duration": 0.4079169731834984, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "No problem, I'll bring a selection of wool pullovers in different styles then.", + "original_text": "No problem, I'll bring a selection of wool pullovers in different styles then.", + "start_time": 28.970458932468365, + "end_time": 33.35903036103979, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--167/temp/line_6_A.wav", + "silence_duration": 0.4185057099662508, + "is_interrupted": false + } + ] + }, + "DialogSum--val--169": { + "original_text": "A: Let's do something really nice for our family this Christmas. \nB: What did you have in [interrupt] mind for that? I was thinking we could plan a special family trip or create personalized gifts that reflect our shared memories and values. \nA: Sorry, I just want to clarify—are you thinking of something like an experience or a physical gift? \nB: I'm not sure yet. I just know I want to get out of the mindless gift trap. \nA: I know what you mean. I want to give a gift that is really meaningful. \nB: Or do something that shows we have spent time thinking about them. \nA: Right, or maybe something that only we are able to give them. By the way, what did you have in mind earlier?", + "cleaned_text": "A: Let's do something really nice for our family this Christmas. \nB:What did you have in mind for that? I was thinking we could plan a special family trip or create personalized gifts that reflect our shared memories and values.\nA: Sorry, I just want to clarify—are you thinking of something like an experience or a physical gift? \nB: I'm not sure yet. I just know I want to get out of the mindless gift trap. \nA: I know what you mean. I want to give a gift that is really meaningful. \nB: Or do something that shows we have spent time thinking about them. \nA: Right, or maybe something that only we are able to give them. By the way, what did you have in mind earlier?", + "total_duration": 30.451020408163266, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--169/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--169/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--169/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Let's do something really nice for our family this Christmas.", + "original_text": "Let's do something really nice for our family this Christmas.", + "start_time": 0, + "end_time": 3.1695238095238096, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--169/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "What did you have in", + "original_text": "What did you have in [interrupt] mind for that? I was thinking we could plan a special family trip or create personalized gifts that reflect our shared memories and values.", + "start_time": 3.73000296954061, + "end_time": 11.740887323282108, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--169/temp/line_1_B.wav", + "silence_duration": 0.5604791600168001, + "is_interrupted": true, + "text_after_interrupt": "mind for that? I was thinking we could plan a special family trip or create personalized gifts that reflect our shared memories and values." + }, + { + "speaker": "A", + "text": "Sorry, I just want to clarify—are you thinking of something like an experience or a physical gift?", + "original_text": "Sorry, I just want to clarify—are you thinking of something like an experience or a physical gift?", + "start_time": 4.763290951400021, + "end_time": 11.055898661150588, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--169/temp/line_2_A.wav", + "silence_duration": 0.4656567872990765, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I'm not sure yet. I just know I want to get out of the mindless gift trap.", + "original_text": "I'm not sure yet. I just know I want to get out of the mindless gift trap.", + "start_time": 12.330730408102, + "end_time": 15.860163514677962, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--169/temp/line_3_B.wav", + "silence_duration": 0.5898430848198909, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I know what you mean. I want to give a gift that is really meaningful.", + "original_text": "I know what you mean. I want to give a gift that is really meaningful.", + "start_time": 16.229867934222824, + "end_time": 20.548779498848674, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--169/temp/line_4_A.wav", + "silence_duration": 0.3697044195448616, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Or do something that shows we have spent time thinking about them.", + "original_text": "Or do something that shows we have spent time thinking about them.", + "start_time": 21.08330456357015, + "end_time": 23.939358985338856, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--169/temp/line_5_B.wav", + "silence_duration": 0.5345250647214759, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Right, or maybe something that only we are able to give them. By the way, what did you have in mind earlier?", + "original_text": "Right, or maybe something that only we are able to give them. By the way, what did you have in mind earlier?", + "start_time": 24.23971834918735, + "end_time": 30.451056217668075, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--169/temp/line_6_A.wav", + "silence_duration": 0.30035936384849143, + "is_interrupted": false + } + ] + }, + "DialogSum--val--170": { + "original_text": "A: What's up, how are you? \nB: I'm splendid. How about yourself? \nA: Could be better. \nB: So, have you been on the bus very [interrupt] long today or did you just hop on recently? I'm curious because the traffic seems lighter than usual this morning. \nA: Sorry to cut in, but I was just curious, how often do you ride the bus? \nB: I usually just drive. \nA: You have your own vehicle? \nB: Yes, I have my own car. \nA: So then, why don't you [interrupt] drive today instead of taking the bus? Is there a particular reason or are you just trying something different for a change? \nB: Oh, before I forget, you mentioned earlier about how long I've been on the bus. I got on about fifteen minutes ago. And as for why I'm not driving, I'm waiting for our President to lower the gas prices. \nA: Smart.", + "cleaned_text": "A: What's up, how are you? \nB: I'm splendid. How about yourself? \nA: Could be better. \nB:So, have you been on the bus very long today or did you just hop on recently? I'm curious because the traffic seems lighter than usual this morning.\nA: Sorry to cut in, but I was just curious, how often do you ride the bus? \nB: I usually just drive. \nA: You have your own vehicle? \nB: Yes, I have my own car. \nA:So then, why don't you drive today instead of taking the bus? Is there a particular reason or are you just trying something different for a change?\nB: Oh, before I forget, you mentioned earlier about how long I've been on the bus. I got on about fifteen minutes ago. And as for why I'm not driving, I'm waiting for our President to lower the gas prices. \nA: Smart.", + "total_duration": 37.907981859410434, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--170/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--170/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--170/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "What's up, how are you?", + "original_text": "What's up, how are you?", + "start_time": 0, + "end_time": 1.6137868480725623, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--170/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I'm splendid. How about yourself?", + "original_text": "I'm splendid. How about yourself?", + "start_time": 1.9852027279084825, + "end_time": 4.2027083968427235, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--170/temp/line_1_B.wav", + "silence_duration": 0.3714158798359201, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Could be better.", + "original_text": "Could be better.", + "start_time": 4.742794526641559, + "end_time": 5.718032621879654, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--170/temp/line_2_A.wav", + "silence_duration": 0.5400861297988349, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "So, have you been on the bus very", + "original_text": "So, have you been on the bus very [interrupt] long today or did you just hop on recently? I'm curious because the traffic seems lighter than usual this morning.", + "start_time": 6.083513925245599, + "end_time": 13.560339322070996, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--170/temp/line_3_B.wav", + "silence_duration": 0.36548130336594503, + "is_interrupted": true, + "text_after_interrupt": "long today or did you just hop on recently? I'm curious because the traffic seems lighter than usual this morning." + }, + { + "speaker": "A", + "text": "Sorry to cut in, but I was just curious, how often do you ride the bus?", + "original_text": "Sorry to cut in, but I was just curious, how often do you ride the bus?", + "start_time": 8.242969707558524, + "end_time": 13.281699866288683, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--170/temp/line_4_A.wav", + "silence_duration": 0.48153722890932105, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I usually just drive.", + "original_text": "I usually just drive.", + "start_time": 14.00314108408638, + "end_time": 15.222188703133998, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--170/temp/line_5_B.wav", + "silence_duration": 0.4428017620153835, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "You have your own vehicle?", + "original_text": "You have your own vehicle?", + "start_time": 15.709176533078395, + "end_time": 17.06754388001717, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--170/temp/line_6_A.wav", + "silence_duration": 0.4869878299443975, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, I have my own car.", + "original_text": "Yes, I have my own car.", + "start_time": 17.50918470174238, + "end_time": 19.006871776572314, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--170/temp/line_7_B.wav", + "silence_duration": 0.44164082172521035, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "So then, why don't you", + "original_text": "So then, why don't you [interrupt] drive today instead of taking the bus? Is there a particular reason or are you just trying something different for a change?", + "start_time": 19.516846316385887, + "end_time": 27.73671026196412, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--170/temp/line_8_A.wav", + "silence_duration": 0.5099745398135744, + "is_interrupted": true, + "text_after_interrupt": "drive today instead of taking the bus? Is there a particular reason or are you just trying something different for a change?" + }, + { + "speaker": "B", + "text": "Oh, before I forget, you mentioned earlier about how long I've been on the bus. I got on about fifteen minutes ago. And as for why I'm not driving, I'm waiting for our President to lower the gas prices.", + "original_text": "Oh, before I forget, you mentioned earlier about how long I've been on the bus. I got on about fifteen minutes ago. And as for why I'm not driving, I'm waiting for our President to lower the gas prices.", + "start_time": 26.477144073991692, + "end_time": 36.56621436877627, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--170/temp/line_9_B.wav", + "silence_duration": 0.38818621471809545, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Smart.", + "original_text": "Smart.", + "start_time": 37.15337198279955, + "end_time": 37.908020508876646, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--170/temp/line_10_A.wav", + "silence_duration": 0.5871576140232777, + "is_interrupted": false + } + ] + }, + "DialogSum--val--172": { + "original_text": "A: Welcome back, Sir. I trust the materials were helpful to you? \nB: Indeed. I've decided to go for the Petty Consumer Loan. That is, if my credit rating is [interrupt] acceptable for the loan terms and meets all the necessary requirements for approval without any additional conditions or special approvals. \nA: Sorry to jump in, but your credit is fine, Sir. Now, tell me, what is it that you need the loan for? \nB: I've just bought a second-hand apartment and I'm looking to do some renovations. You know, a bit of decorating, some new furniture, nothing flashy. \nA: I see. And what loan amount are you expecting? \nB: It says here that the maximum is 20,000 RMB. Is that the limit for all types of renovations, or can it be adjusted based on specific needs? \nA: Is that enough for the renovations you have in mind? \nB: Well, 20,000 RMB, it'll have to be then. \nA: I need some documentation from you. Such as your resident permit, your occupation and salary details and—oh, I already have your credit details here. \nB: Everything is right here. If that's all in order, just let me know where I sign.", + "cleaned_text": "A: Welcome back, Sir. I trust the materials were helpful to you? \nB:Indeed. I've decided to go for the Petty Consumer Loan. That is, if my credit rating is acceptable for the loan terms and meets all the necessary requirements for approval without any additional conditions or special approvals.\nA: Sorry to jump in, but your credit is fine, Sir. Now, tell me, what is it that you need the loan for? \nB: I've just bought a second-hand apartment and I'm looking to do some renovations. You know, a bit of decorating, some new furniture, nothing flashy. \nA: I see. And what loan amount are you expecting? \nB: It says here that the maximum is 20,000 RMB. Is that the limit for all types of renovations, or can it be adjusted based on specific needs? \nA: Is that enough for the renovations you have in mind? \nB: Well, 20,000 RMB, it'll have to be then. \nA: I need some documentation from you. Such as your resident permit, your occupation and salary details and—oh, I already have your credit details here. \nB: Everything is right here. If that's all in order, just let me know where I sign.", + "total_duration": 56.89170068027211, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--172/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--172/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--172/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Welcome back, Sir. I trust the materials were helpful to you?", + "original_text": "Welcome back, Sir. I trust the materials were helpful to you?", + "start_time": 0, + "end_time": 3.6687528344671203, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--172/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Indeed. I've decided to go for the Petty Consumer Loan. That is, if my credit rating is", + "original_text": "Indeed. I've decided to go for the Petty Consumer Loan. That is, if my credit rating is [interrupt] acceptable for the loan terms and meets all the necessary requirements for approval without any additional conditions or special approvals.", + "start_time": 4.116638714029979, + "end_time": 15.993645516751066, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--172/temp/line_1_B.wav", + "silence_duration": 0.4478858795628592, + "is_interrupted": true, + "text_after_interrupt": "acceptable for the loan terms and meets all the necessary requirements for approval without any additional conditions or special approvals." + }, + { + "speaker": "A", + "text": "Sorry to jump in, but your credit is fine, Sir. Now, tell me, what is it that you need the loan for?", + "original_text": "Sorry to jump in, but your credit is fine, Sir. Now, tell me, what is it that you need the loan for?", + "start_time": 8.888339394302088, + "end_time": 15.08806728545855, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--172/temp/line_2_A.wav", + "silence_duration": 0.4094136452744367, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I've just bought a second-hand apartment and I'm looking to do some renovations. You know, a bit of decorating, some new furniture, nothing flashy.", + "original_text": "I've just bought a second-hand apartment and I'm looking to do some renovations. You know, a bit of decorating, some new furniture, nothing flashy.", + "start_time": 16.425714144198096, + "end_time": 23.43814044805297, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--172/temp/line_3_B.wav", + "silence_duration": 0.4320686274470301, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I see. And what loan amount are you expecting?", + "original_text": "I see. And what loan amount are you expecting?", + "start_time": 23.884105694498516, + "end_time": 27.26260909585906, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--172/temp/line_4_A.wav", + "silence_duration": 0.44596524644554425, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "It says here that the maximum is 20,000 RMB. Is that the limit for all types of renovations, or can it be adjusted based on specific needs?", + "original_text": "It says here that the maximum is 20,000 RMB. Is that the limit for all types of renovations, or can it be adjusted based on specific needs?", + "start_time": 27.67390521376577, + "end_time": 36.2072385470991, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--172/temp/line_5_B.wav", + "silence_duration": 0.4112961179067125, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Is that enough for the renovations you have in mind?", + "original_text": "Is that enough for the renovations you have in mind?", + "start_time": 36.66768845974287, + "end_time": 39.30315331235058, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--172/temp/line_6_A.wav", + "silence_duration": 0.46044991264376645, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Well, 20,000 RMB, it'll have to be then.", + "original_text": "Well, 20,000 RMB, it'll have to be then.", + "start_time": 39.83498712115277, + "end_time": 42.865191202785425, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--172/temp/line_7_B.wav", + "silence_duration": 0.5318338088021871, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I need some documentation from you. Such as your resident permit, your occupation and salary details and—oh, I already have your credit details here.", + "original_text": "I need some documentation from you. Such as your resident permit, your occupation and salary details and—oh, I already have your credit details here.", + "start_time": 43.171164072063334, + "end_time": 52.50558584077082, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--172/temp/line_8_A.wav", + "silence_duration": 0.3059728692779115, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Everything is right here. If that's all in order, just let me know where I sign.", + "original_text": "Everything is right here. If that's all in order, just let me know where I sign.", + "start_time": 53.095282054800975, + "end_time": 56.89174463983499, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--172/temp/line_9_B.wav", + "silence_duration": 0.5896962140301565, + "is_interrupted": false + } + ] + }, + "DialogSum--val--176": { + "original_text": "A: How do you think a manager should react to an employee's unsatisfactory work?\nB: If I were a manager, I would have a private talk with this employee to figure out the reasons. It is very important to have this one-to-one discussion in an unthreatening situation without any [interrupt] distractions or interruptions so the employee feels comfortable opening up about their challenges and concerns while receiving constructive feedback in a supportive environment.\nA: Sorry to jump in, but do you think it's better to address the issue immediately, or should the manager wait for a more appropriate time?\nB: It depends on the situation, but generally, waiting for a more appropriate time is better. However, I was going to say that it's also crucial to avoid any distractions during the conversation. Speaking of which, I overheard a manager scold his employee in the elevator this morning, they were from the company on the 12th floor, I guess. They were only three of us in the elevator, I felt very embarrassed to be in the middle of such a tense and uncomfortable situation.\nA: You were in the elevator with them? That must have been awkward. But did you notice how the employee reacted? I wonder if they tried to defend themselves or just stayed silent.\nB: The employee looked really uncomfortable and didn't say much. But I was going to mention that they were only three of us in the elevator, and I felt really embarrassed to be in the middle of them. Anyway, it's not wise to give a harsh time to your employee in front of others, especially strangers.", + "cleaned_text": "A: How do you think a manager should react to an employee's unsatisfactory work?\nB:If I were a manager, I would have a private talk with this employee to figure out the reasons. It is very important to have this one-to-one discussion in an unthreatening situation without any distractions or interruptions so the employee feels comfortable opening up about their challenges and concerns while receiving constructive feedback in a supportive environment.\nA: Sorry to jump in, but do you think it's better to address the issue immediately, or should the manager wait for a more appropriate time?\nB: It depends on the situation, but generally, waiting for a more appropriate time is better. However, I was going to say that it's also crucial to avoid any distractions during the conversation. Speaking of which, I overheard a manager scold his employee in the elevator this morning, they were from the company on the 12th floor, I guess. They were only three of us in the elevator, I felt very embarrassed to be in the middle of such a tense and uncomfortable situation.\nA: You were in the elevator with them? That must have been awkward. But did you notice how the employee reacted? I wonder if they tried to defend themselves or just stayed silent.\nB: The employee looked really uncomfortable and didn't say much. But I was going to mention that they were only three of us in the elevator, and I felt really embarrassed to be in the middle of them. Anyway, it's not wise to give a harsh time to your employee in front of others, especially strangers.", + "total_duration": 71.68040816326531, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--176/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--176/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--176/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "How do you think a manager should react to an employee's unsatisfactory work?", + "original_text": "How do you think a manager should react to an employee's unsatisfactory work?", + "start_time": 0, + "end_time": 4.017052154195011, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--176/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "If I were a manager, I would have a private talk with this employee to figure out the reasons. It is very important to have this one-to-one discussion in an unthreatening situation without any", + "original_text": "If I were a manager, I would have a private talk with this employee to figure out the reasons. It is very important to have this one-to-one discussion in an unthreatening situation without any [interrupt] distractions or interruptions so the employee feels comfortable opening up about their challenges and concerns while receiving constructive feedback in a supportive environment.", + "start_time": 4.468226246608792, + "end_time": 23.160289738672283, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--176/temp/line_1_B.wav", + "silence_duration": 0.4511740924137803, + "is_interrupted": true, + "text_after_interrupt": "distractions or interruptions so the employee feels comfortable opening up about their challenges and concerns while receiving constructive feedback in a supportive environment." + }, + { + "speaker": "A", + "text": "Sorry to jump in, but do you think it's better to address the issue immediately, or should the manager wait for a more appropriate time?", + "original_text": "Sorry to jump in, but do you think it's better to address the issue immediately, or should the manager wait for a more appropriate time?", + "start_time": 13.86069790193759, + "end_time": 21.99929200624598, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--176/temp/line_2_A.wav", + "silence_duration": 0.5577478681613512, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "It depends on the situation, but generally, waiting for a more appropriate time is better. However, I was going to say that it's also crucial to avoid any distractions during the conversation. Speaking of which, I overheard a manager scold his employee in the elevator this morning, they were from the company on the 12th floor, I guess. They were only three of us in the elevator, I felt very embarrassed to be in the middle of such a tense and uncomfortable situation.", + "original_text": "It depends on the situation, but generally, waiting for a more appropriate time is better. However, I was going to say that it's also crucial to avoid any distractions during the conversation. Speaking of which, I overheard a manager scold his employee in the elevator this morning, they were from the company on the 12th floor, I guess. They were only three of us in the elevator, I felt very embarrassed to be in the middle of such a tense and uncomfortable situation.", + "start_time": 23.73288506627354, + "end_time": 46.53488053112615, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--176/temp/line_3_B.wav", + "silence_duration": 0.5725953276012576, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "You were in the elevator with them? That must have been awkward. But did you notice how the employee reacted? I wonder if they tried to defend themselves or just stayed silent.", + "original_text": "You were in the elevator with them? That must have been awkward. But did you notice how the employee reacted? I wonder if they tried to defend themselves or just stayed silent.", + "start_time": 46.98892455253087, + "end_time": 57.50756400831318, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--176/temp/line_4_A.wav", + "silence_duration": 0.45404402140472144, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "The employee looked really uncomfortable and didn't say much. But I was going to mention that they were only three of us in the elevator, and I felt really embarrassed to be in the middle of them. Anyway, it's not wise to give a harsh time to your employee in front of others, especially strangers.", + "original_text": "The employee looked really uncomfortable and didn't say much. But I was going to mention that they were only three of us in the elevator, and I felt really embarrassed to be in the middle of them. Anyway, it's not wise to give a harsh time to your employee in front of others, especially strangers.", + "start_time": 57.864541820313306, + "end_time": 71.68041483618632, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--176/temp/line_5_B.wav", + "silence_duration": 0.35697781200012596, + "is_interrupted": false + } + ] + }, + "DialogSum--val--177": { + "original_text": "A: Hello. Do you know how I can find a room to rent? \nB: There is so much information and I advise to read [interrupt] online listings regularly because they are updated more frequently than traditional sources and often include detailed descriptions, photos, and sometimes even virtual tours of available properties. \nA: Sorry, but do you mean online newspapers or printed ones? \nB: Actually, both can be useful. If you like the room, call the landlord and confirm the information of the room. By the way, I was going to say newspapers are just one option. You might also want to check online listings or local community boards.", + "cleaned_text": "A: Hello. Do you know how I can find a room to rent? \nB:There is so much information and I advise to read online listings regularly because they are updated more frequently than traditional sources and often include detailed descriptions, photos, and sometimes even virtual tours of available properties.\nA: Sorry, but do you mean online newspapers or printed ones? \nB: Actually, both can be useful. If you like the room, call the landlord and confirm the information of the room. By the way, I was going to say newspapers are just one option. You might also want to check online listings or local community boards.", + "total_duration": 29.926575963718822, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--177/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--177/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--177/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Hello. Do you know how I can find a room to rent?", + "original_text": "Hello. Do you know how I can find a room to rent?", + "start_time": 0, + "end_time": 3.1579138321995464, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--177/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "There is so much information and I advise to read", + "original_text": "There is so much information and I advise to read [interrupt] online listings regularly because they are updated more frequently than traditional sources and often include detailed descriptions, photos, and sometimes even virtual tours of available properties.", + "start_time": 3.754448626019334, + "end_time": 16.73440327454541, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--177/temp/line_1_B.wav", + "silence_duration": 0.5965347938197878, + "is_interrupted": true, + "text_after_interrupt": "online listings regularly because they are updated more frequently than traditional sources and often include detailed descriptions, photos, and sometimes even virtual tours of available properties." + }, + { + "speaker": "A", + "text": "Sorry, but do you mean online newspapers or printed ones?", + "original_text": "Sorry, but do you mean online newspapers or printed ones?", + "start_time": 6.447963365248359, + "end_time": 10.557895338037476, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--177/temp/line_2_A.wav", + "silence_duration": 0.42201777353398984, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Actually, both can be useful. If you like the room, call the landlord and confirm the information of the room. By the way, I was going to say newspapers are just one option. You might also want to check online listings or local community boards.", + "original_text": "Actually, both can be useful. If you like the room, call the landlord and confirm the information of the room. By the way, I was going to say newspapers are just one option. You might also want to check online listings or local community boards.", + "start_time": 17.213669683321587, + "end_time": 29.926594853389616, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--177/temp/line_3_B.wav", + "silence_duration": 0.479266408776177, + "is_interrupted": false + } + ] + }, + "DialogSum--val--178": { + "original_text": "A: I'd like two tickets for the movie on Friday, please. \nB: For which movie, madam? \nA: Oh, that's right. Dark and Stormy [interrupt] at 7 PM, if that's possible. I've heard great reviews about its cinematography and the lead actor's performance is supposed to be outstanding. \nB: I'm sorry to interrupt, but I just checked, and the Friday show might already be sold out. Could you consider another day? \nA: Oh, really? Well, how about Saturday or Sunday? \nB: Yes madam, we do have tickets available for that movie on those days. \nA: Are there any seats left for the middle row for Saturday? \nB: Yes, but they are not next to each other. \nA: Oh, that's a pity. We prefer to sit together. \nB: In that case, we still have some seats together in the front or at the back. \nA: The front row sounds good. How much are the [interrupt] tickets for the front row including any additional fees or charges that might apply to premium seating? \nB: Sorry, before we proceed, I just realized I didn't confirm the price for the front row. Let me check that for you. \nA: Sure, please do. \nB: Alright, it's 25 dollars in total.", + "cleaned_text": "A: I'd like two tickets for the movie on Friday, please. \nB: For which movie, madam? \nA:Oh, that's right. Dark and Stormy at 7 PM, if that's possible. I've heard great reviews about its cinematography and the lead actor's performance is supposed to be outstanding.\nB: I'm sorry to interrupt, but I just checked, and the Friday show might already be sold out. Could you consider another day? \nA: Oh, really? Well, how about Saturday or Sunday? \nB: Yes madam, we do have tickets available for that movie on those days. \nA: Are there any seats left for the middle row for Saturday? \nB: Yes, but they are not next to each other. \nA: Oh, that's a pity. We prefer to sit together. \nB: In that case, we still have some seats together in the front or at the back. \nA:The front row sounds good. How much are the tickets for the front row including any additional fees or charges that might apply to premium seating?\nB: Sorry, before we proceed, I just realized I didn't confirm the price for the front row. Let me check that for you. \nA: Sure, please do. \nB: Alright, it's 25 dollars in total.", + "total_duration": 57.78702947845805, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--178/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--178/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--178/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "I'd like two tickets for the movie on Friday, please.", + "original_text": "I'd like two tickets for the movie on Friday, please.", + "start_time": 0, + "end_time": 2.8328344671201813, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--178/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "For which movie, madam?", + "original_text": "For which movie, madam?", + "start_time": 3.2823597353560965, + "end_time": 4.478187399755189, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--178/temp/line_1_B.wav", + "silence_duration": 0.449525268235915, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Oh, that's right. Dark and Stormy", + "original_text": "Oh, that's right. Dark and Stormy [interrupt] at 7 PM, if that's possible. I've heard great reviews about its cinematography and the lead actor's performance is supposed to be outstanding.", + "start_time": 5.0692527365159235, + "end_time": 16.040681307944496, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--178/temp/line_2_A.wav", + "silence_duration": 0.591065336760734, + "is_interrupted": true, + "text_after_interrupt": "at 7 PM, if that's possible. I've heard great reviews about its cinematography and the lead actor's performance is supposed to be outstanding." + }, + { + "speaker": "B", + "text": "I'm sorry to interrupt, but I just checked, and the Friday show might already be sold out. Could you consider another day?", + "original_text": "I'm sorry to interrupt, but I just checked, and the Friday show might already be sold out. Could you consider another day?", + "start_time": 6.9268491083980095, + "end_time": 13.556146160552204, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--178/temp/line_3_B.wav", + "silence_duration": 0.3320468029587545, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Oh, really? Well, how about Saturday or Sunday?", + "original_text": "Oh, really? Well, how about Saturday or Sunday?", + "start_time": 16.342393226691073, + "end_time": 19.58157690016046, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--178/temp/line_4_A.wav", + "silence_duration": 0.301711918746577, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes madam, we do have tickets available for that movie on those days.", + "original_text": "Yes madam, we do have tickets available for that movie on those days.", + "start_time": 19.99020445776373, + "end_time": 23.600907405609536, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--178/temp/line_5_B.wav", + "silence_duration": 0.4086275576032712, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Are there any seats left for the middle row for Saturday?", + "original_text": "Are there any seats left for the middle row for Saturday?", + "start_time": 23.942893205985374, + "end_time": 26.694457831835713, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--178/temp/line_6_A.wav", + "silence_duration": 0.3419858003758378, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, but they are not next to each other.", + "original_text": "Yes, but they are not next to each other.", + "start_time": 27.026435951903306, + "end_time": 29.023352051676547, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--178/temp/line_7_B.wav", + "silence_duration": 0.33197812006759114, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Oh, that's a pity. We prefer to sit together.", + "original_text": "Oh, that's a pity. We prefer to sit together.", + "start_time": 29.33098056553596, + "end_time": 32.12898510068335, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--178/temp/line_8_A.wav", + "silence_duration": 0.3076285138594125, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "In that case, we still have some seats together in the front or at the back.", + "original_text": "In that case, we still have some seats together in the front or at the back.", + "start_time": 32.657342369931726, + "end_time": 36.256435340453265, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--178/temp/line_9_B.wav", + "silence_duration": 0.5283572692483761, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "The front row sounds good. How much are the", + "original_text": "The front row sounds good. How much are the [interrupt] tickets for the front row including any additional fees or charges that might apply to premium seating?", + "start_time": 36.56563293512383, + "end_time": 45.296335882969636, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--178/temp/line_10_A.wav", + "silence_duration": 0.30919759467056174, + "is_interrupted": true, + "text_after_interrupt": "tickets for the front row including any additional fees or charges that might apply to premium seating?" + }, + { + "speaker": "B", + "text": "Sorry, before we proceed, I just realized I didn't confirm the price for the front row. Let me check that for you.", + "original_text": "Sorry, before we proceed, I just realized I didn't confirm the price for the front row. Let me check that for you.", + "start_time": 47.6582340318954, + "end_time": 53.42839276205413, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--178/temp/line_11_B.wav", + "silence_duration": 0.3569153150299154, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Sure, please do.", + "original_text": "Sure, please do.", + "start_time": 54.00637753158, + "end_time": 55.12093535470925, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--178/temp/line_12_A.wav", + "silence_duration": 0.5779847695258697, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Alright, it's 25 dollars in total.", + "original_text": "Alright, it's 25 dollars in total.", + "start_time": 55.62758755606937, + "end_time": 57.7870433383823, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--178/temp/line_13_B.wav", + "silence_duration": 0.5066522013601173, + "is_interrupted": false + } + ] + }, + "DialogSum--val--179": { + "original_text": "A: Hi, there! Did you have any questions about our bikes? \nB: Yeah. Do you work on bicycles in addition to selling them? \nA: Oh, yes, we can handle any repairs you may [interrupt] need, from basic tune-ups to more complex fixes like drivetrain replacements, brake system overhauls, or even full frame alignments if necessary. \nB: Sorry to jump in, but what I need is not exactly a repair. My cousin gave me a road bike, but I'm not tall enough to ride it. Can you put smaller wheels on it? \nA: We could do that, but I wouldn't recommend it, because you would have to use your legs more to go the same distance. You'd be better off buying a bike that's the right size for you. \nB: I was afraid you'd say that. You see, my cousin's bike is a very expensive model. It's a really nice [interrupt] bike with premium carbon fiber components and top-tier Shimano gears, and I was hoping to make it work somehow despite the size mismatch. \nA: Have you considered trading the bike in? We do buy and sell used bikes, and I can give you a fair price for any trade-in. \nB: Really? That would be great! How much can you give me for the bike? \nA: If it's in good shape, probably at least 50% of its original value. By the way, you mentioned earlier that the bike is a really nice model. What brand or model is it? \nB: Oh, it's a Trek Domane. It's almost brand new, which is why I was hesitant to part with it. \nA: That's a great bike! Bring it in tomorrow, and we can take a closer look to give you an accurate trade-in value. \nB: Terrific! If you're here tomorrow, I'll bring it in then.", + "cleaned_text": "A: Hi, there! Did you have any questions about our bikes? \nB: Yeah. Do you work on bicycles in addition to selling them? \nA:Oh, yes, we can handle any repairs you may need, from basic tune-ups to more complex fixes like drivetrain replacements, brake system overhauls, or even full frame alignments if necessary.\nB: Sorry to jump in, but what I need is not exactly a repair. My cousin gave me a road bike, but I'm not tall enough to ride it. Can you put smaller wheels on it? \nA: We could do that, but I wouldn't recommend it, because you would have to use your legs more to go the same distance. You'd be better off buying a bike that's the right size for you. \nB:I was afraid you'd say that. You see, my cousin's bike is a very expensive model. It's a really nice bike with premium carbon fiber components and top-tier Shimano gears, and I was hoping to make it work somehow despite the size mismatch.\nA: Have you considered trading the bike in? We do buy and sell used bikes, and I can give you a fair price for any trade-in. \nB: Really? That would be great! How much can you give me for the bike? \nA: If it's in good shape, probably at least 50% of its original value. By the way, you mentioned earlier that the bike is a really nice model. What brand or model is it? \nB: Oh, it's a Trek Domane. It's almost brand new, which is why I was hesitant to part with it. \nA: That's a great bike! Bring it in tomorrow, and we can take a closer look to give you an accurate trade-in value. \nB: Terrific! If you're here tomorrow, I'll bring it in then.", + "total_duration": 83.77650793650794, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--179/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--179/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--179/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Hi, there! Did you have any questions about our bikes?", + "original_text": "Hi, there! Did you have any questions about our bikes?", + "start_time": 0, + "end_time": 3.6919727891156464, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--179/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yeah. Do you work on bicycles in addition to selling them?", + "original_text": "Yeah. Do you work on bicycles in addition to selling them?", + "start_time": 4.035101478008145, + "end_time": 7.134965423586376, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--179/temp/line_1_B.wav", + "silence_duration": 0.3431286888924989, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Oh, yes, we can handle any repairs you may", + "original_text": "Oh, yes, we can handle any repairs you may [interrupt] need, from basic tune-ups to more complex fixes like drivetrain replacements, brake system overhauls, or even full frame alignments if necessary.", + "start_time": 7.589727304059602, + "end_time": 19.559613925374794, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--179/temp/line_2_A.wav", + "silence_duration": 0.4547618804732261, + "is_interrupted": true, + "text_after_interrupt": "need, from basic tune-ups to more complex fixes like drivetrain replacements, brake system overhauls, or even full frame alignments if necessary." + }, + { + "speaker": "B", + "text": "Sorry to jump in, but what I need is not exactly a repair. My cousin gave me a road bike, but I'm not tall enough to ride it. Can you put smaller wheels on it?", + "original_text": "Sorry to jump in, but what I need is not exactly a repair. My cousin gave me a road bike, but I'm not tall enough to ride it. Can you put smaller wheels on it?", + "start_time": 10.167142270045996, + "end_time": 18.561155875488176, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--179/temp/line_3_B.wav", + "silence_duration": 0.3118713883649353, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "We could do that, but I wouldn't recommend it, because you would have to use your legs more to go the same distance. You'd be better off buying a bike that's the right size for you.", + "original_text": "We could do that, but I wouldn't recommend it, because you would have to use your legs more to go the same distance. You'd be better off buying a bike that's the right size for you.", + "start_time": 20.063314886906795, + "end_time": 30.28009493225827, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--179/temp/line_4_A.wav", + "silence_duration": 0.5037009615320005, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I was afraid you'd say that. You see, my cousin's bike is a very expensive model. It's a really nice", + "original_text": "I was afraid you'd say that. You see, my cousin's bike is a very expensive model. It's a really nice [interrupt] bike with premium carbon fiber components and top-tier Shimano gears, and I was hoping to make it work somehow despite the size mismatch.", + "start_time": 30.80636176130521, + "end_time": 44.2855454347746, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--179/temp/line_5_B.wav", + "silence_duration": 0.5262668290469421, + "is_interrupted": true, + "text_after_interrupt": "bike with premium carbon fiber components and top-tier Shimano gears, and I was hoping to make it work somehow despite the size mismatch." + }, + { + "speaker": "A", + "text": "Have you considered trading the bike in? We do buy and sell used bikes, and I can give you a fair price for any trade-in.", + "original_text": "Have you considered trading the bike in? We do buy and sell used bikes, and I can give you a fair price for any trade-in.", + "start_time": 44.773195082726275, + "end_time": 52.691199617873664, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--179/temp/line_6_A.wav", + "silence_duration": 0.5898487751712957, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Really? That would be great! How much can you give me for the bike?", + "original_text": "Really? That would be great! How much can you give me for the bike?", + "start_time": 53.095766736000165, + "end_time": 56.532320023982024, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--179/temp/line_7_B.wav", + "silence_duration": 0.40456711812650403, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "If it's in good shape, probably at least 50% of its original value. By the way, you mentioned earlier that the bike is a really nice model. What brand or model is it?", + "original_text": "If it's in good shape, probably at least 50% of its original value. By the way, you mentioned earlier that the bike is a really nice model. What brand or model is it?", + "start_time": 56.94741426356047, + "end_time": 67.36156392342441, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--179/temp/line_8_A.wav", + "silence_duration": 0.41509423957844355, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Oh, it's a Trek Domane. It's almost brand new, which is why I was hesitant to part with it.", + "original_text": "Oh, it's a Trek Domane. It's almost brand new, which is why I was hesitant to part with it.", + "start_time": 67.8328769837502, + "end_time": 72.546527777401, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--179/temp/line_9_B.wav", + "silence_duration": 0.4713130603257787, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "That's a great bike! Bring it in tomorrow, and we can take a closer look to give you an accurate trade-in value.", + "original_text": "That's a great bike! Bring it in tomorrow, and we can take a closer look to give you an accurate trade-in value.", + "start_time": 73.14361946366272, + "end_time": 80.37663533667859, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--179/temp/line_10_A.wav", + "silence_duration": 0.5970916862617188, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Terrific! If you're here tomorrow, I'll bring it in then.", + "original_text": "Terrific! If you're here tomorrow, I'll bring it in then.", + "start_time": 80.82761655264795, + "end_time": 83.77655079301077, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--179/temp/line_11_B.wav", + "silence_duration": 0.4509812159693591, + "is_interrupted": false + } + ] + }, + "DialogSum--val--180": { + "original_text": "A: Help me decide on which type of hotel room to book.\nB: I want the one with a bed.\nA: Very funny. We have a choice of different views, and each one is a different price. For instance, a room with a city view is 175 a night.\nB: 175 a night?! That's highway robbery!\nA: If you think that's too steep, there are a few other options. We can get a courtyard room with no view for 120 a night or a room with an obstructed or peek-a-boo ocean views for 130 [interrupt] a night, but it may not be worth it if you really want a clear view since the obstruction could be quite significant depending on the building's layout and position.\nB: Wait, did you say \"peek-a-boo\" ocean view? What does that even mean?\nA: It means you can see the ocean, but the view is partially blocked by something, like another building. Anyway, as I was saying, the peek-a-boo ocean view is 130 a night.\nB: I don't really care which type of room we get as long as we don't end up with a room on the ground floor. I don't like having people walking back and forth outside my window all night.\nA: Okay, I can request a room on an upper floor. You really don't have a preference?\nB: No, not really.\nA: There is a penthouse room for 400 a night.\nB: What?! For that price, I'd better get a view of the Eiffel Tower, the Parthenon, and the Great Wall of [interrupt] China all at once! That's just too much, especially considering we're only staying for a couple of nights and won't even be in the room that often.\nA: China, yes, I get it. But seriously, are you sure you don't want to reconsider the city view option? It's not as expensive as the penthouse, and it might be worth the extra cost for a better experience.\nB: Hmm, you might be right. But wait, you mentioned something about an obstructed view earlier—can you explain that again?", + "cleaned_text": "A: Help me decide on which type of hotel room to book.\nB: I want the one with a bed.\nA: Very funny. We have a choice of different views, and each one is a different price. For instance, a room with a city view is 175 a night.\nB: 175 a night?! That's highway robbery!\nA:If you think that's too steep, there are a few other options. We can get a courtyard room with no view for 120 a night or a room with an obstructed or peek-a-boo ocean views for 130 a night, but it may not be worth it if you really want a clear view since the obstruction could be quite significant depending on the building's layout and position.\nB: Wait, did you say \"peek-a-boo\" ocean view? What does that even mean?\nA: It means you can see the ocean, but the view is partially blocked by something, like another building. Anyway, as I was saying, the peek-a-boo ocean view is 130 a night.\nB: I don't really care which type of room we get as long as we don't end up with a room on the ground floor. I don't like having people walking back and forth outside my window all night.\nA: Okay, I can request a room on an upper floor. You really don't have a preference?\nB: No, not really.\nA: There is a penthouse room for 400 a night.\nB:What?! For that price, I'd better get a view of the Eiffel Tower, the Parthenon, and the Great Wall of China all at once! That's just too much, especially considering we're only staying for a couple of nights and won't even be in the room that often.\nA: China, yes, I get it. But seriously, are you sure you don't want to reconsider the city view option? It's not as expensive as the penthouse, and it might be worth the extra cost for a better experience.\nB: Hmm, you might be right. But wait, you mentioned something about an obstructed view earlier—can you explain that again?", + "total_duration": 104.03233560090703, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--180/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--180/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--180/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Help me decide on which type of hotel room to book.", + "original_text": "Help me decide on which type of hotel room to book.", + "start_time": 0, + "end_time": 2.995374149659864, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--180/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I want the one with a bed.", + "original_text": "I want the one with a bed.", + "start_time": 3.2991975586719344, + "end_time": 4.634344950962184, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--180/temp/line_1_B.wav", + "silence_duration": 0.3038234090120703, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Very funny. We have a choice of different views, and each one is a different price. For instance, a room with a city view is 175 a night.", + "original_text": "Very funny. We have a choice of different views, and each one is a different price. For instance, a room with a city view is 175 a night.", + "start_time": 5.101713606600419, + "end_time": 14.77282471771153, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--180/temp/line_2_A.wav", + "silence_duration": 0.4673686556382345, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "175 a night?! That's highway robbery!", + "original_text": "175 a night?! That's highway robbery!", + "start_time": 15.34238509136666, + "end_time": 18.39580912764784, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--180/temp/line_3_B.wav", + "silence_duration": 0.5695603736551313, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "If you think that's too steep, there are a few other options. We can get a courtyard room with no view for 120 a night or a room with an obstructed or peek-a-boo ocean views for 130", + "original_text": "If you think that's too steep, there are a few other options. We can get a courtyard room with no view for 120 a night or a room with an obstructed or peek-a-boo ocean views for 130 [interrupt] a night, but it may not be worth it if you really want a clear view since the obstruction could be quite significant depending on the building's layout and position.", + "start_time": 18.752236831119905, + "end_time": 40.207474926358, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--180/temp/line_4_A.wav", + "silence_duration": 0.3564277034720654, + "is_interrupted": true, + "text_after_interrupt": "a night, but it may not be worth it if you really want a clear view since the obstruction could be quite significant depending on the building's layout and position." + }, + { + "speaker": "B", + "text": "Wait, did you say \"peek-a-boo\" ocean view? What does that even mean?", + "original_text": "Wait, did you say \"peek-a-boo\" ocean view? What does that even mean?", + "start_time": 31.244572432026935, + "end_time": 36.65482186513351, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--180/temp/line_5_B.wav", + "silence_duration": 0.503378876478118, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "It means you can see the ocean, but the view is partially blocked by something, like another building. Anyway, as I was saying, the peek-a-boo ocean view is 130 a night.", + "original_text": "It means you can see the ocean, but the view is partially blocked by something, like another building. Anyway, as I was saying, the peek-a-boo ocean view is 130 a night.", + "start_time": 40.749611680327554, + "end_time": 51.82553004767449, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--180/temp/line_6_A.wav", + "silence_duration": 0.5421367539695539, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I don't really care which type of room we get as long as we don't end up with a room on the ground floor. I don't like having people walking back and forth outside my window all night.", + "original_text": "I don't really care which type of room we get as long as we don't end up with a room on the ground floor. I don't like having people walking back and forth outside my window all night.", + "start_time": 52.17654128445012, + "end_time": 60.45445511664966, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--180/temp/line_7_B.wav", + "silence_duration": 0.3510112367756295, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Okay, I can request a room on an upper floor. You really don't have a preference?", + "original_text": "Okay, I can request a room on an upper floor. You really don't have a preference?", + "start_time": 60.816382354543684, + "end_time": 66.41239142483848, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--180/temp/line_8_A.wav", + "silence_duration": 0.36192723789402553, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "No, not really.", + "original_text": "No, not really.", + "start_time": 66.98046956479008, + "end_time": 68.15307727454065, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--180/temp/line_9_B.wav", + "silence_duration": 0.5680781399516032, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "There is a penthouse room for 400 a night.", + "original_text": "There is a penthouse room for 400 a night.", + "start_time": 68.57666605012572, + "end_time": 71.29340074400328, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--180/temp/line_10_A.wav", + "silence_duration": 0.4235887755850684, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "What?! For that price, I'd better get a view of the Eiffel Tower, the Parthenon, and the Great Wall of", + "original_text": "What?! For that price, I'd better get a view of the Eiffel Tower, the Parthenon, and the Great Wall of [interrupt] China all at once! That's just too much, especially considering we're only staying for a couple of nights and won't even be in the room that often.", + "start_time": 71.67312259653545, + "end_time": 83.22505003417717, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--180/temp/line_11_B.wav", + "silence_duration": 0.37972185253216945, + "is_interrupted": true, + "text_after_interrupt": "China all at once! That's just too much, especially considering we're only staying for a couple of nights and won't even be in the room that often." + }, + { + "speaker": "A", + "text": "China, yes, I get it. But seriously, are you sure you don't want to reconsider the city view option? It's not as expensive as the penthouse, and it might be worth the extra cost for a better experience.", + "original_text": "China, yes, I get it. But seriously, are you sure you don't want to reconsider the city view option? It's not as expensive as the penthouse, and it might be worth the extra cost for a better experience.", + "start_time": 82.98325123558111, + "end_time": 97.15903354850627, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--180/temp/line_12_A.wav", + "silence_duration": 0.5948340574013256, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Hmm, you might be right. But wait, you mentioned something about an obstructed view earlier—can you explain that again?", + "original_text": "Hmm, you might be right. But wait, you mentioned something about an obstructed view earlier—can you explain that again?", + "start_time": 97.46112507622351, + "end_time": 104.03237224175639, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--180/temp/line_13_B.wav", + "silence_duration": 0.3020915277172377, + "is_interrupted": false + } + ] + }, + "DialogSum--val--181": { + "original_text": "A: Holiday Travel! What can I do for you? \nB: Hello! I'd like to book a flight to Berlin for the 23rd this month. \nA: OK. Let me see what's available. And when will you be [interrupt] departing from? I need to know your origin city to check all possible connections and find you the best possible deal with the most convenient layovers. \nB: Oh, sorry, I forgot to mention, I need the cheapest seat possible. \nA: No problem. And when will you be returning? \nB: Er, well, I'd like to catch a return flight on the 29th. \nA: OK, let me see. Hmm... the ticket price is much lower if you leave one day earlier. \nB: I see. How much is it for one day earlier? \nA: It's only 980 dollars. \nB: All right. Then I'll take that flight. \nA: OK. That's flight BA 7101, from Salt Lake City to New York Kennedy Airport. Then Flight BA 2701 from Kennedy Airport to Berlin. The first flight leaves Salt Lake City at 10:00 am, and arrives in New York at 4:15 pm. Then the 2nd flight leaves Kennedy Airport at 5:45 pm. You'll arrive in Berlin at 8:30 am the next day. \nB: All right. Thanks. Oh, wait, did you mention the return flight details? \nA: Oh, I haven't yet. Let me check that for you.", + "cleaned_text": "A: Holiday Travel! What can I do for you? \nB: Hello! I'd like to book a flight to Berlin for the 23rd this month. \nA:OK. Let me see what's available. And when will you be departing from? I need to know your origin city to check all possible connections and find you the best possible deal with the most convenient layovers.\nB: Oh, sorry, I forgot to mention, I need the cheapest seat possible. \nA: No problem. And when will you be returning? \nB: Er, well, I'd like to catch a return flight on the 29th. \nA: OK, let me see. Hmm... the ticket price is much lower if you leave one day earlier. \nB: I see. How much is it for one day earlier? \nA: It's only 980 dollars. \nB: All right. Then I'll take that flight. \nA: OK. That's flight BA 7101, from Salt Lake City to New York Kennedy Airport. Then Flight BA 2701 from Kennedy Airport to Berlin. The first flight leaves Salt Lake City at 10:00 am, and arrives in New York at 4:15 pm. Then the 2nd flight leaves Kennedy Airport at 5:45 pm. You'll arrive in Berlin at 8:30 am the next day. \nB: All right. Thanks. Oh, wait, did you mention the return flight details? \nA: Oh, I haven't yet. Let me check that for you.", + "total_duration": 75.32730158730159, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--181/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--181/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--181/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Holiday Travel! What can I do for you?", + "original_text": "Holiday Travel! What can I do for you?", + "start_time": 0, + "end_time": 2.8560544217687074, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--181/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Hello! I'd like to book a flight to Berlin for the 23rd this month.", + "original_text": "Hello! I'd like to book a flight to Berlin for the 23rd this month.", + "start_time": 3.4275166925197933, + "end_time": 7.165929390932492, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--181/temp/line_1_B.wav", + "silence_duration": 0.5714622707510857, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "OK. Let me see what's available. And when will you be", + "original_text": "OK. Let me see what's available. And when will you be [interrupt] departing from? I need to know your origin city to check all possible connections and find you the best possible deal with the most convenient layovers.", + "start_time": 7.488381552550128, + "end_time": 20.363846405157837, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--181/temp/line_2_A.wav", + "silence_duration": 0.32245216161763585, + "is_interrupted": true, + "text_after_interrupt": "departing from? I need to know your origin city to check all possible connections and find you the best possible deal with the most convenient layovers." + }, + { + "speaker": "B", + "text": "Oh, sorry, I forgot to mention, I need the cheapest seat possible.", + "original_text": "Oh, sorry, I forgot to mention, I need the cheapest seat possible.", + "start_time": 11.226794250962826, + "end_time": 14.686567493593211, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--181/temp/line_3_B.wav", + "silence_duration": 0.3874935240637401, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "No problem. And when will you be returning?", + "original_text": "No problem. And when will you be returning?", + "start_time": 20.897137302703108, + "end_time": 23.81124161109313, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--181/temp/line_4_A.wav", + "silence_duration": 0.5332908975452715, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Er, well, I'd like to catch a return flight on the 29th.", + "original_text": "Er, well, I'd like to catch a return flight on the 29th.", + "start_time": 24.161983385360845, + "end_time": 28.097765698286015, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--181/temp/line_5_B.wav", + "silence_duration": 0.3507417742677145, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "OK, let me see. Hmm... the ticket price is much lower if you leave one day earlier.", + "original_text": "OK, let me see. Hmm... the ticket price is much lower if you leave one day earlier.", + "start_time": 28.62524294847157, + "end_time": 34.639211202439824, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--181/temp/line_6_A.wav", + "silence_duration": 0.5274772501855567, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I see. How much is it for one day earlier?", + "original_text": "I see. How much is it for one day earlier?", + "start_time": 35.21178662349681, + "end_time": 37.847251476104525, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--181/temp/line_7_B.wav", + "silence_duration": 0.5725754210569867, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "It's only 980 dollars.", + "original_text": "It's only 980 dollars.", + "start_time": 38.22765712151474, + "end_time": 40.561262563691606, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--181/temp/line_8_A.wav", + "silence_duration": 0.3804056454102116, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "All right. Then I'll take that flight.", + "original_text": "All right. Then I'll take that flight.", + "start_time": 40.951677949765255, + "end_time": 42.7280044803775, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--181/temp/line_9_B.wav", + "silence_duration": 0.3904153860736503, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "OK. That's flight BA 7101, from Salt Lake City to New York Kennedy Airport. Then Flight BA 2701 from Kennedy Airport to Berlin. The first flight leaves Salt Lake City at 10:00 am, and arrives in New York at 4:15 pm. Then the 2nd flight leaves Kennedy Airport at 5:45 pm. You'll arrive in Berlin at 8:30 am the next day.", + "original_text": "OK. That's flight BA 7101, from Salt Lake City to New York Kennedy Airport. Then Flight BA 2701 from Kennedy Airport to Berlin. The first flight leaves Salt Lake City at 10:00 am, and arrives in New York at 4:15 pm. Then the 2nd flight leaves Kennedy Airport at 5:45 pm. You'll arrive in Berlin at 8:30 am the next day.", + "start_time": 43.13645444347163, + "end_time": 66.69309843440134, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--181/temp/line_10_A.wav", + "silence_duration": 0.40844996309412873, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "All right. Thanks. Oh, wait, did you mention the return flight details?", + "original_text": "All right. Thanks. Oh, wait, did you mention the return flight details?", + "start_time": 67.14851689312962, + "end_time": 71.82733775480763, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--181/temp/line_11_B.wav", + "silence_duration": 0.45541845872828324, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Oh, I haven't yet. Let me check that for you.", + "original_text": "Oh, I haven't yet. Let me check that for you.", + "start_time": 72.21586955662768, + "end_time": 75.32734347953017, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--181/temp/line_12_A.wav", + "silence_duration": 0.3885318018200527, + "is_interrupted": false + } + ] + }, + "DialogSum--val--182": { + "original_text": "A: At the Museum of Modern Art in New York. The Art History Department recently organized a special museum tour [interrupt] that featured a range of modern and contemporary artists, including some exclusive exhibits that were only available for viewing during this limited-time event. The tour also included interactive workshops with curators and special access to the museum's archives. \nB: That sounds amazing! Do you know if they're planning another tour soon? \nA: Yes, but before I get to that, I wanted to mention that this print is actually a painting by Georgia O'Keefe called 'Lake George Window' which showcases her incredible ability to blend realism with abstract elements in a way that was revolutionary for her time. \nB: Oh, interesting! It really does look like a photograph. Anyway, about that tour—are they organizing another one? \nA: Yes, they are planning another tour, but the details haven't been finalized yet. They're considering expanding it to include more international artists and possibly even some digital art installations.", + "cleaned_text": "A:At the Museum of Modern Art in New York. The Art History Department recently organized a special museum tour that featured a range of modern and contemporary artists, including some exclusive exhibits that were only available for viewing during this limited-time event. The tour also included interactive workshops with curators and special access to the museum's archives.\nB: That sounds amazing! Do you know if they're planning another tour soon? \nA: Yes, but before I get to that, I wanted to mention that this print is actually a painting by Georgia O'Keefe called 'Lake George Window' which showcases her incredible ability to blend realism with abstract elements in a way that was revolutionary for her time. \nB: Oh, interesting! It really does look like a photograph. Anyway, about that tour—are they organizing another one? \nA: Yes, they are planning another tour, but the details haven't been finalized yet. They're considering expanding it to include more international artists and possibly even some digital art installations.", + "total_duration": 56.38848072562358, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--182/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--182/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--182/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "At the Museum of Modern Art in New York. The Art History Department recently organized a special museum tour", + "original_text": "At the Museum of Modern Art in New York. The Art History Department recently organized a special museum tour [interrupt] that featured a range of modern and contemporary artists, including some exclusive exhibits that were only available for viewing during this limited-time event. The tour also included interactive workshops with curators and special access to the museum's archives.", + "start_time": 0, + "end_time": 22.558185941043085, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--182/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": true, + "text_after_interrupt": "that featured a range of modern and contemporary artists, including some exclusive exhibits that were only available for viewing during this limited-time event. The tour also included interactive workshops with curators and special access to the museum's archives." + }, + { + "speaker": "B", + "text": "That sounds amazing! Do you know if they're planning another tour soon?", + "original_text": "That sounds amazing! Do you know if they're planning another tour soon?", + "start_time": 6.896326530612245, + "end_time": 10.332879818594105, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--182/temp/line_1_B.wav", + "silence_duration": 0.3496632781808549, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Yes, but before I get to that, I wanted to mention that this print is actually a painting by Georgia O'Keefe called 'Lake George Window' which showcases her incredible ability to blend realism with abstract elements in a way that was revolutionary for her time.", + "original_text": "Yes, but before I get to that, I wanted to mention that this print is actually a painting by Georgia O'Keefe called 'Lake George Window' which showcases her incredible ability to blend realism with abstract elements in a way that was revolutionary for her time.", + "start_time": 22.87154075439938, + "end_time": 38.568230096803006, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--182/temp/line_2_A.wav", + "silence_duration": 0.31335481335629384, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Oh, interesting! It really does look like a photograph. Anyway, about that tour—are they organizing another one?", + "original_text": "Oh, interesting! It really does look like a photograph. Anyway, about that tour—are they organizing another one?", + "start_time": 38.92033493590425, + "end_time": 44.4002442329564, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--182/temp/line_3_B.wav", + "silence_duration": 0.35210483910124446, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Yes, they are planning another tour, but the details haven't been finalized yet. They're considering expanding it to include more international artists and possibly even some digital art installations.", + "original_text": "Yes, they are planning another tour, but the details haven't been finalized yet. They're considering expanding it to include more international artists and possibly even some digital art installations.", + "start_time": 44.77854772518379, + "end_time": 56.38852504944683, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--182/temp/line_4_A.wav", + "silence_duration": 0.378303492227388, + "is_interrupted": false + } + ] + }, + "DialogSum--val--183": { + "original_text": "A: How much freedom do your parents give you? \nB: Quite a lot. I mean I'm allowed out most evenings. Weekdays, I have to be back by 9:30. But on weekends I can stay out till [interrupt] 11:00, which is pretty reasonable considering my age and the fact that they trust me to make good decisions about where I go and who I spend time with. \nA: Sorry to cut in, but does that mean you have the same curfew even if you're out with friends? \nB: Yes, it's the same, but on weekends I can stay out till 11:00. \n\nA: What about money? Do you have any pocket money? \nB: Yes, my parents give me two pounds a week. \nA: Is there anything you'd like to do which your parents won't let you? \nB: Yes, I want to go on holidays this coming summer with my boyfriend, but they say I have to wait till I am [interrupt] 17 before I can go on trips like that without them because they believe I'll be more mature and better able to handle any unexpected situations that might arise during the trip. \nA: Wait, do you think they're worried about your safety or is it more about the relationship? \nB: I think it's more about my age. They say I have to wait till I am 17. \n\nA: Do you think that's unfair? \nB: I don't know...he is very responsible, my boyfriend, even my parents think so and I don't see how a year or two is going to make much difference.", + "cleaned_text": "A: How much freedom do your parents give you? \nB:Quite a lot. I mean I'm allowed out most evenings. Weekdays, I have to be back by 9:30. But on weekends I can stay out till 11:00, which is pretty reasonable considering my age and the fact that they trust me to make good decisions about where I go and who I spend time with.\nA: Sorry to cut in, but does that mean you have the same curfew even if you're out with friends? \nB: Yes, it's the same, but on weekends I can stay out till 11:00. \n\nA: What about money? Do you have any pocket money? \nB: Yes, my parents give me two pounds a week. \nA: Is there anything you'd like to do which your parents won't let you? \nB:Yes, I want to go on holidays this coming summer with my boyfriend, but they say I have to wait till I am 17 before I can go on trips like that without them because they believe I'll be more mature and better able to handle any unexpected situations that might arise during the trip.\nA: Wait, do you think they're worried about your safety or is it more about the relationship? \nB: I think it's more about my age. They say I have to wait till I am 17. \n\nA: Do you think that's unfair? \nB: I don't know...he is very responsible, my boyfriend, even my parents think so and I don't see how a year or two is going to make much difference.", + "total_duration": 63.060589569160996, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--183/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--183/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--183/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "How much freedom do your parents give you?", + "original_text": "How much freedom do your parents give you?", + "start_time": 0, + "end_time": 2.136235827664399, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--183/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Quite a lot. I mean I'm allowed out most evenings. Weekdays, I have to be back by 9:30. But on weekends I can stay out till", + "original_text": "Quite a lot. I mean I'm allowed out most evenings. Weekdays, I have to be back by 9:30. But on weekends I can stay out till [interrupt] 11:00, which is pretty reasonable considering my age and the fact that they trust me to make good decisions about where I go and who I spend time with.", + "start_time": 2.447934275176931, + "end_time": 17.65700456996151, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--183/temp/line_1_B.wav", + "silence_duration": 0.311698447512532, + "is_interrupted": true, + "text_after_interrupt": "11:00, which is pretty reasonable considering my age and the fact that they trust me to make good decisions about where I go and who I spend time with." + }, + { + "speaker": "A", + "text": "Sorry to cut in, but does that mean you have the same curfew even if you're out with friends?", + "original_text": "Sorry to cut in, but does that mean you have the same curfew even if you're out with friends?", + "start_time": 10.423988696945639, + "end_time": 16.403127018941102, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--183/temp/line_2_A.wav", + "silence_duration": 0.4097532109176402, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, it's the same, but on weekends I can stay out till 11:00.", + "original_text": "Yes, it's the same, but on weekends I can stay out till 11:00.", + "start_time": 18.24768035072321, + "end_time": 21.90482320786607, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--183/temp/line_3_B.wav", + "silence_duration": 0.5906757807616998, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "What about money? Do you have any pocket money?", + "original_text": "What about money? Do you have any pocket money?", + "start_time": 22.231784893342798, + "end_time": 25.482578544136448, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--183/temp/line_4_A.wav", + "silence_duration": 0.326961685476729, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, my parents give me two pounds a week.", + "original_text": "Yes, my parents give me two pounds a week.", + "start_time": 26.05626308287248, + "end_time": 28.285378729130983, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--183/temp/line_5_B.wav", + "silence_duration": 0.5736845387360321, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Is there anything you'd like to do which your parents won't let you?", + "original_text": "Is there anything you'd like to do which your parents won't let you?", + "start_time": 28.729703406508712, + "end_time": 31.748297510817103, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--183/temp/line_6_A.wav", + "silence_duration": 0.4443246773777285, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, I want to go on holidays this coming summer with my boyfriend, but they say I have to wait till I am", + "original_text": "Yes, I want to go on holidays this coming summer with my boyfriend, but they say I have to wait till I am [interrupt] 17 before I can go on trips like that without them because they believe I'll be more mature and better able to handle any unexpected situations that might arise during the trip.", + "start_time": 32.14554579013371, + "end_time": 47.07597662913598, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--183/temp/line_7_B.wav", + "silence_duration": 0.3972482793166056, + "is_interrupted": true, + "text_after_interrupt": "17 before I can go on trips like that without them because they believe I'll be more mature and better able to handle any unexpected situations that might arise during the trip." + }, + { + "speaker": "A", + "text": "Wait, do you think they're worried about your safety or is it more about the relationship?", + "original_text": "Wait, do you think they're worried about your safety or is it more about the relationship?", + "start_time": 43.071261923035024, + "end_time": 48.56278119741144, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--183/temp/line_8_A.wav", + "silence_duration": 0.33657264313504576, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I think it's more about my age. They say I have to wait till I am 17.", + "original_text": "I think it's more about my age. They say I have to wait till I am 17.", + "start_time": 48.90153021672178, + "end_time": 52.89536241626827, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--183/temp/line_9_B.wav", + "silence_duration": 0.3387490193103429, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Do you think that's unfair?", + "original_text": "Do you think that's unfair?", + "start_time": 53.3994463261819, + "end_time": 54.93196333298462, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--183/temp/line_10_A.wav", + "silence_duration": 0.5040839099136316, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I don't know...he is very responsible, my boyfriend, even my parents think so and I don't see how a year or two is going to make much difference.", + "original_text": "I don't know...he is very responsible, my boyfriend, even my parents think so and I don't see how a year or two is going to make much difference.", + "start_time": 55.32835564619776, + "end_time": 63.06060054415694, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--183/temp/line_11_B.wav", + "silence_duration": 0.39639231321313567, + "is_interrupted": false + } + ] + }, + "DialogSum--val--184": { + "original_text": "A: You're going to wear out the computer's keyboard!\nB: Oh, hi.\nA: Do you have any idea what time it is?\nB: About ten or ten-[interrupt] thirty, I think, though I've been so focused on my work that I completely lost track of time and didn't even notice how late it's gotten.\nA: It's nearly midnight.\nB: Really? I didn't know it was so late.\nA: Don't you have an early class to teach tomorrow morning?\nB: Yes, at seven o'clock. My commuter class, the students who go to [interrupt] work right after class, so they need to be sharp in the morning which means I have to be extra prepared with engaging material and clear explanations to help them start their day productively.\nA: Sorry to cut you off, but if it's already midnight, you should really be getting some rest. You can always prep for the class in the morning.\nB: You're right, I should. But I was in the middle of writing an article I hope I can sell.\nA: Oh, another of your newspaper pieces? What's this one about?\nB: Do you remember the trip I took last month? Oh, and just to finish my thought earlier, the students go to work right after their lesson, so I try to make the class as engaging as possible.", + "cleaned_text": "A: You're going to wear out the computer's keyboard!\nB: Oh, hi.\nA: Do you have any idea what time it is?\nB:About ten or ten- thirty, I think, though I've been so focused on my work that I completely lost track of time and didn't even notice how late it's gotten.\nA: It's nearly midnight.\nB: Really? I didn't know it was so late.\nA: Don't you have an early class to teach tomorrow morning?\nB:Yes, at seven o'clock. My commuter class, the students who go to work right after class, so they need to be sharp in the morning which means I have to be extra prepared with engaging material and clear explanations to help them start their day productively.\nA: Sorry to cut you off, but if it's already midnight, you should really be getting some rest. You can always prep for the class in the morning.\nB: You're right, I should. But I was in the middle of writing an article I hope I can sell.\nA: Oh, another of your newspaper pieces? What's this one about?\nB: Do you remember the trip I took last month? Oh, and just to finish my thought earlier, the students go to work right after their lesson, so I try to make the class as engaging as possible.", + "total_duration": 52.67591836734694, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--184/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--184/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--184/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "You're going to wear out the computer's keyboard!", + "original_text": "You're going to wear out the computer's keyboard!", + "start_time": 0, + "end_time": 2.6354648526077096, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--184/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Oh, hi.", + "original_text": "Oh, hi.", + "start_time": 3.1913432278272555, + "end_time": 4.085311481795509, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--184/temp/line_1_B.wav", + "silence_duration": 0.5558783752195459, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Do you have any idea what time it is?", + "original_text": "Do you have any idea what time it is?", + "start_time": 4.457974948841349, + "end_time": 6.814800345666745, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--184/temp/line_2_A.wav", + "silence_duration": 0.3726634670458399, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "About ten or ten-", + "original_text": "About ten or ten-[interrupt] thirty, I think, though I've been so focused on my work that I completely lost track of time and didn't even notice how late it's gotten.", + "start_time": 7.238470464106313, + "end_time": 14.552756178392027, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--184/temp/line_3_B.wav", + "silence_duration": 0.4236701184395683, + "is_interrupted": true, + "text_after_interrupt": "thirty, I think, though I've been so focused on my work that I completely lost track of time and didn't even notice how late it's gotten." + }, + { + "speaker": "A", + "text": "It's nearly midnight.", + "original_text": "It's nearly midnight.", + "start_time": 8.457518083153932, + "end_time": 9.873935316714023, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--184/temp/line_4_A.wav", + "silence_duration": 0.5461459411570573, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Really? I didn't know it was so late.", + "original_text": "Really? I didn't know it was so late.", + "start_time": 15.131445283487396, + "end_time": 17.32573099777311, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--184/temp/line_5_B.wav", + "silence_duration": 0.5786891050953697, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Don't you have an early class to teach tomorrow morning?", + "original_text": "Don't you have an early class to teach tomorrow morning?", + "start_time": 17.88465037865505, + "end_time": 20.543335185911285, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--184/temp/line_6_A.wav", + "silence_duration": 0.5589193808819373, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, at seven o'clock. My commuter class, the students who go to", + "original_text": "Yes, at seven o'clock. My commuter class, the students who go to [interrupt] work right after class, so they need to be sharp in the morning which means I have to be extra prepared with engaging material and clear explanations to help them start their day productively.", + "start_time": 20.991236001041994, + "end_time": 33.53001151124607, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--184/temp/line_7_B.wav", + "silence_duration": 0.4479008151307087, + "is_interrupted": true, + "text_after_interrupt": "work right after class, so they need to be sharp in the morning which means I have to be extra prepared with engaging material and clear explanations to help them start their day productively." + }, + { + "speaker": "A", + "text": "Sorry to cut you off, but if it's already midnight, you should really be getting some rest. You can always prep for the class in the morning.", + "original_text": "Sorry to cut you off, but if it's already midnight, you should really be getting some rest. You can always prep for the class in the morning.", + "start_time": 26.23842660812603, + "end_time": 33.85457173284259, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--184/temp/line_8_A.wav", + "silence_duration": 0.5322104341376199, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "You're right, I should. But I was in the middle of writing an article I hope I can sell.", + "original_text": "You're right, I should. But I was in the middle of writing an article I hope I can sell.", + "start_time": 34.374769983832756, + "end_time": 38.76334141240419, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--184/temp/line_9_B.wav", + "silence_duration": 0.520198250990171, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Oh, another of your newspaper pieces? What's this one about?", + "original_text": "Oh, another of your newspaper pieces? What's this one about?", + "start_time": 39.244082672134084, + "end_time": 42.63419605081889, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--184/temp/line_10_A.wav", + "silence_duration": 0.48074125972989873, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Do you remember the trip I took last month? Oh, and just to finish my thought earlier, the students go to work right after their lesson, so I try to make the class as engaging as possible.", + "original_text": "Do you remember the trip I took last month? Oh, and just to finish my thought earlier, the students go to work right after their lesson, so I try to make the class as engaging as possible.", + "start_time": 43.06287513173139, + "end_time": 52.675936356221186, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--184/temp/line_11_B.wav", + "silence_duration": 0.42867908091249873, + "is_interrupted": false + } + ] + }, + "DialogSum--val--185": { + "original_text": "A: Have you heard that the boss of the law office where Rick works wants him to fly to Brazil and do a month's work [interrupt] to help with a major case they're handling down there, which involves some high-profile international clients and complex legal negotiations.\nB: Oh, Brazil? That sounds amazing! But wait, do you think Rick is prepared for such a long trip? I mean, has he traveled internationally before?\nA: Actually, this is his first time getting out of the States. And you're right, he's really excited because everything will be paid for—air travel, meals, hotel... But I didn't mention that his little sister [interrupt] is a bit worried about him being so far from home for the first time, especially since she's always relied on him for emotional support and guidance through difficult times.\nB: Oh, I bet she must be so proud of him! But I'm curious, who else is going with him on this trip?\nA: He's going alone. And yes, his little sister really admires him. He even promised to buy her gifts.\nB: That's sweet. So, when will he be leaving?", + "cleaned_text": "A:Have you heard that the boss of the law office where Rick works wants him to fly to Brazil and do a month's work to help with a major case they're handling down there, which involves some high-profile international clients and complex legal negotiations.\nB: Oh, Brazil? That sounds amazing! But wait, do you think Rick is prepared for such a long trip? I mean, has he traveled internationally before?\nA:Actually, this is his first time getting out of the States. And you're right, he's really excited because everything will be paid for—air travel, meals, hotel... But I didn't mention that his little sister is a bit worried about him being so far from home for the first time, especially since she's always relied on him for emotional support and guidance through difficult times.\nB: Oh, I bet she must be so proud of him! But I'm curious, who else is going with him on this trip?\nA: He's going alone. And yes, his little sister really admires him. He even promised to buy her gifts.\nB: That's sweet. So, when will he be leaving?", + "total_duration": 51.99954648526077, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--185/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--185/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--185/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Have you heard that the boss of the law office where Rick works wants him to fly to Brazil and do a month's work", + "original_text": "Have you heard that the boss of the law office where Rick works wants him to fly to Brazil and do a month's work [interrupt] to help with a major case they're handling down there, which involves some high-profile international clients and complex legal negotiations.", + "start_time": 0, + "end_time": 14.675011337868481, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--185/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": true, + "text_after_interrupt": "to help with a major case they're handling down there, which involves some high-profile international clients and complex legal negotiations." + }, + { + "speaker": "B", + "text": "Oh, Brazil? That sounds amazing! But wait, do you think Rick is prepared for such a long trip? I mean, has he traveled internationally before?", + "original_text": "Oh, Brazil? That sounds amazing! But wait, do you think Rick is prepared for such a long trip? I mean, has he traveled internationally before?", + "start_time": 6.2345578231292516, + "end_time": 15.104580498866213, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--185/temp/line_1_B.wav", + "silence_duration": 0.44508848685192626, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Actually, this is his first time getting out of the States. And you're right, he's really excited because everything will be paid for—air travel, meals, hotel... But I didn't mention that his little sister", + "original_text": "Actually, this is his first time getting out of the States. And you're right, he's really excited because everything will be paid for—air travel, meals, hotel... But I didn't mention that his little sister [interrupt] is a bit worried about him being so far from home for the first time, especially since she's always relied on him for emotional support and guidance through difficult times.", + "start_time": 15.44803857290576, + "end_time": 35.92803857290576, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--185/temp/line_2_A.wav", + "silence_duration": 0.3434580740395484, + "is_interrupted": true, + "text_after_interrupt": "is a bit worried about him being so far from home for the first time, especially since she's always relied on him for emotional support and guidance through difficult times." + }, + { + "speaker": "B", + "text": "Oh, I bet she must be so proud of him! But I'm curious, who else is going with him on this trip?", + "original_text": "Oh, I bet she must be so proud of him! But I'm curious, who else is going with him on this trip?", + "start_time": 36.718417360809156, + "end_time": 41.71070761024226, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--185/temp/line_3_B.wav", + "silence_duration": 0.30791143381951325, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "He's going alone. And yes, his little sister really admires him. He even promised to buy her gifts.", + "original_text": "He's going alone. And yes, his little sister really admires him. He even promised to buy her gifts.", + "start_time": 42.066809870655064, + "end_time": 49.29982574367094, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--185/temp/line_4_A.wav", + "silence_duration": 0.35610226041280674, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "That's sweet. So, when will he be leaving?", + "original_text": "That's sweet. So, when will he be leaving?", + "start_time": 49.80529052457646, + "end_time": 51.999576238862176, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--185/temp/line_5_B.wav", + "silence_duration": 0.5054647809055304, + "is_interrupted": false + } + ] + }, + "DialogSum--val--186": { + "original_text": "A: Hi young lady. How may I help you? \nB: Well, ... yeah. I'm looking for a Father's Day gift. \nA: Okay. How about getting your father a new wallet? \nB: Hmm. How much is that wallet? \nA: Huh ... which one? \nB: The black one. \nA: Oh. It's only $40.95. \nB: Huh? That's too expensive for me. Do you have a cheaper [interrupt] option with similar quality but at a more affordable price point? Maybe something under $30 would be more within my budget and still look nice for Father's Day. \nA: Oh, I just remembered, we have a special discount on some items today. Let me check if the black wallet qualifies for that discount. \nB: That would be great! But I was actually asking if you have a cheaper wallet available. \nA: Ah, sorry about that. Yes, we do. How about this brown leather one? \nB: Umm... I don't think my father will like the design on the outside, and it doesn't have a place to put pictures. How much is it anyway? \nA: It's $25.99. \nB: Humm. I don't have that much money.", + "cleaned_text": "A: Hi young lady. How may I help you? \nB: Well, ... yeah. I'm looking for a Father's Day gift. \nA: Okay. How about getting your father a new wallet? \nB: Hmm. How much is that wallet? \nA: Huh ... which one? \nB: The black one. \nA: Oh. It's only $40.95. \nB:Huh? That's too expensive for me. Do you have a cheaper option with similar quality but at a more affordable price point? Maybe something under $30 would be more within my budget and still look nice for Father's Day.\nA: Oh, I just remembered, we have a special discount on some items today. Let me check if the black wallet qualifies for that discount. \nB: That would be great! But I was actually asking if you have a cheaper wallet available. \nA: Ah, sorry about that. Yes, we do. How about this brown leather one? \nB: Umm... I don't think my father will like the design on the outside, and it doesn't have a place to put pictures. How much is it anyway? \nA: It's $25.99. \nB: Humm. I don't have that much money.", + "total_duration": 54.530249433106576, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--186/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--186/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--186/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Hi young lady. How may I help you?", + "original_text": "Hi young lady. How may I help you?", + "start_time": 0, + "end_time": 2.2755555555555556, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--186/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Well, ... yeah. I'm looking for a Father's Day gift.", + "original_text": "Well, ... yeah. I'm looking for a Father's Day gift.", + "start_time": 2.710717167495107, + "end_time": 6.182100387449756, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--186/temp/line_1_B.wav", + "silence_duration": 0.4351616119395515, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Okay. How about getting your father a new wallet?", + "original_text": "Okay. How about getting your father a new wallet?", + "start_time": 6.51727554340105, + "end_time": 9.814509103491753, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--186/temp/line_2_A.wav", + "silence_duration": 0.3351751559512941, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Hmm. How much is that wallet?", + "original_text": "Hmm. How much is that wallet?", + "start_time": 10.264447414575393, + "end_time": 11.843404330675167, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--186/temp/line_3_B.wav", + "silence_duration": 0.44993831108364035, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Huh ... which one?", + "original_text": "Huh ... which one?", + "start_time": 12.339059090809053, + "end_time": 13.8947960522603, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--186/temp/line_4_A.wav", + "silence_duration": 0.4956547601338873, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "The black one.", + "original_text": "The black one.", + "start_time": 14.303930937810131, + "end_time": 15.081799418535756, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--186/temp/line_5_B.wav", + "silence_duration": 0.40913488554983, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Oh. It's only $40.95.", + "original_text": "Oh. It's only $40.95.", + "start_time": 15.614276376717722, + "end_time": 18.644480458350376, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--186/temp/line_6_A.wav", + "silence_duration": 0.5324769581819673, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Huh? That's too expensive for me. Do you have a cheaper", + "original_text": "Huh? That's too expensive for me. Do you have a cheaper [interrupt] option with similar quality but at a more affordable price point? Maybe something under $30 would be more within my budget and still look nice for Father's Day.", + "start_time": 19.152108664565297, + "end_time": 30.97106558066507, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--186/temp/line_7_B.wav", + "silence_duration": 0.5076282062149229, + "is_interrupted": true, + "text_after_interrupt": "option with similar quality but at a more affordable price point? Maybe something under $30 would be more within my budget and still look nice for Father's Day." + }, + { + "speaker": "A", + "text": "Oh, I just remembered, we have a special discount on some items today. Let me check if the black wallet qualifies for that discount.", + "original_text": "Oh, I just remembered, we have a special discount on some items today. Let me check if the black wallet qualifies for that discount.", + "start_time": 22.56544199789863, + "end_time": 30.181587122615184, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--186/temp/line_8_A.wav", + "silence_duration": 0.38434992239519417, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "That would be great! But I was actually asking if you have a cheaper wallet available.", + "original_text": "That would be great! But I was actually asking if you have a cheaper wallet available.", + "start_time": 31.43033450849539, + "end_time": 35.36611682142056, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--186/temp/line_9_B.wav", + "silence_duration": 0.45926892783031825, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Ah, sorry about that. Yes, we do. How about this brown leather one?", + "original_text": "Ah, sorry about that. Yes, we do. How about this brown leather one?", + "start_time": 35.84731237210545, + "end_time": 41.80323073945239, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--186/temp/line_10_A.wav", + "silence_duration": 0.4811955506848884, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Umm... I don't think my father will like the design on the outside, and it doesn't have a place to put pictures. How much is it anyway?", + "original_text": "Umm... I don't think my father will like the design on the outside, and it doesn't have a place to put pictures. How much is it anyway?", + "start_time": 42.30583673234248, + "end_time": 48.84225396590257, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--186/temp/line_11_B.wav", + "silence_duration": 0.5026059928900892, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "It's $25.99.", + "original_text": "It's $25.99.", + "start_time": 49.40982369828541, + "end_time": 51.82469898173212, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--186/temp/line_12_A.wav", + "silence_duration": 0.5675697323828393, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Humm. I don't have that much money.", + "original_text": "Humm. I don't have that much money.", + "start_time": 52.30117651272225, + "end_time": 54.53029215898076, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--186/temp/line_13_B.wav", + "silence_duration": 0.47647753099012846, + "is_interrupted": false + } + ] + }, + "DialogSum--val--187": { + "original_text": "A: Shall we share a taxi? \nB: Where are you heading now? \nA: I want to go back to my college on the Huanghe road. It is very close to your [interrupt] apartment, so it makes sense to share since we're both going in the same general direction and can split the fare. \nB: Oh, Huanghe Road? Isn't that the one next to the Teachers' College? \nA: Yes, that's the one. So, you mean we'll share the taxi? \nB: Yeah. If we share the cab, it'll be cheaper. Besides, your Chinese is better than mine. The drivers usually have difficulty understanding me even though I practice my pronunciation [interrupt] every day with various language apps and even take weekly speaking classes to improve my accent and fluency. \nA: I understand what you mean. Sometimes they have trouble with my pronunciation too, but don't worry, I'll help with the directions. \nB: Well. Don't worry about it, I will be happy to share the taxi with you.", + "cleaned_text": "A: Shall we share a taxi? \nB: Where are you heading now? \nA:I want to go back to my college on the Huanghe road. It is very close to your apartment, so it makes sense to share since we're both going in the same general direction and can split the fare.\nB: Oh, Huanghe Road? Isn't that the one next to the Teachers' College? \nA: Yes, that's the one. So, you mean we'll share the taxi? \nB:Yeah. If we share the cab, it'll be cheaper. Besides, your Chinese is better than mine. The drivers usually have difficulty understanding me even though I practice my pronunciation every day with various language apps and even take weekly speaking classes to improve my accent and fluency.\nA: I understand what you mean. Sometimes they have trouble with my pronunciation too, but don't worry, I'll help with the directions. \nB: Well. Don't worry about it, I will be happy to share the taxi with you.", + "total_duration": 44.53501133786848, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--187/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--187/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--187/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Shall we share a taxi?", + "original_text": "Shall we share a taxi?", + "start_time": 0, + "end_time": 1.3931972789115645, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--187/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Where are you heading now?", + "original_text": "Where are you heading now?", + "start_time": 1.8319312021040792, + "end_time": 3.143858639745803, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--187/temp/line_1_B.wav", + "silence_duration": 0.4387339231925148, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I want to go back to my college on the Huanghe road. It is very close to your", + "original_text": "I want to go back to my college on the Huanghe road. It is very close to your [interrupt] apartment, so it makes sense to share since we're both going in the same general direction and can split the fare.", + "start_time": 3.5702072320750675, + "end_time": 14.286216302369851, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--187/temp/line_2_A.wav", + "silence_duration": 0.4263485923292648, + "is_interrupted": true, + "text_after_interrupt": "apartment, so it makes sense to share since we're both going in the same general direction and can split the fare." + }, + { + "speaker": "B", + "text": "Oh, Huanghe Road? Isn't that the one next to the Teachers' College?", + "original_text": "Oh, Huanghe Road? Isn't that the one next to the Teachers' College?", + "start_time": 8.527667549535385, + "end_time": 11.859731041598877, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--187/temp/line_3_B.wav", + "silence_duration": 0.3406922175736014, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Yes, that's the one. So, you mean we'll share the taxi?", + "original_text": "Yes, that's the one. So, you mean we'll share the taxi?", + "start_time": 14.675644211250296, + "end_time": 18.78557618403941, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--187/temp/line_4_A.wav", + "silence_duration": 0.38942790888044365, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yeah. If we share the cab, it'll be cheaper. Besides, your Chinese is better than mine. The drivers usually have difficulty understanding me even though I practice my pronunciation", + "original_text": "Yeah. If we share the cab, it'll be cheaper. Besides, your Chinese is better than mine. The drivers usually have difficulty understanding me even though I practice my pronunciation [interrupt] every day with various language apps and even take weekly speaking classes to improve my accent and fluency.", + "start_time": 19.37747346474946, + "end_time": 35.07416280715309, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--187/temp/line_5_B.wav", + "silence_duration": 0.5918972807100502, + "is_interrupted": true, + "text_after_interrupt": "every day with various language apps and even take weekly speaking classes to improve my accent and fluency." + }, + { + "speaker": "A", + "text": "I understand what you mean. Sometimes they have trouble with my pronunciation too, but don't worry, I'll help with the directions.", + "original_text": "I understand what you mean. Sometimes they have trouble with my pronunciation too, but don't worry, I'll help with the directions.", + "start_time": 32.983413649067884, + "end_time": 40.77370843364838, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--187/temp/line_6_A.wav", + "silence_duration": 0.37809651787297033, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Well. Don't worry about it, I will be happy to share the taxi with you.", + "original_text": "Well. Don't worry about it, I will be happy to share the taxi with you.", + "start_time": 41.34227423809134, + "end_time": 44.535018002263676, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--187/temp/line_7_B.wav", + "silence_duration": 0.568565804442961, + "is_interrupted": false + } + ] + }, + "DialogSum--val--188": { + "original_text": "A: Um... where are my utensils? \nB: You eat with your hands. Pick up the bread and use it like a spoon to scoop up the [interrupt] stew, which is rich with tender lamb, potatoes, and aromatic spices that have been simmering for hours to perfection. It's a traditional way of eating here. \nA: Oh, I see! Thanks for the tip. So, what's this dish called? \nB: This dish, Zilbo, has lamb and potatoes. \nA: Mmm! This is really good! Can you pass the honey wine? So, Clyde, what do you [interrupt] do when you're not studying or working at your family's firm? I imagine you must have some fascinating hobbies or interests outside of your professional life. \nB: International law and business. My family runs its own firm. \nA: Oh, interesting! You mentioned earlier how to use bread as a spoon, but what about the honey wine? How do you traditionally drink it? \nB: Just sip it slowly, it's meant to be savored. \nA: Got it. And you were saying, Clyde, about what you study? \nB: Right, I study international law and business. Clyde wants to be the first black president.", + "cleaned_text": "A: Um... where are my utensils? \nB:You eat with your hands. Pick up the bread and use it like a spoon to scoop up the stew, which is rich with tender lamb, potatoes, and aromatic spices that have been simmering for hours to perfection. It's a traditional way of eating here.\nA: Oh, I see! Thanks for the tip. So, what's this dish called? \nB: This dish, Zilbo, has lamb and potatoes. \nA:Mmm! This is really good! Can you pass the honey wine? So, Clyde, what do you do when you're not studying or working at your family's firm? I imagine you must have some fascinating hobbies or interests outside of your professional life.\nB: International law and business. My family runs its own firm. \nA: Oh, interesting! You mentioned earlier how to use bread as a spoon, but what about the honey wine? How do you traditionally drink it? \nB: Just sip it slowly, it's meant to be savored. \nA: Got it. And you were saying, Clyde, about what you study? \nB: Right, I study international law and business. Clyde wants to be the first black president.", + "total_duration": 53.25705215419501, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--188/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--188/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--188/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Um... where are my utensils?", + "original_text": "Um... where are my utensils?", + "start_time": 0, + "end_time": 1.8924263038548752, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--188/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "You eat with your hands. Pick up the bread and use it like a spoon to scoop up the", + "original_text": "You eat with your hands. Pick up the bread and use it like a spoon to scoop up the [interrupt] stew, which is rich with tender lamb, potatoes, and aromatic spices that have been simmering for hours to perfection. It's a traditional way of eating here.", + "start_time": 2.2231866520145527, + "end_time": 14.0189236134658, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--188/temp/line_1_B.wav", + "silence_duration": 0.33076034815967753, + "is_interrupted": true, + "text_after_interrupt": "stew, which is rich with tender lamb, potatoes, and aromatic spices that have been simmering for hours to perfection. It's a traditional way of eating here." + }, + { + "speaker": "A", + "text": "Oh, I see! Thanks for the tip. So, what's this dish called?", + "original_text": "Oh, I see! Thanks for the tip. So, what's this dish called?", + "start_time": 5.880329509157409, + "end_time": 10.431440620268521, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--188/temp/line_2_A.wav", + "silence_duration": 0.5842645066417322, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "This dish, Zilbo, has lamb and potatoes.", + "original_text": "This dish, Zilbo, has lamb and potatoes.", + "start_time": 14.58676115563637, + "end_time": 17.535695395999184, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--188/temp/line_3_B.wav", + "silence_duration": 0.5678375421705706, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Mmm! This is really good! Can you pass the honey wine? So, Clyde, what do you", + "original_text": "Mmm! This is really good! Can you pass the honey wine? So, Clyde, what do you [interrupt] do when you're not studying or working at your family's firm? I imagine you must have some fascinating hobbies or interests outside of your professional life.", + "start_time": 17.982589898001756, + "end_time": 32.61116132657318, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--188/temp/line_4_A.wav", + "silence_duration": 0.44689450200257114, + "is_interrupted": true, + "text_after_interrupt": "do when you're not studying or working at your family's firm? I imagine you must have some fascinating hobbies or interests outside of your professional life." + }, + { + "speaker": "B", + "text": "International law and business. My family runs its own firm.", + "original_text": "International law and business. My family runs its own firm.", + "start_time": 28.96055805021897, + "end_time": 32.07203197312147, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--188/temp/line_5_B.wav", + "silence_duration": 0.30117473881448437, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Oh, interesting! You mentioned earlier how to use bread as a spoon, but what about the honey wine? How do you traditionally drink it?", + "original_text": "Oh, interesting! You mentioned earlier how to use bread as a spoon, but what about the honey wine? How do you traditionally drink it?", + "start_time": 33.15362441577828, + "end_time": 40.94391920035878, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--188/temp/line_6_A.wav", + "silence_duration": 0.5424630892051024, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Just sip it slowly, it's meant to be savored.", + "original_text": "Just sip it slowly, it's meant to be savored.", + "start_time": 41.36703075836493, + "end_time": 44.118595384215276, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--188/temp/line_7_B.wav", + "silence_duration": 0.4231115580061547, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Got it. And you were saying, Clyde, about what you study?", + "original_text": "Got it. And you were saying, Clyde, about what you study?", + "start_time": 44.56225169028702, + "end_time": 47.67372561318952, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--188/temp/line_8_A.wav", + "silence_duration": 0.4436563060717466, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Right, I study international law and business. Clyde wants to be the first black president.", + "original_text": "Right, I study international law and business. Clyde wants to be the first black president.", + "start_time": 48.2647988523772, + "end_time": 53.2570891018103, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--188/temp/line_9_B.wav", + "silence_duration": 0.591073239187679, + "is_interrupted": false + } + ] + }, + "DialogSum--val--189": { + "original_text": "A: I would like to have a custom-made skirt. \nB: May I take your size? \nA: OK. I want it a bit close around the waist. \nB: No problem. How long would you like the [interrupt] skirt to be, and do you have a specific style in mind? We can discuss different fabric options and design details to ensure it matches your personal taste perfectly. \nA: Sorry to interrupt, but do you have any recommendations on the length? I'm not quite sure. \nB: Sure, I can suggest a length based on your height and style preference. By the way, I was asking how long you'd like the skirt to be. \nA: Oh, I see. I think knee-length would be best. How long will it take? \nB: About a week. \nA: What's the charge for the tailoring? \nB: 20 yuan for a skirt.", + "cleaned_text": "A: I would like to have a custom-made skirt. \nB: May I take your size? \nA: OK. I want it a bit close around the waist. \nB:No problem. How long would you like the skirt to be, and do you have a specific style in mind? We can discuss different fabric options and design details to ensure it matches your personal taste perfectly.\nA: Sorry to interrupt, but do you have any recommendations on the length? I'm not quite sure. \nB: Sure, I can suggest a length based on your height and style preference. By the way, I was asking how long you'd like the skirt to be. \nA: Oh, I see. I think knee-length would be best. How long will it take? \nB: About a week. \nA: What's the charge for the tailoring? \nB: 20 yuan for a skirt.", + "total_duration": 37.78054421768707, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--189/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--189/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--189/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "I would like to have a custom-made skirt.", + "original_text": "I would like to have a custom-made skirt.", + "start_time": 0, + "end_time": 2.1130158730158732, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--189/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "May I take your size?", + "original_text": "May I take your size?", + "start_time": 2.550054003159995, + "end_time": 3.7458816675590882, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--189/temp/line_1_B.wav", + "silence_duration": 0.4370381301441222, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "OK. I want it a bit close around the waist.", + "original_text": "OK. I want it a bit close around the waist.", + "start_time": 4.0918665185690495, + "end_time": 7.331050192038438, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--189/temp/line_2_A.wav", + "silence_duration": 0.34598485100996096, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "No problem. How long would you like the", + "original_text": "No problem. How long would you like the [interrupt] skirt to be, and do you have a specific style in mind? We can discuss different fabric options and design details to ensure it matches your personal taste perfectly.", + "start_time": 7.6690444394494754, + "end_time": 18.83784262539052, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--189/temp/line_3_B.wav", + "silence_duration": 0.33799424741103734, + "is_interrupted": true, + "text_after_interrupt": "skirt to be, and do you have a specific style in mind? We can discuss different fabric options and design details to ensure it matches your personal taste perfectly." + }, + { + "speaker": "A", + "text": "Sorry to interrupt, but do you have any recommendations on the length? I'm not quite sure.", + "original_text": "Sorry to interrupt, but do you have any recommendations on the length? I'm not quite sure.", + "start_time": 10.002649881626347, + "end_time": 15.93534829432476, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--189/temp/line_4_A.wav", + "silence_duration": 0.542533640194077, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Sure, I can suggest a length based on your height and style preference. By the way, I was asking how long you'd like the skirt to be.", + "original_text": "Sure, I can suggest a length based on your height and style preference. By the way, I was asking how long you'd like the skirt to be.", + "start_time": 19.35405353000651, + "end_time": 26.203940151321703, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--189/temp/line_5_B.wav", + "silence_duration": 0.5162109046159936, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Oh, I see. I think knee-length would be best. How long will it take?", + "original_text": "Oh, I see. I think knee-length would be best. How long will it take?", + "start_time": 26.516765665134848, + "end_time": 32.58878380572442, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--189/temp/line_6_A.wav", + "silence_duration": 0.3128255138131441, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "About a week.", + "original_text": "About a week.", + "start_time": 33.1516466930866, + "end_time": 33.96434510578501, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--189/temp/line_7_B.wav", + "silence_duration": 0.5628628873621824, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "What's the charge for the tailoring?", + "original_text": "What's the charge for the tailoring?", + "start_time": 34.363636017579815, + "end_time": 36.13996254819206, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--189/temp/line_8_A.wav", + "silence_duration": 0.3992909117948071, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "20 yuan for a skirt.", + "original_text": "20 yuan for a skirt.", + "start_time": 36.526693459923465, + "end_time": 37.78057101094387, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--189/temp/line_9_B.wav", + "silence_duration": 0.3867309117314034, + "is_interrupted": false + } + ] + }, + "DialogSum--val--191": { + "original_text": "A: Are you studying here? \nB: Yes, I am studying in Eastern Asian language department. \nA: What are you major in? \nB: I major in Japanese. \nA: What do you think of the literature [interrupt] it's quite challenging but also fascinating, especially when you dive deep into the classical works from the Heian period and analyze how they influence modern storytelling techniques. \nB: Sorry to interrupt, but I just wanted to ask, do you also study any other languages besides Japanese? \nA: Oh, I focus primarily on Japanese, but I do dabble in some Korean as well. But coming back to your earlier question, the literature course is very helpful. The course has let me into a world of literature. I read so many great [interrupt] authors that have broadened my perspective on Japanese culture, particularly through their exploration of themes like identity, tradition, and modernity in post-war Japan. \nB: Speaking of literature, have you come across any authors that particularly resonated with you? \nA: Yes, actually, I was about to mention that I've been really drawn to the works of Haruki Murakami. His style is quite unique.", + "cleaned_text": "A: Are you studying here? \nB: Yes, I am studying in Eastern Asian language department. \nA: What are you major in? \nB: I major in Japanese. \nA:What do you think of the literature it's quite challenging but also fascinating, especially when you dive deep into the classical works from the Heian period and analyze how they influence modern storytelling techniques.\nB: Sorry to interrupt, but I just wanted to ask, do you also study any other languages besides Japanese? \nA:Oh, I focus primarily on Japanese, but I do dabble in some Korean as well. But coming back to your earlier question, the literature course is very helpful. The course has let me into a world of literature. I read so many great authors that have broadened my perspective on Japanese culture, particularly through their exploration of themes like identity, tradition, and modernity in post-war Japan.\nB: Speaking of literature, have you come across any authors that particularly resonated with you? \nA: Yes, actually, I was about to mention that I've been really drawn to the works of Haruki Murakami. His style is quite unique.", + "total_duration": 56.07732426303855, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--191/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--191/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--191/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Are you studying here?", + "original_text": "Are you studying here?", + "start_time": 0, + "end_time": 1.3119274376417234, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--191/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, I am studying in Eastern Asian language department.", + "original_text": "Yes, I am studying in Eastern Asian language department.", + "start_time": 1.8986260688883114, + "end_time": 5.091369833060647, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--191/temp/line_1_B.wav", + "silence_duration": 0.586698631246588, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "What are you major in?", + "original_text": "What are you major in?", + "start_time": 5.65673704203761, + "end_time": 6.9106145930580185, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--191/temp/line_2_A.wav", + "silence_duration": 0.5653672089769628, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I major in Japanese.", + "original_text": "I major in Japanese.", + "start_time": 7.459740612728629, + "end_time": 8.95742768755856, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--191/temp/line_3_B.wav", + "silence_duration": 0.5491260196706099, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "What do you think of the literature", + "original_text": "What do you think of the literature [interrupt] it's quite challenging but also fascinating, especially when you dive deep into the classical works from the Heian period and analyze how they influence modern storytelling techniques.", + "start_time": 9.41970066859213, + "end_time": 21.49407708582569, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--191/temp/line_4_A.wav", + "silence_duration": 0.46227298103356906, + "is_interrupted": true, + "text_after_interrupt": "it's quite challenging but also fascinating, especially when you dive deep into the classical works from the Heian period and analyze how they influence modern storytelling techniques." + }, + { + "speaker": "B", + "text": "Sorry to interrupt, but I just wanted to ask, do you also study any other languages besides Japanese?", + "original_text": "Sorry to interrupt, but I just wanted to ask, do you also study any other languages besides Japanese?", + "start_time": 11.149587289907323, + "end_time": 16.919746020066054, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--191/temp/line_5_B.wav", + "silence_duration": 0.46123892846327375, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Oh, I focus primarily on Japanese, but I do dabble in some Korean as well. But coming back to your earlier question, the literature course is very helpful. The course has let me into a world of literature. I read so many great", + "original_text": "Oh, I focus primarily on Japanese, but I do dabble in some Korean as well. But coming back to your earlier question, the literature course is very helpful. The course has let me into a world of literature. I read so many great [interrupt] authors that have broadened my perspective on Japanese culture, particularly through their exploration of themes like identity, tradition, and modernity in post-war Japan.", + "start_time": 22.04305238437187, + "end_time": 47.29475306464398, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--191/temp/line_6_A.wav", + "silence_duration": 0.54897529854618, + "is_interrupted": true, + "text_after_interrupt": "authors that have broadened my perspective on Japanese culture, particularly through their exploration of themes like identity, tradition, and modernity in post-war Japan." + }, + { + "speaker": "B", + "text": "Speaking of literature, have you come across any authors that particularly resonated with you?", + "original_text": "Speaking of literature, have you come across any authors that particularly resonated with you?", + "start_time": 43.208462929016996, + "end_time": 48.02660351858616, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--191/temp/line_7_B.wav", + "silence_duration": 0.5862432406223916, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Yes, actually, I was about to mention that I've been really drawn to the works of Haruki Murakami. His style is quite unique.", + "original_text": "Yes, actually, I was about to mention that I've been really drawn to the works of Haruki Murakami. His style is quite unique.", + "start_time": 48.56569049184736, + "end_time": 56.07734582064555, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--191/temp/line_8_A.wav", + "silence_duration": 0.5390869732612067, + "is_interrupted": false + } + ] + }, + "DialogSum--val--192": { + "original_text": "A: I came to this lab to have my blood drawn. \nB: You are in the right place. Roll up your left sleeve and have a seat. \nA: What am I being tested for? \nB: Your doctor wants to know what your white blood cell [interrupt] count is, which can help in diagnosing various conditions such as infections, immune disorders, or even certain types of cancers that might be affecting your overall health. \nA: Sorry, I just realized I never asked—what does the white blood cell count actually indicate? \nB: Usually if your white count is off, the doctor suspects an infection. But I was saying that your doctor specifically wants to check your white blood cell count to rule out any underlying issues that might need immediate attention. \nA: Got it. How much will it hurt? \nB: It is only a pin prick. I have to put this tourniquet on your arm to make the vein easier to find. \nA: Is that my blood going into that tube? \nB: That blood that just filled the tube is all that I needed. Thanks for coming in!", + "cleaned_text": "A: I came to this lab to have my blood drawn. \nB: You are in the right place. Roll up your left sleeve and have a seat. \nA: What am I being tested for? \nB:Your doctor wants to know what your white blood cell count is, which can help in diagnosing various conditions such as infections, immune disorders, or even certain types of cancers that might be affecting your overall health.\nA: Sorry, I just realized I never asked—what does the white blood cell count actually indicate? \nB: Usually if your white count is off, the doctor suspects an infection. But I was saying that your doctor specifically wants to check your white blood cell count to rule out any underlying issues that might need immediate attention. \nA: Got it. How much will it hurt? \nB: It is only a pin prick. I have to put this tourniquet on your arm to make the vein easier to find. \nA: Is that my blood going into that tube? \nB: That blood that just filled the tube is all that I needed. Thanks for coming in!", + "total_duration": 46.70521541950114, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--192/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--192/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--192/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "I came to this lab to have my blood drawn.", + "original_text": "I came to this lab to have my blood drawn.", + "start_time": 0, + "end_time": 2.6586848072562357, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--192/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "You are in the right place. Roll up your left sleeve and have a seat.", + "original_text": "You are in the right place. Roll up your left sleeve and have a seat.", + "start_time": 3.141922333583429, + "end_time": 6.334666097755765, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--192/temp/line_1_B.wav", + "silence_duration": 0.4832375263271933, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "What am I being tested for?", + "original_text": "What am I being tested for?", + "start_time": 6.715924067484688, + "end_time": 8.36454084753004, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--192/temp/line_2_A.wav", + "silence_duration": 0.3812579697289236, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Your doctor wants to know what your white blood cell", + "original_text": "Your doctor wants to know what your white blood cell [interrupt] count is, which can help in diagnosing various conditions such as infections, immune disorders, or even certain types of cancers that might be affecting your overall health.", + "start_time": 8.782128797674426, + "end_time": 20.21795646207352, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--192/temp/line_3_B.wav", + "silence_duration": 0.41758795014438616, + "is_interrupted": true, + "text_after_interrupt": "count is, which can help in diagnosing various conditions such as infections, immune disorders, or even certain types of cancers that might be affecting your overall health." + }, + { + "speaker": "A", + "text": "Sorry, I just realized I never asked—what does the white blood cell count actually indicate?", + "original_text": "Sorry, I just realized I never asked—what does the white blood cell count actually indicate?", + "start_time": 11.197004081121138, + "end_time": 17.12970249381955, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--192/temp/line_4_A.wav", + "silence_duration": 0.3975231065654119, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Usually if your white count is off, the doctor suspects an infection. But I was saying that your doctor specifically wants to check your white blood cell count to rule out any underlying issues that might need immediate attention.", + "original_text": "Usually if your white count is off, the doctor suspects an infection. But I was saying that your doctor specifically wants to check your white blood cell count to rule out any underlying issues that might need immediate attention.", + "start_time": 20.699282350308195, + "end_time": 32.13511001470729, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--192/temp/line_5_B.wav", + "silence_duration": 0.48132588823467404, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Got it. How much will it hurt?", + "original_text": "Got it. How much will it hurt?", + "start_time": 32.449294402952724, + "end_time": 34.144351092295125, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--192/temp/line_6_A.wav", + "silence_duration": 0.31418438824543976, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "It is only a pin prick. I have to put this tourniquet on your arm to make the vein easier to find.", + "original_text": "It is only a pin prick. I have to put this tourniquet on your arm to make the vein easier to find.", + "start_time": 34.458511721786685, + "end_time": 39.67139154038079, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--192/temp/line_7_B.wav", + "silence_duration": 0.3141606294915639, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Is that my blood going into that tube?", + "original_text": "Is that my blood going into that tube?", + "start_time": 40.04289898211935, + "end_time": 42.23718469640506, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--192/temp/line_8_A.wav", + "silence_duration": 0.37150744173855993, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "That blood that just filled the tube is all that I needed. Thanks for coming in!", + "original_text": "That blood that just filled the tube is all that I needed. Thanks for coming in!", + "start_time": 42.572086335320726, + "end_time": 46.70523826275837, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--192/temp/line_9_B.wav", + "silence_duration": 0.33490163891566527, + "is_interrupted": false + } + ] + }, + "DialogSum--val--193": { + "original_text": "A: Do you know what is the most special event in Kentucky? \nB: The world class horses or the Hollywood stars? \nA: Well, it's the hats. The hat parade is one of the most anticipated events during the Kentucky Derby [interrupt] where people showcase incredibly elaborate designs that often incorporate flowers, feathers, and even miniature horse sculptures to celebrate the rich tradition of the event. \nB: Oh, you mean the Kentucky Derby, right? I've heard about the famous hats there. How does the parade work? \nA: Yes, exactly! The hat parade is a big part of the Kentucky Derby. The hats are not only a fashion tradition in the southern part of America, they are also said to be good luck. By the way, you asked about different kinds of hats earlier—yes, there are many unique and extravagant designs. Some people even spend months planning and creating their hats just for this event. \nB: That sounds amazing! When does the hat parade take place?", + "cleaned_text": "A: Do you know what is the most special event in Kentucky? \nB: The world class horses or the Hollywood stars? \nA:Well, it's the hats. The hat parade is one of the most anticipated events during the Kentucky Derby where people showcase incredibly elaborate designs that often incorporate flowers, feathers, and even miniature horse sculptures to celebrate the rich tradition of the event.\nB: Oh, you mean the Kentucky Derby, right? I've heard about the famous hats there. How does the parade work? \nA: Yes, exactly! The hat parade is a big part of the Kentucky Derby. The hats are not only a fashion tradition in the southern part of America, they are also said to be good luck. By the way, you asked about different kinds of hats earlier—yes, there are many unique and extravagant designs. Some people even spend months planning and creating their hats just for this event. \nB: That sounds amazing! When does the hat parade take place?", + "total_duration": 48.441814058956915, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--193/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--193/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--193/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Do you know what is the most special event in Kentucky?", + "original_text": "Do you know what is the most special event in Kentucky?", + "start_time": 0, + "end_time": 3.030204081632653, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--193/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "The world class horses or the Hollywood stars?", + "original_text": "The world class horses or the Hollywood stars?", + "start_time": 3.628951710544644, + "end_time": 6.1018768806126715, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--193/temp/line_1_B.wav", + "silence_duration": 0.5987476289119907, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Well, it's the hats. The hat parade is one of the most anticipated events during the Kentucky Derby", + "original_text": "Well, it's the hats. The hat parade is one of the most anticipated events during the Kentucky Derby [interrupt] where people showcase incredibly elaborate designs that often incorporate flowers, feathers, and even miniature horse sculptures to celebrate the rich tradition of the event.", + "start_time": 6.654197815127365, + "end_time": 22.710796454583146, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--193/temp/line_2_A.wav", + "silence_duration": 0.5523209345146928, + "is_interrupted": true, + "text_after_interrupt": "where people showcase incredibly elaborate designs that often incorporate flowers, feathers, and even miniature horse sculptures to celebrate the rich tradition of the event." + }, + { + "speaker": "B", + "text": "Oh, you mean the Kentucky Derby, right? I've heard about the famous hats there. How does the parade work?", + "original_text": "Oh, you mean the Kentucky Derby, right? I've heard about the famous hats there. How does the parade work?", + "start_time": 12.807485796986775, + "end_time": 19.10009350673734, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--193/temp/line_3_B.wav", + "silence_duration": 0.32469422184421187, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Yes, exactly! The hat parade is a big part of the Kentucky Derby. The hats are not only a fashion tradition in the southern part of America, they are also said to be good luck. By the way, you asked about different kinds of hats earlier—yes, there are many unique and extravagant designs. Some people even spend months planning and creating their hats just for this event.", + "original_text": "Yes, exactly! The hat parade is a big part of the Kentucky Derby. The hats are not only a fashion tradition in the southern part of America, they are also said to be good luck. By the way, you asked about different kinds of hats earlier—yes, there are many unique and extravagant designs. Some people even spend months planning and creating their hats just for this event.", + "start_time": 23.080888785530426, + "end_time": 44.9192561324692, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--193/temp/line_4_A.wav", + "silence_duration": 0.3700923309472811, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "That sounds amazing! When does the hat parade take place?", + "original_text": "That sounds amazing! When does the hat parade take place?", + "start_time": 45.4116269481262, + "end_time": 48.44183102975885, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--193/temp/line_5_B.wav", + "silence_duration": 0.4923708156569977, + "is_interrupted": false + } + ] + }, + "DialogSum--val--194": { + "original_text": "A: Excuse me, Miss Ames, can I ask you something? \nB: Sure, John. Ask me anything. \nA: OK, would you please oil your door? \nB: What? \nA: You always come home so late. And whenever you open the front door, it makes a lot of [interrupt] creaking sounds that wake me up and sometimes even startle me awake from deep sleep, which makes it really hard to fall back asleep afterward. \nB: Noise, right? I didn't realize it was that loud. But what do you mean by late? I come back around 11:00. That's not late at all. \nA: Well, you spend hours after that going in and out, in and out, until my head feels ready to burst. \nB: Oh, I'm so sorry to hear that. I'll see what I can do with the door this weekend. By the way, you mentioned something about the door making noise—was there anything else you wanted to say about that? \nA: No, that was it. Just the noise is really disturbing my sleep. \nB: Got it. I'll definitely take care of it.", + "cleaned_text": "A: Excuse me, Miss Ames, can I ask you something? \nB: Sure, John. Ask me anything. \nA: OK, would you please oil your door? \nB: What? \nA:You always come home so late. And whenever you open the front door, it makes a lot of creaking sounds that wake me up and sometimes even startle me awake from deep sleep, which makes it really hard to fall back asleep afterward.\nB: Noise, right? I didn't realize it was that loud. But what do you mean by late? I come back around 11:00. That's not late at all. \nA: Well, you spend hours after that going in and out, in and out, until my head feels ready to burst. \nB: Oh, I'm so sorry to hear that. I'll see what I can do with the door this weekend. By the way, you mentioned something about the door making noise—was there anything else you wanted to say about that? \nA: No, that was it. Just the noise is really disturbing my sleep. \nB: Got it. I'll definitely take care of it.", + "total_duration": 45.63492063492063, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--194/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--194/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--194/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Excuse me, Miss Ames, can I ask you something?", + "original_text": "Excuse me, Miss Ames, can I ask you something?", + "start_time": 0, + "end_time": 2.589024943310658, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--194/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Sure, John. Ask me anything.", + "original_text": "Sure, John. Ask me anything.", + "start_time": 3.0385599171053395, + "end_time": 4.687176697150691, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--194/temp/line_1_B.wav", + "silence_duration": 0.44953497379468166, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "OK, would you please oil your door?", + "original_text": "OK, would you please oil your door?", + "start_time": 5.224205935924459, + "end_time": 7.615861264722645, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--194/temp/line_2_A.wav", + "silence_duration": 0.5370292387737682, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "What?", + "original_text": "What?", + "start_time": 7.960461420424877, + "end_time": 8.471300422692451, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--194/temp/line_3_B.wav", + "silence_duration": 0.34460015570223157, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "You always come home so late. And whenever you open the front door, it makes a lot of", + "original_text": "You always come home so late. And whenever you open the front door, it makes a lot of [interrupt] creaking sounds that wake me up and sometimes even startle me awake from deep sleep, which makes it really hard to fall back asleep afterward.", + "start_time": 9.068519864772668, + "end_time": 21.781445034840694, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--194/temp/line_4_A.wav", + "silence_duration": 0.597219442080217, + "is_interrupted": true, + "text_after_interrupt": "creaking sounds that wake me up and sometimes even startle me awake from deep sleep, which makes it really hard to fall back asleep afterward." + }, + { + "speaker": "B", + "text": "Noise, right? I didn't realize it was that loud. But what do you mean by late? I come back around 11:00. That's not late at all.", + "original_text": "Noise, right? I didn't realize it was that loud. But what do you mean by late? I come back around 11:00. That's not late at all.", + "start_time": 13.805390613071989, + "end_time": 21.015186531439337, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--194/temp/line_5_B.wav", + "silence_duration": 0.5910671220119714, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Well, you spend hours after that going in and out, in and out, until my head feels ready to burst.", + "original_text": "Well, you spend hours after that going in and out, in and out, until my head feels ready to burst.", + "start_time": 22.364234091069466, + "end_time": 29.063191007169237, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--194/temp/line_6_A.wav", + "silence_duration": 0.5827890562287716, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Oh, I'm so sorry to hear that. I'll see what I can do with the door this weekend. By the way, you mentioned something about the door making noise—was there anything else you wanted to say about that?", + "original_text": "Oh, I'm so sorry to hear that. I'll see what I can do with the door this weekend. By the way, you mentioned something about the door making noise—was there anything else you wanted to say about that?", + "start_time": 29.424170082252232, + "end_time": 38.677322009689874, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--194/temp/line_7_B.wav", + "silence_duration": 0.3609790750829942, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "No, that was it. Just the noise is really disturbing my sleep.", + "original_text": "No, that was it. Just the noise is really disturbing my sleep.", + "start_time": 39.10219537162473, + "end_time": 42.97992779792859, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--194/temp/line_8_A.wav", + "silence_duration": 0.4248733619348581, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Got it. I'll definitely take care of it.", + "original_text": "Got it. I'll definitely take care of it.", + "start_time": 43.55674702768941, + "end_time": 45.63493296873249, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--194/temp/line_9_B.wav", + "silence_duration": 0.5768192297608257, + "is_interrupted": false + } + ] + }, + "DialogSum--val--195": { + "original_text": "A: Now, Mark, you're from Canada? \nB: That's right. \nA: Where is it actually that you grew up? \nB: I was born in Montreal and I lived there for 4 years. The first 4 years, but uh, I grew up in Calgary in Alberta. \nA: Ok, so what was your childhood like? Were you into nature or sports? \nB: When I was young, I was into books. I was a big reader. I used to go to the library with my [interrupt] older sister every weekend to check out new novels and explore different sections of the library, which really helped develop my love for literature at an early age.\nA: Sorry, just curious—what kind of books were you into back then? \nB: Mostly adventure and mystery novels. But as I was saying, I used to go to the library with my mother. \nA: Got it. So, when was your first trip abroad? Where did you go? \nB: The first big trip I took abroad was when I was 14. I went to Liverpool that time, where my mother is from and [interrupt] I got to meet a lot of my extended family for the first time while also experiencing British culture and traditions firsthand, which was incredibly eye-opening for a teenager from Canada.\nA: Oh, Liverpool! Did you get a chance to visit any Beatles landmarks while you were there? \nB: Yes, I did! But I was also going to mention that we visited Wales and Scotland on the 5 or 6 trips after that.", + "cleaned_text": "A: Now, Mark, you're from Canada? \nB: That's right. \nA: Where is it actually that you grew up? \nB: I was born in Montreal and I lived there for 4 years. The first 4 years, but uh, I grew up in Calgary in Alberta. \nA: Ok, so what was your childhood like? Were you into nature or sports? \nB:When I was young, I was into books. I was a big reader. I used to go to the library with my older sister every weekend to check out new novels and explore different sections of the library, which really helped develop my love for literature at an early age.\nA: Sorry, just curious—what kind of books were you into back then? \nB: Mostly adventure and mystery novels. But as I was saying, I used to go to the library with my mother. \nA: Got it. So, when was your first trip abroad? Where did you go? \nB:The first big trip I took abroad was when I was 14. I went to Liverpool that time, where my mother is from and I got to meet a lot of my extended family for the first time while also experiencing British culture and traditions firsthand, which was incredibly eye-opening for a teenager from Canada.\nA: Oh, Liverpool! Did you get a chance to visit any Beatles landmarks while you were there? \nB: Yes, I did! But I was also going to mention that we visited Wales and Scotland on the 5 or 6 trips after that.", + "total_duration": 65.09673469387755, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--195/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--195/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--195/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Now, Mark, you're from Canada?", + "original_text": "Now, Mark, you're from Canada?", + "start_time": 0, + "end_time": 1.7298866213151927, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--195/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "That's right.", + "original_text": "That's right.", + "start_time": 2.076480922995312, + "end_time": 2.749859607802568, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--195/temp/line_1_B.wav", + "silence_duration": 0.3465943016801192, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Where is it actually that you grew up?", + "original_text": "Where is it actually that you grew up?", + "start_time": 3.235117932742562, + "end_time": 5.313303873785646, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--195/temp/line_2_A.wav", + "silence_duration": 0.4852583249399942, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I was born in Montreal and I lived there for 4 years. The first 4 years, but uh, I grew up in Calgary in Alberta.", + "original_text": "I was born in Montreal and I lived there for 4 years. The first 4 years, but uh, I grew up in Calgary in Alberta.", + "start_time": 5.845171522384781, + "end_time": 12.613788302430134, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--195/temp/line_3_B.wav", + "silence_duration": 0.5318676485991349, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Ok, so what was your childhood like? Were you into nature or sports?", + "original_text": "Ok, so what was your childhood like? Were you into nature or sports?", + "start_time": 12.945195563725882, + "end_time": 17.91426585851046, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--195/temp/line_4_A.wav", + "silence_duration": 0.3314072612957474, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "When I was young, I was into books. I was a big reader. I used to go to the library with my", + "original_text": "When I was young, I was into books. I was a big reader. I used to go to the library with my [interrupt] older sister every weekend to check out new novels and explore different sections of the library, which really helped develop my love for literature at an early age.", + "start_time": 18.3809142111348, + "end_time": 31.209939154445458, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--195/temp/line_5_B.wav", + "silence_duration": 0.4666483526243407, + "is_interrupted": true, + "text_after_interrupt": "older sister every weekend to check out new novels and explore different sections of the library, which really helped develop my love for literature at an early age." + }, + { + "speaker": "A", + "text": "Sorry, just curious—what kind of books were you into back then?", + "original_text": "Sorry, just curious—what kind of books were you into back then?", + "start_time": 23.37320446056791, + "end_time": 27.78499584378786, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--195/temp/line_6_A.wav", + "silence_duration": 0.38931625947214316, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Mostly adventure and mystery novels. But as I was saying, I used to go to the library with my mother.", + "original_text": "Mostly adventure and mystery novels. But as I was saying, I used to go to the library with my mother.", + "start_time": 31.67813477744589, + "end_time": 37.25092389309215, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--195/temp/line_7_B.wav", + "silence_duration": 0.4681956230004334, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Got it. So, when was your first trip abroad? Where did you go?", + "original_text": "Got it. So, when was your first trip abroad? Where did you go?", + "start_time": 37.77755128460675, + "end_time": 42.607301851500175, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--195/temp/line_8_A.wav", + "silence_duration": 0.5266273915145983, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "The first big trip I took abroad was when I was 14. I went to Liverpool that time, where my mother is from and", + "original_text": "The first big trip I took abroad was when I was 14. I went to Liverpool that time, where my mother is from and [interrupt] I got to meet a lot of my extended family for the first time while also experiencing British culture and traditions firsthand, which was incredibly eye-opening for a teenager from Canada.", + "start_time": 43.17710008536124, + "end_time": 58.71124974522519, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--195/temp/line_9_B.wav", + "silence_duration": 0.5697982338610619, + "is_interrupted": true, + "text_after_interrupt": "I got to meet a lot of my extended family for the first time while also experiencing British culture and traditions firsthand, which was incredibly eye-opening for a teenager from Canada." + }, + { + "speaker": "A", + "text": "Oh, Liverpool! Did you get a chance to visit any Beatles landmarks while you were there?", + "original_text": "Oh, Liverpool! Did you get a chance to visit any Beatles landmarks while you were there?", + "start_time": 53.80477966873738, + "end_time": 58.65775019027933, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--195/temp/line_10_A.wav", + "silence_duration": 0.31114680494526425, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, I did! But I was also going to mention that we visited Wales and Scotland on the 5 or 6 trips after that.", + "original_text": "Yes, I did! But I was also going to mention that we visited Wales and Scotland on the 5 or 6 trips after that.", + "start_time": 59.22212443405157, + "end_time": 65.09677296012867, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--195/temp/line_11_B.wav", + "silence_duration": 0.5108746888263872, + "is_interrupted": false + } + ] + }, + "DialogSum--val--196": { + "original_text": "A: Hi, David. How was your day? \nB: Don't ask, it was terrible. \nA: You poor thing. What on earth happened? \nB: Well, at about 11 o'clock this morning, I was skateboarding in the park [interrupt] and practicing some new tricks when suddenly I lost my balance completely. \nA: Oh, yes? Did you see Tony after you fell? I heard he was also planning to go skateboarding today. \nB: Sorry to interrupt, but no, luckily, I didn't see anyone I know. \nA: What do you mean 'luckily'? \nB: To start with, I wasn't looking where I was going and I fell off my skateboard. I landed in a pool. I was really dirty. \nA: Oh, no. What did you do? \nB: Well, I was getting on the bus to come home, when the driver shouted at me. He didn't let me on the bus because I was wet and dirty. And I didn't have any money for a cab or anything else [interrupt] so I had to figure out another way to get home while being completely soaked and covered in mud. \nA: Wait, you didn't have any money for a taxi? That must have made things even worse. How did you get home then? \nB: I walked all the way home.", + "cleaned_text": "A: Hi, David. How was your day? \nB: Don't ask, it was terrible. \nA: You poor thing. What on earth happened? \nB:Well, at about 11 o'clock this morning, I was skateboarding in the park and practicing some new tricks when suddenly I lost my balance completely.\nA: Oh, yes? Did you see Tony after you fell? I heard he was also planning to go skateboarding today. \nB: Sorry to interrupt, but no, luckily, I didn't see anyone I know. \nA: What do you mean 'luckily'? \nB: To start with, I wasn't looking where I was going and I fell off my skateboard. I landed in a pool. I was really dirty. \nA: Oh, no. What did you do? \nB:Well, I was getting on the bus to come home, when the driver shouted at me. He didn't let me on the bus because I was wet and dirty. And I didn't have any money for a cab or anything else so I had to figure out another way to get home while being completely soaked and covered in mud.\nA: Wait, you didn't have any money for a taxi? That must have made things even worse. How did you get home then? \nB: I walked all the way home.", + "total_duration": 55.06612244897959, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--196/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--196/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--196/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Hi, David. How was your day?", + "original_text": "Hi, David. How was your day?", + "start_time": 0, + "end_time": 2.1942857142857144, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--196/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Don't ask, it was terrible.", + "original_text": "Don't ask, it was terrible.", + "start_time": 2.7257367856261965, + "end_time": 4.4207934749686, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--196/temp/line_1_B.wav", + "silence_duration": 0.5314510713404823, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "You poor thing. What on earth happened?", + "original_text": "You poor thing. What on earth happened?", + "start_time": 4.901561685244095, + "end_time": 7.072627444881284, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--196/temp/line_2_A.wav", + "silence_duration": 0.48076821027549543, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Well, at about 11 o'clock this morning, I was skateboarding in the park", + "original_text": "Well, at about 11 o'clock this morning, I was skateboarding in the park [interrupt] and practicing some new tricks when suddenly I lost my balance completely.", + "start_time": 7.434057603877953, + "end_time": 14.423263953084302, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--196/temp/line_3_B.wav", + "silence_duration": 0.36143015899666914, + "is_interrupted": true, + "text_after_interrupt": "and practicing some new tricks when suddenly I lost my balance completely." + }, + { + "speaker": "A", + "text": "Oh, yes? Did you see Tony after you fell? I heard he was also planning to go skateboarding today.", + "original_text": "Oh, yes? Did you see Tony after you fell? I heard he was also planning to go skateboarding today.", + "start_time": 11.126030392993599, + "end_time": 17.325758284150062, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--196/temp/line_4_A.wav", + "silence_duration": 0.3255396894587025, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Sorry to interrupt, but no, luckily, I didn't see anyone I know.", + "original_text": "Sorry to interrupt, but no, luckily, I didn't see anyone I know.", + "start_time": 17.679562384657707, + "end_time": 21.255435400530722, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--196/temp/line_5_B.wav", + "silence_duration": 0.3538041005076464, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "What do you mean 'luckily'?", + "original_text": "What do you mean 'luckily'?", + "start_time": 21.835145304265495, + "end_time": 23.91333124530858, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--196/temp/line_6_A.wav", + "silence_duration": 0.5797099037347717, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "To start with, I wasn't looking where I was going and I fell off my skateboard. I landed in a pool. I was really dirty.", + "original_text": "To start with, I wasn't looking where I was going and I fell off my skateboard. I landed in a pool. I was really dirty.", + "start_time": 24.35722523073728, + "end_time": 30.649832940487848, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--196/temp/line_7_B.wav", + "silence_duration": 0.44389398542870273, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Oh, no. What did you do?", + "original_text": "Oh, no. What did you do?", + "start_time": 31.24926447429727, + "end_time": 33.25779055139478, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--196/temp/line_8_A.wav", + "silence_duration": 0.5994315338094235, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Well, I was getting on the bus to come home, when the driver shouted at me. He didn't let me on the bus because I was wet and dirty. And I didn't have any money for a cab or anything else", + "original_text": "Well, I was getting on the bus to come home, when the driver shouted at me. He didn't let me on the bus because I was wet and dirty. And I didn't have any money for a cab or anything else [interrupt] so I had to figure out another way to get home while being completely soaked and covered in mud.", + "start_time": 33.832167856046915, + "end_time": 47.78736059981109, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--196/temp/line_9_B.wav", + "silence_duration": 0.5743773046521349, + "is_interrupted": true, + "text_after_interrupt": "so I had to figure out another way to get home while being completely soaked and covered in mud." + }, + { + "speaker": "A", + "text": "Wait, you didn't have any money for a taxi? That must have made things even worse. How did you get home then?", + "original_text": "Wait, you didn't have any money for a taxi? That must have made things even worse. How did you get home then?", + "start_time": 46.16829480395041, + "end_time": 53.50580047288465, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--196/temp/line_10_A.wav", + "silence_duration": 0.5723647831551169, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I walked all the way home.", + "original_text": "I walked all the way home.", + "start_time": 53.81225502257701, + "end_time": 55.06613257359742, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--196/temp/line_11_B.wav", + "silence_duration": 0.3064545496923629, + "is_interrupted": false + } + ] + }, + "DialogSum--val--197": { + "original_text": "A: You look upset. Are you OK, Tommy? \nB: I'm fine, mom. It's just your cellphone. You lent it to me this morning. \nA: Yes, is something wrong with it? No, don't tell me you dropped and [interrupt] cracked the screen or something like that because I just got this phone last month and it was quite expensive. \nB: No, I was texting Jack outside a store and somebody ran past and grabbed it. \nA: You mean someone stole my phone? \nB: I am afraid so. Everything just happened so suddenly. I was too [interrupt] shocked to react quickly enough to stop them from disappearing into the crowd before I could even shout for help. \nA: Wait, did you see who it was? Any details? \nB: No. It was someone in a white shirt. But there's a camera on the entrance. It might have got a shot of the thief's face. \nA: You've reported it then? \nB: Well, not yet. I was too shocked earlier to think clearly, but I'll do it tomorrow. \nA: Tomorrow? Tommy, turn to a policeman nearby right now. I'll have a look at the insurance and see if it's covered. \nB: OK, I will.", + "cleaned_text": "A: You look upset. Are you OK, Tommy? \nB: I'm fine, mom. It's just your cellphone. You lent it to me this morning. \nA:Yes, is something wrong with it? No, don't tell me you dropped and cracked the screen or something like that because I just got this phone last month and it was quite expensive.\nB: No, I was texting Jack outside a store and somebody ran past and grabbed it. \nA: You mean someone stole my phone? \nB:I am afraid so. Everything just happened so suddenly. I was too shocked to react quickly enough to stop them from disappearing into the crowd before I could even shout for help.\nA: Wait, did you see who it was? Any details? \nB: No. It was someone in a white shirt. But there's a camera on the entrance. It might have got a shot of the thief's face. \nA: You've reported it then? \nB: Well, not yet. I was too shocked earlier to think clearly, but I'll do it tomorrow. \nA: Tomorrow? Tommy, turn to a policeman nearby right now. I'll have a look at the insurance and see if it's covered. \nB: OK, I will.", + "total_duration": 56.22081632653061, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--197/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--197/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--197/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "You look upset. Are you OK, Tommy?", + "original_text": "You look upset. Are you OK, Tommy?", + "start_time": 0, + "end_time": 2.7980045351473923, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--197/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I'm fine, mom. It's just your cellphone. You lent it to me this morning.", + "original_text": "I'm fine, mom. It's just your cellphone. You lent it to me this morning.", + "start_time": 3.130889631286666, + "end_time": 7.345311399994149, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--197/temp/line_1_B.wav", + "silence_duration": 0.3328850961392734, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Yes, is something wrong with it? No, don't tell me you dropped and", + "original_text": "Yes, is something wrong with it? No, don't tell me you dropped and [interrupt] cracked the screen or something like that because I just got this phone last month and it was quite expensive.", + "start_time": 7.896013563593396, + "end_time": 18.426262996699972, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--197/temp/line_2_A.wav", + "silence_duration": 0.5507021635992468, + "is_interrupted": true, + "text_after_interrupt": "cracked the screen or something like that because I just got this phone last month and it was quite expensive." + }, + { + "speaker": "B", + "text": "No, I was texting Jack outside a store and somebody ran past and grabbed it.", + "original_text": "No, I was texting Jack outside a store and somebody ran past and grabbed it.", + "start_time": 13.1088933821875, + "end_time": 17.62517456132582, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--197/temp/line_3_B.wav", + "silence_duration": 0.35717638901973175, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "You mean someone stole my phone?", + "original_text": "You mean someone stole my phone?", + "start_time": 18.9646480564552, + "end_time": 20.833854405661548, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--197/temp/line_4_A.wav", + "silence_duration": 0.5383850597552293, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I am afraid so. Everything just happened so suddenly. I was too", + "original_text": "I am afraid so. Everything just happened so suddenly. I was too [interrupt] shocked to react quickly enough to stop them from disappearing into the crowd before I could even shout for help.", + "start_time": 21.430738346803505, + "end_time": 30.08017145337947, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--197/temp/line_5_B.wav", + "silence_duration": 0.5968839411419573, + "is_interrupted": true, + "text_after_interrupt": "shocked to react quickly enough to stop them from disappearing into the crowd before I could even shout for help." + }, + { + "speaker": "A", + "text": "Wait, did you see who it was? Any details?", + "original_text": "Wait, did you see who it was? Any details?", + "start_time": 29.845307028279247, + "end_time": 33.87396915979852, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--197/temp/line_6_A.wav", + "silence_duration": 0.5448319680536987, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "No. It was someone in a white shirt. But there's a camera on the entrance. It might have got a shot of the thief's face.", + "original_text": "No. It was someone in a white shirt. But there's a camera on the entrance. It might have got a shot of the thief's face.", + "start_time": 34.40686485217138, + "end_time": 40.78074240319179, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--197/temp/line_7_B.wav", + "silence_duration": 0.5328956923728624, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "You've reported it then?", + "original_text": "You've reported it then?", + "start_time": 41.13682631794103, + "end_time": 42.47197371023128, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--197/temp/line_8_A.wav", + "silence_duration": 0.35608391474924417, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Well, not yet. I was too shocked earlier to think clearly, but I'll do it tomorrow.", + "original_text": "Well, not yet. I was too shocked earlier to think clearly, but I'll do it tomorrow.", + "start_time": 43.05956580958612, + "end_time": 47.21593769167229, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--197/temp/line_9_B.wav", + "silence_duration": 0.5875920993548356, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Tomorrow? Tommy, turn to a policeman nearby right now. I'll have a look at the insurance and see if it's covered.", + "original_text": "Tomorrow? Tommy, turn to a policeman nearby right now. I'll have a look at the insurance and see if it's covered.", + "start_time": 47.64836275549456, + "end_time": 54.38214960356712, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--197/temp/line_10_A.wav", + "silence_duration": 0.43242506382227025, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "OK, I will.", + "original_text": "OK, I will.", + "start_time": 54.96695006464633, + "end_time": 56.22082761566674, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--197/temp/line_11_B.wav", + "silence_duration": 0.5848004610792146, + "is_interrupted": false + } + ] + }, + "DialogSum--val--198": { + "original_text": "A: I like this table, it looks very strong. Do you think it will look good in your new house?\nB: I don't think so. My new house is by the beach. I want something that looks like it belongs by the [interrupt] sea, something that really captures that coastal essence with weathered wood textures and soft, ocean-inspired color tones that complement the natural surroundings.\nA: Sorry to interrupt, but what kind of beach style are you aiming for? Something more rustic or modern?\nB: I'm thinking more along the lines of a rustic, coastal vibe. But I also want something light, like the color of sand. What about this one? It looks good.\nA: It's too dark. I want something that matches that beachy feel. You're very picky. This one?\nB: No, it looks too weak, and it's way too dark.\nA: Alright then, how about this table? It's strong and light.\nB: Um... Maybe, I'll have to think about it. But it also has to be big enough for the space. It shouldn't feel too cramped in the room.", + "cleaned_text": "A: I like this table, it looks very strong. Do you think it will look good in your new house?\nB:I don't think so. My new house is by the beach. I want something that looks like it belongs by the sea, something that really captures that coastal essence with weathered wood textures and soft, ocean-inspired color tones that complement the natural surroundings.\nA: Sorry to interrupt, but what kind of beach style are you aiming for? Something more rustic or modern?\nB: I'm thinking more along the lines of a rustic, coastal vibe. But I also want something light, like the color of sand. What about this one? It looks good.\nA: It's too dark. I want something that matches that beachy feel. You're very picky. This one?\nB: No, it looks too weak, and it's way too dark.\nA: Alright then, how about this table? It's strong and light.\nB: Um... Maybe, I'll have to think about it. But it also has to be big enough for the space. It shouldn't feel too cramped in the room.", + "total_duration": 49.48086167800454, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--198/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--198/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--198/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "I like this table, it looks very strong. Do you think it will look good in your new house?", + "original_text": "I like this table, it looks very strong. Do you think it will look good in your new house?", + "start_time": 0, + "end_time": 5.352199546485261, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--198/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I don't think so. My new house is by the beach. I want something that looks like it belongs by the", + "original_text": "I don't think so. My new house is by the beach. I want something that looks like it belongs by the [interrupt] sea, something that really captures that coastal essence with weathered wood textures and soft, ocean-inspired color tones that complement the natural surroundings.", + "start_time": 5.880141328107928, + "end_time": 19.278055160307474, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--198/temp/line_1_B.wav", + "silence_duration": 0.5279417816226663, + "is_interrupted": true, + "text_after_interrupt": "sea, something that really captures that coastal essence with weathered wood textures and soft, ocean-inspired color tones that complement the natural surroundings." + }, + { + "speaker": "A", + "text": "Sorry to interrupt, but what kind of beach style are you aiming for? Something more rustic or modern?", + "original_text": "Sorry to interrupt, but what kind of beach style are you aiming for? Something more rustic or modern?", + "start_time": 10.62862205373151, + "end_time": 16.839959922212238, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--198/temp/line_2_A.wav", + "silence_duration": 0.35376173321552123, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I'm thinking more along the lines of a rustic, coastal vibe. But I also want something light, like the color of sand. What about this one? It looks good.", + "original_text": "I'm thinking more along the lines of a rustic, coastal vibe. But I also want something light, like the color of sand. What about this one? It looks good.", + "start_time": 19.81894863928131, + "end_time": 28.07364251683233, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--198/temp/line_3_B.wav", + "silence_duration": 0.5408934789738342, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "It's too dark. I want something that matches that beachy feel. You're very picky. This one?", + "original_text": "It's too dark. I want something that matches that beachy feel. You're very picky. This one?", + "start_time": 28.664647828676667, + "end_time": 34.759885923914766, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--198/temp/line_4_A.wav", + "silence_duration": 0.5910053118443377, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "No, it looks too weak, and it's way too dark.", + "original_text": "No, it looks too weak, and it's way too dark.", + "start_time": 35.1335943581252, + "end_time": 37.74583925608439, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--198/temp/line_5_B.wav", + "silence_duration": 0.3737084342104364, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Alright then, how about this table? It's strong and light.", + "original_text": "Alright then, how about this table? It's strong and light.", + "start_time": 38.255032418582026, + "end_time": 41.854125389103565, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--198/temp/line_6_A.wav", + "silence_duration": 0.5091931624976376, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Um... Maybe, I'll have to think about it. But it also has to be big enough for the space. It shouldn't feel too cramped in the room.", + "original_text": "Um... Maybe, I'll have to think about it. But it also has to be big enough for the space. It shouldn't feel too cramped in the room.", + "start_time": 42.42199868808464, + "end_time": 49.48086490123657, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--198/temp/line_7_B.wav", + "silence_duration": 0.5678732989810773, + "is_interrupted": false + } + ] + }, + "DialogSum--val--199": { + "original_text": "A: Hello Mabel Hotel. What can I do for you? \nB: Hello, this is George Damon. Our company will be having a sales meeting in January, and we need to book a room for about 200 people. Does your hotel have something that can accommodate that [interrupt] size and also provide a comfortable setting for such a large group? We're particularly interested in spaces with good acoustics and flexible seating arrangements to facilitate different presentation formats. \nA: Sorry to jump in, but just to clarify, will you also need catering services for the meeting? \nB: Not at this time, but we'll need chairs, a stage, and a projection screen. \nA: Then I would suggest room 13. \nB: Well, I don't like the room [interrupt] because it feels a bit too small and lacks natural lighting, which is important for creating an energizing atmosphere during our full-day training sessions and product demonstrations. \nA: Ah, got it. Room 19 and room 26 are also available. \nB: I prefer something ending with nine.", + "cleaned_text": "A: Hello Mabel Hotel. What can I do for you? \nB:Hello, this is George Damon. Our company will be having a sales meeting in January, and we need to book a room for about 200 people. Does your hotel have something that can accommodate that size and also provide a comfortable setting for such a large group? We're particularly interested in spaces with good acoustics and flexible seating arrangements to facilitate different presentation formats.\nA: Sorry to jump in, but just to clarify, will you also need catering services for the meeting? \nB: Not at this time, but we'll need chairs, a stage, and a projection screen. \nA: Then I would suggest room 13. \nB:Well, I don't like the room because it feels a bit too small and lacks natural lighting, which is important for creating an energizing atmosphere during our full-day training sessions and product demonstrations.\nA: Ah, got it. Room 19 and room 26 are also available. \nB: I prefer something ending with nine.", + "total_duration": 44.51514739229025, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--199/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--199/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--199/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Hello Mabel Hotel. What can I do for you?", + "original_text": "Hello Mabel Hotel. What can I do for you?", + "start_time": 0, + "end_time": 2.716734693877551, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--199/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Hello, this is George Damon. Our company will be having a sales meeting in January, and we need to book a room for about 200 people. Does your hotel have something that can accommodate that", + "original_text": "Hello, this is George Damon. Our company will be having a sales meeting in January, and we need to book a room for about 200 people. Does your hotel have something that can accommodate that [interrupt] size and also provide a comfortable setting for such a large group? We're particularly interested in spaces with good acoustics and flexible seating arrangements to facilitate different presentation formats.", + "start_time": 3.165486691339397, + "end_time": 23.599046782042343, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--199/temp/line_1_B.wav", + "silence_duration": 0.4487519974618455, + "is_interrupted": true, + "text_after_interrupt": "size and also provide a comfortable setting for such a large group? We're particularly interested in spaces with good acoustics and flexible seating arrangements to facilitate different presentation formats." + }, + { + "speaker": "A", + "text": "Sorry to jump in, but just to clarify, will you also need catering services for the meeting?", + "original_text": "Sorry to jump in, but just to clarify, will you also need catering services for the meeting?", + "start_time": 13.41709666866366, + "end_time": 18.98988578430992, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--199/temp/line_2_A.wav", + "silence_duration": 0.31729411747284075, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Not at this time, but we'll need chairs, a stage, and a projection screen.", + "original_text": "Not at this time, but we'll need chairs, a stage, and a projection screen.", + "start_time": 23.984022530556445, + "end_time": 27.455405750511094, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--199/temp/line_3_B.wav", + "silence_duration": 0.3849757485141002, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Then I would suggest room 13.", + "original_text": "Then I would suggest room 13.", + "start_time": 27.92515368025878, + "end_time": 29.956899712004812, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--199/temp/line_4_A.wav", + "silence_duration": 0.46974792974768526, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Well, I don't like the room", + "original_text": "Well, I don't like the room [interrupt] because it feels a bit too small and lacks natural lighting, which is important for creating an energizing atmosphere during our full-day training sessions and product demonstrations.", + "start_time": 30.30403082096681, + "end_time": 40.54403082096681, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--199/temp/line_5_B.wav", + "silence_duration": 0.34713110896199567, + "is_interrupted": true, + "text_after_interrupt": "because it feels a bit too small and lacks natural lighting, which is important for creating an energizing atmosphere during our full-day training sessions and product demonstrations." + }, + { + "speaker": "A", + "text": "Ah, got it. Room 19 and room 26 are also available.", + "original_text": "Ah, got it. Room 19 and room 26 are also available.", + "start_time": 37.82089100940289, + "end_time": 42.13980257402874, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--199/temp/line_6_A.wav", + "silence_duration": 0.3041380661294688, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I prefer something ending with nine.", + "original_text": "I prefer something ending with nine.", + "start_time": 42.68080611668038, + "end_time": 44.515182533913936, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--199/temp/line_7_B.wav", + "silence_duration": 0.5410035426516395, + "is_interrupted": false + } + ] + }, + "DialogSum--val--200": { + "original_text": "A: So, to start with, I want to talk about a very successful invention, the bicycle. Why? Do you know what the main advantages of bikes [interrupt] are in terms of sustainability and health benefits? They significantly reduce carbon emissions compared to motorized transport while providing excellent cardiovascular exercise and improving overall physical fitness.\nB: They don't cost much?\nA: Yes, and they're not complicated. They're easy to use. Yeah? They're also incredibly versatile, allowing people to navigate through urban environments [interrupt] with ease while avoiding traffic congestion and parking hassles that come with cars.\nB: Not easy when you're going uphill. Let's say simple.\nA: OK. Yeah. They're cheap to run. They don't often [interrupt] require fuel, and maintenance is minimal compared to other vehicles, making them an economical choice for both short commutes and longer recreational rides.\nB: Sorry, just to clarify, when you say \"cheap to run,\" are you also considering maintenance costs?\nA: Yes, maintenance is part of that. I was actually going to mention that they're also safe, especially in low-traffic areas [interrupt] where dedicated bike lanes are available, and studies show they contribute to reduced accident rates when proper infrastructure is in place.", + "cleaned_text": "A:So, to start with, I want to talk about a very successful invention, the bicycle. Why? Do you know what the main advantages of bikes are in terms of sustainability and health benefits? They significantly reduce carbon emissions compared to motorized transport while providing excellent cardiovascular exercise and improving overall physical fitness.\nB: They don't cost much?\nA:Yes, and they're not complicated. They're easy to use. Yeah? They're also incredibly versatile, allowing people to navigate through urban environments with ease while avoiding traffic congestion and parking hassles that come with cars.\nB: Not easy when you're going uphill. Let's say simple.\nA:OK. Yeah. They're cheap to run. They don't often require fuel, and maintenance is minimal compared to other vehicles, making them an economical choice for both short commutes and longer recreational rides.\nB: Sorry, just to clarify, when you say \"cheap to run,\" are you also considering maintenance costs?\nA:Yes, maintenance is part of that. I was actually going to mention that they're also safe, especially in low-traffic areas where dedicated bike lanes are available, and studies show they contribute to reduced accident rates when proper infrastructure is in place.", + "total_duration": 65.56362811791384, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--200/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--200/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--200/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "So, to start with, I want to talk about a very successful invention, the bicycle. Why? Do you know what the main advantages of bikes", + "original_text": "So, to start with, I want to talk about a very successful invention, the bicycle. Why? Do you know what the main advantages of bikes [interrupt] are in terms of sustainability and health benefits? They significantly reduce carbon emissions compared to motorized transport while providing excellent cardiovascular exercise and improving overall physical fitness.", + "start_time": 0, + "end_time": 20.21297052154195, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--200/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": true, + "text_after_interrupt": "are in terms of sustainability and health benefits? They significantly reduce carbon emissions compared to motorized transport while providing excellent cardiovascular exercise and improving overall physical fitness." + }, + { + "speaker": "B", + "text": "They don't cost much?", + "original_text": "They don't cost much?", + "start_time": 8.916462585034013, + "end_time": 10.065850340136054, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--200/temp/line_1_B.wav", + "silence_duration": 0.41796747514758203, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Yes, and they're not complicated. They're easy to use. Yeah? They're also incredibly versatile, allowing people to navigate through urban environments", + "original_text": "Yes, and they're not complicated. They're easy to use. Yeah? They're also incredibly versatile, allowing people to navigate through urban environments [interrupt] with ease while avoiding traffic congestion and parking hassles that come with cars.", + "start_time": 20.725321158356316, + "end_time": 34.40187444633818, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--200/temp/line_2_A.wav", + "silence_duration": 0.5123506368143635, + "is_interrupted": true, + "text_after_interrupt": "with ease while avoiding traffic congestion and parking hassles that come with cars." + }, + { + "speaker": "B", + "text": "Not easy when you're going uphill. Let's say simple.", + "original_text": "Not easy when you're going uphill. Let's say simple.", + "start_time": 31.051268171875925, + "end_time": 33.70995297913216, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--200/temp/line_3_B.wav", + "silence_duration": 0.5366642365032068, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "OK. Yeah. They're cheap to run. They don't often", + "original_text": "OK. Yeah. They're cheap to run. They don't often [interrupt] require fuel, and maintenance is minimal compared to other vehicles, making them an economical choice for both short commutes and longer recreational rides.", + "start_time": 34.909017865840994, + "end_time": 47.45940335336934, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--200/temp/line_4_A.wav", + "silence_duration": 0.5071434195028178, + "is_interrupted": true, + "text_after_interrupt": "require fuel, and maintenance is minimal compared to other vehicles, making them an economical choice for both short commutes and longer recreational rides." + }, + { + "speaker": "B", + "text": "Sorry, just to clarify, when you say \"cheap to run,\" are you also considering maintenance costs?", + "original_text": "Sorry, just to clarify, when you say \"cheap to run,\" are you also considering maintenance costs?", + "start_time": 43.519687377467754, + "end_time": 48.75578715071038, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--200/temp/line_5_B.wav", + "silence_duration": 0.5737115823297699, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Yes, maintenance is part of that. I was actually going to mention that they're also safe, especially in low-traffic areas", + "original_text": "Yes, maintenance is part of that. I was actually going to mention that they're also safe, especially in low-traffic areas [interrupt] where dedicated bike lanes are available, and studies show they contribute to reduced accident rates when proper infrastructure is in place.", + "start_time": 49.332906945500824, + "end_time": 65.56365524482055, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--200/temp/line_6_A.wav", + "silence_duration": 0.5771197947904433, + "is_interrupted": true, + "text_after_interrupt": "where dedicated bike lanes are available, and studies show they contribute to reduced accident rates when proper infrastructure is in place." + } + ] + }, + "DialogSum--val--201": { + "original_text": "A: Hi, Sam. I want to buy a pet. Do you have any ideas? \nB: You really should go to Rachel's pet store. \nA: Why? Anything special there? \nB: It's more than special. You can find as many kinds of animals as you can put a name to and [interrupt] even some that you might not expect to see in a typical pet store, like rare tropical birds, miniature pigs, and even some legally-kept exotic species that require special permits. \nA: Oh, really? Are there any snakes? \nB: Snakes? There are even rodents and monkeys! It's a world of exotic pets. \nA: That's terrific. I can't wait to check it out. \nB: Hang on. Are you sure you want to keep a non-traditional pet? \nA: Why not? It's so cool. \nB: But it will pose a risk to your health. \nA: Pardon? \nB: I mean, most reptiles carry some harmful bacteria. They are likely to cause immune system problems. By the way, you mentioned snakes earlier—did you want to ask something else about them?", + "cleaned_text": "A: Hi, Sam. I want to buy a pet. Do you have any ideas? \nB: You really should go to Rachel's pet store. \nA: Why? Anything special there? \nB:It's more than special. You can find as many kinds of animals as you can put a name to and even some that you might not expect to see in a typical pet store, like rare tropical birds, miniature pigs, and even some legally-kept exotic species that require special permits.\nA: Oh, really? Are there any snakes? \nB: Snakes? There are even rodents and monkeys! It's a world of exotic pets. \nA: That's terrific. I can't wait to check it out. \nB: Hang on. Are you sure you want to keep a non-traditional pet? \nA: Why not? It's so cool. \nB: But it will pose a risk to your health. \nA: Pardon? \nB: I mean, most reptiles carry some harmful bacteria. They are likely to cause immune system problems. By the way, you mentioned snakes earlier—did you want to ask something else about them?", + "total_duration": 51.03569160997733, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--201/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--201/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--201/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Hi, Sam. I want to buy a pet. Do you have any ideas?", + "original_text": "Hi, Sam. I want to buy a pet. Do you have any ideas?", + "start_time": 0, + "end_time": 3.889342403628118, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--201/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "You really should go to Rachel's pet store.", + "original_text": "You really should go to Rachel's pet store.", + "start_time": 4.37882757105017, + "end_time": 6.457013512093254, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--201/temp/line_1_B.wav", + "silence_duration": 0.4894851674220523, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Why? Anything special there?", + "original_text": "Why? Anything special there?", + "start_time": 6.962836276362873, + "end_time": 8.773992738947907, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--201/temp/line_2_A.wav", + "silence_duration": 0.5058227642696191, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "It's more than special. You can find as many kinds of animals as you can put a name to and", + "original_text": "It's more than special. You can find as many kinds of animals as you can put a name to and [interrupt] even some that you might not expect to see in a typical pet store, like rare tropical birds, miniature pigs, and even some legally-kept exotic species that require special permits.", + "start_time": 9.136568597929763, + "end_time": 23.974119618337927, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--201/temp/line_3_B.wav", + "silence_duration": 0.3625758589818559, + "is_interrupted": true, + "text_after_interrupt": "even some that you might not expect to see in a typical pet store, like rare tropical birds, miniature pigs, and even some legally-kept exotic species that require special permits." + }, + { + "speaker": "A", + "text": "Oh, really? Are there any snakes?", + "original_text": "Oh, really? Are there any snakes?", + "start_time": 13.768949550310715, + "end_time": 15.742645695435431, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--201/temp/line_4_A.wav", + "silence_duration": 0.4854492220997497, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Snakes? There are even rodents and monkeys! It's a world of exotic pets.", + "original_text": "Snakes? There are even rodents and monkeys! It's a world of exotic pets.", + "start_time": 24.498036224085162, + "end_time": 29.049147335196274, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--201/temp/line_5_B.wav", + "silence_duration": 0.5239166057472364, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "That's terrific. I can't wait to check it out.", + "original_text": "That's terrific. I can't wait to check it out.", + "start_time": 29.397723668952025, + "end_time": 32.59046743312436, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--201/temp/line_6_A.wav", + "silence_duration": 0.34857633375575137, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Hang on. Are you sure you want to keep a non-traditional pet?", + "original_text": "Hang on. Are you sure you want to keep a non-traditional pet?", + "start_time": 32.92737775232209, + "end_time": 36.17817140311574, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--201/temp/line_7_B.wav", + "silence_duration": 0.3369103191977297, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Why not? It's so cool.", + "original_text": "Why not? It's so cool.", + "start_time": 36.52133910182145, + "end_time": 38.471815292297634, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--201/temp/line_8_A.wav", + "silence_duration": 0.3431676987057055, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "But it will pose a risk to your health.", + "original_text": "But it will pose a risk to your health.", + "start_time": 38.817243226466935, + "end_time": 40.4310300745395, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--201/temp/line_9_B.wav", + "silence_duration": 0.34542793416929995, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Pardon?", + "original_text": "Pardon?", + "start_time": 40.968406385676325, + "end_time": 41.60695513851079, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--201/temp/line_10_A.wav", + "silence_duration": 0.5373763111368256, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I mean, most reptiles carry some harmful bacteria. They are likely to cause immune system problems. By the way, you mentioned snakes earlier—did you want to ask something else about them?", + "original_text": "I mean, most reptiles carry some harmful bacteria. They are likely to cause immune system problems. By the way, you mentioned snakes earlier—did you want to ask something else about them?", + "start_time": 42.20052470207817, + "end_time": 51.035717445842344, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--201/temp/line_11_B.wav", + "silence_duration": 0.5935695635673762, + "is_interrupted": false + } + ] + }, + "DialogSum--val--204": { + "original_text": "A: I believe you have charged me twice for the same thing. Look, the figure of 6.5 dollar appears here, then again [interrupt] further down on the bill, which seems like a duplicate charge and is causing my total to be significantly higher than what I expected to pay for my purchase today.\nB: Oh, I apologize for that. Let me take a closer look. Could you show me where exactly the duplicate charge is? \nA: Sure, it's right here. I was pointing out that the 6.5 dollar charge appears twice, once here and then again further down. \nB: I'll just go and check it for you, sir. I'll also verify if there might be any other discrepancies in your bill while I'm at it to ensure everything is accurate.", + "cleaned_text": "A:I believe you have charged me twice for the same thing. Look, the figure of 6.5 dollar appears here, then again further down on the bill, which seems like a duplicate charge and is causing my total to be significantly higher than what I expected to pay for my purchase today.\nB: Oh, I apologize for that. Let me take a closer look. Could you show me where exactly the duplicate charge is? \nA: Sure, it's right here. I was pointing out that the 6.5 dollar charge appears twice, once here and then again further down. \nB: I'll just go and check it for you, sir. I'll also verify if there might be any other discrepancies in your bill while I'm at it to ensure everything is accurate.", + "total_duration": 33.57174603174603, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--204/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--204/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--204/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "I believe you have charged me twice for the same thing. Look, the figure of 6.5 dollar appears here, then again", + "original_text": "I believe you have charged me twice for the same thing. Look, the figure of 6.5 dollar appears here, then again [interrupt] further down on the bill, which seems like a duplicate charge and is causing my total to be significantly higher than what I expected to pay for my purchase today.", + "start_time": 0, + "end_time": 16.89251700680272, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--204/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": true, + "text_after_interrupt": "further down on the bill, which seems like a duplicate charge and is causing my total to be significantly higher than what I expected to pay for my purchase today." + }, + { + "speaker": "B", + "text": "Oh, I apologize for that. Let me take a closer look. Could you show me where exactly the duplicate charge is?", + "original_text": "Oh, I apologize for that. Let me take a closer look. Could you show me where exactly the duplicate charge is?", + "start_time": 7.894784580498866, + "end_time": 13.653333333333332, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--204/temp/line_1_B.wav", + "silence_duration": 0.42075840273930304, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Sure, it's right here. I was pointing out that the 6.5 dollar charge appears twice, once here and then again further down.", + "original_text": "Sure, it's right here. I was pointing out that the 6.5 dollar charge appears twice, once here and then again further down.", + "start_time": 17.307155852291096, + "end_time": 25.22516038743849, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--204/temp/line_2_A.wav", + "silence_duration": 0.41463884548837515, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I'll just go and check it for you, sir. I'll also verify if there might be any other discrepancies in your bill while I'm at it to ensure everything is accurate.", + "original_text": "I'll just go and check it for you, sir. I'll also verify if there might be any other discrepancies in your bill while I'm at it to ensure everything is accurate.", + "start_time": 25.781460339384505, + "end_time": 33.571755123965005, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--204/temp/line_3_B.wav", + "silence_duration": 0.5562999519460159, + "is_interrupted": false + } + ] + }, + "DialogSum--val--205": { + "original_text": "A: How are you doing, Christopher? \nB: To be honest, I'm really fed up with work at the moment. I need a break! \nA: Are you doing anything this weekend? \nB: I have to work on Saturday all day! I really [interrupt] need some time to relax, but there's just too much to do and I feel completely overwhelmed by all the deadlines piling up. \nA: Oh no, working on the weekend must be exhausting! But what about Sunday, are you available then? \nB: Yes, that's my only day off until Thursday. \nA: Okay, well, my friends and I are planning on going to the beach on Sunday. We tend to leave around noon whenever we go anywhere, so you could still sleep in. Do you want to come with us? \nB: That'd be fantastic! Which beach are you [interrupt] thinking of going to? I'd love to know more details about the location and what kind of activities we might be doing there. \nA: Sorry, I forgot to say—it's a quiet beach just about an hour outside of the city. \nB: Sounds perfect! What should I bring with me? \nA: We've got plenty of inflatables, but if you want to sit on a chair, you'll have to bring your own sunlounger. \nB: I can just use my beach towel. I love lazing around in the sun.", + "cleaned_text": "A: How are you doing, Christopher? \nB: To be honest, I'm really fed up with work at the moment. I need a break! \nA: Are you doing anything this weekend? \nB:I have to work on Saturday all day! I really need some time to relax, but there's just too much to do and I feel completely overwhelmed by all the deadlines piling up.\nA: Oh no, working on the weekend must be exhausting! But what about Sunday, are you available then? \nB: Yes, that's my only day off until Thursday. \nA: Okay, well, my friends and I are planning on going to the beach on Sunday. We tend to leave around noon whenever we go anywhere, so you could still sleep in. Do you want to come with us? \nB:That'd be fantastic! Which beach are you thinking of going to? I'd love to know more details about the location and what kind of activities we might be doing there.\nA: Sorry, I forgot to say—it's a quiet beach just about an hour outside of the city. \nB: Sounds perfect! What should I bring with me? \nA: We've got plenty of inflatables, but if you want to sit on a chair, you'll have to bring your own sunlounger. \nB: I can just use my beach towel. I love lazing around in the sun.", + "total_duration": 59.17922902494331, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--205/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--205/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--205/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "How are you doing, Christopher?", + "original_text": "How are you doing, Christopher?", + "start_time": 0, + "end_time": 1.497687074829932, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--205/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "To be honest, I'm really fed up with work at the moment. I need a break!", + "original_text": "To be honest, I'm really fed up with work at the moment. I need a break!", + "start_time": 2.0056020608694, + "end_time": 5.337665552932892, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--205/temp/line_1_B.wav", + "silence_duration": 0.5079149860394677, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Are you doing anything this weekend?", + "original_text": "Are you doing anything this weekend?", + "start_time": 5.654563242364885, + "end_time": 7.593429455516812, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--205/temp/line_2_A.wav", + "silence_duration": 0.31689768943199303, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I have to work on Saturday all day! I really", + "original_text": "I have to work on Saturday all day! I really [interrupt] need some time to relax, but there's just too much to do and I feel completely overwhelmed by all the deadlines piling up.", + "start_time": 8.123521429774975, + "end_time": 16.85422437762078, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--205/temp/line_3_B.wav", + "silence_duration": 0.5300919742581625, + "is_interrupted": true, + "text_after_interrupt": "need some time to relax, but there's just too much to do and I feel completely overwhelmed by all the deadlines piling up." + }, + { + "speaker": "A", + "text": "Oh no, working on the weekend must be exhausting! But what about Sunday, are you available then?", + "original_text": "Oh no, working on the weekend must be exhausting! But what about Sunday, are you available then?", + "start_time": 10.956355896895156, + "end_time": 16.807784468323728, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--205/temp/line_4_A.wav", + "silence_duration": 0.3975680038169999, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, that's my only day off until Thursday.", + "original_text": "Yes, that's my only day off until Thursday.", + "start_time": 17.287926713518534, + "end_time": 19.67958204231672, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--205/temp/line_5_B.wav", + "silence_duration": 0.4337023358977534, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Okay, well, my friends and I are planning on going to the beach on Sunday. We tend to leave around noon whenever we go anywhere, so you could still sleep in. Do you want to come with us?", + "original_text": "Okay, well, my friends and I are planning on going to the beach on Sunday. We tend to leave around noon whenever we go anywhere, so you could still sleep in. Do you want to come with us?", + "start_time": 20.22745722734729, + "end_time": 31.547185118503755, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--205/temp/line_6_A.wav", + "silence_duration": 0.5478751850305711, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "That'd be fantastic! Which beach are you", + "original_text": "That'd be fantastic! Which beach are you [interrupt] thinking of going to? I'd love to know more details about the location and what kind of activities we might be doing there.", + "start_time": 31.886325726947312, + "end_time": 39.67662051152781, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--205/temp/line_7_B.wav", + "silence_duration": 0.33914060844355615, + "is_interrupted": true, + "text_after_interrupt": "thinking of going to? I'd love to know more details about the location and what kind of activities we might be doing there." + }, + { + "speaker": "A", + "text": "Sorry, I forgot to say—it's a quiet beach just about an hour outside of the city.", + "original_text": "Sorry, I forgot to say—it's a quiet beach just about an hour outside of the city.", + "start_time": 40.29506610453595, + "end_time": 46.03039490272189, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--205/temp/line_8_A.wav", + "silence_duration": 0.3052310244206633, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Sounds perfect! What should I bring with me?", + "original_text": "Sounds perfect! What should I bring with me?", + "start_time": 46.531567491972815, + "end_time": 48.58653347836737, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--205/temp/line_9_B.wav", + "silence_duration": 0.5011725892509241, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "We've got plenty of inflatables, but if you want to sit on a chair, you'll have to bring your own sunlounger.", + "original_text": "We've got plenty of inflatables, but if you want to sit on a chair, you'll have to bring your own sunlounger.", + "start_time": 48.90619234949274, + "end_time": 55.001430444730836, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--205/temp/line_10_A.wav", + "silence_duration": 0.31965887112536817, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I can just use my beach towel. I love lazing around in the sun.", + "original_text": "I can just use my beach towel. I love lazing around in the sun.", + "start_time": 55.54532335616067, + "end_time": 59.179246258655006, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--205/temp/line_11_B.wav", + "silence_duration": 0.5438929114298329, + "is_interrupted": false + } + ] + }, + "DialogSum--val--206": { + "original_text": "A: Doris, Helen Mall is having a big sale this weekend. Do you wanna [interrupt] check out some deals together? I heard they're offering massive discounts on designer brands and electronics, plus there's going to be live music and free samples throughout the mall.\nB: Sorry, I just remembered, didn't you mention last week that you were saving up for something? Is that why you're not interested?\nA: Yeah, exactly. I'm broke because I'm saving up for a trip. But, what I was going to say earlier—do you still want to go window shopping? We could still enjoy the atmosphere and maybe grab some food at that new Italian place in the food court.\nB: Oh, right! But just looking around? Nah, that sounds boring.", + "cleaned_text": "A:Doris, Helen Mall is having a big sale this weekend. Do you wanna check out some deals together? I heard they're offering massive discounts on designer brands and electronics, plus there's going to be live music and free samples throughout the mall.\nB: Sorry, I just remembered, didn't you mention last week that you were saving up for something? Is that why you're not interested?\nA: Yeah, exactly. I'm broke because I'm saving up for a trip. But, what I was going to say earlier—do you still want to go window shopping? We could still enjoy the atmosphere and maybe grab some food at that new Italian place in the food court.\nB: Oh, right! But just looking around? Nah, that sounds boring.", + "total_duration": 35.70934240362812, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--206/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--206/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--206/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Doris, Helen Mall is having a big sale this weekend. Do you wanna", + "original_text": "Doris, Helen Mall is having a big sale this weekend. Do you wanna [interrupt] check out some deals together? I heard they're offering massive discounts on designer brands and electronics, plus there's going to be live music and free samples throughout the mall.", + "start_time": 0, + "end_time": 15.952108843537415, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--206/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": true, + "text_after_interrupt": "check out some deals together? I heard they're offering massive discounts on designer brands and electronics, plus there's going to be live music and free samples throughout the mall." + }, + { + "speaker": "B", + "text": "Sorry, I just remembered, didn't you mention last week that you were saving up for something? Is that why you're not interested?", + "original_text": "Sorry, I just remembered, didn't you mention last week that you were saving up for something? Is that why you're not interested?", + "start_time": 4.748480725623582, + "end_time": 10.878548752834467, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--206/temp/line_1_B.wav", + "silence_duration": 0.44688096860753723, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Yeah, exactly. I'm broke because I'm saving up for a trip. But, what I was going to say earlier—do you still want to go window shopping? We could still enjoy the atmosphere and maybe grab some food at that new Italian place in the food court.", + "original_text": "Yeah, exactly. I'm broke because I'm saving up for a trip. But, what I was going to say earlier—do you still want to go window shopping? We could still enjoy the atmosphere and maybe grab some food at that new Italian place in the food court.", + "start_time": 16.52865904568552, + "end_time": 31.459089884687785, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--206/temp/line_2_A.wav", + "silence_duration": 0.5765502021481033, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Oh, right! But just looking around? Nah, that sounds boring.", + "original_text": "Oh, right! But just looking around? Nah, that sounds boring.", + "start_time": 31.7735845343743, + "end_time": 35.70936684729947, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--206/temp/line_3_B.wav", + "silence_duration": 0.31449464968651686, + "is_interrupted": false + } + ] + }, + "DialogSum--val--207": { + "original_text": "A: I need help with the office party. \nB: Yes, of course. We could split it. What part would you like to do, the food or the entertainment [interrupt] planning and coordinating all the different aspects of the event to ensure everything runs smoothly and meets everyone's expectations? \nA: Sorry to jump in, but I'm really stuck on the entertainment part. I have no idea what it should be. \nB: Let's make sure we are on the same page. Do we want a formal or informal gathering? \nA: Let's make it a formal affair. \nB: Yes, that would be best. Now, for food should we have Chinese or American [interrupt] cuisine with a variety of options to accommodate different dietary restrictions and preferences among our colleagues? \nA: Actually, I was thinking American food would be the best choice. \nB: That would be great. What kind of music would you like, a band or recorded music? \nA: We should bring in a really good DJ. \nB: That works for me. Let's see what we can each do about planning our part and meet again on Friday.", + "cleaned_text": "A: I need help with the office party. \nB:Yes, of course. We could split it. What part would you like to do, the food or the entertainment planning and coordinating all the different aspects of the event to ensure everything runs smoothly and meets everyone's expectations?\nA: Sorry to jump in, but I'm really stuck on the entertainment part. I have no idea what it should be. \nB: Let's make sure we are on the same page. Do we want a formal or informal gathering? \nA: Let's make it a formal affair. \nB:Yes, that would be best. Now, for food should we have Chinese or American cuisine with a variety of options to accommodate different dietary restrictions and preferences among our colleagues?\nA: Actually, I was thinking American food would be the best choice. \nB: That would be great. What kind of music would you like, a band or recorded music? \nA: We should bring in a really good DJ. \nB: That works for me. Let's see what we can each do about planning our part and meet again on Friday.", + "total_duration": 49.51401360544218, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--207/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--207/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--207/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "I need help with the office party.", + "original_text": "I need help with the office party.", + "start_time": 0, + "end_time": 1.9388662131519274, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--207/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, of course. We could split it. What part would you like to do, the food or the entertainment", + "original_text": "Yes, of course. We could split it. What part would you like to do, the food or the entertainment [interrupt] planning and coordinating all the different aspects of the event to ensure everything runs smoothly and meets everyone's expectations?", + "start_time": 2.306107885189274, + "end_time": 13.637445753669999, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--207/temp/line_1_B.wav", + "silence_duration": 0.3672416720373463, + "is_interrupted": true, + "text_after_interrupt": "planning and coordinating all the different aspects of the event to ensure everything runs smoothly and meets everyone's expectations?" + }, + { + "speaker": "A", + "text": "Sorry to jump in, but I'm really stuck on the entertainment part. I have no idea what it should be.", + "original_text": "Sorry to jump in, but I'm really stuck on the entertainment part. I have no idea what it should be.", + "start_time": 7.135858452082698, + "end_time": 13.068556864781112, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--207/temp/line_2_A.wav", + "silence_duration": 0.3391249924034887, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Let's make sure we are on the same page. Do we want a formal or informal gathering?", + "original_text": "Let's make sure we are on the same page. Do we want a formal or informal gathering?", + "start_time": 14.103304674157542, + "end_time": 18.921445263726703, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--207/temp/line_3_B.wav", + "silence_duration": 0.46585892048754285, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Let's make it a formal affair.", + "original_text": "Let's make it a formal affair.", + "start_time": 19.225718228557493, + "end_time": 21.141364487060894, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--207/temp/line_4_A.wav", + "silence_duration": 0.30427296483079097, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, that would be best. Now, for food should we have Chinese or American", + "original_text": "Yes, that would be best. Now, for food should we have Chinese or American [interrupt] cuisine with a variety of options to accommodate different dietary restrictions and preferences among our colleagues?", + "start_time": 21.615702677860394, + "end_time": 32.11112217899418, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--207/temp/line_5_B.wav", + "silence_duration": 0.47433819079949957, + "is_interrupted": true, + "text_after_interrupt": "cuisine with a variety of options to accommodate different dietary restrictions and preferences among our colleagues?" + }, + { + "speaker": "A", + "text": "Actually, I was thinking American food would be the best choice.", + "original_text": "Actually, I was thinking American food would be the best choice.", + "start_time": 32.76710494965241, + "end_time": 36.29653805622838, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--207/temp/line_6_A.wav", + "silence_duration": 0.5332473196222942, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "That would be great. What kind of music would you like, a band or recorded music?", + "original_text": "That would be great. What kind of music would you like, a band or recorded music?", + "start_time": 36.77728509275621, + "end_time": 40.71306740568138, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--207/temp/line_7_B.wav", + "silence_duration": 0.48074703652783296, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "We should bring in a really good DJ.", + "original_text": "We should bring in a really good DJ.", + "start_time": 41.141363941708555, + "end_time": 43.440139451912636, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--207/temp/line_8_A.wav", + "silence_duration": 0.42829653602717466, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "That works for me. Let's see what we can each do about planning our part and meet again on Friday.", + "original_text": "That works for me. Let's see what we can each do about planning our part and meet again on Friday.", + "start_time": 43.8019366451548, + "end_time": 49.51404548869221, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--207/temp/line_9_B.wav", + "silence_duration": 0.361797193242163, + "is_interrupted": false + } + ] + }, + "DialogSum--val--208": { + "original_text": "A: I am here to get my prescription filled. \nB: Your prescription will be ready in twenty minutes. \nA: Do you ever deliver prescriptions by [interrupt] courier or any other fast service? I was wondering if there are same-day delivery options available for urgent medications or if you partner with any local delivery services. \nB: Sorry to interrupt, yes, we do offer delivery by mail. In fact, you can renew this prescription over the Internet and have it delivered to your home. \nA: That's convenient. By the way, how should I take this medication? \nB: You should take it twice a day. \nA: Should I avoid alcohol with this medication, or are there any other specific things I should steer clear of? \nB: You definitely should. Also, make sure you have something in your stomach when you take it. \nA: Got it. And earlier, you mentioned something about renewing the prescription online—how exactly do I do that? \nB: You can log into our website or use our mobile app to renew it. It's quite simple and saves you a trip. \nA: That's good to know. Should I expect any side effects? \nB: Sometimes you might feel dizzy, but that isn't common.", + "cleaned_text": "A: I am here to get my prescription filled. \nB: Your prescription will be ready in twenty minutes. \nA:Do you ever deliver prescriptions by courier or any other fast service? I was wondering if there are same-day delivery options available for urgent medications or if you partner with any local delivery services.\nB: Sorry to interrupt, yes, we do offer delivery by mail. In fact, you can renew this prescription over the Internet and have it delivered to your home. \nA: That's convenient. By the way, how should I take this medication? \nB: You should take it twice a day. \nA: Should I avoid alcohol with this medication, or are there any other specific things I should steer clear of? \nB: You definitely should. Also, make sure you have something in your stomach when you take it. \nA: Got it. And earlier, you mentioned something about renewing the prescription online—how exactly do I do that? \nB: You can log into our website or use our mobile app to renew it. It's quite simple and saves you a trip. \nA: That's good to know. Should I expect any side effects? \nB: Sometimes you might feel dizzy, but that isn't common.", + "total_duration": 57.18349206349206, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--208/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--208/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--208/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "I am here to get my prescription filled.", + "original_text": "I am here to get my prescription filled.", + "start_time": 0, + "end_time": 2.2523356009070294, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--208/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Your prescription will be ready in twenty minutes.", + "original_text": "Your prescription will be ready in twenty minutes.", + "start_time": 2.626557920164287, + "end_time": 4.786013702477212, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--208/temp/line_1_B.wav", + "silence_duration": 0.37422231925725763, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Do you ever deliver prescriptions by", + "original_text": "Do you ever deliver prescriptions by [interrupt] courier or any other fast service? I was wondering if there are same-day delivery options available for urgent medications or if you partner with any local delivery services.", + "start_time": 5.139879774762211, + "end_time": 18.491353697664707, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--208/temp/line_2_A.wav", + "silence_duration": 0.35386607228499944, + "is_interrupted": true, + "text_after_interrupt": "courier or any other fast service? I was wondering if there are same-day delivery options available for urgent medications or if you partner with any local delivery services." + }, + { + "speaker": "B", + "text": "Sorry to interrupt, yes, we do offer delivery by mail. In fact, you can renew this prescription over the Internet and have it delivered to your home.", + "original_text": "Sorry to interrupt, yes, we do offer delivery by mail. In fact, you can renew this prescription over the Internet and have it delivered to your home.", + "start_time": 7.392215375669241, + "end_time": 16.36672784732457, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--208/temp/line_3_B.wav", + "silence_duration": 0.475528829806278, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "That's convenient. By the way, how should I take this medication?", + "original_text": "That's convenient. By the way, how should I take this medication?", + "start_time": 18.852252393697658, + "end_time": 23.10150409437793, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--208/temp/line_4_A.wav", + "silence_duration": 0.36089869603295055, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "You should take it twice a day.", + "original_text": "You should take it twice a day.", + "start_time": 23.675747892015757, + "end_time": 25.185044944169952, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--208/temp/line_5_B.wav", + "silence_duration": 0.5742437976378256, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Should I avoid alcohol with this medication, or are there any other specific things I should steer clear of?", + "original_text": "Should I avoid alcohol with this medication, or are there any other specific things I should steer clear of?", + "start_time": 25.557991302836644, + "end_time": 31.827379057938685, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--208/temp/line_6_A.wav", + "silence_duration": 0.37294635866669207, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "You definitely should. Also, make sure you have something in your stomach when you take it.", + "original_text": "You definitely should. Also, make sure you have something in your stomach when you take it.", + "start_time": 32.16768046824102, + "end_time": 36.49820201019113, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--208/temp/line_7_B.wav", + "silence_duration": 0.34030141030233185, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Got it. And earlier, you mentioned something about renewing the prescription online—how exactly do I do that?", + "original_text": "Got it. And earlier, you mentioned something about renewing the prescription online—how exactly do I do that?", + "start_time": 37.01624366204097, + "end_time": 44.144769739138475, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--208/temp/line_8_A.wav", + "silence_duration": 0.5180416518498451, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "You can log into our website or use our mobile app to renew it. It's quite simple and saves you a trip.", + "original_text": "You can log into our website or use our mobile app to renew it. It's quite simple and saves you a trip.", + "start_time": 44.74358662761713, + "end_time": 50.07256621945386, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--208/temp/line_9_B.wav", + "silence_duration": 0.5988168884786542, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "That's good to know. Should I expect any side effects?", + "original_text": "That's good to know. Should I expect any side effects?", + "start_time": 50.469941660451276, + "end_time": 54.069034630972816, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--208/temp/line_10_A.wav", + "silence_duration": 0.39737544099741445, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Sometimes you might feel dizzy, but that isn't common.", + "original_text": "Sometimes you might feel dizzy, but that isn't common.", + "start_time": 54.38551577315147, + "end_time": 57.18352030829886, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--208/temp/line_11_B.wav", + "silence_duration": 0.3164811421786526, + "is_interrupted": false + } + ] + }, + "DialogSum--val--209": { + "original_text": "A: Mom, can I watch TV? \nB: No more today, honey. \nA: Alright, Mom. Should I turn off the TV right [interrupt] now, or can I finish this episode first? I promise it's almost over and I'll go straight to my room afterward. \nB: Wait, before you turn it off, did you finish your homework? \nA: Yes, I did. But I was asking if I should turn off the TV right now? \nB: Yes, honey. Go to your room, and take out your book. It's your reading time now. \nA: Mom, where is the remote? I can't find it. \nB: Just go to read. I will find it, honey.", + "cleaned_text": "A: Mom, can I watch TV? \nB: No more today, honey. \nA:Alright, Mom. Should I turn off the TV right now, or can I finish this episode first? I promise it's almost over and I'll go straight to my room afterward.\nB: Wait, before you turn it off, did you finish your homework? \nA: Yes, I did. But I was asking if I should turn off the TV right now? \nB: Yes, honey. Go to your room, and take out your book. It's your reading time now. \nA: Mom, where is the remote? I can't find it. \nB: Just go to read. I will find it, honey.", + "total_duration": 29.332290249433107, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--209/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--209/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--209/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Mom, can I watch TV?", + "original_text": "Mom, can I watch TV?", + "start_time": 0, + "end_time": 1.799546485260771, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--209/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "No more today, honey.", + "original_text": "No more today, honey.", + "start_time": 2.249425222431638, + "end_time": 3.468472841479257, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--209/temp/line_1_B.wav", + "silence_duration": 0.44987873717086696, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Alright, Mom. Should I turn off the TV right", + "original_text": "Alright, Mom. Should I turn off the TV right [interrupt] now, or can I finish this episode first? I promise it's almost over and I'll go straight to my room afterward.", + "start_time": 4.032376677064401, + "end_time": 13.12298892196236, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--209/temp/line_2_A.wav", + "silence_duration": 0.5639038355851442, + "is_interrupted": true, + "text_after_interrupt": "now, or can I finish this episode first? I promise it's almost over and I'll go straight to my room afterward." + }, + { + "speaker": "B", + "text": "Wait, before you turn it off, did you finish your homework?", + "original_text": "Wait, before you turn it off, did you finish your homework?", + "start_time": 6.667841529672111, + "end_time": 9.407796178198188, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--209/temp/line_3_B.wav", + "silence_duration": 0.38129400631189464, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Yes, I did. But I was asking if I should turn off the TV right now?", + "original_text": "Yes, I did. But I was asking if I should turn off the TV right now?", + "start_time": 13.662101969722295, + "end_time": 18.480242559291455, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--209/temp/line_4_A.wav", + "silence_duration": 0.5391130477599358, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, honey. Go to your room, and take out your book. It's your reading time now.", + "original_text": "Yes, honey. Go to your room, and take out your book. It's your reading time now.", + "start_time": 18.97527587596786, + "end_time": 23.1084278034055, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--209/temp/line_5_B.wav", + "silence_duration": 0.4950333166764047, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Mom, where is the remote? I can't find it.", + "original_text": "Mom, where is the remote? I can't find it.", + "start_time": 23.622287789959124, + "end_time": 26.838251508779987, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--209/temp/line_6_A.wav", + "silence_duration": 0.5138599865536221, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Just go to read. I will find it, honey.", + "original_text": "Just go to read. I will find it, honey.", + "start_time": 27.41667572757782, + "end_time": 29.332321986081222, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--209/temp/line_7_B.wav", + "silence_duration": 0.5784242187978352, + "is_interrupted": false + } + ] + }, + "DialogSum--val--210": { + "original_text": "A: Is there a problem, officer? \nB: I stopped you for driving through a red light. \nA: Did I [interrupt] not notice it? I was completely focused on the road ahead and must have missed the signal change entirely. \nB: You didn't know? \nA: I had no idea that I ran it. \nB: Don't you know that yellow means slow down? \nA: Yes, madam. \nB: Why'd you speed up when you saw the yellow light? \nA: Officer, I really have no excuse, madam. I was distracted by something, but I didn't mean to speed up. \nB: I'll have to write you a ticket. \nA: I understand, and I am very sorry. By the way, did you mention why I sped up earlier? \nB: Yes, I asked why you sped up instead of slowing down [interrupt] when the traffic signal clearly indicated you should prepare to stop for the upcoming red light. \nA: I was just caught up in my thoughts, and I realize that's no excuse. \nB: Here's your ticket.", + "cleaned_text": "A: Is there a problem, officer? \nB: I stopped you for driving through a red light. \nA:Did I not notice it? I was completely focused on the road ahead and must have missed the signal change entirely.\nB: You didn't know? \nA: I had no idea that I ran it. \nB: Don't you know that yellow means slow down? \nA: Yes, madam. \nB: Why'd you speed up when you saw the yellow light? \nA: Officer, I really have no excuse, madam. I was distracted by something, but I didn't mean to speed up. \nB: I'll have to write you a ticket. \nA: I understand, and I am very sorry. By the way, did you mention why I sped up earlier? \nB:Yes, I asked why you sped up instead of slowing down when the traffic signal clearly indicated you should prepare to stop for the upcoming red light.\nA: I was just caught up in my thoughts, and I realize that's no excuse. \nB: Here's your ticket.", + "total_duration": 45.74503401360544, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--210/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--210/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--210/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Is there a problem, officer?", + "original_text": "Is there a problem, officer?", + "start_time": 0, + "end_time": 1.509297052154195, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--210/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I stopped you for driving through a red light.", + "original_text": "I stopped you for driving through a red light.", + "start_time": 1.9877205632651307, + "end_time": 4.100736436281004, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--210/temp/line_1_B.wav", + "silence_duration": 0.4784235111109356, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Did I", + "original_text": "Did I [interrupt] not notice it? I was completely focused on the road ahead and must have missed the signal change entirely.", + "start_time": 4.696792156321267, + "end_time": 11.616338641582038, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--210/temp/line_2_A.wav", + "silence_duration": 0.5960557200402639, + "is_interrupted": true, + "text_after_interrupt": "not notice it? I was completely focused on the road ahead and must have missed the signal change entirely." + }, + { + "speaker": "B", + "text": "You didn't know?", + "original_text": "You didn't know?", + "start_time": 5.451440682398365, + "end_time": 6.380238868339409, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--210/temp/line_3_B.wav", + "silence_duration": 0.4421677552026936, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I had no idea that I ran it.", + "original_text": "I had no idea that I ran it.", + "start_time": 11.93135522314014, + "end_time": 13.73090170840091, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--210/temp/line_4_A.wav", + "silence_duration": 0.31501658155810097, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Don't you know that yellow means slow down?", + "original_text": "Don't you know that yellow means slow down?", + "start_time": 14.096449108348473, + "end_time": 16.128195140094505, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--210/temp/line_5_B.wav", + "silence_duration": 0.36554739994756263, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Yes, madam.", + "original_text": "Yes, madam.", + "start_time": 16.535273698707407, + "end_time": 17.452461907324185, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--210/temp/line_6_A.wav", + "silence_duration": 0.40707855861290126, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Why'd you speed up when you saw the yellow light?", + "original_text": "Why'd you speed up when you saw the yellow light?", + "start_time": 17.758487882107225, + "end_time": 19.83667382315031, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--210/temp/line_7_B.wav", + "silence_duration": 0.30602597478304183, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Officer, I really have no excuse, madam. I was distracted by something, but I didn't mean to speed up.", + "original_text": "Officer, I really have no excuse, madam. I was distracted by something, but I didn't mean to speed up.", + "start_time": 20.3986917332523, + "end_time": 27.329848195837332, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--210/temp/line_8_A.wav", + "silence_duration": 0.562017910101989, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I'll have to write you a ticket.", + "original_text": "I'll have to write you a ticket.", + "start_time": 27.662681910552834, + "end_time": 29.021049257491608, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--210/temp/line_9_B.wav", + "silence_duration": 0.3328337147155032, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I understand, and I am very sorry. By the way, did you mention why I sped up earlier?", + "original_text": "I understand, and I am very sorry. By the way, did you mention why I sped up earlier?", + "start_time": 29.456578356454333, + "end_time": 35.41249672380127, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--210/temp/line_10_A.wav", + "silence_duration": 0.43552909896272574, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, I asked why you sped up instead of slowing down", + "original_text": "Yes, I asked why you sped up instead of slowing down [interrupt] when the traffic signal clearly indicated you should prepare to stop for the upcoming red light.", + "start_time": 35.886701425360805, + "end_time": 42.945567638512735, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--210/temp/line_11_B.wav", + "silence_duration": 0.4742047015595365, + "is_interrupted": true, + "text_after_interrupt": "when the traffic signal clearly indicated you should prepare to stop for the upcoming red light." + }, + { + "speaker": "A", + "text": "I was just caught up in my thoughts, and I realize that's no excuse.", + "original_text": "I was just caught up in my thoughts, and I realize that's no excuse.", + "start_time": 40.32837325653847, + "end_time": 44.21771566016659, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--210/temp/line_12_A.wav", + "silence_duration": 0.5577939950889585, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Here's your ticket.", + "original_text": "Here's your ticket.", + "start_time": 44.81623698305459, + "end_time": 45.74503516899563, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--210/temp/line_13_B.wav", + "silence_duration": 0.5985213228879952, + "is_interrupted": false + } + ] + }, + "DialogSum--val--211": { + "original_text": "A: Has Alan shown up yet? \nB: Nope. I guess something might have [interrupt] happened on his way here, or maybe he's dealing with a personal issue that we're not aware of yet. He's usually so punctual that this is really out of character for him. \nA: Do you think it could be related to his sister? \nB: I'm not sure. What happened to her? \nA: Last week his sister was admitted to the hospital. \nB: Oh? What happened? \nA: His sister had a car accident last week. \nB: Is she fine now? \nA: She is still in a coma. \nB: Oh, poor Alan! His sister is the only one he has left since his parents died last year. \nA: Right, and I was going to mention earlier, I hope it's nothing serious that kept him from showing up today.", + "cleaned_text": "A: Has Alan shown up yet? \nB:Nope. I guess something might have happened on his way here, or maybe he's dealing with a personal issue that we're not aware of yet. He's usually so punctual that this is really out of character for him.\nA: Do you think it could be related to his sister? \nB: I'm not sure. What happened to her? \nA: Last week his sister was admitted to the hospital. \nB: Oh? What happened? \nA: His sister had a car accident last week. \nB: Is she fine now? \nA: She is still in a coma. \nB: Oh, poor Alan! His sister is the only one he has left since his parents died last year. \nA: Right, and I was going to mention earlier, I hope it's nothing serious that kept him from showing up today.", + "total_duration": 36.63079365079365, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--211/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--211/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--211/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Has Alan shown up yet?", + "original_text": "Has Alan shown up yet?", + "start_time": 0, + "end_time": 1.6137868480725623, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--211/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Nope. I guess something might have", + "original_text": "Nope. I guess something might have [interrupt] happened on his way here, or maybe he's dealing with a personal issue that we're not aware of yet. He's usually so punctual that this is really out of character for him.", + "start_time": 2.154719429682805, + "end_time": 11.431091311768972, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--211/temp/line_1_B.wav", + "silence_duration": 0.5409325816102425, + "is_interrupted": true, + "text_after_interrupt": "happened on his way here, or maybe he's dealing with a personal issue that we're not aware of yet. He's usually so punctual that this is really out of character for him." + }, + { + "speaker": "A", + "text": "Do you think it could be related to his sister?", + "original_text": "Do you think it could be related to his sister?", + "start_time": 3.8497761190252087, + "end_time": 6.160161606553553, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--211/temp/line_2_A.wav", + "silence_duration": 0.3005132663148405, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I'm not sure. What happened to her?", + "original_text": "I'm not sure. What happened to her?", + "start_time": 11.877414211728901, + "end_time": 14.048479971366088, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--211/temp/line_3_B.wav", + "silence_duration": 0.4463228999599284, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Last week his sister was admitted to the hospital.", + "original_text": "Last week his sister was admitted to the hospital.", + "start_time": 14.370147114358359, + "end_time": 17.028831921614593, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--211/temp/line_4_A.wav", + "silence_duration": 0.3216671429922698, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Oh? What happened?", + "original_text": "Oh? What happened?", + "start_time": 17.368149197068146, + "end_time": 18.37821722427903, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--211/temp/line_5_B.wav", + "silence_duration": 0.339317275453554, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "His sister had a car accident last week.", + "original_text": "His sister had a car accident last week.", + "start_time": 18.825495471512934, + "end_time": 21.263590709608174, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--211/temp/line_6_A.wav", + "silence_duration": 0.44727824723390297, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Is she fine now?", + "original_text": "Is she fine now?", + "start_time": 21.720450709119262, + "end_time": 22.800178600275725, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--211/temp/line_7_B.wav", + "silence_duration": 0.456859999511088, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "She is still in a coma.", + "original_text": "She is still in a coma.", + "start_time": 23.370366210282093, + "end_time": 24.763563489193658, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--211/temp/line_8_A.wav", + "silence_duration": 0.570187610006367, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Oh, poor Alan! His sister is the only one he has left since his parents died last year.", + "original_text": "Oh, poor Alan! His sister is the only one he has left since his parents died last year.", + "start_time": 25.143720451366068, + "end_time": 29.741271471774233, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--211/temp/line_9_B.wav", + "silence_duration": 0.3801569621724101, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Right, and I was going to mention earlier, I hope it's nothing serious that kept him from showing up today.", + "original_text": "Right, and I was going to mention earlier, I hope it's nothing serious that kept him from showing up today.", + "start_time": 30.2220975559235, + "end_time": 36.6308050389167, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--211/temp/line_10_A.wav", + "silence_duration": 0.480826084149268, + "is_interrupted": false + } + ] + }, + "DialogSum--val--212": { + "original_text": "A: Hello, John. How are you? \nB: I'm fine, thanks. And you? \nA: Very well, thanks. Nice to see you again. I haven't seen you for a long time. What have you been [interrupt] up to lately with all your projects and studies? I remember you were working on something big last time we spoke. \nB: Sorry to interrupt, but I just remembered—didn't you mention you were planning to take some courses? How did that go? \nA: Oh, nothing much really. I was going to tell you about that, but I didn't get the chance. And how is everything with you? \nB: Fine, thanks. I've been busy lately. \nA: What have you been doing? \nB: I've been studying for my exams. My school exams will begin next month. \nA: Oh, I remember you mentioned your exams before [interrupt] and said they were going to be tough, especially the advanced mathematics section that you were particularly worried about. Are you feeling prepared now that you've had more time to study? \nB: Right, I did. And how are your parents? \nA: They're both very well, thanks. By the way, I was about to ask—where are you going now? \nB: I'm going to do some shopping. Why don't you come with me?", + "cleaned_text": "A: Hello, John. How are you? \nB: I'm fine, thanks. And you? \nA:Very well, thanks. Nice to see you again. I haven't seen you for a long time. What have you been up to lately with all your projects and studies? I remember you were working on something big last time we spoke.\nB: Sorry to interrupt, but I just remembered—didn't you mention you were planning to take some courses? How did that go? \nA: Oh, nothing much really. I was going to tell you about that, but I didn't get the chance. And how is everything with you? \nB: Fine, thanks. I've been busy lately. \nA: What have you been doing? \nB: I've been studying for my exams. My school exams will begin next month. \nA:Oh, I remember you mentioned your exams before and said they were going to be tough, especially the advanced mathematics section that you were particularly worried about. Are you feeling prepared now that you've had more time to study?\nB: Right, I did. And how are your parents? \nA: They're both very well, thanks. By the way, I was about to ask—where are you going now? \nB: I'm going to do some shopping. Why don't you come with me?", + "total_duration": 57.166439909297054, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--212/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--212/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--212/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Hello, John. How are you?", + "original_text": "Hello, John. How are you?", + "start_time": 0, + "end_time": 1.5325170068027212, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--212/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I'm fine, thanks. And you?", + "original_text": "I'm fine, thanks. And you?", + "start_time": 1.9069897372590585, + "end_time": 3.4859466533588317, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--212/temp/line_1_B.wav", + "silence_duration": 0.37447273045633733, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Very well, thanks. Nice to see you again. I haven't seen you for a long time. What have you been", + "original_text": "Very well, thanks. Nice to see you again. I haven't seen you for a long time. What have you been [interrupt] up to lately with all your projects and studies? I remember you were working on something big last time we spoke.", + "start_time": 4.021119385615414, + "end_time": 16.432185145252603, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--212/temp/line_2_A.wav", + "silence_duration": 0.5351727322565827, + "is_interrupted": true, + "text_after_interrupt": "up to lately with all your projects and studies? I remember you were working on something big last time we spoke." + }, + { + "speaker": "B", + "text": "Sorry to interrupt, but I just remembered—didn't you mention you were planning to take some courses? How did that go?", + "original_text": "Sorry to interrupt, but I just remembered—didn't you mention you were planning to take some courses? How did that go?", + "start_time": 10.371776981987296, + "end_time": 16.490235031873915, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--212/temp/line_3_B.wav", + "silence_duration": 0.5603462201794165, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Oh, nothing much really. I was going to tell you about that, but I didn't get the chance. And how is everything with you?", + "original_text": "Oh, nothing much really. I was going to tell you about that, but I didn't get the chance. And how is everything with you?", + "start_time": 16.842909831254207, + "end_time": 24.296515273431076, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--212/temp/line_4_A.wav", + "silence_duration": 0.35267479938029256, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Fine, thanks. I've been busy lately.", + "original_text": "Fine, thanks. I've been busy lately.", + "start_time": 24.832221164724434, + "end_time": 26.782697355200625, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--212/temp/line_5_B.wav", + "silence_duration": 0.5357058912933567, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "What have you been doing?", + "original_text": "What have you been doing?", + "start_time": 27.202462932850782, + "end_time": 28.49117041584398, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--212/temp/line_6_A.wav", + "silence_duration": 0.41976557765015815, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I've been studying for my exams. My school exams will begin next month.", + "original_text": "I've been studying for my exams. My school exams will begin next month.", + "start_time": 29.039435656694785, + "end_time": 32.975217969619955, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--212/temp/line_7_B.wav", + "silence_duration": 0.5482652408508055, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Oh, I remember you mentioned your exams before", + "original_text": "Oh, I remember you mentioned your exams before [interrupt] and said they were going to be tough, especially the advanced mathematics section that you were particularly worried about. Are you feeling prepared now that you've had more time to study?", + "start_time": 33.51305067230292, + "end_time": 46.8064747085841, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--212/temp/line_8_A.wav", + "silence_duration": 0.5378327026829611, + "is_interrupted": true, + "text_after_interrupt": "and said they were going to be tough, especially the advanced mathematics section that you were particularly worried about. Are you feeling prepared now that you've had more time to study?" + }, + { + "speaker": "B", + "text": "Right, I did. And how are your parents?", + "original_text": "Right, I did. And how are your parents?", + "start_time": 42.936739364090585, + "end_time": 45.189074964997616, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--212/temp/line_9_B.wav", + "silence_duration": 0.485228613497706, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "They're both very well, thanks. By the way, I was about to ask—where are you going now?", + "original_text": "They're both very well, thanks. By the way, I was about to ask—where are you going now?", + "start_time": 47.39156241138403, + "end_time": 53.96280957691691, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--212/temp/line_10_A.wav", + "silence_duration": 0.5850877027999312, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I'm going to do some shopping. Why don't you come with me?", + "original_text": "I'm going to do some shopping. Why don't you come with me?", + "start_time": 54.472932567468185, + "end_time": 57.16644730669721, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--212/temp/line_11_B.wav", + "silence_duration": 0.5101229905512759, + "is_interrupted": false + } + ] + }, + "DialogSum--val--213": { + "original_text": "A: Vince, I think one of your programmers is spying on us for WebTracker.\nB: Pardon?\nA: I won't say who, because I'm not sure yet. But I'll know [interrupt] once I gather more evidence and confirm my suspicions through careful monitoring of their network activity and communication patterns.\nB: Wait, Zina, I hope you're not scheming to make Elvin look bad.\nA: It isn't Elvin. But as I was saying, I'll know soon.\nB: Dave then? Dave is a spy for WebTracker? You can't be serious.", + "cleaned_text": "A: Vince, I think one of your programmers is spying on us for WebTracker.\nB: Pardon?\nA:I won't say who, because I'm not sure yet. But I'll know once I gather more evidence and confirm my suspicions through careful monitoring of their network activity and communication patterns.\nB: Wait, Zina, I hope you're not scheming to make Elvin look bad.\nA: It isn't Elvin. But as I was saying, I'll know soon.\nB: Dave then? Dave is a spy for WebTracker? You can't be serious.", + "total_duration": 26.202857142857145, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--213/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--213/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--213/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Vince, I think one of your programmers is spying on us for WebTracker.", + "original_text": "Vince, I think one of your programmers is spying on us for WebTracker.", + "start_time": 0, + "end_time": 4.179591836734694, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--213/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Pardon?", + "original_text": "Pardon?", + "start_time": 4.57486654513905, + "end_time": 4.969605774163993, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--213/temp/line_1_B.wav", + "silence_duration": 0.39527470840435536, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I won't say who, because I'm not sure yet. But I'll know", + "original_text": "I won't say who, because I'm not sure yet. But I'll know [interrupt] once I gather more evidence and confirm my suspicions through careful monitoring of their network activity and communication patterns.", + "start_time": 5.4145445204666816, + "end_time": 16.908422071487088, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--213/temp/line_2_A.wav", + "silence_duration": 0.4449387463026886, + "is_interrupted": true, + "text_after_interrupt": "once I gather more evidence and confirm my suspicions through careful monitoring of their network activity and communication patterns." + }, + { + "speaker": "B", + "text": "Wait, Zina, I hope you're not scheming to make Elvin look bad.", + "original_text": "Wait, Zina, I hope you're not scheming to make Elvin look bad.", + "start_time": 9.18778715085217, + "end_time": 12.65917037080682, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--213/temp/line_3_B.wav", + "silence_duration": 0.4903602938904792, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "It isn't Elvin. But as I was saying, I'll know soon.", + "original_text": "It isn't Elvin. But as I was saying, I'll know soon.", + "start_time": 17.403601460580163, + "end_time": 20.816934793913497, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--213/temp/line_4_A.wav", + "silence_duration": 0.4951793890930753, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Dave then? Dave is a spy for WebTracker? You can't be serious.", + "original_text": "Dave then? Dave is a spy for WebTracker? You can't be serious.", + "start_time": 21.152541600720497, + "end_time": 26.20288173677492, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--213/temp/line_5_B.wav", + "silence_duration": 0.3356068068069998, + "is_interrupted": false + } + ] + }, + "DialogSum--val--214": { + "original_text": "A: Well, it's too bad that we like different kinds of movies. Maybe we're just different kinds of [interrupt] people with distinct preferences and perspectives, but that doesn't mean we can't still have fun together by exploring new experiences and finding creative compromises. \nB: Sorry to cut in, but maybe we're not that different after all. What if we find some common ground? \nA: Yeah, it's too bad. . . but actually I think I know what to do. \nB: What's that? \nA: We can go to a horror movie, and I'll hold your hand so you don't get scared. \nB: You mean. . . like on a second date? \nA: Of course! Or are you still too scared? \nB: Wait, you were saying something about us being different kinds of people. What did you mean by that? \nA: Oh, I just meant that even though we have different tastes, it doesn't mean we can't find ways to enjoy things together.", + "cleaned_text": "A:Well, it's too bad that we like different kinds of movies. Maybe we're just different kinds of people with distinct preferences and perspectives, but that doesn't mean we can't still have fun together by exploring new experiences and finding creative compromises.\nB: Sorry to cut in, but maybe we're not that different after all. What if we find some common ground? \nA: Yeah, it's too bad. . . but actually I think I know what to do. \nB: What's that? \nA: We can go to a horror movie, and I'll hold your hand so you don't get scared. \nB: You mean. . . like on a second date? \nA: Of course! Or are you still too scared? \nB: Wait, you were saying something about us being different kinds of people. What did you mean by that? \nA: Oh, I just meant that even though we have different tastes, it doesn't mean we can't find ways to enjoy things together.", + "total_duration": 44.4362358276644, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--214/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--214/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--214/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Well, it's too bad that we like different kinds of movies. Maybe we're just different kinds of", + "original_text": "Well, it's too bad that we like different kinds of movies. Maybe we're just different kinds of [interrupt] people with distinct preferences and perspectives, but that doesn't mean we can't still have fun together by exploring new experiences and finding creative compromises.", + "start_time": 0, + "end_time": 15.731519274376417, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--214/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": true, + "text_after_interrupt": "people with distinct preferences and perspectives, but that doesn't mean we can't still have fun together by exploring new experiences and finding creative compromises." + }, + { + "speaker": "B", + "text": "Sorry to cut in, but maybe we're not that different after all. What if we find some common ground?", + "original_text": "Sorry to cut in, but maybe we're not that different after all. What if we find some common ground?", + "start_time": 5.038730158730159, + "end_time": 10.193560090702949, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--214/temp/line_1_B.wav", + "silence_duration": 0.5452763048651754, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Yeah, it's too bad. . . but actually I think I know what to do.", + "original_text": "Yeah, it's too bad. . . but actually I think I know what to do.", + "start_time": 16.035073507681165, + "end_time": 20.226275321740122, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--214/temp/line_2_A.wav", + "silence_duration": 0.3035542333047468, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "What's that?", + "original_text": "What's that?", + "start_time": 20.810366657386492, + "end_time": 21.46052538754522, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--214/temp/line_3_B.wav", + "silence_duration": 0.58409133564637, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "We can go to a horror movie, and I'll hold your hand so you don't get scared.", + "original_text": "We can go to a horror movie, and I'll hold your hand so you don't get scared.", + "start_time": 22.026485864281337, + "end_time": 26.484717156798343, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--214/temp/line_4_A.wav", + "silence_duration": 0.5659604767361166, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "You mean. . . like on a second date?", + "original_text": "You mean. . . like on a second date?", + "start_time": 26.84952399543804, + "end_time": 28.98575982310244, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--214/temp/line_5_B.wav", + "silence_duration": 0.36480683863969754, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Of course! Or are you still too scared?", + "original_text": "Of course! Or are you still too scared?", + "start_time": 29.55948644128767, + "end_time": 32.4387608177049, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--214/temp/line_6_A.wav", + "silence_duration": 0.5737266181852294, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Wait, you were saying something about us being different kinds of people. What did you mean by that?", + "original_text": "Wait, you were saying something about us being different kinds of people. What did you mean by that?", + "start_time": 32.97012895344791, + "end_time": 37.103280880885556, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--214/temp/line_7_B.wav", + "silence_duration": 0.5313681357430114, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Oh, I just meant that even though we have different tastes, it doesn't mean we can't find ways to enjoy things together.", + "original_text": "Oh, I just meant that even though we have different tastes, it doesn't mean we can't find ways to enjoy things together.", + "start_time": 37.59799877701509, + "end_time": 44.43627542100602, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--214/temp/line_8_A.wav", + "silence_duration": 0.4947178961295344, + "is_interrupted": false + } + ] + }, + "DialogSum--val--215": { + "original_text": "A: Could we possibly discuss my salary some time? \nB: Sure. \nA: First of all, I want you to know that I really like working for this company. Do you think I'm doing a good [interrupt] job here? I've been putting in a lot of effort to meet the expectations and have consistently received positive feedback from both colleagues and clients about my performance. \nB: Sorry to jump in, but before we go further, I just want to clarify—are you thinking of staying long-term with us? \nA: Absolutely, I see a future here. Now, as I was saying, do you think I'm doing a good job here? \nB: Well, you are a very hard-worker. \nA: I try very hard. The problem is, my salary just isn't enough to live on. Now that I have a wife and a child to support, we hardly have enough money for food and rent. \nB: These are trying times for everyone. What do you propose? \nA: I could really use a 5% rise. \nB: That's quite a bit. If I give you a raise, I'm going to have to give everyone a raise. \nA: Listen, if you give me a raise, I'll take on extra responsibilities. \nB: That sounds reasonable. How about this, from now on, you can be responsible for scheduling. That means that if you can't find someone to cover a shift, then you'll have to step in yourself to ensure the shift is covered. \nA: Wait, just to clarify, if I have to cover a shift myself, do I get overtime for those extra hours? \nB: Of course. It'd be against the law if we didn't.", + "cleaned_text": "A: Could we possibly discuss my salary some time? \nB: Sure. \nA:First of all, I want you to know that I really like working for this company. Do you think I'm doing a good job here? I've been putting in a lot of effort to meet the expectations and have consistently received positive feedback from both colleagues and clients about my performance.\nB: Sorry to jump in, but before we go further, I just want to clarify—are you thinking of staying long-term with us? \nA: Absolutely, I see a future here. Now, as I was saying, do you think I'm doing a good job here? \nB: Well, you are a very hard-worker. \nA: I try very hard. The problem is, my salary just isn't enough to live on. Now that I have a wife and a child to support, we hardly have enough money for food and rent. \nB: These are trying times for everyone. What do you propose? \nA: I could really use a 5% rise. \nB: That's quite a bit. If I give you a raise, I'm going to have to give everyone a raise. \nA: Listen, if you give me a raise, I'll take on extra responsibilities. \nB: That sounds reasonable. How about this, from now on, you can be responsible for scheduling. That means that if you can't find someone to cover a shift, then you'll have to step in yourself to ensure the shift is covered. \nA: Wait, just to clarify, if I have to cover a shift myself, do I get overtime for those extra hours? \nB: Of course. It'd be against the law if we didn't.", + "total_duration": 77.25006802721089, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--215/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--215/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--215/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Could we possibly discuss my salary some time?", + "original_text": "Could we possibly discuss my salary some time?", + "start_time": 0, + "end_time": 2.809614512471655, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--215/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Sure.", + "original_text": "Sure.", + "start_time": 3.283641880233768, + "end_time": 3.852530769122657, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--215/temp/line_1_B.wav", + "silence_duration": 0.47402736776211296, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "First of all, I want you to know that I really like working for this company. Do you think I'm doing a good", + "original_text": "First of all, I want you to know that I really like working for this company. Do you think I'm doing a good [interrupt] job here? I've been putting in a lot of effort to meet the expectations and have consistently received positive feedback from both colleagues and clients about my performance.", + "start_time": 4.302860067538461, + "end_time": 20.254968911075878, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--215/temp/line_2_A.wav", + "silence_duration": 0.45032929841580394, + "is_interrupted": true, + "text_after_interrupt": "job here? I've been putting in a lot of effort to meet the expectations and have consistently received positive feedback from both colleagues and clients about my performance." + }, + { + "speaker": "B", + "text": "Sorry to jump in, but before we go further, I just want to clarify—are you thinking of staying long-term with us?", + "original_text": "Sorry to jump in, but before we go further, I just want to clarify—are you thinking of staying long-term with us?", + "start_time": 10.514197936019187, + "end_time": 16.365626507447757, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--215/temp/line_3_B.wav", + "silence_duration": 0.5889807676601932, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Absolutely, I see a future here. Now, as I was saying, do you think I'm doing a good job here?", + "original_text": "Absolutely, I see a future here. Now, as I was saying, do you think I'm doing a good job here?", + "start_time": 20.701033246836325, + "end_time": 27.01686091123542, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--215/temp/line_4_A.wav", + "silence_duration": 0.44606433576044613, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Well, you are a very hard-worker.", + "original_text": "Well, you are a very hard-worker.", + "start_time": 27.39986758527696, + "end_time": 29.26907393448331, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--215/temp/line_5_B.wav", + "silence_duration": 0.38300667404154126, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I try very hard. The problem is, my salary just isn't enough to live on. Now that I have a wife and a child to support, we hardly have enough money for food and rent.", + "original_text": "I try very hard. The problem is, my salary just isn't enough to live on. Now that I have a wife and a child to support, we hardly have enough money for food and rent.", + "start_time": 29.80251882888418, + "end_time": 40.47208798988191, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--215/temp/line_6_A.wav", + "silence_duration": 0.5334448944008676, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "These are trying times for everyone. What do you propose?", + "original_text": "These are trying times for everyone. What do you propose?", + "start_time": 40.87270859674652, + "end_time": 43.844862791757855, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--215/temp/line_7_B.wav", + "silence_duration": 0.40062060686460876, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I could really use a 5% rise.", + "original_text": "I could really use a 5% rise.", + "start_time": 44.39309445764179, + "end_time": 46.98211940095244, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--215/temp/line_8_A.wav", + "silence_duration": 0.5482316658839337, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "That's quite a bit. If I give you a raise, I'm going to have to give everyone a raise.", + "original_text": "That's quite a bit. If I give you a raise, I'm going to have to give everyone a raise.", + "start_time": 47.30285005296029, + "end_time": 51.57532170828909, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--215/temp/line_9_B.wav", + "silence_duration": 0.32073065200784556, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Listen, if you give me a raise, I'll take on extra responsibilities.", + "original_text": "Listen, if you give me a raise, I'll take on extra responsibilities.", + "start_time": 51.877473010149565, + "end_time": 55.79003536842621, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--215/temp/line_10_A.wav", + "silence_duration": 0.30215130186047945, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "That sounds reasonable. How about this, from now on, you can be responsible for scheduling. That means that if you can't find someone to cover a shift, then you'll have to step in yourself to ensure the shift is covered.", + "original_text": "That sounds reasonable. How about this, from now on, you can be responsible for scheduling. That means that if you can't find someone to cover a shift, then you'll have to step in yourself to ensure the shift is covered.", + "start_time": 56.13752977565714, + "end_time": 66.96963861919455, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--215/temp/line_11_B.wav", + "silence_duration": 0.3474944072309325, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Wait, just to clarify, if I have to cover a shift myself, do I get overtime for those extra hours?", + "original_text": "Wait, just to clarify, if I have to cover a shift myself, do I get overtime for those extra hours?", + "start_time": 67.44585438448523, + "end_time": 74.64404032552831, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--215/temp/line_12_A.wav", + "silence_duration": 0.4762157652906705, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Of course. It'd be against the law if we didn't.", + "original_text": "Of course. It'd be against the law if we didn't.", + "start_time": 75.16030079480412, + "end_time": 77.25009671317146, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--215/temp/line_13_B.wav", + "silence_duration": 0.5162604692758008, + "is_interrupted": false + } + ] + }, + "DialogSum--val--216": { + "original_text": "A: Did you enjoy that new movie? \nB: That movie's just a lot of noise, same as Simon. \nA: Oh, what happened, Carole? \nB: I had to go by myself, he couldn't [interrupt] make it because he had some last-minute work, or so he said, but I suspect he was just making excuses as usual to avoid spending time with me. \nA: What? I met him just before I took off from Kitty's, he said he was coming. \nB: Kitty's? He sure gets around, doesn't he? \nA: Looks like it. So how did he handle the situation when you confronted him about it? \nB: His excuse was familiar. He said his car died again. \nA: I think that's a bunch of nonsense. It seemed ok to me. \nB: I know. Last week he gave me a lie about being too busy. \nA: Wait, what were you saying earlier about how he handled it? \nB: Oh, right. He just brushed it off like it was no big deal. \nA: Doesn't sound promising. \nB: Well, I think it's the time to pull the plug.", + "cleaned_text": "A: Did you enjoy that new movie? \nB: That movie's just a lot of noise, same as Simon. \nA: Oh, what happened, Carole? \nB:I had to go by myself, he couldn't make it because he had some last-minute work, or so he said, but I suspect he was just making excuses as usual to avoid spending time with me.\nA: What? I met him just before I took off from Kitty's, he said he was coming. \nB: Kitty's? He sure gets around, doesn't he? \nA: Looks like it. So how did he handle the situation when you confronted him about it? \nB: His excuse was familiar. He said his car died again. \nA: I think that's a bunch of nonsense. It seemed ok to me. \nB: I know. Last week he gave me a lie about being too busy. \nA: Wait, what were you saying earlier about how he handled it? \nB: Oh, right. He just brushed it off like it was no big deal. \nA: Doesn't sound promising. \nB: Well, I think it's the time to pull the plug.", + "total_duration": 48.038004535147394, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--216/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--216/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--216/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Did you enjoy that new movie?", + "original_text": "Did you enjoy that new movie?", + "start_time": 0, + "end_time": 1.6486167800453515, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--216/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "That movie's just a lot of noise, same as Simon.", + "original_text": "That movie's just a lot of noise, same as Simon.", + "start_time": 2.1755929156089455, + "end_time": 4.834277722865181, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--216/temp/line_1_B.wav", + "silence_duration": 0.526976135563594, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Oh, what happened, Carole?", + "original_text": "Oh, what happened, Carole?", + "start_time": 5.391916419271869, + "end_time": 6.843163584804749, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--216/temp/line_2_A.wav", + "silence_duration": 0.557638696406688, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I had to go by myself, he couldn't", + "original_text": "I had to go by myself, he couldn't [interrupt] make it because he had some last-minute work, or so he said, but I suspect he was just making excuses as usual to avoid spending time with me.", + "start_time": 7.202265119941618, + "end_time": 16.5366868886491, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--216/temp/line_3_B.wav", + "silence_duration": 0.3591015351368689, + "is_interrupted": true, + "text_after_interrupt": "make it because he had some last-minute work, or so he said, but I suspect he was just making excuses as usual to avoid spending time with me." + }, + { + "speaker": "A", + "text": "What? I met him just before I took off from Kitty's, he said he was coming.", + "original_text": "What? I met him just before I took off from Kitty's, he said he was coming.", + "start_time": 9.094691423796494, + "end_time": 13.251063305882662, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--216/temp/line_4_A.wav", + "silence_duration": 0.4663450271411933, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Kitty's? He sure gets around, doesn't he?", + "original_text": "Kitty's? He sure gets around, doesn't he?", + "start_time": 16.998508217144582, + "end_time": 19.216013886078823, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--216/temp/line_5_B.wav", + "silence_duration": 0.4618213284954822, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Looks like it. So how did he handle the situation when you confronted him about it?", + "original_text": "Looks like it. So how did he handle the situation when you confronted him about it?", + "start_time": 19.594917697978342, + "end_time": 24.308568491629135, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--216/temp/line_6_A.wav", + "silence_duration": 0.37890381189952044, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "His excuse was familiar. He said his car died again.", + "original_text": "His excuse was familiar. He said his car died again.", + "start_time": 24.635271729558877, + "end_time": 27.944115266973842, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--216/temp/line_7_B.wav", + "silence_duration": 0.3267032379297405, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I think that's a bunch of nonsense. It seemed ok to me.", + "original_text": "I think that's a bunch of nonsense. It seemed ok to me.", + "start_time": 28.53170438827114, + "end_time": 32.27011708668384, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--216/temp/line_8_A.wav", + "silence_duration": 0.5875891212972996, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I know. Last week he gave me a lie about being too busy.", + "original_text": "I know. Last week he gave me a lie about being too busy.", + "start_time": 32.64430322695685, + "end_time": 35.895096877750504, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--216/temp/line_9_B.wav", + "silence_duration": 0.37418614027301217, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Wait, what were you saying earlier about how he handled it?", + "original_text": "Wait, what were you saying earlier about how he handled it?", + "start_time": 36.30296441682296, + "end_time": 39.774347636777605, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--216/temp/line_10_A.wav", + "silence_duration": 0.40786753907245366, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Oh, right. He just brushed it off like it was no big deal.", + "original_text": "Oh, right. He just brushed it off like it was no big deal.", + "start_time": 40.25738864680596, + "end_time": 43.647502025490766, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--216/temp/line_11_B.wav", + "silence_duration": 0.4830410100283483, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Doesn't sound promising.", + "original_text": "Doesn't sound promising.", + "start_time": 44.07257221644539, + "end_time": 45.46576949535695, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--216/temp/line_12_A.wav", + "silence_duration": 0.4250701909546175, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Well, I think it's the time to pull the plug.", + "original_text": "Well, I think it's the time to pull the plug.", + "start_time": 45.86695285190096, + "end_time": 48.03801861153815, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--216/temp/line_13_B.wav", + "silence_duration": 0.40118335654401094, + "is_interrupted": false + } + ] + }, + "DialogSum--val--217": { + "original_text": "A: Excuse me, sir? \nB: Yes? \nA: I'm afraid you can't smoke here. \nB: Why not? \nA: Can't you see the notes [interrupt] posted on the walls clearly indicating this area is smoke-free? They're placed at eye level near all major entrances and exits, and there are even some with braille for visually impaired visitors. \nB: Sorry to interrupt, but I honestly can't see it. What does the note say? \nA: It says 'No smoking'. \nB: Oh, sorry, I'm very near sighted. By the way, where is the note exactly?", + "cleaned_text": "A: Excuse me, sir? \nB: Yes? \nA: I'm afraid you can't smoke here. \nB: Why not? \nA:Can't you see the notes posted on the walls clearly indicating this area is smoke-free? They're placed at eye level near all major entrances and exits, and there are even some with braille for visually impaired visitors.\nB: Sorry to interrupt, but I honestly can't see it. What does the note say? \nA: It says 'No smoking'. \nB: Oh, sorry, I'm very near sighted. By the way, where is the note exactly?", + "total_duration": 25.827891156462584, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--217/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--217/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--217/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Excuse me, sir?", + "original_text": "Excuse me, sir?", + "start_time": 0, + "end_time": 1.172607709750567, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--217/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes?", + "original_text": "Yes?", + "start_time": 1.5502055977080849, + "end_time": 2.1423144412455, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--217/temp/line_1_B.wav", + "silence_duration": 0.3775978879575178, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I'm afraid you can't smoke here.", + "original_text": "I'm afraid you can't smoke here.", + "start_time": 2.490393327961252, + "end_time": 4.4060395864646535, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--217/temp/line_2_A.wav", + "silence_duration": 0.34807888671575193, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Why not?", + "original_text": "Why not?", + "start_time": 4.761516366882671, + "end_time": 5.458115006338454, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--217/temp/line_3_B.wav", + "silence_duration": 0.35547678041801783, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Can't you see the notes", + "original_text": "Can't you see the notes [interrupt] posted on the walls clearly indicating this area is smoke-free? They're placed at eye level near all major entrances and exits, and there are even some with braille for visually impaired visitors.", + "start_time": 5.895052775936269, + "end_time": 19.08398701629908, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--217/temp/line_4_A.wav", + "silence_duration": 0.43693776959781494, + "is_interrupted": true, + "text_after_interrupt": "posted on the walls clearly indicating this area is smoke-free? They're placed at eye level near all major entrances and exits, and there are even some with braille for visually impaired visitors." + }, + { + "speaker": "B", + "text": "Sorry to interrupt, but I honestly can't see it. What does the note say?", + "original_text": "Sorry to interrupt, but I honestly can't see it. What does the note say?", + "start_time": 7.392739850766201, + "end_time": 11.78131127933763, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--217/temp/line_5_B.wav", + "silence_duration": 0.5896382530095197, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "It says 'No smoking'.", + "original_text": "It says 'No smoking'.", + "start_time": 19.427627029923812, + "end_time": 20.8440442634839, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--217/temp/line_6_A.wav", + "silence_duration": 0.34364001362473334, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Oh, sorry, I'm very near sighted. By the way, where is the note exactly?", + "original_text": "Oh, sorry, I'm very near sighted. By the way, where is the note exactly?", + "start_time": 21.288400817536427, + "end_time": 25.827901951323277, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--217/temp/line_7_B.wav", + "silence_duration": 0.44435655405252644, + "is_interrupted": false + } + ] + }, + "DialogSum--val--218": { + "original_text": "A: I'm so hungry. Shall we go eat now, Rick? \nB: Sure. Where do you want to go? Are you in the mood for anything in [interrupt] particular? Maybe something light or hearty, like a salad or a steak? I know you've been trying to eat healthier lately. \nA: How about some dumplings? I just can't get enough of them. \nB: Dumplings again?! Oh, Amy, let's try something new! \nA: Well, what do you have in mind? \nB: How about the Mongolian hot pot? \nA: Oh, it's too spicy for me. Don't you remember last time when I tasted the lamb? It was so spicy my eyes [interrupt] were watering uncontrollably, and I couldn't finish my meal despite drinking three glasses of milk to cool down the burning sensation. \nB: Maybe we can try Yuanyang pot this time. You can choose the non-spicy soup base. \nA: That sounds great. But I was saying, my eyes teared up last time! Do they serve noodles? I am in the mood for some tasty noodles as well. \nB: Yes. The sliced noodles they offer are among the most authentic Shanti cuisines. \nA: Great. Let's go! \nB: Wait a minute. Let me throw on a sweater.", + "cleaned_text": "A: I'm so hungry. Shall we go eat now, Rick? \nB:Sure. Where do you want to go? Are you in the mood for anything in particular? Maybe something light or hearty, like a salad or a steak? I know you've been trying to eat healthier lately.\nA: How about some dumplings? I just can't get enough of them. \nB: Dumplings again?! Oh, Amy, let's try something new! \nA: Well, what do you have in mind? \nB: How about the Mongolian hot pot? \nA:Oh, it's too spicy for me. Don't you remember last time when I tasted the lamb? It was so spicy my eyes were watering uncontrollably, and I couldn't finish my meal despite drinking three glasses of milk to cool down the burning sensation.\nB: Maybe we can try Yuanyang pot this time. You can choose the non-spicy soup base. \nA: That sounds great. But I was saying, my eyes teared up last time! Do they serve noodles? I am in the mood for some tasty noodles as well. \nB: Yes. The sliced noodles they offer are among the most authentic Shanti cuisines. \nA: Great. Let's go! \nB: Wait a minute. Let me throw on a sweater.", + "total_duration": 57.0815873015873, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--218/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--218/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--218/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "I'm so hungry. Shall we go eat now, Rick?", + "original_text": "I'm so hungry. Shall we go eat now, Rick?", + "start_time": 0, + "end_time": 3.7500226757369615, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--218/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Sure. Where do you want to go? Are you in the mood for anything in", + "original_text": "Sure. Where do you want to go? Are you in the mood for anything in [interrupt] particular? Maybe something light or hearty, like a salad or a steak? I know you've been trying to eat healthier lately.", + "start_time": 4.170838087478321, + "end_time": 13.667799538725486, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--218/temp/line_1_B.wav", + "silence_duration": 0.42081541174135983, + "is_interrupted": true, + "text_after_interrupt": "particular? Maybe something light or hearty, like a salad or a steak? I know you've been trying to eat healthier lately." + }, + { + "speaker": "A", + "text": "How about some dumplings? I just can't get enough of them.", + "original_text": "How about some dumplings? I just can't get enough of them.", + "start_time": 7.410021760947709, + "end_time": 10.92784489019941, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--218/temp/line_2_A.wav", + "silence_duration": 0.5919485020008171, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Dumplings again?! Oh, Amy, let's try something new!", + "original_text": "Dumplings again?! Oh, Amy, let's try something new!", + "start_time": 14.08448417445563, + "end_time": 17.21917805200665, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--218/temp/line_3_B.wav", + "silence_duration": 0.4166846357301447, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Well, what do you have in mind?", + "original_text": "Well, what do you have in mind?", + "start_time": 17.673761909172796, + "end_time": 19.53135828105488, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--218/temp/line_4_A.wav", + "silence_duration": 0.4545838571661449, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "How about the Mongolian hot pot?", + "original_text": "How about the Mongolian hot pot?", + "start_time": 19.871926887883827, + "end_time": 22.066212602169543, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--218/temp/line_5_B.wav", + "silence_duration": 0.3405686068289462, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Oh, it's too spicy for me. Don't you remember last time when I tasted the lamb? It was so spicy my eyes", + "original_text": "Oh, it's too spicy for me. Don't you remember last time when I tasted the lamb? It was so spicy my eyes [interrupt] were watering uncontrollably, and I couldn't finish my meal despite drinking three glasses of milk to cool down the burning sensation.", + "start_time": 22.562361838856688, + "end_time": 37.1328833808068, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--218/temp/line_6_A.wav", + "silence_duration": 0.49614923668714406, + "is_interrupted": true, + "text_after_interrupt": "were watering uncontrollably, and I couldn't finish my meal despite drinking three glasses of milk to cool down the burning sensation." + }, + { + "speaker": "B", + "text": "Maybe we can try Yuanyang pot this time. You can choose the non-spicy soup base.", + "original_text": "Maybe we can try Yuanyang pot this time. You can choose the non-spicy soup base.", + "start_time": 34.01980398960557, + "end_time": 38.919214420444575, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--218/temp/line_7_B.wav", + "silence_duration": 0.4930056220984519, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "That sounds great. But I was saying, my eyes teared up last time! Do they serve noodles? I am in the mood for some tasty noodles as well.", + "original_text": "That sounds great. But I was saying, my eyes teared up last time! Do they serve noodles? I am in the mood for some tasty noodles as well.", + "start_time": 39.25675456784559, + "end_time": 47.83652781047598, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--218/temp/line_8_A.wav", + "silence_duration": 0.3375401474010115, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes. The sliced noodles they offer are among the most authentic Shanti cuisines.", + "original_text": "Yes. The sliced noodles they offer are among the most authentic Shanti cuisines.", + "start_time": 48.27158646384992, + "end_time": 52.86913748425808, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--218/temp/line_9_B.wav", + "silence_duration": 0.435058653373945, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Great. Let's go!", + "original_text": "Great. Let's go!", + "start_time": 53.378392014697575, + "end_time": 54.597439633745196, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--218/temp/line_10_A.wav", + "silence_duration": 0.5092545304394919, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Wait a minute. Let me throw on a sweater.", + "original_text": "Wait a minute. Let me throw on a sweater.", + "start_time": 55.02663497040564, + "end_time": 57.081600956800195, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--218/temp/line_11_B.wav", + "silence_duration": 0.42919533666044374, + "is_interrupted": false + } + ] + }, + "DialogSum--val--219": { + "original_text": "A: Mom! How can I help with the washing up? \nB: You peel the onions and wash them, then chop [interrupt] them into small pieces for the salad and make sure to keep the pieces uniform so they mix well with the other ingredients. \nA: Should I chop them finely or just roughly? \nB: Just roughly is fine. After that, wash the cabbage over there. \nA: OK, got it. By the way, what is your father doing now? \nB: He's reading the newspaper on the couch. And after you finish with the cabbage, can you get your father and brother? \nA: Sure! Oh, how about Daniel? \nB: Staying with Ultraman, of course. You know he likes it very much. \nA: Yeah, he's always been a fan. I'll be careful with the peeler, don't worry. \nB: I will.", + "cleaned_text": "A: Mom! How can I help with the washing up? \nB:You peel the onions and wash them, then chop them into small pieces for the salad and make sure to keep the pieces uniform so they mix well with the other ingredients.\nA: Should I chop them finely or just roughly? \nB: Just roughly is fine. After that, wash the cabbage over there. \nA: OK, got it. By the way, what is your father doing now? \nB: He's reading the newspaper on the couch. And after you finish with the cabbage, can you get your father and brother? \nA: Sure! Oh, how about Daniel? \nB: Staying with Ultraman, of course. You know he likes it very much. \nA: Yeah, he's always been a fan. I'll be careful with the peeler, don't worry. \nB: I will.", + "total_duration": 39.36589569160998, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--219/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--219/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--219/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Mom! How can I help with the washing up?", + "original_text": "Mom! How can I help with the washing up?", + "start_time": 0, + "end_time": 2.7747845804988662, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--219/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "You peel the onions and wash them, then chop", + "original_text": "You peel the onions and wash them, then chop [interrupt] them into small pieces for the salad and make sure to keep the pieces uniform so they mix well with the other ingredients.", + "start_time": 3.298314493881731, + "end_time": 11.518178439459962, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--219/temp/line_1_B.wav", + "silence_duration": 0.5235299133828649, + "is_interrupted": true, + "text_after_interrupt": "them into small pieces for the salad and make sure to keep the pieces uniform so they mix well with the other ingredients." + }, + { + "speaker": "A", + "text": "Should I chop them finely or just roughly?", + "original_text": "Should I chop them finely or just roughly?", + "start_time": 5.794459618598284, + "end_time": 8.093235128802366, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--219/temp/line_2_A.wav", + "silence_duration": 0.5617775600030976, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Just roughly is fine. After that, wash the cabbage over there.", + "original_text": "Just roughly is fine. After that, wash the cabbage over there.", + "start_time": 12.028892089116702, + "end_time": 15.662814991611032, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--219/temp/line_3_B.wav", + "silence_duration": 0.5107136496567397, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "OK, got it. By the way, what is your father doing now?", + "original_text": "OK, got it. By the way, what is your father doing now?", + "start_time": 15.993798704357895, + "end_time": 20.10373067714701, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--219/temp/line_4_A.wav", + "silence_duration": 0.33098371274686295, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "He's reading the newspaper on the couch. And after you finish with the cabbage, can you get your father and brother?", + "original_text": "He's reading the newspaper on the couch. And after you finish with the cabbage, can you get your father and brother?", + "start_time": 20.48391820256439, + "end_time": 25.940607544968017, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--219/temp/line_5_B.wav", + "silence_duration": 0.3801875254173783, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Sure! Oh, how about Daniel?", + "original_text": "Sure! Oh, how about Daniel?", + "start_time": 26.527849978860395, + "end_time": 28.96594521695563, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--219/temp/line_6_A.wav", + "silence_duration": 0.5872424338923761, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Staying with Ultraman, of course. You know he likes it very much.", + "original_text": "Staying with Ultraman, of course. You know he likes it very much.", + "start_time": 29.394682388700105, + "end_time": 32.993775359221644, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--219/temp/line_7_B.wav", + "silence_duration": 0.428737171744474, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Yeah, he's always been a fan. I'll be careful with the peeler, don't worry.", + "original_text": "Yeah, he's always been a fan. I'll be careful with the peeler, don't worry.", + "start_time": 33.48682237522934, + "end_time": 38.281743010149974, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--219/temp/line_8_A.wav", + "silence_duration": 0.49304701600769163, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I will.", + "original_text": "I will.", + "start_time": 38.750589693822995, + "end_time": 39.36591849200894, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--219/temp/line_9_B.wav", + "silence_duration": 0.46884668367302307, + "is_interrupted": false + } + ] + }, + "DialogSum--val--220": { + "original_text": "A: Oh, Ralph, I heard it is very dangerous traveling in space. Disasters have happened before. If the spaceship were out of [interrupt] control due to a malfunction, it could lead to catastrophic consequences like complete system failure or even collision with space debris that would endanger the entire crew.\nB: You should be optimistic about this. I just want to clarify, what exactly do you mean by \"out of order\"? Are you referring to technical malfunctions or something else?\nA: Yes, I was thinking about technical malfunctions. But as I was saying, things have taken a good turn. You should remember that less than two centuries ago the dangers of train travel seemed similarly terrible.\nB: But is it possible that travelers could be hit by meteors?\nA: It's once in a blue moon.\nB: What do you think is the real danger man faced in space?\nA: The main one is radiation. There are two sorts of radiation man must fear in space. The first is radiation from the sun, and this is particularly dangerous when the sun is very active and explosions are occurring on its surface. The second, less harmful, comes from the so-called Van Allen Belts, which are regions of trapped radiation around Earth.\nB: Sorry, I didn't catch that last part. What are the Van Allen Belts?\nA: The Van Allen Belts are [interrupt] zones of charged particles around Earth, and while they are less harmful, they still pose a significant risk to astronauts during prolonged exposure and can potentially damage sensitive electronic equipment on spacecraft.", + "cleaned_text": "A:Oh, Ralph, I heard it is very dangerous traveling in space. Disasters have happened before. If the spaceship were out of control due to a malfunction, it could lead to catastrophic consequences like complete system failure or even collision with space debris that would endanger the entire crew.\nB: You should be optimistic about this. I just want to clarify, what exactly do you mean by \"out of order\"? Are you referring to technical malfunctions or something else?\nA: Yes, I was thinking about technical malfunctions. But as I was saying, things have taken a good turn. You should remember that less than two centuries ago the dangers of train travel seemed similarly terrible.\nB: But is it possible that travelers could be hit by meteors?\nA: It's once in a blue moon.\nB: What do you think is the real danger man faced in space?\nA: The main one is radiation. There are two sorts of radiation man must fear in space. The first is radiation from the sun, and this is particularly dangerous when the sun is very active and explosions are occurring on its surface. The second, less harmful, comes from the so-called Van Allen Belts, which are regions of trapped radiation around Earth.\nB: Sorry, I didn't catch that last part. What are the Van Allen Belts?\nA:The Van Allen Belts are zones of charged particles around Earth, and while they are less harmful, they still pose a significant risk to astronauts during prolonged exposure and can potentially damage sensitive electronic equipment on spacecraft.", + "total_duration": 81.02997732426304, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--220/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--220/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--220/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Oh, Ralph, I heard it is very dangerous traveling in space. Disasters have happened before. If the spaceship were out of", + "original_text": "Oh, Ralph, I heard it is very dangerous traveling in space. Disasters have happened before. If the spaceship were out of [interrupt] control due to a malfunction, it could lead to catastrophic consequences like complete system failure or even collision with space debris that would endanger the entire crew.", + "start_time": 0, + "end_time": 17.949024943310658, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--220/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": true, + "text_after_interrupt": "control due to a malfunction, it could lead to catastrophic consequences like complete system failure or even collision with space debris that would endanger the entire crew." + }, + { + "speaker": "B", + "text": "You should be optimistic about this. I just want to clarify, what exactly do you mean by \"out of order\"? Are you referring to technical malfunctions or something else?", + "original_text": "You should be optimistic about this. I just want to clarify, what exactly do you mean by \"out of order\"? Are you referring to technical malfunctions or something else?", + "start_time": 7.778684807256236, + "end_time": 16.31201814058957, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--220/temp/line_1_B.wav", + "silence_duration": 0.3825845617006096, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Yes, I was thinking about technical malfunctions. But as I was saying, things have taken a good turn. You should remember that less than two centuries ago the dangers of train travel seemed similarly terrible.", + "original_text": "Yes, I was thinking about technical malfunctions. But as I was saying, things have taken a good turn. You should remember that less than two centuries ago the dangers of train travel seemed similarly terrible.", + "start_time": 18.41602688865036, + "end_time": 31.314711695906595, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--220/temp/line_2_A.wav", + "silence_duration": 0.46700194533970385, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "But is it possible that travelers could be hit by meteors?", + "original_text": "But is it possible that travelers could be hit by meteors?", + "start_time": 31.700741403044592, + "end_time": 34.51035591551625, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--220/temp/line_3_B.wav", + "silence_duration": 0.38602970713799617, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "It's once in a blue moon.", + "original_text": "It's once in a blue moon.", + "start_time": 35.09247011613148, + "end_time": 36.74108689617683, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--220/temp/line_4_A.wav", + "silence_duration": 0.5821142006152279, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "What do you think is the real danger man faced in space?", + "original_text": "What do you think is the real danger man faced in space?", + "start_time": 37.15230948730527, + "end_time": 39.89226413583135, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--220/temp/line_5_B.wav", + "silence_duration": 0.4112225911284356, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "The main one is radiation. There are two sorts of radiation man must fear in space. The first is radiation from the sun, and this is particularly dangerous when the sun is very active and explosions are occurring on its surface. The second, less harmful, comes from the so-called Van Allen Belts, which are regions of trapped radiation around Earth.", + "original_text": "The main one is radiation. There are two sorts of radiation man must fear in space. The first is radiation from the sun, and this is particularly dangerous when the sun is very active and explosions are occurring on its surface. The second, less harmful, comes from the so-called Van Allen Belts, which are regions of trapped radiation around Earth.", + "start_time": 40.37080082451991, + "end_time": 61.709939146515374, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--220/temp/line_6_A.wav", + "silence_duration": 0.4785366886885636, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Sorry, I didn't catch that last part. What are the Van Allen Belts?", + "original_text": "Sorry, I didn't catch that last part. What are the Van Allen Belts?", + "start_time": 62.15265978775968, + "end_time": 65.75175275828123, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--220/temp/line_7_B.wav", + "silence_duration": 0.442720641244308, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "The Van Allen Belts are", + "original_text": "The Van Allen Belts are [interrupt] zones of charged particles around Earth, and while they are less harmful, they still pose a significant risk to astronauts during prolonged exposure and can potentially damage sensitive electronic equipment on spacecraft.", + "start_time": 66.18084605900508, + "end_time": 81.0300070567375, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--220/temp/line_8_A.wav", + "silence_duration": 0.429093300723856, + "is_interrupted": true, + "text_after_interrupt": "zones of charged particles around Earth, and while they are less harmful, they still pose a significant risk to astronauts during prolonged exposure and can potentially damage sensitive electronic equipment on spacecraft." + } + ] + }, + "DialogSum--val--221": { + "original_text": "A: What do you think of this coffee table? \nB: It's nice, but it doesn't match the color of our [interrupt] furniture, and I think that might be an issue because we've been trying to maintain a consistent aesthetic throughout the entire living space. \nA: Wait, before you continue—do you think we should prioritize the color or the size of the table? \nB: Good point, but I was going to say it doesn't match the color of our room. I think color is more important because it sets the tone. \nA: Got it. How about this one? \nB: Oh no, this type gets dirty very easily and it's difficult to clean. \nA: Alright, let's look at some others. Look, this one matches our room and it's made of a material that's easy to maintain. \nB: Sorry, I just realized—did we check if it's within our budget? \nA: Oh, I was going to mention it's inexpensive too. And yes, it's well within our budget.", + "cleaned_text": "A: What do you think of this coffee table? \nB:It's nice, but it doesn't match the color of our furniture, and I think that might be an issue because we've been trying to maintain a consistent aesthetic throughout the entire living space.\nA: Wait, before you continue—do you think we should prioritize the color or the size of the table? \nB: Good point, but I was going to say it doesn't match the color of our room. I think color is more important because it sets the tone. \nA: Got it. How about this one? \nB: Oh no, this type gets dirty very easily and it's difficult to clean. \nA: Alright, let's look at some others. Look, this one matches our room and it's made of a material that's easy to maintain. \nB: Sorry, I just realized—did we check if it's within our budget? \nA: Oh, I was going to mention it's inexpensive too. And yes, it's well within our budget.", + "total_duration": 42.32585034013606, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--221/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--221/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--221/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "What do you think of this coffee table?", + "original_text": "What do you think of this coffee table?", + "start_time": 0, + "end_time": 1.8692063492063493, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--221/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "It's nice, but it doesn't match the color of our", + "original_text": "It's nice, but it doesn't match the color of our [interrupt] furniture, and I think that might be an issue because we've been trying to maintain a consistent aesthetic throughout the entire living space.", + "start_time": 2.4575913293734017, + "end_time": 11.211514231867733, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--221/temp/line_1_B.wav", + "silence_duration": 0.5883849801670524, + "is_interrupted": true, + "text_after_interrupt": "furniture, and I think that might be an issue because we've been trying to maintain a consistent aesthetic throughout the entire living space." + }, + { + "speaker": "A", + "text": "Wait, before you continue—do you think we should prioritize the color or the size of the table?", + "original_text": "Wait, before you continue—do you think we should prioritize the color or the size of the table?", + "start_time": 5.592285206924422, + "end_time": 10.886434866788367, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--221/temp/line_2_A.wav", + "silence_duration": 0.31686160604931396, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Good point, but I was going to say it doesn't match the color of our room. I think color is more important because it sets the tone.", + "original_text": "Good point, but I was going to say it doesn't match the color of our room. I think color is more important because it sets the tone.", + "start_time": 11.677805136040426, + "end_time": 18.272272256221832, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--221/temp/line_3_B.wav", + "silence_duration": 0.46629090417269314, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Got it. How about this one?", + "original_text": "Got it. How about this one?", + "start_time": 18.70068810643014, + "end_time": 20.279645022529913, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--221/temp/line_4_A.wav", + "silence_duration": 0.42841585020830586, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Oh no, this type gets dirty very easily and it's difficult to clean.", + "original_text": "Oh no, this type gets dirty very easily and it's difficult to clean.", + "start_time": 20.84128286310015, + "end_time": 24.85833501729516, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--221/temp/line_5_B.wav", + "silence_duration": 0.5616378405702368, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Alright, let's look at some others. Look, this one matches our room and it's made of a material that's easy to maintain.", + "original_text": "Alright, let's look at some others. Look, this one matches our room and it's made of a material that's easy to maintain.", + "start_time": 25.160102766622398, + "end_time": 33.054887347121266, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--221/temp/line_6_A.wav", + "silence_duration": 0.3017677493272359, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Sorry, I just realized—did we check if it's within our budget?", + "original_text": "Sorry, I just realized—did we check if it's within our budget?", + "start_time": 33.377836737575784, + "end_time": 36.512530615126806, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--221/temp/line_7_B.wav", + "silence_duration": 0.3229493904545169, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Oh, I was going to mention it's inexpensive too. And yes, it's well within our budget.", + "original_text": "Oh, I was going to mention it's inexpensive too. And yes, it's well within our budget.", + "start_time": 36.99691276839833, + "end_time": 42.325892360235066, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--221/temp/line_8_A.wav", + "silence_duration": 0.4843821532715219, + "is_interrupted": false + } + ] + }, + "DialogSum--val--222": { + "original_text": "A: Welcome. May I help you? \nB: Yes, I want an eye-shadow. \nA: We have different colours of eye-shadow. May I know what colour you usually [interrupt] prefer so I can suggest something similar or a bit different if you're looking for a change? I'd also love to know if you have any specific finish preferences like matte or shimmer. \nB: Purple. But today, I'm thinking of buying one in a bright colour. \nA: Yes, I see. How do you like this one? \nB: May I have a try? \nA: Certainly. \nB: It's still too dark. Any brighter colours? \nA: Not from this brand, I'm afraid. \nB: What about other brands? \nA: How about this one? \nB: Oh, that's the very thing I need. By the way, you were asking earlier about the colour I usually wear? \nA: Yes, I was just curious if you often go for purples or if you like to experiment with other shades as well.", + "cleaned_text": "A: Welcome. May I help you? \nB: Yes, I want an eye-shadow. \nA:We have different colours of eye-shadow. May I know what colour you usually prefer so I can suggest something similar or a bit different if you're looking for a change? I'd also love to know if you have any specific finish preferences like matte or shimmer.\nB: Purple. But today, I'm thinking of buying one in a bright colour. \nA: Yes, I see. How do you like this one? \nB: May I have a try? \nA: Certainly. \nB: It's still too dark. Any brighter colours? \nA: Not from this brand, I'm afraid. \nB: What about other brands? \nA: How about this one? \nB: Oh, that's the very thing I need. By the way, you were asking earlier about the colour I usually wear? \nA: Yes, I was just curious if you often go for purples or if you like to experiment with other shades as well.", + "total_duration": 46.5043537414966, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--222/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--222/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--222/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Welcome. May I help you?", + "original_text": "Welcome. May I help you?", + "start_time": 0, + "end_time": 1.4512471655328798, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--222/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, I want an eye-shadow.", + "original_text": "Yes, I want an eye-shadow.", + "start_time": 1.9486918515458418, + "end_time": 3.5973086315911935, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--222/temp/line_1_B.wav", + "silence_duration": 0.49744468601296205, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "We have different colours of eye-shadow. May I know what colour you usually", + "original_text": "We have different colours of eye-shadow. May I know what colour you usually [interrupt] prefer so I can suggest something similar or a bit different if you're looking for a change? I'd also love to know if you have any specific finish preferences like matte or shimmer.", + "start_time": 3.993896005419123, + "end_time": 19.19135632287944, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--222/temp/line_2_A.wav", + "silence_duration": 0.3965873738279292, + "is_interrupted": true, + "text_after_interrupt": "prefer so I can suggest something similar or a bit different if you're looking for a change? I'd also love to know if you have any specific finish preferences like matte or shimmer." + }, + { + "speaker": "B", + "text": "Purple. But today, I'm thinking of buying one in a bright colour.", + "original_text": "Purple. But today, I'm thinking of buying one in a bright colour.", + "start_time": 8.486957229908919, + "end_time": 12.376299633537037, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--222/temp/line_3_B.wav", + "silence_duration": 0.47328060687959894, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Yes, I see. How do you like this one?", + "original_text": "Yes, I see. How do you like this one?", + "start_time": 19.754590134603376, + "end_time": 23.33046315047639, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--222/temp/line_4_A.wav", + "silence_duration": 0.5632338117239375, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "May I have a try?", + "original_text": "May I have a try?", + "start_time": 23.796908962270074, + "end_time": 24.830196944129483, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--222/temp/line_5_B.wav", + "silence_duration": 0.4664458117936844, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Certainly.", + "original_text": "Certainly.", + "start_time": 25.359291115572546, + "end_time": 26.17198952827096, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--222/temp/line_6_A.wav", + "silence_duration": 0.5290941714430648, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "It's still too dark. Any brighter colours?", + "original_text": "It's still too dark. Any brighter colours?", + "start_time": 26.68555942408985, + "end_time": 28.961114979645405, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--222/temp/line_7_B.wav", + "silence_duration": 0.5135698958188905, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Not from this brand, I'm afraid.", + "original_text": "Not from this brand, I'm afraid.", + "start_time": 29.341575471116776, + "end_time": 31.315271616241493, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--222/temp/line_8_A.wav", + "silence_duration": 0.3804604914713697, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "What about other brands?", + "original_text": "What about other brands?", + "start_time": 31.902969398387523, + "end_time": 33.098797062786616, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--222/temp/line_9_B.wav", + "silence_duration": 0.5876977821460302, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "How about this one?", + "original_text": "How about this one?", + "start_time": 33.49866687048636, + "end_time": 34.69449453488545, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--222/temp/line_10_A.wav", + "silence_duration": 0.3998698076997465, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Oh, that's the very thing I need. By the way, you were asking earlier about the colour I usually wear?", + "original_text": "Oh, that's the very thing I need. By the way, you were asking earlier about the colour I usually wear?", + "start_time": 35.16282033427819, + "end_time": 39.45851194425551, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--222/temp/line_11_B.wav", + "silence_duration": 0.4683257993927355, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Yes, I was just curious if you often go for purples or if you like to experiment with other shades as well.", + "original_text": "Yes, I was just curious if you often go for purples or if you like to experiment with other shades as well.", + "start_time": 39.90991832048933, + "end_time": 46.50438544067074, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--222/temp/line_12_A.wav", + "silence_duration": 0.4514063762338226, + "is_interrupted": false + } + ] + }, + "DialogSum--val--223": { + "original_text": "A: I was really glad to hear about your award, congratulations! \nB: Thanks. Actually, I was really surprised. I mean there were a lot of qualified [interrupt] candidates who could have won, including several senior colleagues with decades of experience and groundbreaking contributions to our field. I didn't expect it to be me. \nA: Sorry to jump in, but I just wanted to say—you've been working there for so long with so much sacrifice. You definitely deserve it. \nB: Thanks a lot. I appreciate that. But I was about to say, there were a lot of qualified people out there. Anyway, I expect to see your name nominated pretty soon too. You've been doing some great work.", + "cleaned_text": "A: I was really glad to hear about your award, congratulations! \nB:Thanks. Actually, I was really surprised. I mean there were a lot of qualified candidates who could have won, including several senior colleagues with decades of experience and groundbreaking contributions to our field. I didn't expect it to be me.\nA: Sorry to jump in, but I just wanted to say—you've been working there for so long with so much sacrifice. You definitely deserve it. \nB: Thanks a lot. I appreciate that. But I was about to say, there were a lot of qualified people out there. Anyway, I expect to see your name nominated pretty soon too. You've been doing some great work.", + "total_duration": 27.55573696145125, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--223/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--223/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--223/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "I was really glad to hear about your award, congratulations!", + "original_text": "I was really glad to hear about your award, congratulations!", + "start_time": 0, + "end_time": 3.4946031746031747, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--223/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Thanks. Actually, I was really surprised. I mean there were a lot of qualified", + "original_text": "Thanks. Actually, I was really surprised. I mean there were a lot of qualified [interrupt] candidates who could have won, including several senior colleagues with decades of experience and groundbreaking contributions to our field. I didn't expect it to be me.", + "start_time": 4.011476268397157, + "end_time": 17.13075064481439, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--223/temp/line_1_B.wav", + "silence_duration": 0.5168730937939824, + "is_interrupted": true, + "text_after_interrupt": "candidates who could have won, including several senior colleagues with decades of experience and groundbreaking contributions to our field. I didn't expect it to be me." + }, + { + "speaker": "A", + "text": "Sorry to jump in, but I just wanted to say—you've been working there for so long with so much sacrifice. You definitely deserve it.", + "original_text": "Sorry to jump in, but I just wanted to say—you've been working there for so long with so much sacrifice. You definitely deserve it.", + "start_time": 8.365217764995798, + "end_time": 16.004582844360876, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--223/temp/line_2_A.wav", + "silence_duration": 0.3952942849126433, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Thanks a lot. I appreciate that. But I was about to say, there were a lot of qualified people out there. Anyway, I expect to see your name nominated pretty soon too. You've been doing some great work.", + "original_text": "Thanks a lot. I appreciate that. But I was about to say, there were a lot of qualified people out there. Anyway, I expect to see your name nominated pretty soon too. You've been doing some great work.", + "start_time": 17.58279503572008, + "end_time": 27.555765557262028, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--223/temp/line_3_B.wav", + "silence_duration": 0.4520443909056866, + "is_interrupted": false + } + ] + }, + "DialogSum--val--224": { + "original_text": "A: I haven't received my credit card bill yet.\nB: Which credit card are you speaking of?\nA: My Master Card.\nB: We sent that bill out a couple of [interrupt] weeks ago along with all the other monthly statements, so it definitely should have arrived by now unless there was some unexpected delay in the mail delivery system.\nA: Sorry to jump in, but I really haven't seen anything. What am I going to do since I haven't received the bill?\nB: If you haven't gotten it yet, then you should probably take that up with your post office.\nA: I see. But wait, you mentioned you sent the bill out a couple of weeks ago. Could I get an extension on my bill if it does happen to be the post office's fault?\nB: If that's the case, you will need to provide proof of their mistake.\nA: Got it. Thanks for everything.\nB: Don't mention it. Call back if you have any more questions.", + "cleaned_text": "A: I haven't received my credit card bill yet.\nB: Which credit card are you speaking of?\nA: My Master Card.\nB:We sent that bill out a couple of weeks ago along with all the other monthly statements, so it definitely should have arrived by now unless there was some unexpected delay in the mail delivery system.\nA: Sorry to jump in, but I really haven't seen anything. What am I going to do since I haven't received the bill?\nB: If you haven't gotten it yet, then you should probably take that up with your post office.\nA: I see. But wait, you mentioned you sent the bill out a couple of weeks ago. Could I get an extension on my bill if it does happen to be the post office's fault?\nB: If that's the case, you will need to provide proof of their mistake.\nA: Got it. Thanks for everything.\nB: Don't mention it. Call back if you have any more questions.", + "total_duration": 40.39927437641723, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--224/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--224/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--224/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "I haven't received my credit card bill yet.", + "original_text": "I haven't received my credit card bill yet.", + "start_time": 0, + "end_time": 2.4380952380952383, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--224/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Which credit card are you speaking of?", + "original_text": "Which credit card are you speaking of?", + "start_time": 2.808903593725974, + "end_time": 4.6432800109595345, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--224/temp/line_1_B.wav", + "silence_duration": 0.3708083556307357, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "My Master Card.", + "original_text": "My Master Card.", + "start_time": 4.977336397407327, + "end_time": 6.207993993779208, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--224/temp/line_2_A.wav", + "silence_duration": 0.33405638644779234, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "We sent that bill out a couple of", + "original_text": "We sent that bill out a couple of [interrupt] weeks ago along with all the other monthly statements, so it definitely should have arrived by now unless there was some unexpected delay in the mail delivery system.", + "start_time": 6.652083232879475, + "end_time": 16.26514445736927, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--224/temp/line_3_B.wav", + "silence_duration": 0.4440892391002663, + "is_interrupted": true, + "text_after_interrupt": "weeks ago along with all the other monthly statements, so it definitely should have arrived by now unless there was some unexpected delay in the mail delivery system." + }, + { + "speaker": "A", + "text": "Sorry to jump in, but I really haven't seen anything. What am I going to do since I haven't received the bill?", + "original_text": "Sorry to jump in, but I really haven't seen anything. What am I going to do since I haven't received the bill?", + "start_time": 8.300700012924827, + "end_time": 14.837117246484917, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--224/temp/line_4_A.wav", + "silence_duration": 0.3419282711511233, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "If you haven't gotten it yet, then you should probably take that up with your post office.", + "original_text": "If you haven't gotten it yet, then you should probably take that up with your post office.", + "start_time": 16.756437423016923, + "end_time": 20.425190257484044, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--224/temp/line_5_B.wav", + "silence_duration": 0.49129296564765335, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I see. But wait, you mentioned you sent the bill out a couple of weeks ago. Could I get an extension on my bill if it does happen to be the post office's fault?", + "original_text": "I see. But wait, you mentioned you sent the bill out a couple of weeks ago. Could I get an extension on my bill if it does happen to be the post office's fault?", + "start_time": 20.880141068075883, + "end_time": 30.818281657645045, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--224/temp/line_6_A.wav", + "silence_duration": 0.45495081059183773, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "If that's the case, you will need to provide proof of their mistake.", + "original_text": "If that's the case, you will need to provide proof of their mistake.", + "start_time": 31.230141519558067, + "end_time": 34.283565555839246, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--224/temp/line_7_B.wav", + "silence_duration": 0.41185986191302343, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Got it. Thanks for everything.", + "original_text": "Got it. Thanks for everything.", + "start_time": 34.84227415877587, + "end_time": 37.210709532925534, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--224/temp/line_8_A.wav", + "silence_duration": 0.5587086029366262, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Don't mention it. Call back if you have any more questions.", + "original_text": "Don't mention it. Call back if you have any more questions.", + "start_time": 37.5432320137239, + "end_time": 40.39928643549261, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--224/temp/line_9_B.wav", + "silence_duration": 0.3325224807983694, + "is_interrupted": false + } + ] + }, + "DialogSum--val--225": { + "original_text": "A: Excuse me. I want to pay the bill.\nB: Please wait till your name is called. OK. Your bill includes the doctor's fee and the cost for a 3-day supply of medicine. It comes to one hundred yuan.\nA: Here you are.\nB: Good. Here is the receipt. The dispensary is over there. . . By the way, will this be covered by your insurance from [interrupt] work, or do you have a different plan that might offer better coverage? You might want to check with your HR department about the specific benefits included in your employment package.\nA: Sorry, I just realized I have private medical insurance. Will that make a difference?\nB: In that case, I'll give you a certificate, so you can get it reimbursed.\nA: Thanks a lot. Oh, you were asking something about insurance earlier—what was it?\nB: I was just asking if this will be covered by your insurance from work. Don't lose this receipt, because insurance companies are very difficult about helping when they don't have the right paperwork.", + "cleaned_text": "A: Excuse me. I want to pay the bill.\nB: Please wait till your name is called. OK. Your bill includes the doctor's fee and the cost for a 3-day supply of medicine. It comes to one hundred yuan.\nA: Here you are.\nB:Good. Here is the receipt. The dispensary is over there. . . By the way, will this be covered by your insurance from work, or do you have a different plan that might offer better coverage? You might want to check with your HR department about the specific benefits included in your employment package.\nA: Sorry, I just realized I have private medical insurance. Will that make a difference?\nB: In that case, I'll give you a certificate, so you can get it reimbursed.\nA: Thanks a lot. Oh, you were asking something about insurance earlier—what was it?\nB: I was just asking if this will be covered by your insurance from work. Don't lose this receipt, because insurance companies are very difficult about helping when they don't have the right paperwork.", + "total_duration": 46.54403628117914, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--225/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--225/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--225/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Excuse me. I want to pay the bill.", + "original_text": "Excuse me. I want to pay the bill.", + "start_time": 0, + "end_time": 2.2755555555555556, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--225/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Please wait till your name is called. OK. Your bill includes the doctor's fee and the cost for a 3-day supply of medicine. It comes to one hundred yuan.", + "original_text": "Please wait till your name is called. OK. Your bill includes the doctor's fee and the cost for a 3-day supply of medicine. It comes to one hundred yuan.", + "start_time": 2.7497116735373117, + "end_time": 11.782274031813955, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--225/temp/line_1_B.wav", + "silence_duration": 0.47415611798175605, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Here you are.", + "original_text": "Here you are.", + "start_time": 12.263319837907199, + "end_time": 13.192118023848241, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--225/temp/line_2_A.wav", + "silence_duration": 0.4810458060932442, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Good. Here is the receipt. The dispensary is over there. . . By the way, will this be covered by your insurance from", + "original_text": "Good. Here is the receipt. The dispensary is over there. . . By the way, will this be covered by your insurance from [interrupt] work, or do you have a different plan that might offer better coverage? You might want to check with your HR department about the specific benefits included in your employment package.", + "start_time": 13.625539099257482, + "end_time": 28.21928059585612, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--225/temp/line_3_B.wav", + "silence_duration": 0.4334210754092409, + "is_interrupted": true, + "text_after_interrupt": "work, or do you have a different plan that might offer better coverage? You might want to check with your HR department about the specific benefits included in your employment package." + }, + { + "speaker": "A", + "text": "Sorry, I just realized I have private medical insurance. Will that make a difference?", + "original_text": "Sorry, I just realized I have private medical insurance. Will that make a difference?", + "start_time": 19.19832821490374, + "end_time": 24.655017557307367, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--225/temp/line_4_A.wav", + "silence_duration": 0.5842736085790249, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "In that case, I'll give you a certificate, so you can get it reimbursed.", + "original_text": "In that case, I'll give you a certificate, so you can get it reimbursed.", + "start_time": 28.809927797584294, + "end_time": 32.08394140302647, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--225/temp/line_5_B.wav", + "silence_duration": 0.590647201728175, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Thanks a lot. Oh, you were asking something about insurance earlier—what was it?", + "original_text": "Thanks a lot. Oh, you were asking something about insurance earlier—what was it?", + "start_time": 32.420558452032715, + "end_time": 37.27352897357466, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--225/temp/line_6_A.wav", + "silence_duration": 0.336617049006245, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I was just asking if this will be covered by your insurance from work. Don't lose this receipt, because insurance companies are very difficult about helping when they don't have the right paperwork.", + "original_text": "I was just asking if this will be covered by your insurance from work. Don't lose this receipt, because insurance companies are very difficult about helping when they don't have the right paperwork.", + "start_time": 37.75531426726654, + "end_time": 46.54406710173366, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--225/temp/line_7_B.wav", + "silence_duration": 0.4817852936918747, + "is_interrupted": false + } + ] + }, + "DialogSum--val--226": { + "original_text": "A: I finally found an apartment that I want to rent.\nB: Where did you see it?\nA: I saw it in this ad for apartments in today's [interrupt] newspaper, and it caught my eye right away because the listing had such detailed photos and a floor plan that perfectly matched what I've been looking for.\nB: Wait, you found an apartment in the ads? I thought those were usually overpriced or already taken.\nA: I really did, but what's so great about it is that it's really affordable and in a great neighborhood with easy access to public transportation and local amenities.\nB: Tell me about the apartment.\nA: Well, most importantly, the apartment is beautiful with hardwood floors throughout, large windows that let in plenty of natural light, and a modern kitchen with stainless steel appliances.\nB: How much is the rent for the apartment?\nA: The rent is $725 each month which includes water and trash service, making it an even better deal than I initially thought.\nB: That's pretty cheap for out here. But you mentioned you saw it in today's newspaper. Did you check if it's still available?\nA: Yes, I called right after I saw the ad to make sure it was still on the market. And when I found out how much the rent was, I knew I had to act fast before someone else snatched it up.\nB: Congratulations on the new apartment.", + "cleaned_text": "A: I finally found an apartment that I want to rent.\nB: Where did you see it?\nA:I saw it in this ad for apartments in today's newspaper, and it caught my eye right away because the listing had such detailed photos and a floor plan that perfectly matched what I've been looking for.\nB: Wait, you found an apartment in the ads? I thought those were usually overpriced or already taken.\nA: I really did, but what's so great about it is that it's really affordable and in a great neighborhood with easy access to public transportation and local amenities.\nB: Tell me about the apartment.\nA: Well, most importantly, the apartment is beautiful with hardwood floors throughout, large windows that let in plenty of natural light, and a modern kitchen with stainless steel appliances.\nB: How much is the rent for the apartment?\nA: The rent is $725 each month which includes water and trash service, making it an even better deal than I initially thought.\nB: That's pretty cheap for out here. But you mentioned you saw it in today's newspaper. Did you check if it's still available?\nA: Yes, I called right after I saw the ad to make sure it was still on the market. And when I found out how much the rent was, I knew I had to act fast before someone else snatched it up.\nB: Congratulations on the new apartment.", + "total_duration": 72.43269841269841, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--226/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--226/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--226/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "I finally found an apartment that I want to rent.", + "original_text": "I finally found an apartment that I want to rent.", + "start_time": 0, + "end_time": 2.995374149659864, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--226/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Where did you see it?", + "original_text": "Where did you see it?", + "start_time": 3.3208433933660224, + "end_time": 4.4586211711438, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--226/temp/line_1_B.wav", + "silence_duration": 0.3254692437061584, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I saw it in this ad for apartments in today's", + "original_text": "I saw it in this ad for apartments in today's [interrupt] newspaper, and it caught my eye right away because the listing had such detailed photos and a floor plan that perfectly matched what I've been looking for.", + "start_time": 4.900528055724623, + "end_time": 16.789144835769974, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--226/temp/line_2_A.wav", + "silence_duration": 0.44190688458082183, + "is_interrupted": true, + "text_after_interrupt": "newspaper, and it caught my eye right away because the listing had such detailed photos and a floor plan that perfectly matched what I've been looking for." + }, + { + "speaker": "B", + "text": "Wait, you found an apartment in the ads? I thought those were usually overpriced or already taken.", + "original_text": "Wait, you found an apartment in the ads? I thought those were usually overpriced or already taken.", + "start_time": 7.895902205384487, + "end_time": 13.770550731461583, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--226/temp/line_3_B.wav", + "silence_duration": 0.43585750207766644, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I really did, but what's so great about it is that it's really affordable and in a great neighborhood with easy access to public transportation and local amenities.", + "original_text": "I really did, but what's so great about it is that it's really affordable and in a great neighborhood with easy access to public transportation and local amenities.", + "start_time": 17.16529292438434, + "end_time": 28.276041223704066, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--226/temp/line_4_A.wav", + "silence_duration": 0.37614808861436555, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Tell me about the apartment.", + "original_text": "Tell me about the apartment.", + "start_time": 28.76703048766026, + "end_time": 29.9164182427623, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--226/temp/line_5_B.wav", + "silence_duration": 0.49098926395619497, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Well, most importantly, the apartment is beautiful with hardwood floors throughout, large windows that let in plenty of natural light, and a modern kitchen with stainless steel appliances.", + "original_text": "Well, most importantly, the apartment is beautiful with hardwood floors throughout, large windows that let in plenty of natural light, and a modern kitchen with stainless steel appliances.", + "start_time": 30.28992638972083, + "end_time": 41.36584475706777, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--226/temp/line_6_A.wav", + "silence_duration": 0.37350814695852946, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "How much is the rent for the apartment?", + "original_text": "How much is the rent for the apartment?", + "start_time": 41.74979451128459, + "end_time": 43.468071155275524, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--226/temp/line_7_B.wav", + "silence_duration": 0.3839497542168222, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "The rent is $725 each month which includes water and trash service, making it an even better deal than I initially thought.", + "original_text": "The rent is $725 each month which includes water and trash service, making it an even better deal than I initially thought.", + "start_time": 43.933238632139116, + "end_time": 53.20961051422528, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--226/temp/line_8_A.wav", + "silence_duration": 0.46516747686359095, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "That's pretty cheap for out here. But you mentioned you saw it in today's newspaper. Did you check if it's still available?", + "original_text": "That's pretty cheap for out here. But you mentioned you saw it in today's newspaper. Did you check if it's still available?", + "start_time": 53.541598064043846, + "end_time": 59.30014681687831, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--226/temp/line_9_B.wav", + "silence_duration": 0.33198754981856654, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Yes, I called right after I saw the ad to make sure it was still on the market. And when I found out how much the rent was, I knew I had to act fast before someone else snatched it up.", + "original_text": "Yes, I called right after I saw the ad to make sure it was still on the market. And when I found out how much the rent was, I knew I had to act fast before someone else snatched it up.", + "start_time": 59.712763593221695, + "end_time": 70.10369329843712, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--226/temp/line_10_A.wav", + "silence_duration": 0.41261677634338223, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Congratulations on the new apartment.", + "original_text": "Congratulations on the new apartment.", + "start_time": 70.48224176618781, + "end_time": 72.432717956664, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--226/temp/line_11_B.wav", + "silence_duration": 0.3785484677506894, + "is_interrupted": false + } + ] + }, + "DialogSum--val--227": { + "original_text": "A: May I help you? \nB: Yes. I'd like to send this parcel to Changchun. \nA: How do you want to send it? \nB: I guess I'll send it by [interrupt] airmail because it's faster and more reliable for international shipping, though I should probably check the exact delivery times and insurance options available for this particular destination. \nA: Sorry to interrupt, but before you decide, do you know the cost difference between airmail and surface mail? It might be worth considering depending on your budget and urgency. \nB: Oh, that's a good point. I think I'll still go with airmail since it's faster. \nA: Alright. Is there anything valuable in the parcel? \nB: No, there are only some vases. \nA: They are fragile articles. They must be packed in a proper strong box. Your light cardboard box won't provide enough protection during transit, especially if it's going by airmail. \nB: Oh, I see. Do you have any boxes for sale that would work? \nA: Yes, we do. Have you got the forms filled out? \nB: Not yet. I was just about to ask if the box I choose will be alright this time. \nA: Yes, it will be. Now, fill in two customs declarations and one despatch note in English. You'll have to take your parcel to the next window for examination when you have completed the forms. \nB: OK, thanks for the help.", + "cleaned_text": "A: May I help you? \nB: Yes. I'd like to send this parcel to Changchun. \nA: How do you want to send it? \nB:I guess I'll send it by airmail because it's faster and more reliable for international shipping, though I should probably check the exact delivery times and insurance options available for this particular destination.\nA: Sorry to interrupt, but before you decide, do you know the cost difference between airmail and surface mail? It might be worth considering depending on your budget and urgency. \nB: Oh, that's a good point. I think I'll still go with airmail since it's faster. \nA: Alright. Is there anything valuable in the parcel? \nB: No, there are only some vases. \nA: They are fragile articles. They must be packed in a proper strong box. Your light cardboard box won't provide enough protection during transit, especially if it's going by airmail. \nB: Oh, I see. Do you have any boxes for sale that would work? \nA: Yes, we do. Have you got the forms filled out? \nB: Not yet. I was just about to ask if the box I choose will be alright this time. \nA: Yes, it will be. Now, fill in two customs declarations and one despatch note in English. You'll have to take your parcel to the next window for examination when you have completed the forms. \nB: OK, thanks for the help.", + "total_duration": 66.19256235827665, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--227/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--227/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--227/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "May I help you?", + "original_text": "May I help you?", + "start_time": 0, + "end_time": 0.9520181405895691, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--227/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes. I'd like to send this parcel to Changchun.", + "original_text": "Yes. I'd like to send this parcel to Changchun.", + "start_time": 1.4978828516997065, + "end_time": 3.9475880671192076, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--227/temp/line_1_B.wav", + "silence_duration": 0.5458647111101372, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "How do you want to send it?", + "original_text": "How do you want to send it?", + "start_time": 4.358009739711503, + "end_time": 5.7512070186230675, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--227/temp/line_2_A.wav", + "silence_duration": 0.41042167259229495, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I guess I'll send it by", + "original_text": "I guess I'll send it by [interrupt] airmail because it's faster and more reliable for international shipping, though I should probably check the exact delivery times and insurance options available for this particular destination.", + "start_time": 6.302870415465749, + "end_time": 16.577700347438537, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--227/temp/line_3_B.wav", + "silence_duration": 0.5516633968426818, + "is_interrupted": true, + "text_after_interrupt": "airmail because it's faster and more reliable for international shipping, though I should probably check the exact delivery times and insurance options available for this particular destination." + }, + { + "speaker": "A", + "text": "Sorry to interrupt, but before you decide, do you know the cost difference between airmail and surface mail? It might be worth considering depending on your budget and urgency.", + "original_text": "Sorry to interrupt, but before you decide, do you know the cost difference between airmail and surface mail? It might be worth considering depending on your budget and urgency.", + "start_time": 7.556747966486157, + "end_time": 18.028947512971417, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--227/temp/line_4_A.wav", + "silence_duration": 0.5911627159092466, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Oh, that's a good point. I think I'll still go with airmail since it's faster.", + "original_text": "Oh, that's a good point. I think I'll still go with airmail since it's faster.", + "start_time": 18.62331658944173, + "end_time": 22.617148788988214, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--227/temp/line_5_B.wav", + "silence_duration": 0.5943690764703107, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Alright. Is there anything valuable in the parcel?", + "original_text": "Alright. Is there anything valuable in the parcel?", + "start_time": 23.010749357420487, + "end_time": 25.982903552431825, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--227/temp/line_6_A.wav", + "silence_duration": 0.3936005684322728, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "No, there are only some vases.", + "original_text": "No, there are only some vases.", + "start_time": 26.493597853869765, + "end_time": 28.409244112373166, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--227/temp/line_7_B.wav", + "silence_duration": 0.5106943014379404, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "They are fragile articles. They must be packed in a proper strong box. Your light cardboard box won't provide enough protection during transit, especially if it's going by airmail.", + "original_text": "They are fragile articles. They must be packed in a proper strong box. Your light cardboard box won't provide enough protection during transit, especially if it's going by airmail.", + "start_time": 28.769805585471588, + "end_time": 39.54386454238769, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--227/temp/line_8_A.wav", + "silence_duration": 0.36056147309842, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Oh, I see. Do you have any boxes for sale that would work?", + "original_text": "Oh, I see. Do you have any boxes for sale that would work?", + "start_time": 40.06412644040458, + "end_time": 43.222040272604126, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--227/temp/line_9_B.wav", + "silence_duration": 0.5202618980168893, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Yes, we do. Have you got the forms filled out?", + "original_text": "Yes, we do. Have you got the forms filled out?", + "start_time": 43.67648861420573, + "end_time": 46.72991265048691, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--227/temp/line_10_A.wav", + "silence_duration": 0.45444834160160263, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Not yet. I was just about to ask if the box I choose will be alright this time.", + "original_text": "Not yet. I was just about to ask if the box I choose will be alright this time.", + "start_time": 47.09994704761179, + "end_time": 52.359266775502945, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--227/temp/line_11_B.wav", + "silence_duration": 0.3700343971248835, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Yes, it will be. Now, fill in two customs declarations and one despatch note in English. You'll have to take your parcel to the next window for examination when you have completed the forms.", + "original_text": "Yes, it will be. Now, fill in two customs declarations and one despatch note in English. You'll have to take your parcel to the next window for examination when you have completed the forms.", + "start_time": 52.84798704372094, + "end_time": 64.28381470812003, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--227/temp/line_12_A.wav", + "silence_duration": 0.4887202682179964, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "OK, thanks for the help.", + "original_text": "OK, thanks for the help.", + "start_time": 64.71811840599435, + "end_time": 66.19258552617575, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--227/temp/line_13_B.wav", + "silence_duration": 0.434303697874311, + "is_interrupted": false + } + ] + }, + "DialogSum--val--228": { + "original_text": "A: What about the working hours? \nB: Working conditions are very relaxed. You may work whatever hours you want, provided you get your job done [interrupt] and meet your deadlines without compromising on the quality of your work, which includes thorough documentation, peer reviews, and maintaining our company's high standards for customer satisfaction. \nA: Sorry to cut in, but does that mean there's no strict monitoring of when we clock in and out? \nB: Exactly, it's more about the results you deliver. But I was going to mention that flexibility also extends to the work location. Would you mind changing the position or working place you've applied for? \nA: Oh, I see. But before we get to that, you were saying something about getting the job done properly—could you clarify what you meant by that?", + "cleaned_text": "A: What about the working hours? \nB:Working conditions are very relaxed. You may work whatever hours you want, provided you get your job done and meet your deadlines without compromising on the quality of your work, which includes thorough documentation, peer reviews, and maintaining our company's high standards for customer satisfaction.\nA: Sorry to cut in, but does that mean there's no strict monitoring of when we clock in and out? \nB: Exactly, it's more about the results you deliver. But I was going to mention that flexibility also extends to the work location. Would you mind changing the position or working place you've applied for? \nA: Oh, I see. But before we get to that, you were saying something about getting the job done properly—could you clarify what you meant by that?", + "total_duration": 38.02009070294785, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--228/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--228/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--228/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "What about the working hours?", + "original_text": "What about the working hours?", + "start_time": 0, + "end_time": 1.7763265306122449, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--228/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Working conditions are very relaxed. You may work whatever hours you want, provided you get your job done", + "original_text": "Working conditions are very relaxed. You may work whatever hours you want, provided you get your job done [interrupt] and meet your deadlines without compromising on the quality of your work, which includes thorough documentation, peer reviews, and maintaining our company's high standards for customer satisfaction.", + "start_time": 2.2597828384453864, + "end_time": 18.17706175001001, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--228/temp/line_1_B.wav", + "silence_duration": 0.4834563078331414, + "is_interrupted": true, + "text_after_interrupt": "and meet your deadlines without compromising on the quality of your work, which includes thorough documentation, peer reviews, and maintaining our company's high standards for customer satisfaction." + }, + { + "speaker": "A", + "text": "Sorry to cut in, but does that mean there's no strict monitoring of when we clock in and out?", + "original_text": "Sorry to cut in, but does that mean there's no strict monitoring of when we clock in and out?", + "start_time": 7.913841795361487, + "end_time": 14.392209142300263, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--228/temp/line_2_A.wav", + "silence_duration": 0.3594707826422153, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Exactly, it's more about the results you deliver. But I was going to mention that flexibility also extends to the work location. Would you mind changing the position or working place you've applied for?", + "original_text": "Exactly, it's more about the results you deliver. But I was going to mention that flexibility also extends to the work location. Would you mind changing the position or working place you've applied for?", + "start_time": 18.68809867638556, + "end_time": 29.07902838160098, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--228/temp/line_3_B.wav", + "silence_duration": 0.5110369263755479, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Oh, I see. But before we get to that, you were saying something about getting the job done properly—could you clarify what you meant by that?", + "original_text": "Oh, I see. But before we get to that, you were saying something about getting the job done properly—could you clarify what you meant by that?", + "start_time": 29.48679731614892, + "end_time": 38.020130649482255, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--228/temp/line_4_A.wav", + "silence_duration": 0.4077689345479374, + "is_interrupted": false + } + ] + }, + "DialogSum--val--229": { + "original_text": "A: An exhibition of Picasso's paintings is being held. Do you want to go with me? \nB: How can I miss it! But with the bus drivers on strike and taxis so expensive, we have no choice but to [interrupt] take the subway, even though it's going to be crowded during rush hour and we'll probably have to stand the whole way there. \nA: Oh, speaking of the strike, do you know how long it's expected to last? Because if it goes on for much longer, it might affect other plans too. \nB: I heard it might last a week, but back to the subway—if only we had a car, it would make things so much easier. We could even stop for coffee on the way to the exhibition without worrying about parking or schedules.", + "cleaned_text": "A: An exhibition of Picasso's paintings is being held. Do you want to go with me? \nB:How can I miss it! But with the bus drivers on strike and taxis so expensive, we have no choice but to take the subway, even though it's going to be crowded during rush hour and we'll probably have to stand the whole way there.\nA: Oh, speaking of the strike, do you know how long it's expected to last? Because if it goes on for much longer, it might affect other plans too. \nB: I heard it might last a week, but back to the subway—if only we had a car, it would make things so much easier. We could even stop for coffee on the way to the exhibition without worrying about parking or schedules.", + "total_duration": 30.92453514739229, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--229/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--229/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--229/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "An exhibition of Picasso's paintings is being held. Do you want to go with me?", + "original_text": "An exhibition of Picasso's paintings is being held. Do you want to go with me?", + "start_time": 0, + "end_time": 5.038730158730159, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--229/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "How can I miss it! But with the bus drivers on strike and taxis so expensive, we have no choice but to", + "original_text": "How can I miss it! But with the bus drivers on strike and taxis so expensive, we have no choice but to [interrupt] take the subway, even though it's going to be crowded during rush hour and we'll probably have to stand the whole way there.", + "start_time": 5.487234801865484, + "end_time": 16.78374273837342, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--229/temp/line_1_B.wav", + "silence_duration": 0.4485046431353254, + "is_interrupted": true, + "text_after_interrupt": "take the subway, even though it's going to be crowded during rush hour and we'll probably have to stand the whole way there." + }, + { + "speaker": "A", + "text": "Oh, speaking of the strike, do you know how long it's expected to last? Because if it goes on for much longer, it might affect other plans too.", + "original_text": "Oh, speaking of the strike, do you know how long it's expected to last? Because if it goes on for much longer, it might affect other plans too.", + "start_time": 10.885874257647796, + "end_time": 20.255125958328065, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--229/temp/line_2_A.wav", + "silence_duration": 0.37850214449249164, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I heard it might last a week, but back to the subway—if only we had a car, it would make things so much easier. We could even stop for coffee on the way to the exhibition without worrying about parking or schedules.", + "original_text": "I heard it might last a week, but back to the subway—if only we had a car, it would make things so much easier. We could even stop for coffee on the way to the exhibition without worrying about parking or schedules.", + "start_time": 20.614887678327648, + "end_time": 30.924547542273224, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--229/temp/line_3_B.wav", + "silence_duration": 0.3597617199995819, + "is_interrupted": false + } + ] + }, + "DialogSum--val--230": { + "original_text": "A: The day I turned thirty, I turned on the computer. I went into the over-thirty room for a joke. And he was there. And we started [interrupt] chatting about random things, just to kill some time, but surprisingly we ended up talking for hours about everything from favorite movies to childhood memories. \nB: Wait, who is \"he\"? Is it someone you knew before or just a random person in the chat room? \nA: Just a random person in the chat room. We started chatting about books, music, how much we both love New York. Nothing really [interrupt] deep or personal, just light conversation that somehow felt refreshing and comforting during that particular phase of my life. \nB: Speaking of New York, have you ever met up with him in person, considering you both love the city? \nA: No, we never met in person. But I was going to say that our conversations weren't really meaningful, just a good way to pass time. \nB: Got it, so it was more of a casual connection than anything serious.", + "cleaned_text": "A:The day I turned thirty, I turned on the computer. I went into the over-thirty room for a joke. And he was there. And we started chatting about random things, just to kill some time, but surprisingly we ended up talking for hours about everything from favorite movies to childhood memories.\nB: Wait, who is \"he\"? Is it someone you knew before or just a random person in the chat room? \nA:Just a random person in the chat room. We started chatting about books, music, how much we both love New York. Nothing really deep or personal, just light conversation that somehow felt refreshing and comforting during that particular phase of my life.\nB: Speaking of New York, have you ever met up with him in person, considering you both love the city? \nA: No, we never met in person. But I was going to say that our conversations weren't really meaningful, just a good way to pass time. \nB: Got it, so it was more of a casual connection than anything serious.", + "total_duration": 50.571020408163264, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--230/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--230/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--230/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "The day I turned thirty, I turned on the computer. I went into the over-thirty room for a joke. And he was there. And we started", + "original_text": "The day I turned thirty, I turned on the computer. I went into the over-thirty room for a joke. And he was there. And we started [interrupt] chatting about random things, just to kill some time, but surprisingly we ended up talking for hours about everything from favorite movies to childhood memories.", + "start_time": 0, + "end_time": 16.973786848072564, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--230/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": true, + "text_after_interrupt": "chatting about random things, just to kill some time, but surprisingly we ended up talking for hours about everything from favorite movies to childhood memories." + }, + { + "speaker": "B", + "text": "Wait, who is \"he\"? Is it someone you knew before or just a random person in the chat room?", + "original_text": "Wait, who is \"he\"? Is it someone you knew before or just a random person in the chat room?", + "start_time": 7.534875283446712, + "end_time": 12.933514739229025, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--230/temp/line_1_B.wav", + "silence_duration": 0.5493736561572191, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Just a random person in the chat room. We started chatting about books, music, how much we both love New York. Nothing really", + "original_text": "Just a random person in the chat room. We started chatting about books, music, how much we both love New York. Nothing really [interrupt] deep or personal, just light conversation that somehow felt refreshing and comforting during that particular phase of my life.", + "start_time": 17.5066623324259, + "end_time": 32.8666623324259, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--230/temp/line_2_A.wav", + "silence_duration": 0.5328754843533352, + "is_interrupted": true, + "text_after_interrupt": "deep or personal, just light conversation that somehow felt refreshing and comforting during that particular phase of my life." + }, + { + "speaker": "B", + "text": "Speaking of New York, have you ever met up with him in person, considering you both love the city?", + "original_text": "Speaking of New York, have you ever met up with him in person, considering you both love the city?", + "start_time": 32.81115401606307, + "end_time": 38.302673290439486, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--230/temp/line_3_B.wav", + "silence_duration": 0.4908339798161294, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "No, we never met in person. But I was going to say that our conversations weren't really meaningful, just a good way to pass time.", + "original_text": "No, we never met in person. But I was going to say that our conversations weren't really meaningful, just a good way to pass time.", + "start_time": 38.67322907483018, + "end_time": 46.46352385941068, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--230/temp/line_4_A.wav", + "silence_duration": 0.37055578439069875, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Got it, so it was more of a casual connection than anything serious.", + "original_text": "Got it, so it was more of a casual connection than anything serious.", + "start_time": 47.05323511808865, + "end_time": 50.57105824734035, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--230/temp/line_5_B.wav", + "silence_duration": 0.5897112586779698, + "is_interrupted": false + } + ] + }, + "DialogSum--val--231": { + "original_text": "A: I understand how you feel, sir. But there simply isn't any room. The person who received your reservation call must have forgotten to write it down. She is new, you [interrupt] might want to speak with the manager about this issue to ensure proper training procedures are followed and similar mistakes are prevented in the future.\nB: Just a mistake? Do you realize that I've invited some very important people to dinner? It could cause me to lose an important business partner.\nA: I'm really sorry, sir. I suggest you call them and explain the problem. I'm sure you'll find several other very good restaurants around here. But as I was saying, the person who took your reservation is new [interrupt] and still going through our comprehensive training program, which includes shadowing experienced staff members and practicing our reservation system extensively before handling calls independently.\nB: I can't get in touch with them now. They are probably on their way at this very minute. Surely you could fit one more table in.\nA: Not unless you'd like me to put you in the hall, sir.\nB: Well, that's better than nothing.", + "cleaned_text": "A:I understand how you feel, sir. But there simply isn't any room. The person who received your reservation call must have forgotten to write it down. She is new, you might want to speak with the manager about this issue to ensure proper training procedures are followed and similar mistakes are prevented in the future.\nB: Just a mistake? Do you realize that I've invited some very important people to dinner? It could cause me to lose an important business partner.\nA:I'm really sorry, sir. I suggest you call them and explain the problem. I'm sure you'll find several other very good restaurants around here. But as I was saying, the person who took your reservation is new and still going through our comprehensive training program, which includes shadowing experienced staff members and practicing our reservation system extensively before handling calls independently.\nB: I can't get in touch with them now. They are probably on their way at this very minute. Surely you could fit one more table in.\nA: Not unless you'd like me to put you in the hall, sir.\nB: Well, that's better than nothing.", + "total_duration": 50.51070294784581, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--231/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--231/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--231/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "I understand how you feel, sir. But there simply isn't any room. The person who received your reservation call must have forgotten to write it down. She is new, you", + "original_text": "I understand how you feel, sir. But there simply isn't any room. The person who received your reservation call must have forgotten to write it down. She is new, you [interrupt] might want to speak with the manager about this issue to ensure proper training procedures are followed and similar mistakes are prevented in the future.", + "start_time": 0, + "end_time": 18.715283446712018, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--231/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": true, + "text_after_interrupt": "might want to speak with the manager about this issue to ensure proper training procedures are followed and similar mistakes are prevented in the future." + }, + { + "speaker": "B", + "text": "Just a mistake? Do you realize that I've invited some very important people to dinner? It could cause me to lose an important business partner.", + "original_text": "Just a mistake? Do you realize that I've invited some very important people to dinner? It could cause me to lose an important business partner.", + "start_time": 10.634739229024943, + "end_time": 18.030294784580498, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--231/temp/line_1_B.wav", + "silence_duration": 0.5369039303288646, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I'm really sorry, sir. I suggest you call them and explain the problem. I'm sure you'll find several other very good restaurants around here. But as I was saying, the person who took your reservation is new", + "original_text": "I'm really sorry, sir. I suggest you call them and explain the problem. I'm sure you'll find several other very good restaurants around here. But as I was saying, the person who took your reservation is new [interrupt] and still going through our comprehensive training program, which includes shadowing experienced staff members and practicing our reservation system extensively before handling calls independently.", + "start_time": 19.23857396489348, + "end_time": 42.60945831863498, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--231/temp/line_2_A.wav", + "silence_duration": 0.5232905181814623, + "is_interrupted": true, + "text_after_interrupt": "and still going through our comprehensive training program, which includes shadowing experienced staff members and practicing our reservation system extensively before handling calls independently." + }, + { + "speaker": "B", + "text": "I can't get in touch with them now. They are probably on their way at this very minute. Surely you could fit one more table in.", + "original_text": "I can't get in touch with them now. They are probably on their way at this very minute. Surely you could fit one more table in.", + "start_time": 39.49392931421484, + "end_time": 45.4730676362103, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--231/temp/line_3_B.wav", + "silence_duration": 0.3207564881541131, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Not unless you'd like me to put you in the hall, sir.", + "original_text": "Not unless you'd like me to put you in the hall, sir.", + "start_time": 45.80630919698661, + "end_time": 48.499823936215634, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--231/temp/line_4_A.wav", + "silence_duration": 0.33324156077630573, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Well, that's better than nothing.", + "original_text": "Well, that's better than nothing.", + "start_time": 48.838885888250545, + "end_time": 50.51072262294442, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--231/temp/line_5_B.wav", + "silence_duration": 0.3390619520349105, + "is_interrupted": false + } + ] + }, + "DialogSum--val--232": { + "original_text": "A: So, what seems to be the problem, Bobby? \nB: Dr. Cardano, I woke up in the middle of the night with a terrible pain in my right foot. \nA: Did you cut yourself or knock it against [interrupt] something while you were sleeping? I'm asking because sometimes even minor injuries can cause significant discomfort if they happen during sleep when we're not fully aware of our movements. \nB: No, it just started hurting all of a sudden. Could it be something serious? \nA: It's hard to say right now. Can you describe the pain for me? Is it a sharp pain that comes and goes? Or is it a constant, dull pain that doesn't really ever go away? \nB: I suppose it's more like the first one. But it's definitely difficult to walk, so it's not really going away, either. \nA: Let me see those feet, Bobby. \nB: Do you want me to take off both socks? \nA: Yes, I'd like to compare your right and left foot. Ah, the right foot is pretty red, and it looks bigger than the left one. It also feels warmer. \nB: What does it mean, doctor? \nA: Well, I don't know for sure. It could be one of a couple of things. I'm going to send you up to the lab to get some blood tests. Check in to the lab on the [interrupt] third floor; they'll be expecting you and will run a complete blood count along with inflammation markers to help us determine the exact cause of your symptoms. \nB: Wait, before I go, I need to use the restroom first. Can you tell me where that is? \nA: Sure, it's just down the hall to your left. But remember to check in to the lab on the third floor afterward. I'm sending them some instructions. Come back down here as soon as it's finished. \nB: Got it. Thanks, doctor.", + "cleaned_text": "A: So, what seems to be the problem, Bobby? \nB: Dr. Cardano, I woke up in the middle of the night with a terrible pain in my right foot. \nA:Did you cut yourself or knock it against something while you were sleeping? I'm asking because sometimes even minor injuries can cause significant discomfort if they happen during sleep when we're not fully aware of our movements.\nB: No, it just started hurting all of a sudden. Could it be something serious? \nA: It's hard to say right now. Can you describe the pain for me? Is it a sharp pain that comes and goes? Or is it a constant, dull pain that doesn't really ever go away? \nB: I suppose it's more like the first one. But it's definitely difficult to walk, so it's not really going away, either. \nA: Let me see those feet, Bobby. \nB: Do you want me to take off both socks? \nA: Yes, I'd like to compare your right and left foot. Ah, the right foot is pretty red, and it looks bigger than the left one. It also feels warmer. \nB: What does it mean, doctor? \nA:Well, I don't know for sure. It could be one of a couple of things. I'm going to send you up to the lab to get some blood tests. Check in to the lab on the third floor; they'll be expecting you and will run a complete blood count along with inflammation markers to help us determine the exact cause of your symptoms.\nB: Wait, before I go, I need to use the restroom first. Can you tell me where that is? \nA: Sure, it's just down the hall to your left. But remember to check in to the lab on the third floor afterward. I'm sending them some instructions. Come back down here as soon as it's finished. \nB: Got it. Thanks, doctor.", + "total_duration": 86.13718820861678, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--232/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--232/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--232/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "So, what seems to be the problem, Bobby?", + "original_text": "So, what seems to be the problem, Bobby?", + "start_time": 0, + "end_time": 2.089795918367347, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--232/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Dr. Cardano, I woke up in the middle of the night with a terrible pain in my right foot.", + "original_text": "Dr. Cardano, I woke up in the middle of the night with a terrible pain in my right foot.", + "start_time": 2.6054088177873633, + "end_time": 7.202959838195527, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--232/temp/line_1_B.wav", + "silence_duration": 0.5156128994200163, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Did you cut yourself or knock it against", + "original_text": "Did you cut yourself or knock it against [interrupt] something while you were sleeping? I'm asking because sometimes even minor injuries can cause significant discomfort if they happen during sleep when we're not fully aware of our movements.", + "start_time": 7.67154503258859, + "end_time": 20.8604792729514, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--232/temp/line_2_A.wav", + "silence_duration": 0.4685851943930626, + "is_interrupted": true, + "text_after_interrupt": "something while you were sleeping? I'm asking because sometimes even minor injuries can cause significant discomfort if they happen during sleep when we're not fully aware of our movements." + }, + { + "speaker": "B", + "text": "No, it just started hurting all of a sudden. Could it be something serious?", + "original_text": "No, it just started hurting all of a sudden. Could it be something serious?", + "start_time": 10.028370429413986, + "end_time": 13.848052969096525, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--232/temp/line_3_B.wav", + "silence_duration": 0.407842252320199, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "It's hard to say right now. Can you describe the pain for me? Is it a sharp pain that comes and goes? Or is it a constant, dull pain that doesn't really ever go away?", + "original_text": "It's hard to say right now. Can you describe the pain for me? Is it a sharp pain that comes and goes? Or is it a constant, dull pain that doesn't really ever go away?", + "start_time": 21.198429377449337, + "end_time": 31.79833867450149, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--232/temp/line_4_A.wav", + "silence_duration": 0.3379501044979362, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I suppose it's more like the first one. But it's definitely difficult to walk, so it's not really going away, either.", + "original_text": "I suppose it's more like the first one. But it's definitely difficult to walk, so it's not really going away, either.", + "start_time": 32.371378612109666, + "end_time": 38.02543756902577, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--232/temp/line_5_B.wav", + "silence_duration": 0.5730399376081783, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Let me see those feet, Bobby.", + "original_text": "Let me see those feet, Bobby.", + "start_time": 38.48652616661589, + "end_time": 40.158362901309765, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--232/temp/line_6_A.wav", + "silence_duration": 0.4610885975901179, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Do you want me to take off both socks?", + "original_text": "Do you want me to take off both socks?", + "start_time": 40.51394336039267, + "end_time": 42.34831977762623, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--232/temp/line_7_B.wav", + "silence_duration": 0.35558045908290714, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Yes, I'd like to compare your right and left foot. Ah, the right foot is pretty red, and it looks bigger than the left one. It also feels warmer.", + "original_text": "Yes, I'd like to compare your right and left foot. Ah, the right foot is pretty red, and it looks bigger than the left one. It also feels warmer.", + "start_time": 42.91024972631135, + "end_time": 52.00086197120931, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--232/temp/line_8_A.wav", + "silence_duration": 0.5619299486851185, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "What does it mean, doctor?", + "original_text": "What does it mean, doctor?", + "start_time": 52.35127850268139, + "end_time": 53.523886212431954, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--232/temp/line_9_B.wav", + "silence_duration": 0.3504165314720773, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Well, I don't know for sure. It could be one of a couple of things. I'm going to send you up to the lab to get some blood tests. Check in to the lab on the", + "original_text": "Well, I don't know for sure. It could be one of a couple of things. I'm going to send you up to the lab to get some blood tests. Check in to the lab on the [interrupt] third floor; they'll be expecting you and will run a complete blood count along with inflammation markers to help us determine the exact cause of your symptoms.", + "start_time": 53.97896203575658, + "end_time": 72.41560602668629, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--232/temp/line_10_A.wav", + "silence_duration": 0.45507582332462854, + "is_interrupted": true, + "text_after_interrupt": "third floor; they'll be expecting you and will run a complete blood count along with inflammation markers to help us determine the exact cause of your symptoms." + }, + { + "speaker": "B", + "text": "Wait, before I go, I need to use the restroom first. Can you tell me where that is?", + "original_text": "Wait, before I go, I need to use the restroom first. Can you tell me where that is?", + "start_time": 68.46691357540736, + "end_time": 72.62328545749352, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--232/temp/line_11_B.wav", + "silence_duration": 0.5922949914587196, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Sure, it's just down the hall to your left. But remember to check in to the lab on the third floor afterward. I'm sending them some instructions. Come back down here as soon as it's finished.", + "original_text": "Sure, it's just down the hall to your left. But remember to check in to the lab on the third floor afterward. I'm sending them some instructions. Come back down here as soon as it's finished.", + "start_time": 73.07297355528182, + "end_time": 84.3230415824927, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--232/temp/line_12_A.wav", + "silence_duration": 0.4496880977882961, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Got it. Thanks, doctor.", + "original_text": "Got it. Thanks, doctor.", + "start_time": 84.80204425998281, + "end_time": 86.13719165227306, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--232/temp/line_13_B.wav", + "silence_duration": 0.4790026774901064, + "is_interrupted": false + } + ] + }, + "DialogSum--val--234": { + "original_text": "A: Susan, Did you know the four ugliest women in ancient China? \nB: No, I only know the four great beauties of China. \nA: There were some famous ugly women in history who were actually celebrated [interrupt] for their remarkable wisdom, moral character, and significant contributions to their communities despite societal prejudices about appearance. \nB: Yeah? Were they famous because of their unique contributions to society, or was it something else? \nA: Sorry, let me clarify—they were famous not just for their appearance but because of their virtue and contributions. \nB: Oh, I see. Then who were they? \nA: Mo Mu, Zhong Lichun, Meng Guang, and Ruan Nv. They were well respected. \nB: It seems that inner beauty is also important. By the way, you mentioned they were famous for their virtue—could you tell me more about what made them so respected?", + "cleaned_text": "A: Susan, Did you know the four ugliest women in ancient China? \nB: No, I only know the four great beauties of China. \nA:There were some famous ugly women in history who were actually celebrated for their remarkable wisdom, moral character, and significant contributions to their communities despite societal prejudices about appearance.\nB: Yeah? Were they famous because of their unique contributions to society, or was it something else? \nA: Sorry, let me clarify—they were famous not just for their appearance but because of their virtue and contributions. \nB: Oh, I see. Then who were they? \nA: Mo Mu, Zhong Lichun, Meng Guang, and Ruan Nv. They were well respected. \nB: It seems that inner beauty is also important. By the way, you mentioned they were famous for their virtue—could you tell me more about what made them so respected?", + "total_duration": 43.41963718820862, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--234/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--234/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--234/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Susan, Did you know the four ugliest women in ancient China?", + "original_text": "Susan, Did you know the four ugliest women in ancient China?", + "start_time": 0, + "end_time": 4.156371882086168, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--234/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "No, I only know the four great beauties of China.", + "original_text": "No, I only know the four great beauties of China.", + "start_time": 4.487296031223398, + "end_time": 7.459450226234736, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--234/temp/line_1_B.wav", + "silence_duration": 0.33092414913723056, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "There were some famous ugly women in history who were actually celebrated", + "original_text": "There were some famous ugly women in history who were actually celebrated [interrupt] for their remarkable wisdom, moral character, and significant contributions to their communities despite societal prejudices about appearance.", + "start_time": 8.039076526422077, + "end_time": 20.554632081977633, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--234/temp/line_2_A.wav", + "silence_duration": 0.5796263001873413, + "is_interrupted": true, + "text_after_interrupt": "for their remarkable wisdom, moral character, and significant contributions to their communities despite societal prejudices about appearance." + }, + { + "speaker": "B", + "text": "Yeah? Were they famous because of their unique contributions to society, or was it something else?", + "original_text": "Yeah? Were they famous because of their unique contributions to society, or was it something else?", + "start_time": 12.427647954993507, + "end_time": 17.582477886966295, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--234/temp/line_3_B.wav", + "silence_duration": 0.33524358583494457, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Sorry, let me clarify—they were famous not just for their appearance but because of their virtue and contributions.", + "original_text": "Sorry, let me clarify—they were famous not just for their appearance but because of their virtue and contributions.", + "start_time": 21.11264308134332, + "end_time": 28.241169158440826, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--234/temp/line_4_A.wav", + "silence_duration": 0.5580109993656877, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Oh, I see. Then who were they?", + "original_text": "Oh, I see. Then who were they?", + "start_time": 28.729423936298165, + "end_time": 30.528970421558935, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--234/temp/line_5_B.wav", + "silence_duration": 0.48825477785733795, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Mo Mu, Zhong Lichun, Meng Guang, and Ruan Nv. They were well respected.", + "original_text": "Mo Mu, Zhong Lichun, Meng Guang, and Ruan Nv. They were well respected.", + "start_time": 30.84814620180126, + "end_time": 35.16705776642711, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--234/temp/line_6_A.wav", + "silence_duration": 0.3191757802423245, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "It seems that inner beauty is also important. By the way, you mentioned they were famous for their virtue—could you tell me more about what made them so respected?", + "original_text": "It seems that inner beauty is also important. By the way, you mentioned they were famous for their virtue—could you tell me more about what made them so respected?", + "start_time": 35.640985917850514, + "end_time": 43.41967072510675, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--234/temp/line_7_B.wav", + "silence_duration": 0.4739281514234067, + "is_interrupted": false + } + ] + }, + "DialogSum--val--236": { + "original_text": "A: Ghost will be on at six thirty. It's already six fifteen now. Hurry [interrupt] up, or we might miss the beginning of the movie which would be such a shame since we've been looking forward to watching it together all week!\nB: You'd been hanging around before we left home. Well, now, you are urging me for the movie. This has been fun!\nA: Don't be upset. I am just afraid of missing the movie. It is your favorite.\nB: In short, you become more and more impatient with me after the wedding.\nA: Why do you think [interrupt] that? I haven't noticed any change in how I treat you, and I genuinely believe our relationship has only grown stronger since we got married.\nB: Every time I complain about the domestic chores with you, you just don't listen.\nA: Nothing of the sort!\nB: Don't interrupt me! In addition, every time I need your advice, you just say, it's up to you.\nA: Maybe I was busy with my work at that time, so I felt a little bored. But wait, can we go back to what you said earlier? Why do you think I'm more impatient with you since the wedding?\nB: You mean, I am not busy with my work?\nA: Honey, don't get me wrong. I don't know how to explain. But I really have eyes only for you and our children.\nB: Do you still love me?", + "cleaned_text": "A:Ghost will be on at six thirty. It's already six fifteen now. Hurry up, or we might miss the beginning of the movie which would be such a shame since we've been looking forward to watching it together all week!\nB: You'd been hanging around before we left home. Well, now, you are urging me for the movie. This has been fun!\nA: Don't be upset. I am just afraid of missing the movie. It is your favorite.\nB: In short, you become more and more impatient with me after the wedding.\nA:Why do you think that? I haven't noticed any change in how I treat you, and I genuinely believe our relationship has only grown stronger since we got married.\nB: Every time I complain about the domestic chores with you, you just don't listen.\nA: Nothing of the sort!\nB: Don't interrupt me! In addition, every time I need your advice, you just say, it's up to you.\nA: Maybe I was busy with my work at that time, so I felt a little bored. But wait, can we go back to what you said earlier? Why do you think I'm more impatient with you since the wedding?\nB: You mean, I am not busy with my work?\nA: Honey, don't get me wrong. I don't know how to explain. But I really have eyes only for you and our children.\nB: Do you still love me?", + "total_duration": 61.68344671201814, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--236/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--236/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--236/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Ghost will be on at six thirty. It's already six fifteen now. Hurry", + "original_text": "Ghost will be on at six thirty. It's already six fifteen now. Hurry [interrupt] up, or we might miss the beginning of the movie which would be such a shame since we've been looking forward to watching it together all week!", + "start_time": 0, + "end_time": 12.236916099773243, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--236/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": true, + "text_after_interrupt": "up, or we might miss the beginning of the movie which would be such a shame since we've been looking forward to watching it together all week!" + }, + { + "speaker": "B", + "text": "You'd been hanging around before we left home. Well, now, you are urging me for the movie. This has been fun!", + "original_text": "You'd been hanging around before we left home. Well, now, you are urging me for the movie. This has been fun!", + "start_time": 4.690430839002268, + "end_time": 10.483809523809523, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--236/temp/line_1_B.wav", + "silence_duration": 0.5029263927812233, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Don't be upset. I am just afraid of missing the movie. It is your favorite.", + "original_text": "Don't be upset. I am just afraid of missing the movie. It is your favorite.", + "start_time": 12.584900784733147, + "end_time": 17.043132077250153, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--236/temp/line_2_A.wav", + "silence_duration": 0.34798468495990353, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "In short, you become more and more impatient with me after the wedding.", + "original_text": "In short, you become more and more impatient with me after the wedding.", + "start_time": 17.626649006506973, + "end_time": 21.260571909001303, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--236/temp/line_3_B.wav", + "silence_duration": 0.5835169292568212, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Why do you think", + "original_text": "Why do you think [interrupt] that? I haven't noticed any change in how I treat you, and I genuinely believe our relationship has only grown stronger since we got married.", + "start_time": 21.596148436557122, + "end_time": 30.570660908212453, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--236/temp/line_4_A.wav", + "silence_duration": 0.33557652755581896, + "is_interrupted": true, + "text_after_interrupt": "that? I haven't noticed any change in how I treat you, and I genuinely believe our relationship has only grown stronger since we got married." + }, + { + "speaker": "B", + "text": "Every time I complain about the domestic chores with you, you just don't listen.", + "original_text": "Every time I complain about the domestic chores with you, you just don't listen.", + "start_time": 29.271336365722075, + "end_time": 33.10262888272888, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--236/temp/line_5_B.wav", + "silence_duration": 0.36175781227248216, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Nothing of the sort!", + "original_text": "Nothing of the sort!", + "start_time": 33.68002529588033, + "end_time": 34.933902846900736, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--236/temp/line_6_A.wav", + "silence_duration": 0.5773964131514469, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Don't interrupt me! In addition, every time I need your advice, you just say, it's up to you.", + "original_text": "Don't interrupt me! In addition, every time I need your advice, you just say, it's up to you.", + "start_time": 35.38650385850239, + "end_time": 39.856345128343655, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--236/temp/line_7_B.wav", + "silence_duration": 0.45260101160164845, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Maybe I was busy with my work at that time, so I felt a little bored. But wait, can we go back to what you said earlier? Why do you think I'm more impatient with you since the wedding?", + "original_text": "Maybe I was busy with my work at that time, so I felt a little bored. But wait, can we go back to what you said earlier? Why do you think I'm more impatient with you since the wedding?", + "start_time": 40.38428383710806, + "end_time": 51.04224302078153, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--236/temp/line_8_A.wav", + "silence_duration": 0.5279387087644009, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "You mean, I am not busy with my work?", + "original_text": "You mean, I am not busy with my work?", + "start_time": 51.55945440690883, + "end_time": 53.393830824142384, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--236/temp/line_9_B.wav", + "silence_duration": 0.5172113861272969, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Honey, don't get me wrong. I don't know how to explain. But I really have eyes only for you and our children.", + "original_text": "Honey, don't get me wrong. I don't know how to explain. But I really have eyes only for you and our children.", + "start_time": 53.69652074944332, + "end_time": 60.23293798300341, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--236/temp/line_10_A.wav", + "silence_duration": 0.30268992530094146, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Do you still love me?", + "original_text": "Do you still love me?", + "start_time": 60.60373428303051, + "end_time": 61.68346217418697, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--236/temp/line_11_B.wav", + "silence_duration": 0.37079630002709946, + "is_interrupted": false + } + ] + }, + "DialogSum--val--238": { + "original_text": "A: Lily, do you know Lizzy? \nB: Lizzy who? \nA: Lizzy Smith. \nB: Of course I do. \nA: Then, do you know her younger sister? \nB: You mean Mary? \nA: Yes. \nB: Sure. I know her elder sister Sue and younger sister Mary. \nA: Oh, not bad. Then do you know her mother? \nB: Yes, certainly. I know her mother and father, and brother and sisters, [interrupt] and I even met her grandparents once during a family reunion last summer where we had a wonderful time sharing stories and getting to know each other better. \nA: Hold on, you mentioned her brother—what's his name again? \nB: Oh, her brother? His name is Tom. But as I was saying, I know her mother and father, and brother and sisters, too. \nA: That sounds terrific. \nB: Why do you ask me these questions?", + "cleaned_text": "A: Lily, do you know Lizzy? \nB: Lizzy who? \nA: Lizzy Smith. \nB: Of course I do. \nA: Then, do you know her younger sister? \nB: You mean Mary? \nA: Yes. \nB: Sure. I know her elder sister Sue and younger sister Mary. \nA: Oh, not bad. Then do you know her mother? \nB:Yes, certainly. I know her mother and father, and brother and sisters, and I even met her grandparents once during a family reunion last summer where we had a wonderful time sharing stories and getting to know each other better.\nA: Hold on, you mentioned her brother—what's his name again? \nB: Oh, her brother? His name is Tom. But as I was saying, I know her mother and father, and brother and sisters, too. \nA: That sounds terrific. \nB: Why do you ask me these questions?", + "total_duration": 39.64512471655329, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--238/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--238/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--238/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Lily, do you know Lizzy?", + "original_text": "Lily, do you know Lizzy?", + "start_time": 0, + "end_time": 1.9736961451247166, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--238/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Lizzy who?", + "original_text": "Lizzy who?", + "start_time": 2.3918824887882066, + "end_time": 3.3206806747292497, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--238/temp/line_1_B.wav", + "silence_duration": 0.41818634366348995, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Lizzy Smith.", + "original_text": "Lizzy Smith.", + "start_time": 3.640927280372205, + "end_time": 4.65099530758309, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--238/temp/line_2_A.wav", + "silence_duration": 0.32024660564295515, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Of course I do.", + "original_text": "Of course I do.", + "start_time": 4.983561789352, + "end_time": 6.0400697258599365, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--238/temp/line_3_B.wav", + "silence_duration": 0.3325664817689102, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Then, do you know her younger sister?", + "original_text": "Then, do you know her younger sister?", + "start_time": 6.3968320262083855, + "end_time": 8.09188871555079, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--238/temp/line_4_A.wav", + "silence_duration": 0.35676230034844886, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "You mean Mary?", + "original_text": "You mean Mary?", + "start_time": 8.68938305718034, + "end_time": 9.641401197769909, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--238/temp/line_5_B.wav", + "silence_duration": 0.5974943416295504, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Yes.", + "original_text": "Yes.", + "start_time": 9.986796170665485, + "end_time": 10.660174855472741, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--238/temp/line_6_A.wav", + "silence_duration": 0.34539497289557636, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Sure. I know her elder sister Sue and younger sister Mary.", + "original_text": "Sure. I know her elder sister Sue and younger sister Mary.", + "start_time": 11.002740091208532, + "end_time": 14.497343265811706, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--238/temp/line_7_B.wav", + "silence_duration": 0.3425652357357907, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Oh, not bad. Then do you know her mother?", + "original_text": "Oh, not bad. Then do you know her mother?", + "start_time": 14.996886538506608, + "end_time": 17.806501050978262, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--238/temp/line_8_A.wav", + "silence_duration": 0.49954327269490195, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, certainly. I know her mother and father, and brother and sisters,", + "original_text": "Yes, certainly. I know her mother and father, and brother and sisters, [interrupt] and I even met her grandparents once during a family reunion last summer where we had a wonderful time sharing stories and getting to know each other better.", + "start_time": 18.191739539961606, + "end_time": 28.965798496877706, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--238/temp/line_9_B.wav", + "silence_duration": 0.38523848898334334, + "is_interrupted": true, + "text_after_interrupt": "and I even met her grandparents once during a family reunion last summer where we had a wonderful time sharing stories and getting to know each other better." + }, + { + "speaker": "A", + "text": "Hold on, you mentioned her brother—what's his name again?", + "original_text": "Hold on, you mentioned her brother—what's his name again?", + "start_time": 21.76761255583462, + "end_time": 25.262215730437795, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--238/temp/line_10_A.wav", + "silence_duration": 0.5816206176675103, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Oh, her brother? His name is Tom. But as I was saying, I know her mother and father, and brother and sisters, too.", + "original_text": "Oh, her brother? His name is Tom. But as I was saying, I know her mother and father, and brother and sisters, too.", + "start_time": 29.414454177682597, + "end_time": 35.81155168335153, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--238/temp/line_11_B.wav", + "silence_duration": 0.44865568080489127, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "That sounds terrific.", + "original_text": "That sounds terrific.", + "start_time": 36.22415249271846, + "end_time": 37.733449544872656, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--238/temp/line_12_A.wav", + "silence_duration": 0.41260080936692567, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Why do you ask me these questions?", + "original_text": "Why do you ask me these questions?", + "start_time": 38.06618130205615, + "end_time": 39.64513821815592, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--238/temp/line_13_B.wav", + "silence_duration": 0.3327317571834961, + "is_interrupted": false + } + ] + }, + "DialogSum--val--239": { + "original_text": "A: The Johnsons are on their way back. You remember them, don't you? \nB: Johnson? I can't place them. \nA: We met them in Bermuda last [interrupt] year, during that trip we took for our anniversary when we stayed at that beautiful resort with the infinity pool overlooking the ocean. \nB: Wait, Bermuda? Did we meet them at that beach party or was it during the boat trip? \nA: No, it was last May, at that dinner we had by the shore. They were the couple with the dogs—think back. \nB: Oh, right! The couple with the dogs. But I still can't quite picture them... \nA: Well, I've invited them for brunch. \nB: Hmm, I must be getting absent-minded. By the way, what were you saying about Bermuda? Did we do anything else with them there?", + "cleaned_text": "A: The Johnsons are on their way back. You remember them, don't you? \nB: Johnson? I can't place them. \nA:We met them in Bermuda last year, during that trip we took for our anniversary when we stayed at that beautiful resort with the infinity pool overlooking the ocean.\nB: Wait, Bermuda? Did we meet them at that beach party or was it during the boat trip? \nA: No, it was last May, at that dinner we had by the shore. They were the couple with the dogs—think back. \nB: Oh, right! The couple with the dogs. But I still can't quite picture them... \nA: Well, I've invited them for brunch. \nB: Hmm, I must be getting absent-minded. By the way, what were you saying about Bermuda? Did we do anything else with them there?", + "total_duration": 35.25120181405896, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--239/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--239/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--239/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "The Johnsons are on their way back. You remember them, don't you?", + "original_text": "The Johnsons are on their way back. You remember them, don't you?", + "start_time": 0, + "end_time": 3.657142857142857, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--239/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Johnson? I can't place them.", + "original_text": "Johnson? I can't place them.", + "start_time": 4.070774978729583, + "end_time": 5.742611713423461, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--239/temp/line_1_B.wav", + "silence_duration": 0.41363212158672613, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "We met them in Bermuda last", + "original_text": "We met them in Bermuda last [interrupt] year, during that trip we took for our anniversary when we stayed at that beautiful resort with the infinity pool overlooking the ocean.", + "start_time": 6.145336309916465, + "end_time": 16.0602569448371, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--239/temp/line_2_A.wav", + "silence_duration": 0.40272459649300413, + "is_interrupted": true, + "text_after_interrupt": "year, during that trip we took for our anniversary when we stayed at that beautiful resort with the infinity pool overlooking the ocean." + }, + { + "speaker": "B", + "text": "Wait, Bermuda? Did we meet them at that beach party or was it during the boat trip?", + "original_text": "Wait, Bermuda? Did we meet them at that beach party or was it during the boat trip?", + "start_time": 8.060982568419867, + "end_time": 12.414724065018508, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--239/temp/line_3_B.wav", + "silence_duration": 0.41805326774738605, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "No, it was last May, at that dinner we had by the shore. They were the couple with the dogs—think back.", + "original_text": "No, it was last May, at that dinner we had by the shore. They were the couple with the dogs—think back.", + "start_time": 16.55361055435332, + "end_time": 22.544358853673046, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--239/temp/line_4_A.wav", + "silence_duration": 0.4933536095162189, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Oh, right! The couple with the dogs. But I still can't quite picture them...", + "original_text": "Oh, right! The couple with the dogs. But I still can't quite picture them...", + "start_time": 22.930777341687016, + "end_time": 26.785289813342345, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--239/temp/line_5_B.wav", + "silence_duration": 0.3864184880139687, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Well, I've invited them for brunch.", + "original_text": "Well, I've invited them for brunch.", + "start_time": 27.20714164126764, + "end_time": 29.296937559634987, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--239/temp/line_6_A.wav", + "silence_duration": 0.4218518279252952, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Hmm, I must be getting absent-minded. By the way, what were you saying about Bermuda? Did we do anything else with them there?", + "original_text": "Hmm, I must be getting absent-minded. By the way, what were you saying about Bermuda? Did we do anything else with them there?", + "start_time": 29.85256926042291, + "end_time": 35.25120871620523, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--239/temp/line_7_B.wav", + "silence_duration": 0.5556317007879252, + "is_interrupted": false + } + ] + }, + "DialogSum--val--240": { + "original_text": "A: Hello. Capital Hotel. May I help you? \nB: Yes, unlikely my flight will be on time as it's delayed by 2 hours due to the fog. Would you please [interrupt] let the front desk know that I might be late and ask them to prepare my room in advance so it's ready when I arrive? \nA: Sorry, did you mean your flight is delayed by 2 hours? \nB: Oh yes, it's delayed. Could you please keep my reservation? \nA: Sure. May I have your name please? \nB: Lincoln. That's L-I-N-C-O-L-N. Thank you. \nA: Just to confirm, Mr. Lincoln, your reservation is safe. By the way, did you mention what time you expect to arrive? \nB: Oh, I didn't mention that. I should be arriving around 8 PM now.", + "cleaned_text": "A: Hello. Capital Hotel. May I help you? \nB:Yes, unlikely my flight will be on time as it's delayed by 2 hours due to the fog. Would you please let the front desk know that I might be late and ask them to prepare my room in advance so it's ready when I arrive?\nA: Sorry, did you mean your flight is delayed by 2 hours? \nB: Oh yes, it's delayed. Could you please keep my reservation? \nA: Sure. May I have your name please? \nB: Lincoln. That's L-I-N-C-O-L-N. Thank you. \nA: Just to confirm, Mr. Lincoln, your reservation is safe. By the way, did you mention what time you expect to arrive? \nB: Oh, I didn't mention that. I should be arriving around 8 PM now.", + "total_duration": 40.64585034013606, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--240/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--240/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--240/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Hello. Capital Hotel. May I help you?", + "original_text": "Hello. Capital Hotel. May I help you?", + "start_time": 0, + "end_time": 3.7151927437641725, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--240/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, unlikely my flight will be on time as it's delayed by 2 hours due to the fog. Would you please", + "original_text": "Yes, unlikely my flight will be on time as it's delayed by 2 hours due to the fog. Would you please [interrupt] let the front desk know that I might be late and ask them to prepare my room in advance so it's ready when I arrive?", + "start_time": 4.301805088713903, + "end_time": 15.41255338803363, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--240/temp/line_1_B.wav", + "silence_duration": 0.5866123449497305, + "is_interrupted": true, + "text_after_interrupt": "let the front desk know that I might be late and ask them to prepare my room in advance so it's ready when I arrive?" + }, + { + "speaker": "A", + "text": "Sorry, did you mean your flight is delayed by 2 hours?", + "original_text": "Sorry, did you mean your flight is delayed by 2 hours?", + "start_time": 9.29409533814701, + "end_time": 12.8467483993715, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--240/temp/line_2_A.wav", + "silence_duration": 0.46213031176663133, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Oh yes, it's delayed. Could you please keep my reservation?", + "original_text": "Oh yes, it's delayed. Could you please keep my reservation?", + "start_time": 15.761010237431151, + "end_time": 19.069853774846116, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--240/temp/line_3_B.wav", + "silence_duration": 0.3484568493975218, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Sure. May I have your name please?", + "original_text": "Sure. May I have your name please?", + "start_time": 19.47620220418118, + "end_time": 21.670487918466897, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--240/temp/line_4_A.wav", + "silence_duration": 0.40634842933506377, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Lincoln. That's L-I-N-C-O-L-N. Thank you.", + "original_text": "Lincoln. That's L-I-N-C-O-L-N. Thank you.", + "start_time": 22.071610813293358, + "end_time": 28.642857978826235, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--240/temp/line_5_B.wav", + "silence_duration": 0.40112289482646124, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Just to confirm, Mr. Lincoln, your reservation is safe. By the way, did you mention what time you expect to arrive?", + "original_text": "Just to confirm, Mr. Lincoln, your reservation is safe. By the way, did you mention what time you expect to arrive?", + "start_time": 29.123297608286567, + "end_time": 36.681392846381804, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--240/temp/line_6_A.wav", + "silence_duration": 0.48043962946033136, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Oh, I didn't mention that. I should be arriving around 8 PM now.", + "original_text": "Oh, I didn't mention that. I should be arriving around 8 PM now.", + "start_time": 37.232526900501334, + "end_time": 40.64586023383467, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--240/temp/line_7_B.wav", + "silence_duration": 0.5511340541195269, + "is_interrupted": false + } + ] + }, + "DialogSum--val--241": { + "original_text": "A: May I take your order now, sir? \nB: Yes, please. I'd like to start with a chef's salad. \nA: Chef's salad for starter. And what would you like to have for the main [interrupt] course? We have some excellent options including grilled salmon, roasted chicken, or perhaps something from our specials today that feature seasonal ingredients? \nB: Sorry, I just realized—does the chef's salad come with any dressing options? \nA: Yes, it does. We have several dressings available. Now, for the main course, what would you like? \nB: I'll have steak. \nA: How would you like your steak done? \nB: Medium. \nA: And what would you like to go with your steak? \nB: Peas and carrots. \nA: Potatoes? \nB: Boiled. By the way, what dressings do you have for the chef's salad? I forgot to ask earlier. \nA: We have ranch, blue cheese, balsamic, and Italian dressing. Which one would you prefer? \nB: I'll go with balsamic, please. \nA: Excellent choice. Your order will be ready shortly.", + "cleaned_text": "A: May I take your order now, sir? \nB: Yes, please. I'd like to start with a chef's salad. \nA:Chef's salad for starter. And what would you like to have for the main course? We have some excellent options including grilled salmon, roasted chicken, or perhaps something from our specials today that feature seasonal ingredients?\nB: Sorry, I just realized—does the chef's salad come with any dressing options? \nA: Yes, it does. We have several dressings available. Now, for the main course, what would you like? \nB: I'll have steak. \nA: How would you like your steak done? \nB: Medium. \nA: And what would you like to go with your steak? \nB: Peas and carrots. \nA: Potatoes? \nB: Boiled. By the way, what dressings do you have for the chef's salad? I forgot to ask earlier. \nA: We have ranch, blue cheese, balsamic, and Italian dressing. Which one would you prefer? \nB: I'll go with balsamic, please. \nA: Excellent choice. Your order will be ready shortly.", + "total_duration": 52.57714285714286, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--241/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--241/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--241/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "May I take your order now, sir?", + "original_text": "May I take your order now, sir?", + "start_time": 0, + "end_time": 1.7531065759637188, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--241/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, please. I'd like to start with a chef's salad.", + "original_text": "Yes, please. I'd like to start with a chef's salad.", + "start_time": 2.2770012826193824, + "end_time": 4.8544162486057765, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--241/temp/line_1_B.wav", + "silence_duration": 0.5238947066556638, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Chef's salad for starter. And what would you like to have for the main", + "original_text": "Chef's salad for starter. And what would you like to have for the main [interrupt] course? We have some excellent options including grilled salmon, roasted chicken, or perhaps something from our specials today that feature seasonal ingredients?", + "start_time": 5.188288307253744, + "end_time": 19.143481051017915, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--241/temp/line_2_A.wav", + "silence_duration": 0.3338720586479682, + "is_interrupted": true, + "text_after_interrupt": "course? We have some excellent options including grilled salmon, roasted chicken, or perhaps something from our specials today that feature seasonal ingredients?" + }, + { + "speaker": "B", + "text": "Sorry, I just realized—does the chef's salad come with any dressing options?", + "original_text": "Sorry, I just realized—does the chef's salad come with any dressing options?", + "start_time": 9.019580824260547, + "end_time": 13.454592162129028, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--241/temp/line_3_B.wav", + "silence_duration": 0.47999956087850804, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Yes, it does. We have several dressings available. Now, for the main course, what would you like?", + "original_text": "Yes, it does. We have several dressings available. Now, for the main course, what would you like?", + "start_time": 19.45262261046594, + "end_time": 25.60591059232535, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--241/temp/line_4_A.wav", + "silence_duration": 0.30914155944802474, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I'll have steak.", + "original_text": "I'll have steak.", + "start_time": 26.135617189948196, + "end_time": 27.052805398564974, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--241/temp/line_5_B.wav", + "silence_duration": 0.5297065976228441, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "How would you like your steak done?", + "original_text": "How would you like your steak done?", + "start_time": 27.530900011878508, + "end_time": 29.2607866331937, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--241/temp/line_6_A.wav", + "silence_duration": 0.4780946133135333, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Medium.", + "original_text": "Medium.", + "start_time": 29.56591397245129, + "end_time": 30.23929265725855, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--241/temp/line_7_B.wav", + "silence_duration": 0.3051273392575926, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "And what would you like to go with your steak?", + "original_text": "And what would you like to go with your steak?", + "start_time": 30.790411931061957, + "end_time": 32.86859787210504, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--241/temp/line_8_A.wav", + "silence_duration": 0.551119273803409, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Peas and carrots.", + "original_text": "Peas and carrots.", + "start_time": 33.21750053055265, + "end_time": 34.29722842170911, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--241/temp/line_9_B.wav", + "silence_duration": 0.34890265844760987, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Potatoes?", + "original_text": "Potatoes?", + "start_time": 34.80215874021045, + "end_time": 35.83544672206986, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--241/temp/line_10_A.wav", + "silence_duration": 0.5049303185013468, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Boiled. By the way, what dressings do you have for the chef's salad? I forgot to ask earlier.", + "original_text": "Boiled. By the way, what dressings do you have for the chef's salad? I forgot to ask earlier.", + "start_time": 36.26474106070661, + "end_time": 41.477620879300716, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--241/temp/line_11_B.wav", + "silence_duration": 0.4292943386367511, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "We have ranch, blue cheese, balsamic, and Italian dressing. Which one would you prefer?", + "original_text": "We have ranch, blue cheese, balsamic, and Italian dressing. Which one would you prefer?", + "start_time": 41.97526681171449, + "end_time": 46.71213756001381, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--241/temp/line_12_A.wav", + "silence_duration": 0.49764593241377797, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I'll go with balsamic, please.", + "original_text": "I'll go with balsamic, please.", + "start_time": 47.20341156899347, + "end_time": 48.75914853044471, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--241/temp/line_13_B.wav", + "silence_duration": 0.4912740089796569, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Excellent choice. Your order will be ready shortly.", + "original_text": "Excellent choice. Your order will be ready shortly.", + "start_time": 49.2683221978474, + "end_time": 52.57716573526236, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--241/temp/line_14_A.wav", + "silence_duration": 0.5091736674026867, + "is_interrupted": false + } + ] + }, + "DialogSum--val--242": { + "original_text": "A: Would you hurry up? We're late. \nB: I know, I'm coming. \nA: Our flight leaves in less than 2 hours. Come on. \nB: But I can't find my wallet. \nA: If you hadn't overslept, we wouldn't be so stressed out right [interrupt] now. We could have had a calm morning with plenty of time to double-check everything and maybe even grab breakfast before heading to the airport. \nB: I know, I know, but I really can't find my wallet. Can you help me look for it? \nA: Damn it. I can't find it. Do you see my wallet anywhere? It's made of brown leather. \nB: Did you check your pockets? \nA: Of course I did. I'm not that dumb. Oh, wait a second. Oh, here it is. \nB: Why am I not surprised? OK, put on your shoes and let's get out of here. \nA: Yeah, yeah. Say why don't we take the express train to the airport? It will be faster than a regular taxi, especially with the traffic right now. \nB: Wait, before we rush out, you mentioned something about being stressed because I overslept. I just want to say I really didn't hear the alarm. But yeah, the express train sounds like a good idea. Let's go!", + "cleaned_text": "A: Would you hurry up? We're late. \nB: I know, I'm coming. \nA: Our flight leaves in less than 2 hours. Come on. \nB: But I can't find my wallet. \nA:If you hadn't overslept, we wouldn't be so stressed out right now. We could have had a calm morning with plenty of time to double-check everything and maybe even grab breakfast before heading to the airport.\nB: I know, I know, but I really can't find my wallet. Can you help me look for it? \nA: Damn it. I can't find it. Do you see my wallet anywhere? It's made of brown leather. \nB: Did you check your pockets? \nA: Of course I did. I'm not that dumb. Oh, wait a second. Oh, here it is. \nB: Why am I not surprised? OK, put on your shoes and let's get out of here. \nA: Yeah, yeah. Say why don't we take the express train to the airport? It will be faster than a regular taxi, especially with the traffic right now. \nB: Wait, before we rush out, you mentioned something about being stressed because I overslept. I just want to say I really didn't hear the alarm. But yeah, the express train sounds like a good idea. Let's go!", + "total_duration": 60.503628117913834, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--242/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--242/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--242/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Would you hurry up? We're late.", + "original_text": "Would you hurry up? We're late.", + "start_time": 0, + "end_time": 2.0085260770975055, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--242/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I know, I'm coming.", + "original_text": "I know, I'm coming.", + "start_time": 2.52487623909205, + "end_time": 3.5581642209514603, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--242/temp/line_1_B.wav", + "silence_duration": 0.5163501619945448, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Our flight leaves in less than 2 hours. Come on.", + "original_text": "Our flight leaves in less than 2 hours. Come on.", + "start_time": 4.003768696622503, + "end_time": 7.219732415443365, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--242/temp/line_2_A.wav", + "silence_duration": 0.445604475671042, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "But I can't find my wallet.", + "original_text": "But I can't find my wallet.", + "start_time": 7.635724573193, + "end_time": 9.08697173872588, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--242/temp/line_3_B.wav", + "silence_duration": 0.4159921577496358, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "If you hadn't overslept, we wouldn't be so stressed out right", + "original_text": "If you hadn't overslept, we wouldn't be so stressed out right [interrupt] now. We could have had a calm morning with plenty of time to double-check everything and maybe even grab breakfast before heading to the airport.", + "start_time": 9.50074844063149, + "end_time": 21.15716567419158, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--242/temp/line_4_A.wav", + "silence_duration": 0.4137767019056095, + "is_interrupted": true, + "text_after_interrupt": "now. We could have had a calm morning with plenty of time to double-check everything and maybe even grab breakfast before heading to the airport." + }, + { + "speaker": "B", + "text": "I know, I know, but I really can't find my wallet. Can you help me look for it?", + "original_text": "I know, I know, but I really can't find my wallet. Can you help me look for it?", + "start_time": 12.832811932694982, + "end_time": 16.80342417759294, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--242/temp/line_5_B.wav", + "silence_duration": 0.38577471277933, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Damn it. I can't find it. Do you see my wallet anywhere? It's made of brown leather.", + "original_text": "Damn it. I can't find it. Do you see my wallet anywhere? It's made of brown leather.", + "start_time": 21.57770784216522, + "end_time": 27.41752643626953, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--242/temp/line_6_A.wav", + "silence_duration": 0.42054216797364, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Did you check your pockets?", + "original_text": "Did you check your pockets?", + "start_time": 28.011339998284203, + "end_time": 29.265217549304612, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--242/temp/line_7_B.wav", + "silence_duration": 0.5938135620146725, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Of course I did. I'm not that dumb. Oh, wait a second. Oh, here it is.", + "original_text": "Of course I did. I'm not that dumb. Oh, wait a second. Oh, here it is.", + "start_time": 29.623883096650253, + "end_time": 34.63939330073188, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--242/temp/line_8_A.wav", + "silence_duration": 0.35866554734564254, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Why am I not surprised? OK, put on your shoes and let's get out of here.", + "original_text": "Why am I not surprised? OK, put on your shoes and let's get out of here.", + "start_time": 35.05748420483017, + "end_time": 38.87716674451271, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--242/temp/line_9_B.wav", + "silence_duration": 0.41809090409828675, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Yeah, yeah. Say why don't we take the express train to the airport? It will be faster than a regular taxi, especially with the traffic right now.", + "original_text": "Yeah, yeah. Say why don't we take the express train to the airport? It will be faster than a regular taxi, especially with the traffic right now.", + "start_time": 39.394212272922594, + "end_time": 48.76346397360287, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--242/temp/line_10_A.wav", + "silence_duration": 0.5170455284098858, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Wait, before we rush out, you mentioned something about being stressed because I overslept. I just want to say I really didn't hear the alarm. But yeah, the express train sounds like a good idea. Let's go!", + "original_text": "Wait, before we rush out, you mentioned something about being stressed because I overslept. I just want to say I really didn't hear the alarm. But yeah, the express train sounds like a good idea. Let's go!", + "start_time": 49.14909309162487, + "end_time": 60.50365091475412, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--242/temp/line_11_B.wav", + "silence_duration": 0.3856291180220036, + "is_interrupted": false + } + ] + }, + "DialogSum--val--243": { + "original_text": "A: Have you been watching the Euro 2012 football tournament? \nB: Just a bit. Have you? \nA: Of course. I really started to like football since I came to London. Just think a year ago I was still in Montreal and didn't know a thing about [interrupt] football culture here, but now I can't imagine not following the games, especially with how passionate the fans are and how the entire city comes alive during major matches. \nB: Sorry to cut in, but I'm curious—what made you start liking football after moving to London? Was it the atmosphere or something specific? \nA: It was definitely the atmosphere! The energy here is contagious. But I was about to say that when I was in Montreal, I didn't know a thing about it. How about you? Do you feel the same way about any sport since moving to London? \nB: Well, I'm from New Jersey. Americans aren't so into football, either. Actually, we call it soccer. When Americans say football, what we mean is American rules football. I've been here 2 years now, and I still get confused when people call soccer [interrupt] football, especially when I watch the news or talk to locals about upcoming matches and have to mentally switch between the two sports in my head. \nA: Soccer? Yeah, I can imagine. It must be tricky adjusting to all the different terminologies. Do you think you'll ever get used to it? \nB: Maybe, but it's still odd to me. For us, football means the sport where those big guys wear helmets and violently run into each other.", + "cleaned_text": "A: Have you been watching the Euro 2012 football tournament? \nB: Just a bit. Have you? \nA:Of course. I really started to like football since I came to London. Just think a year ago I was still in Montreal and didn't know a thing about football culture here, but now I can't imagine not following the games, especially with how passionate the fans are and how the entire city comes alive during major matches.\nB: Sorry to cut in, but I'm curious—what made you start liking football after moving to London? Was it the atmosphere or something specific? \nA: It was definitely the atmosphere! The energy here is contagious. But I was about to say that when I was in Montreal, I didn't know a thing about it. How about you? Do you feel the same way about any sport since moving to London? \nB:Well, I'm from New Jersey. Americans aren't so into football, either. Actually, we call it soccer. When Americans say football, what we mean is American rules football. I've been here 2 years now, and I still get confused when people call soccer football, especially when I watch the news or talk to locals about upcoming matches and have to mentally switch between the two sports in my head.\nA: Soccer? Yeah, I can imagine. It must be tricky adjusting to all the different terminologies. Do you think you'll ever get used to it? \nB: Maybe, but it's still odd to me. For us, football means the sport where those big guys wear helmets and violently run into each other.", + "total_duration": 75.33097505668934, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--243/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--243/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--243/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Have you been watching the Euro 2012 football tournament?", + "original_text": "Have you been watching the Euro 2012 football tournament?", + "start_time": 0, + "end_time": 3.215963718820862, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--243/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Just a bit. Have you?", + "original_text": "Just a bit. Have you?", + "start_time": 3.5346863412807417, + "end_time": 4.730514005679835, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--243/temp/line_1_B.wav", + "silence_duration": 0.31872262245987965, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Of course. I really started to like football since I came to London. Just think a year ago I was still in Montreal and didn't know a thing about", + "original_text": "Of course. I really started to like football since I came to London. Just think a year ago I was still in Montreal and didn't know a thing about [interrupt] football culture here, but now I can't imagine not following the games, especially with how passionate the fans are and how the entire city comes alive during major matches.", + "start_time": 5.0976147731864, + "end_time": 23.17434946706395, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--243/temp/line_2_A.wav", + "silence_duration": 0.36710076750656534, + "is_interrupted": true, + "text_after_interrupt": "football culture here, but now I can't imagine not following the games, especially with how passionate the fans are and how the entire city comes alive during major matches." + }, + { + "speaker": "B", + "text": "Sorry to cut in, but I'm curious—what made you start liking football after moving to London? Was it the atmosphere or something specific?", + "original_text": "Sorry to cut in, but I'm curious—what made you start liking football after moving to London? Was it the atmosphere or something specific?", + "start_time": 13.410358537358736, + "end_time": 20.480834727834925, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--243/temp/line_3_B.wav", + "silence_duration": 0.3599255531308145, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "It was definitely the atmosphere! The energy here is contagious. But I was about to say that when I was in Montreal, I didn't know a thing about it. How about you? Do you feel the same way about any sport since moving to London?", + "original_text": "It was definitely the atmosphere! The energy here is contagious. But I was about to say that when I was in Montreal, I didn't know a thing about it. How about you? Do you feel the same way about any sport since moving to London?", + "start_time": 23.618813963603582, + "end_time": 37.67849650328612, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--243/temp/line_4_A.wav", + "silence_duration": 0.44446449653963066, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Well, I'm from New Jersey. Americans aren't so into football, either. Actually, we call it soccer. When Americans say football, what we mean is American rules football. I've been here 2 years now, and I still get confused when people call soccer", + "original_text": "Well, I'm from New Jersey. Americans aren't so into football, either. Actually, we call it soccer. When Americans say football, what we mean is American rules football. I've been here 2 years now, and I still get confused when people call soccer [interrupt] football, especially when I watch the news or talk to locals about upcoming matches and have to mentally switch between the two sports in my head.", + "start_time": 37.998186790273294, + "end_time": 57.5958285136293, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--243/temp/line_5_B.wav", + "silence_duration": 0.319690286987177, + "is_interrupted": true, + "text_after_interrupt": "football, especially when I watch the news or talk to locals about upcoming matches and have to mentally switch between the two sports in my head." + }, + { + "speaker": "A", + "text": "Soccer? Yeah, I can imagine. It must be tricky adjusting to all the different terminologies. Do you think you'll ever get used to it?", + "original_text": "Soccer? Yeah, I can imagine. It must be tricky adjusting to all the different terminologies. Do you think you'll ever get used to it?", + "start_time": 58.648197793080456, + "end_time": 67.18153112641379, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--243/temp/line_6_A.wav", + "silence_duration": 0.3556332849149016, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Maybe, but it's still odd to me. For us, football means the sport where those big guys wear helmets and violently run into each other.", + "original_text": "Maybe, but it's still odd to me. For us, football means the sport where those big guys wear helmets and violently run into each other.", + "start_time": 67.5987452251743, + "end_time": 75.33099012313349, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--243/temp/line_7_B.wav", + "silence_duration": 0.41721409876051196, + "is_interrupted": false + } + ] + }, + "DialogSum--val--244": { + "original_text": "A: Is that the Park Hotel? Reservation desk, please. \nB: Reservation desk. May I help you? \nA: Yes, please. I'm phoning from the airport here in Los Angeles. I'd like to reserve a single room for [interrupt] tonight with a queen-sized bed if possible, as I've had a long flight and would appreciate some extra comfort after my journey. I should be arriving in a few hours. \nB: Sorry to interrupt, sir. Just to confirm, will you be needing any special amenities or services during your stay? \nA: Oh, no special amenities needed, just a single room for tonight. \nB: Alright, sir. That's a single room with a bath? \nA: That's right. How much will that be? \nB: Our singles begin at 45 per night, sir. \nA: Good. In that case, I'll take a room, please. \nB: Your name, please. \nA: My name is Tony Chan. T-O-N-Y. \nB: Thank you, Mr. Chan. When will you be arriving? \nA: Sorry, I forgot to ask earlier—does that rate include breakfast? \nB: No, sir, breakfast is an additional charge. Now, when will you be arriving? \nA: I'm arriving very soon. I'm waiting for a taxi to the hotel. \nB: Right, sir. We'll hold your room for you until 9:00 PM.", + "cleaned_text": "A: Is that the Park Hotel? Reservation desk, please. \nB: Reservation desk. May I help you? \nA:Yes, please. I'm phoning from the airport here in Los Angeles. I'd like to reserve a single room for tonight with a queen-sized bed if possible, as I've had a long flight and would appreciate some extra comfort after my journey. I should be arriving in a few hours.\nB: Sorry to interrupt, sir. Just to confirm, will you be needing any special amenities or services during your stay? \nA: Oh, no special amenities needed, just a single room for tonight. \nB: Alright, sir. That's a single room with a bath? \nA: That's right. How much will that be? \nB: Our singles begin at 45 per night, sir. \nA: Good. In that case, I'll take a room, please. \nB: Your name, please. \nA: My name is Tony Chan. T-O-N-Y. \nB: Thank you, Mr. Chan. When will you be arriving? \nA: Sorry, I forgot to ask earlier—does that rate include breakfast? \nB: No, sir, breakfast is an additional charge. Now, when will you be arriving? \nA: I'm arriving very soon. I'm waiting for a taxi to the hotel. \nB: Right, sir. We'll hold your room for you until 9:00 PM.", + "total_duration": 63.72897959183673, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--244/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--244/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--244/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Is that the Park Hotel? Reservation desk, please.", + "original_text": "Is that the Park Hotel? Reservation desk, please.", + "start_time": 0, + "end_time": 3.5294331065759637, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--244/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Reservation desk. May I help you?", + "original_text": "Reservation desk. May I help you?", + "start_time": 4.043625615626087, + "end_time": 5.843172100886857, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--244/temp/line_1_B.wav", + "silence_duration": 0.5141925090501226, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Yes, please. I'm phoning from the airport here in Los Angeles. I'd like to reserve a single room for", + "original_text": "Yes, please. I'm phoning from the airport here in Los Angeles. I'd like to reserve a single room for [interrupt] tonight with a queen-sized bed if possible, as I've had a long flight and would appreciate some extra comfort after my journey. I should be arriving in a few hours.", + "start_time": 6.221687472349919, + "end_time": 23.090984524504115, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--244/temp/line_2_A.wav", + "silence_duration": 0.37851537146306247, + "is_interrupted": true, + "text_after_interrupt": "tonight with a queen-sized bed if possible, as I've had a long flight and would appreciate some extra comfort after my journey. I should be arriving in a few hours." + }, + { + "speaker": "B", + "text": "Sorry to interrupt, sir. Just to confirm, will you be needing any special amenities or services during your stay?", + "original_text": "Sorry to interrupt, sir. Just to confirm, will you be needing any special amenities or services during your stay?", + "start_time": 12.711664796612958, + "end_time": 18.551483390717266, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--244/temp/line_3_B.wav", + "silence_duration": 0.4928716737261539, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Oh, no special amenities needed, just a single room for tonight.", + "original_text": "Oh, no special amenities needed, just a single room for tonight.", + "start_time": 23.673739092996584, + "end_time": 27.86494090705554, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--244/temp/line_4_A.wav", + "silence_duration": 0.5827545684924677, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Alright, sir. That's a single room with a bath?", + "original_text": "Alright, sir. That's a single room with a bath?", + "start_time": 28.37450639705325, + "end_time": 30.626841997960277, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--244/temp/line_5_B.wav", + "silence_duration": 0.5095654899977086, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "That's right. How much will that be?", + "original_text": "That's right. How much will that be?", + "start_time": 31.099786176332923, + "end_time": 33.13153220807895, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--244/temp/line_6_A.wav", + "silence_duration": 0.4729441783726457, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Our singles begin at 45 per night, sir.", + "original_text": "Our singles begin at 45 per night, sir.", + "start_time": 33.65593425289131, + "end_time": 36.10563946831081, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--244/temp/line_7_B.wav", + "silence_duration": 0.5244020448123626, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Good. In that case, I'll take a room, please.", + "original_text": "Good. In that case, I'll take a room, please.", + "start_time": 36.658772241837084, + "end_time": 39.32906702641758, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--244/temp/line_8_A.wav", + "silence_duration": 0.5531327735262725, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Your name, please.", + "original_text": "Your name, please.", + "start_time": 39.64621866579779, + "end_time": 40.6795066476572, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--244/temp/line_9_B.wav", + "silence_duration": 0.31715163938020524, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "My name is Tony Chan. T-O-N-Y.", + "original_text": "My name is Tony Chan. T-O-N-Y.", + "start_time": 41.141061434828586, + "end_time": 44.43829499491929, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--244/temp/line_10_A.wav", + "silence_duration": 0.4615547871713849, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Thank you, Mr. Chan. When will you be arriving?", + "original_text": "Thank you, Mr. Chan. When will you be arriving?", + "start_time": 44.97940667258513, + "end_time": 47.196912341519365, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--244/temp/line_11_B.wav", + "silence_duration": 0.5411116776658387, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Sorry, I forgot to ask earlier—does that rate include breakfast?", + "original_text": "Sorry, I forgot to ask earlier—does that rate include breakfast?", + "start_time": 47.55024540970499, + "end_time": 51.40475788136032, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--244/temp/line_12_A.wav", + "silence_duration": 0.35333306818562366, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "No, sir, breakfast is an additional charge. Now, when will you be arriving?", + "original_text": "No, sir, breakfast is an additional charge. Now, when will you be arriving?", + "start_time": 51.998380966705476, + "end_time": 56.0734830075218, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--244/temp/line_13_B.wav", + "silence_duration": 0.5936230853451563, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I'm arriving very soon. I'm waiting for a taxi to the hotel.", + "original_text": "I'm arriving very soon. I'm waiting for a taxi to the hotel.", + "start_time": 56.455496241245456, + "end_time": 60.47254839544047, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--244/temp/line_14_A.wav", + "silence_duration": 0.38201323372365725, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Right, sir. We'll hold your room for you until 9:00 PM.", + "original_text": "Right, sir. We'll hold your room for you until 9:00 PM.", + "start_time": 60.89617919170385, + "end_time": 63.72901365882403, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--244/temp/line_15_B.wav", + "silence_duration": 0.4236307962633782, + "is_interrupted": false + } + ] + }, + "DialogSum--val--245": { + "original_text": "A: Hello is that Phil Taylor? \nB: Speaking. \nA: Hi Phil. I'm a Reporter for the Sun. I'm calling to ask you a few questions about the fire. Can you tell me how it happened? \nB: Sure. Well it was 2 days ago on November the tenth about 11:00 PM. I decided to fry some chips so I used quite a lot of oil. I was deep frying. Uhm the oil finally got hot enough, so I put the chips in and then my mom [interrupt] called me on the phone just as I was about to check on the food, and we ended up having a long conversation about family matters that distracted me completely. \nA: Sorry to interrupt, Phil. Did you say you were alone at home when this happened? \nB: Yes, I was. My mom rang me, and we started talking. I completely forgot about the chips. After the call, I just went back to my living room. \nA: Oh no. \nB: Yes, I watched TV for about 20 minutes and the next thing I knew there was the smell of smoke and someone was shouting fire fire. I immediately realized it was my chips. I rushed out of the room. The kitchen was next door. Well, there were flames all over one wall. \nA: What did you do? \nB: Well, I grabbed some blankets from my bed and ran to the kitchen to throw them over the flames. By that time, my neighbors had already called the fire Department. The firefighters arrived, I think within about 10 minutes and put the fire out very quickly. \nA: So what was the damage? \nB: Well. I'll have to replace the cooker completely. Besides, I have to have 2 kitchen units and one wall repaired. Oh, and I didn't mention—my mom was still on the line when I realized the fire had started. She was so worried.", + "cleaned_text": "A: Hello is that Phil Taylor? \nB: Speaking. \nA: Hi Phil. I'm a Reporter for the Sun. I'm calling to ask you a few questions about the fire. Can you tell me how it happened? \nB:Sure. Well it was 2 days ago on November the tenth about 11:00 PM. I decided to fry some chips so I used quite a lot of oil. I was deep frying. Uhm the oil finally got hot enough, so I put the chips in and then my mom called me on the phone just as I was about to check on the food, and we ended up having a long conversation about family matters that distracted me completely.\nA: Sorry to interrupt, Phil. Did you say you were alone at home when this happened? \nB: Yes, I was. My mom rang me, and we started talking. I completely forgot about the chips. After the call, I just went back to my living room. \nA: Oh no. \nB: Yes, I watched TV for about 20 minutes and the next thing I knew there was the smell of smoke and someone was shouting fire fire. I immediately realized it was my chips. I rushed out of the room. The kitchen was next door. Well, there were flames all over one wall. \nA: What did you do? \nB: Well, I grabbed some blankets from my bed and ran to the kitchen to throw them over the flames. By that time, my neighbors had already called the fire Department. The firefighters arrived, I think within about 10 minutes and put the fire out very quickly. \nA: So what was the damage? \nB: Well. I'll have to replace the cooker completely. Besides, I have to have 2 kitchen units and one wall repaired. Oh, and I didn't mention—my mom was still on the line when I realized the fire had started. She was so worried.", + "total_duration": 85.46408163265306, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--245/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--245/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--245/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Hello is that Phil Taylor?", + "original_text": "Hello is that Phil Taylor?", + "start_time": 0, + "end_time": 1.6137868480725623, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--245/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Speaking.", + "original_text": "Speaking.", + "start_time": 1.993500120893113, + "end_time": 2.6900987603488953, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--245/temp/line_1_B.wav", + "silence_duration": 0.3797132728205506, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Hi Phil. I'm a Reporter for the Sun. I'm calling to ask you a few questions about the fire. Can you tell me how it happened?", + "original_text": "Hi Phil. I'm a Reporter for the Sun. I'm calling to ask you a few questions about the fire. Can you tell me how it happened?", + "start_time": 3.2667903790001165, + "end_time": 11.358944574011455, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--245/temp/line_2_A.wav", + "silence_duration": 0.5766916186512212, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Sure. Well it was 2 days ago on November the tenth about 11:00 PM. I decided to fry some chips so I used quite a lot of oil. I was deep frying. Uhm the oil finally got hot enough, so I put the chips in and then my mom", + "original_text": "Sure. Well it was 2 days ago on November the tenth about 11:00 PM. I decided to fry some chips so I used quite a lot of oil. I was deep frying. Uhm the oil finally got hot enough, so I put the chips in and then my mom [interrupt] called me on the phone just as I was about to check on the food, and we ended up having a long conversation about family matters that distracted me completely.", + "start_time": 11.788188312055626, + "end_time": 31.94310894697626, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--245/temp/line_3_B.wav", + "silence_duration": 0.42924373804417115, + "is_interrupted": true, + "text_after_interrupt": "called me on the phone just as I was about to check on the food, and we ended up having a long conversation about family matters that distracted me completely." + }, + { + "speaker": "A", + "text": "Sorry to interrupt, Phil. Did you say you were alone at home when this happened?", + "original_text": "Sorry to interrupt, Phil. Did you say you were alone at home when this happened?", + "start_time": 24.001884457180342, + "end_time": 28.11181642996946, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--245/temp/line_4_A.wav", + "silence_duration": 0.33627215628342805, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, I was. My mom rang me, and we started talking. I completely forgot about the chips. After the call, I just went back to my living room.", + "original_text": "Yes, I was. My mom rang me, and we started talking. I completely forgot about the chips. After the call, I just went back to my living room.", + "start_time": 32.40025331825732, + "end_time": 40.0396183976224, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--245/temp/line_5_B.wav", + "silence_duration": 0.45714437128106244, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Oh no.", + "original_text": "Oh no.", + "start_time": 40.47257293677694, + "end_time": 41.22722146285404, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--245/temp/line_6_A.wav", + "silence_duration": 0.43295453915454646, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, I watched TV for about 20 minutes and the next thing I knew there was the smell of smoke and someone was shouting fire fire. I immediately realized it was my chips. I rushed out of the room. The kitchen was next door. Well, there were flames all over one wall.", + "original_text": "Yes, I watched TV for about 20 minutes and the next thing I knew there was the smell of smoke and someone was shouting fire fire. I immediately realized it was my chips. I rushed out of the room. The kitchen was next door. Well, there were flames all over one wall.", + "start_time": 41.728945613384056, + "end_time": 56.71742633900764, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--245/temp/line_7_B.wav", + "silence_duration": 0.501724150530016, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "What did you do?", + "original_text": "What did you do?", + "start_time": 57.117853370009875, + "end_time": 58.17436130651781, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--245/temp/line_8_A.wav", + "silence_duration": 0.400427031002237, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Well, I grabbed some blankets from my bed and ran to the kitchen to throw them over the flames. By that time, my neighbors had already called the fire Department. The firefighters arrived, I think within about 10 minutes and put the fire out very quickly.", + "original_text": "Well, I grabbed some blankets from my bed and ran to the kitchen to throw them over the flames. By that time, my neighbors had already called the fire Department. The firefighters arrived, I think within about 10 minutes and put the fire out very quickly.", + "start_time": 58.76413996858243, + "end_time": 71.16359575089535, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--245/temp/line_9_B.wav", + "silence_duration": 0.5897786620646182, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "So what was the damage?", + "original_text": "So what was the damage?", + "start_time": 71.73163876947746, + "end_time": 73.22932584430738, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--245/temp/line_10_A.wav", + "silence_duration": 0.5680430185820968, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Well. I'll have to replace the cooker completely. Besides, I have to have 2 kitchen units and one wall repaired. Oh, and I didn't mention—my mom was still on the line when I realized the fire had started. She was so worried.", + "original_text": "Well. I'll have to replace the cooker completely. Besides, I have to have 2 kitchen units and one wall repaired. Oh, and I didn't mention—my mom was still on the line when I realized the fire had started. She was so worried.", + "start_time": 73.726399550401, + "end_time": 85.46408662523093, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--245/temp/line_11_B.wav", + "silence_duration": 0.49707370609361223, + "is_interrupted": false + } + ] + }, + "DialogSum--val--248": { + "original_text": "A: Oh, what a beautiful cat! What do you [interrupt] think about adopting one like this? I've heard they're relatively low-maintenance compared to other pets and can be just as affectionate when they want to be.\nB: Sorry to interrupt, but I just want to say, I think I'd rather get a dog. Dogs are more faithful than cats.\nA: Yes, but they require so much work. Would you be willing to walk it every single day and clean up after it?\nB: We'd have to invest a lot of money in a cage or a fish tank, and I don't really know how to take care of a bird or [interrupt] other pets that need special equipment like temperature-controlled environments and specific dietary requirements that might be difficult to maintain consistently.\nA: Hold on, I was asking about walking the dog every day. Are you okay with that?\nB: Oh, right. Walking the dog every day might be tough. Maybe you're right, we're obviously not ready to get a pet yet.\nA: Yeah, you're right. Let's go grab some coffee and talk about it.", + "cleaned_text": "A:Oh, what a beautiful cat! What do you think about adopting one like this? I've heard they're relatively low-maintenance compared to other pets and can be just as affectionate when they want to be.\nB: Sorry to interrupt, but I just want to say, I think I'd rather get a dog. Dogs are more faithful than cats.\nA: Yes, but they require so much work. Would you be willing to walk it every single day and clean up after it?\nB:We'd have to invest a lot of money in a cage or a fish tank, and I don't really know how to take care of a bird or other pets that need special equipment like temperature-controlled environments and specific dietary requirements that might be difficult to maintain consistently.\nA: Hold on, I was asking about walking the dog every day. Are you okay with that?\nB: Oh, right. Walking the dog every day might be tough. Maybe you're right, we're obviously not ready to get a pet yet.\nA: Yeah, you're right. Let's go grab some coffee and talk about it.", + "total_duration": 47.000952380952384, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--248/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--248/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--248/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Oh, what a beautiful cat! What do you", + "original_text": "Oh, what a beautiful cat! What do you [interrupt] think about adopting one like this? I've heard they're relatively low-maintenance compared to other pets and can be just as affectionate when they want to be.", + "start_time": 0, + "end_time": 11.168798185941043, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--248/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": true, + "text_after_interrupt": "think about adopting one like this? I've heard they're relatively low-maintenance compared to other pets and can be just as affectionate when they want to be." + }, + { + "speaker": "B", + "text": "Sorry to interrupt, but I just want to say, I think I'd rather get a dog. Dogs are more faithful than cats.", + "original_text": "Sorry to interrupt, but I just want to say, I think I'd rather get a dog. Dogs are more faithful than cats.", + "start_time": 2.809614512471655, + "end_time": 8.823582766439909, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--248/temp/line_1_B.wav", + "silence_duration": 0.41973055163177897, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Yes, but they require so much work. Would you be willing to walk it every single day and clean up after it?", + "original_text": "Yes, but they require so much work. Would you be willing to walk it every single day and clean up after it?", + "start_time": 11.534366903274766, + "end_time": 18.070784136834856, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--248/temp/line_2_A.wav", + "silence_duration": 0.36556871733372337, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "We'd have to invest a lot of money in a cage or a fish tank, and I don't really know how to take care of a bird or", + "original_text": "We'd have to invest a lot of money in a cage or a fish tank, and I don't really know how to take care of a bird or [interrupt] other pets that need special equipment like temperature-controlled environments and specific dietary requirements that might be difficult to maintain consistently.", + "start_time": 18.584773257132966, + "end_time": 32.957925184570605, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--248/temp/line_3_B.wav", + "silence_duration": 0.5139891202981115, + "is_interrupted": true, + "text_after_interrupt": "other pets that need special equipment like temperature-controlled environments and specific dietary requirements that might be difficult to maintain consistently." + }, + { + "speaker": "A", + "text": "Hold on, I was asking about walking the dog every day. Are you okay with that?", + "original_text": "Hold on, I was asking about walking the dog every day. Are you okay with that?", + "start_time": 30.690406678963548, + "end_time": 35.380837517965816, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--248/temp/line_4_A.wav", + "silence_duration": 0.49773607992381685, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Oh, right. Walking the dog every day might be tough. Maybe you're right, we're obviously not ready to get a pet yet.", + "original_text": "Oh, right. Walking the dog every day might be tough. Maybe you're right, we're obviously not ready to get a pet yet.", + "start_time": 35.71993944802251, + "end_time": 42.23313672693407, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--248/temp/line_5_B.wav", + "silence_duration": 0.33910193005669503, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Yeah, you're right. Let's go grab some coffee and talk about it.", + "original_text": "Yeah, you're right. Let's go grab some coffee and talk about it.", + "start_time": 42.82140258408058, + "end_time": 47.000994420815275, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--248/temp/line_6_A.wav", + "silence_duration": 0.5882658571465122, + "is_interrupted": false + } + ] + }, + "DialogSum--val--249": { + "original_text": "A: Darling, has our TV set been repaired? \nB: Not yet. They say they are still working on [interrupt] fixing the main circuit board, which apparently has some complex wiring issues that require specialized tools and replacement parts that aren't readily available in their workshop. \nA: Oh, it's a long day without any TV. Have you paid the internet bill? \nB: Sorry, I totally forgot. I will do it tomorrow. \nA: Oh dear. Think up something for us to do tonight, will you? \nB: Is there anything good on at the cinema tonight? \nA: Pass me the newspaper. Thanks. There is a Western on at the Maple Theater. \nB: John Wayne again? No. What else? \nA: There is a war movie on at the Silver Star Theater. But you don't usually like war movies, do you? \nB: No. Not really. But wait, you were saying something about the Silver Star Theater? \nA: Yes, I was just saying that you don't usually like war movies. Anyway, there's also a film at the Globe Theatre named *The Killer*. \nB: You know, I'd like to see a film that will cheer me up and help me relax. I don't want to see something frightening.", + "cleaned_text": "A: Darling, has our TV set been repaired? \nB:Not yet. They say they are still working on fixing the main circuit board, which apparently has some complex wiring issues that require specialized tools and replacement parts that aren't readily available in their workshop.\nA: Oh, it's a long day without any TV. Have you paid the internet bill? \nB: Sorry, I totally forgot. I will do it tomorrow. \nA: Oh dear. Think up something for us to do tonight, will you? \nB: Is there anything good on at the cinema tonight? \nA: Pass me the newspaper. Thanks. There is a Western on at the Maple Theater. \nB: John Wayne again? No. What else? \nA: There is a war movie on at the Silver Star Theater. But you don't usually like war movies, do you? \nB: No. Not really. But wait, you were saying something about the Silver Star Theater? \nA: Yes, I was just saying that you don't usually like war movies. Anyway, there's also a film at the Globe Theatre named *The Killer*. \nB: You know, I'd like to see a film that will cheer me up and help me relax. I don't want to see something frightening.", + "total_duration": 57.55546485260771, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--249/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--249/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--249/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Darling, has our TV set been repaired?", + "original_text": "Darling, has our TV set been repaired?", + "start_time": 0, + "end_time": 2.391655328798186, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--249/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Not yet. They say they are still working on", + "original_text": "Not yet. They say they are still working on [interrupt] fixing the main circuit board, which apparently has some complex wiring issues that require specialized tools and replacement parts that aren't readily available in their workshop.", + "start_time": 2.913802632889172, + "end_time": 14.187090614748582, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--249/temp/line_1_B.wav", + "silence_duration": 0.522147304090986, + "is_interrupted": true, + "text_after_interrupt": "fixing the main circuit board, which apparently has some complex wiring issues that require specialized tools and replacement parts that aren't readily available in their workshop." + }, + { + "speaker": "A", + "text": "Oh, it's a long day without any TV. Have you paid the internet bill?", + "original_text": "Oh, it's a long day without any TV. Have you paid the internet bill?", + "start_time": 5.3867278029572, + "end_time": 10.158428483229308, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--249/temp/line_2_A.wav", + "silence_duration": 0.5986760906148358, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Sorry, I totally forgot. I will do it tomorrow.", + "original_text": "Sorry, I totally forgot. I will do it tomorrow.", + "start_time": 14.612245938448114, + "end_time": 17.77015977064766, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--249/temp/line_3_B.wav", + "silence_duration": 0.42515532369953196, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Oh dear. Think up something for us to do tonight, will you?", + "original_text": "Oh dear. Think up something for us to do tonight, will you?", + "start_time": 18.204495449318827, + "end_time": 21.339189326869846, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--249/temp/line_4_A.wav", + "silence_duration": 0.43433567867116907, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Is there anything good on at the cinema tonight?", + "original_text": "Is there anything good on at the cinema tonight?", + "start_time": 21.6445396438443, + "end_time": 23.838825358130016, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--249/temp/line_5_B.wav", + "silence_duration": 0.3053503169744538, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Pass me the newspaper. Thanks. There is a Western on at the Maple Theater.", + "original_text": "Pass me the newspaper. Thanks. There is a Western on at the Maple Theater.", + "start_time": 24.332140640345152, + "end_time": 28.790371932862158, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--249/temp/line_6_A.wav", + "silence_duration": 0.4933152822151359, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "John Wayne again? No. What else?", + "original_text": "John Wayne again? No. What else?", + "start_time": 29.19918693534493, + "end_time": 31.3122028083608, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--249/temp/line_7_B.wav", + "silence_duration": 0.40881500248277153, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "There is a war movie on at the Silver Star Theater. But you don't usually like war movies, do you?", + "original_text": "There is a war movie on at the Silver Star Theater. But you don't usually like war movies, do you?", + "start_time": 31.78962378279126, + "end_time": 37.47851267168015, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--249/temp/line_8_A.wav", + "silence_duration": 0.47742097443045994, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "No. Not really. But wait, you were saying something about the Silver Star Theater?", + "original_text": "No. Not really. But wait, you were saying something about the Silver Star Theater?", + "start_time": 37.952013191413116, + "end_time": 42.13160502814781, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--249/temp/line_9_B.wav", + "silence_duration": 0.4735005197329627, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Yes, I was just saying that you don't usually like war movies. Anyway, there's also a film at the Globe Theatre named *The Killer*.", + "original_text": "Yes, I was just saying that you don't usually like war movies. Anyway, there's also a film at the Globe Theatre named *The Killer*.", + "start_time": 42.64181775364536, + "end_time": 51.86013974911022, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--249/temp/line_10_A.wav", + "silence_duration": 0.5102127254975527, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "You know, I'd like to see a film that will cheer me up and help me relax. I don't want to see something frightening.", + "original_text": "You know, I'd like to see a film that will cheer me up and help me relax. I don't want to see something frightening.", + "start_time": 52.423876617059804, + "end_time": 57.555486594384064, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--249/temp/line_11_B.wav", + "silence_duration": 0.5637368679495898, + "is_interrupted": false + } + ] + }, + "DialogSum--val--252": { + "original_text": "A: There are many art craft items in this shop. I suggest you take your time, and you might find something you [interrupt] really like if you explore each section carefully, especially the hand-painted ceramics and embroidered silk pieces that showcase our local artisans' finest craftsmanship.\nB: Oh, actually, before I start browsing, could you tell me if there's anything particularly unique or rare here that I shouldn't miss?\nA: Certainly! That wood carving you're holding is very rare. But I'm so sorry, it is not for sale. [interrupt] It's actually a piece from a limited collection created by a master carver who only produced 10 such pieces before retiring, each featuring intricate details of mythical creatures from our local folklore.\nB: That's OK. Is there anything else you would recommend?\nA: Do you have any special request?\nB: I'd like to see some traditional arts.\nA: So that means you are shopping for presents?\nB: Yes, I'm just here to pick out some special presents for my foreign friends.\nA: Actually, I think the paper-cuts are a great option because they are easy to carry, and foreign friends are also interested in them. They think it's a miracle.\nB: Sounds good. I'll take the paper-cut. By the way, you mentioned something about the wood carving earlier—what makes it so rare?", + "cleaned_text": "A:There are many art craft items in this shop. I suggest you take your time, and you might find something you really like if you explore each section carefully, especially the hand-painted ceramics and embroidered silk pieces that showcase our local artisans' finest craftsmanship.\nB: Oh, actually, before I start browsing, could you tell me if there's anything particularly unique or rare here that I shouldn't miss?\nA:Certainly! That wood carving you're holding is very rare. But I'm so sorry, it is not for sale. It's actually a piece from a limited collection created by a master carver who only produced 10 such pieces before retiring, each featuring intricate details of mythical creatures from our local folklore.\nB: That's OK. Is there anything else you would recommend?\nA: Do you have any special request?\nB: I'd like to see some traditional arts.\nA: So that means you are shopping for presents?\nB: Yes, I'm just here to pick out some special presents for my foreign friends.\nA: Actually, I think the paper-cuts are a great option because they are easy to carry, and foreign friends are also interested in them. They think it's a miracle.\nB: Sounds good. I'll take the paper-cut. By the way, you mentioned something about the wood carving earlier—what makes it so rare?", + "total_duration": 62.729886621315195, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--252/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--252/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--252/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "There are many art craft items in this shop. I suggest you take your time, and you might find something you", + "original_text": "There are many art craft items in this shop. I suggest you take your time, and you might find something you [interrupt] really like if you explore each section carefully, especially the hand-painted ceramics and embroidered silk pieces that showcase our local artisans' finest craftsmanship.", + "start_time": 0, + "end_time": 15.731519274376417, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--252/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": true, + "text_after_interrupt": "really like if you explore each section carefully, especially the hand-painted ceramics and embroidered silk pieces that showcase our local artisans' finest craftsmanship." + }, + { + "speaker": "B", + "text": "Oh, actually, before I start browsing, could you tell me if there's anything particularly unique or rare here that I shouldn't miss?", + "original_text": "Oh, actually, before I start browsing, could you tell me if there's anything particularly unique or rare here that I shouldn't miss?", + "start_time": 6.931156462585034, + "end_time": 14.767891156462586, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--252/temp/line_1_B.wav", + "silence_duration": 0.5763813807760105, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Certainly! That wood carving you're holding is very rare. But I'm so sorry, it is not for sale.", + "original_text": "Certainly! That wood carving you're holding is very rare. But I'm so sorry, it is not for sale. [interrupt] It's actually a piece from a limited collection created by a master carver who only produced 10 such pieces before retiring, each featuring intricate details of mythical creatures from our local folklore.", + "start_time": 16.311022303399287, + "end_time": 34.747666294328994, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--252/temp/line_2_A.wav", + "silence_duration": 0.5795030290228711, + "is_interrupted": true, + "text_after_interrupt": "It's actually a piece from a limited collection created by a master carver who only produced 10 such pieces before retiring, each featuring intricate details of mythical creatures from our local folklore." + }, + { + "speaker": "B", + "text": "That's OK. Is there anything else you would recommend?", + "original_text": "That's OK. Is there anything else you would recommend?", + "start_time": 30.756197158706296, + "end_time": 33.91411099090584, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--252/temp/line_3_B.wav", + "silence_duration": 0.5642822838872205, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Do you have any special request?", + "original_text": "Do you have any special request?", + "start_time": 35.27126252851378, + "end_time": 37.14046887772013, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--252/temp/line_4_A.wav", + "silence_duration": 0.5235962341847877, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I'd like to see some traditional arts.", + "original_text": "I'd like to see some traditional arts.", + "start_time": 37.44154176920415, + "end_time": 39.380407982356076, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--252/temp/line_5_B.wav", + "silence_duration": 0.30107289148401795, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "So that means you are shopping for presents?", + "original_text": "So that means you are shopping for presents?", + "start_time": 39.71867324085115, + "end_time": 42.07549863767655, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--252/temp/line_6_A.wav", + "silence_duration": 0.33826525849507527, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, I'm just here to pick out some special presents for my foreign friends.", + "original_text": "Yes, I'm just here to pick out some special presents for my foreign friends.", + "start_time": 42.48052570919165, + "end_time": 46.532407795359454, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--252/temp/line_7_B.wav", + "silence_duration": 0.40502707151510164, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Actually, I think the paper-cuts are a great option because they are easy to carry, and foreign friends are also interested in them. They think it's a miracle.", + "original_text": "Actually, I think the paper-cuts are a great option because they are easy to carry, and foreign friends are also interested in them. They think it's a miracle.", + "start_time": 46.97767444551292, + "end_time": 56.254046327599085, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--252/temp/line_8_A.wav", + "silence_duration": 0.44526665015346534, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Sounds good. I'll take the paper-cut. By the way, you mentioned something about the wood carving earlier—what makes it so rare?", + "original_text": "Sounds good. I'll take the paper-cut. By the way, you mentioned something about the wood carving earlier—what makes it so rare?", + "start_time": 56.75076313905078, + "end_time": 62.729901461046246, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--252/temp/line_9_B.wav", + "silence_duration": 0.49671681145169677, + "is_interrupted": false + } + ] + }, + "DialogSum--val--253": { + "original_text": "A: Can you squeeze me in sometime today? \nB: That's a big order, Jane. I am really swamped. \nA: I know what you're saying, but I have to go over the books with you before I go see our tax [interrupt] advisor tomorrow morning. There are several complex financial transactions from last quarter that need careful review, and I've identified at least three major discrepancies I need your input on before I finalize everything. \nB: Wait, you're seeing the tax guy today? That's cutting it close. \nA: Yes, I am. That's why it's urgent. Can you make it happen? \nB: Right. Okay, let me see what I can do. How about 1:30 right after my lunch meeting? It won't take more than a half hour, will it? \nA: No, it shouldn't. And I was going to say, it's important I review everything before the tax guy sees it. I want to make sure we're not missing anything critical that could trigger an audit or cause problems with our quarterly filings.", + "cleaned_text": "A: Can you squeeze me in sometime today? \nB: That's a big order, Jane. I am really swamped. \nA:I know what you're saying, but I have to go over the books with you before I go see our tax advisor tomorrow morning. There are several complex financial transactions from last quarter that need careful review, and I've identified at least three major discrepancies I need your input on before I finalize everything.\nB: Wait, you're seeing the tax guy today? That's cutting it close. \nA: Yes, I am. That's why it's urgent. Can you make it happen? \nB: Right. Okay, let me see what I can do. How about 1:30 right after my lunch meeting? It won't take more than a half hour, will it? \nA: No, it shouldn't. And I was going to say, it's important I review everything before the tax guy sees it. I want to make sure we're not missing anything critical that could trigger an audit or cause problems with our quarterly filings.", + "total_duration": 50.31895691609977, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--253/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--253/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--253/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Can you squeeze me in sometime today?", + "original_text": "Can you squeeze me in sometime today?", + "start_time": 0, + "end_time": 2.0549659863945577, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--253/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "That's a big order, Jane. I am really swamped.", + "original_text": "That's a big order, Jane. I am really swamped.", + "start_time": 2.5655230334014822, + "end_time": 4.933958407551142, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--253/temp/line_1_B.wav", + "silence_duration": 0.5105570470069247, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I know what you're saying, but I have to go over the books with you before I go see our tax", + "original_text": "I know what you're saying, but I have to go over the books with you before I go see our tax [interrupt] advisor tomorrow morning. There are several complex financial transactions from last quarter that need careful review, and I've identified at least three major discrepancies I need your input on before I finalize everything.", + "start_time": 5.270500876794938, + "end_time": 23.38206550264528, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--253/temp/line_2_A.wav", + "silence_duration": 0.3365424692437965, + "is_interrupted": true, + "text_after_interrupt": "advisor tomorrow morning. There are several complex financial transactions from last quarter that need careful review, and I've identified at least three major discrepancies I need your input on before I finalize everything." + }, + { + "speaker": "B", + "text": "Wait, you're seeing the tax guy today? That's cutting it close.", + "original_text": "Wait, you're seeing the tax guy today? That's cutting it close.", + "start_time": 10.367280922146412, + "end_time": 13.943153938019428, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--253/temp/line_3_B.wav", + "silence_duration": 0.553921089343794, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Yes, I am. That's why it's urgent. Can you make it happen?", + "original_text": "Yes, I am. That's why it's urgent. Can you make it happen?", + "start_time": 23.90648228289468, + "end_time": 28.097684096953635, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--253/temp/line_4_A.wav", + "silence_duration": 0.5244167802493995, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Right. Okay, let me see what I can do. How about 1:30 right after my lunch meeting? It won't take more than a half hour, will it?", + "original_text": "Right. Okay, let me see what I can do. How about 1:30 right after my lunch meeting? It won't take more than a half hour, will it?", + "start_time": 28.658256776929974, + "end_time": 36.471771516159, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--253/temp/line_5_B.wav", + "silence_duration": 0.56057267997634, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "No, it shouldn't. And I was going to say, it's important I review everything before the tax guy sees it. I want to make sure we're not missing anything critical that could trigger an audit or cause problems with our quarterly filings.", + "original_text": "No, it shouldn't. And I was going to say, it's important I review everything before the tax guy sees it. I want to make sure we're not missing anything critical that could trigger an audit or cause problems with our quarterly filings.", + "start_time": 37.02554736476665, + "end_time": 50.31897140104783, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--253/temp/line_6_A.wav", + "silence_duration": 0.5537758486076463, + "is_interrupted": false + } + ] + }, + "DialogSum--val--254": { + "original_text": "A: What can I do for you today? \nB: I need to buy a new refrigerator today. \nA: Were you looking at a particular refrigerator? \nB: I like that Kenmore [interrupt] model over there. It looks like it would fit perfectly in my kitchen and has the modern stainless steel finish that matches my other appliances. \nA: Sorry to jump in, but are you looking for any specific features like an ice maker or a water dispenser? \nB: Yes, I do want those features. Does the Kenmore have them? \nA: This particular refrigerator is a very good choice. Not only is it affordable, but it comes with all the [interrupt] features you might need, including an ice maker, water dispenser, adjustable shelves, and even a smart temperature control system that helps keep your food fresher for longer. \nB: Just to clarify, when you say \"all the appliances,\" do you mean it includes an ice maker and a water dispenser? \nA: Yes, it has an ice maker, water dispenser, and plenty of room on the inside. I was also going to mention that it has a really efficient cooling system. \nB: I'd like to see it for myself. \nA: Go right ahead. \nB: I like what I see.", + "cleaned_text": "A: What can I do for you today? \nB: I need to buy a new refrigerator today. \nA: Were you looking at a particular refrigerator? \nB:I like that Kenmore model over there. It looks like it would fit perfectly in my kitchen and has the modern stainless steel finish that matches my other appliances.\nA: Sorry to jump in, but are you looking for any specific features like an ice maker or a water dispenser? \nB: Yes, I do want those features. Does the Kenmore have them? \nA:This particular refrigerator is a very good choice. Not only is it affordable, but it comes with all the features you might need, including an ice maker, water dispenser, adjustable shelves, and even a smart temperature control system that helps keep your food fresher for longer.\nB: Just to clarify, when you say \"all the appliances,\" do you mean it includes an ice maker and a water dispenser? \nA: Yes, it has an ice maker, water dispenser, and plenty of room on the inside. I was also going to mention that it has a really efficient cooling system. \nB: I'd like to see it for myself. \nA: Go right ahead. \nB: I like what I see.", + "total_duration": 55.0340589569161, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--254/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--254/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--254/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "What can I do for you today?", + "original_text": "What can I do for you today?", + "start_time": 0, + "end_time": 1.7763265306122449, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--254/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I need to buy a new refrigerator today.", + "original_text": "I need to buy a new refrigerator today.", + "start_time": 2.3697487400416106, + "end_time": 4.598864386300114, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--254/temp/line_1_B.wav", + "silence_duration": 0.5934222094293656, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Were you looking at a particular refrigerator?", + "original_text": "Were you looking at a particular refrigerator?", + "start_time": 4.96319086933126, + "end_time": 7.273576356859605, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--254/temp/line_2_A.wav", + "silence_duration": 0.36432648303114634, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I like that Kenmore", + "original_text": "I like that Kenmore [interrupt] model over there. It looks like it would fit perfectly in my kitchen and has the modern stainless steel finish that matches my other appliances.", + "start_time": 7.683839684502996, + "end_time": 15.79921383416286, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--254/temp/line_3_B.wav", + "silence_duration": 0.41026332764339124, + "is_interrupted": true, + "text_after_interrupt": "model over there. It looks like it would fit perfectly in my kitchen and has the modern stainless steel finish that matches my other appliances." + }, + { + "speaker": "A", + "text": "Sorry to jump in, but are you looking for any specific features like an ice maker or a water dispenser?", + "original_text": "Sorry to jump in, but are you looking for any specific features like an ice maker or a water dispenser?", + "start_time": 8.972547167496193, + "end_time": 15.38125465048939, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--254/temp/line_4_A.wav", + "silence_duration": 0.3722611681235535, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, I do want those features. Does the Kenmore have them?", + "original_text": "Yes, I do want those features. Does the Kenmore have them?", + "start_time": 16.283967191822594, + "end_time": 19.755350411777243, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--254/temp/line_5_B.wav", + "silence_duration": 0.48475335765973393, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "This particular refrigerator is a very good choice. Not only is it affordable, but it comes with all the", + "original_text": "This particular refrigerator is a very good choice. Not only is it affordable, but it comes with all the [interrupt] features you might need, including an ice maker, water dispenser, adjustable shelves, and even a smart temperature control system that helps keep your food fresher for longer.", + "start_time": 20.149698180656166, + "end_time": 37.320854643241205, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--254/temp/line_6_A.wav", + "silence_duration": 0.3943477688789241, + "is_interrupted": true, + "text_after_interrupt": "features you might need, including an ice maker, water dispenser, adjustable shelves, and even a smart temperature control system that helps keep your food fresher for longer." + }, + { + "speaker": "B", + "text": "Just to clarify, when you say \"all the appliances,\" do you mean it includes an ice maker and a water dispenser?", + "original_text": "Just to clarify, when you say \"all the appliances,\" do you mean it includes an ice maker and a water dispenser?", + "start_time": 34.30534183150098, + "end_time": 40.07550056165971, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--254/temp/line_7_B.wav", + "silence_duration": 0.5384575726736353, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Yes, it has an ice maker, water dispenser, and plenty of room on the inside. I was also going to mention that it has a really efficient cooling system.", + "original_text": "Yes, it has an ice maker, water dispenser, and plenty of room on the inside. I was also going to mention that it has a really efficient cooling system.", + "start_time": 40.5396382865592, + "end_time": 49.87406005526668, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--254/temp/line_8_A.wav", + "silence_duration": 0.46413772489949356, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I'd like to see it for myself.", + "original_text": "I'd like to see it for myself.", + "start_time": 50.19516326924105, + "end_time": 51.8437800492864, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--254/temp/line_9_B.wav", + "silence_duration": 0.3211032139743685, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Go right ahead.", + "original_text": "Go right ahead.", + "start_time": 52.40706518035276, + "end_time": 53.463573116860694, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--254/temp/line_10_A.wav", + "silence_duration": 0.5632851310663549, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I like what I see.", + "original_text": "I like what I see.", + "start_time": 53.91952966914304, + "end_time": 55.03408749227229, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--254/temp/line_11_B.wav", + "silence_duration": 0.45595655228234644, + "is_interrupted": false + } + ] + }, + "DialogSum--val--255": { + "original_text": "A: Well, known, Jim, I'm... I'm pretty much in favour of your computers, I think computers teach kids to think, because they require logical [interrupt] sequences and structured approaches to problem-solving which help develop critical thinking abilities and foster creativity in unexpected ways.\nB: Sorry to jump in, but when you say logical thoughts, are you referring to problem-solving skills or something more specific?\nA: I was actually about to mention logical thoughts in terms of problem-solving, yes. But I... I don't agree with that because computers weaken kids' ability to think because kids don't learn basic skills.\nB: What do you mean by basic skills? Are you talking about things like spelling and arithmetic?\nA: Exactly. They can't spell, they can't add, they can't subtract, they even don't remember any more. That's because they rely on gadgets.", + "cleaned_text": "A:Well, known, Jim, I'm... I'm pretty much in favour of your computers, I think computers teach kids to think, because they require logical sequences and structured approaches to problem-solving which help develop critical thinking abilities and foster creativity in unexpected ways.\nB: Sorry to jump in, but when you say logical thoughts, are you referring to problem-solving skills or something more specific?\nA: I was actually about to mention logical thoughts in terms of problem-solving, yes. But I... I don't agree with that because computers weaken kids' ability to think because kids don't learn basic skills.\nB: What do you mean by basic skills? Are you talking about things like spelling and arithmetic?\nA: Exactly. They can't spell, they can't add, they can't subtract, they even don't remember any more. That's because they rely on gadgets.", + "total_duration": 45.26136054421769, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--255/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--255/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--255/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Well, known, Jim, I'm... I'm pretty much in favour of your computers, I think computers teach kids to think, because they require logical", + "original_text": "Well, known, Jim, I'm... I'm pretty much in favour of your computers, I think computers teach kids to think, because they require logical [interrupt] sequences and structured approaches to problem-solving which help develop critical thinking abilities and foster creativity in unexpected ways.", + "start_time": 0, + "end_time": 17.171156462585035, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--255/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": true, + "text_after_interrupt": "sequences and structured approaches to problem-solving which help develop critical thinking abilities and foster creativity in unexpected ways." + }, + { + "speaker": "B", + "text": "Sorry to jump in, but when you say logical thoughts, are you referring to problem-solving skills or something more specific?", + "original_text": "Sorry to jump in, but when you say logical thoughts, are you referring to problem-solving skills or something more specific?", + "start_time": 9.1718820861678, + "end_time": 15.290340136054422, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--255/temp/line_1_B.wav", + "silence_duration": 0.5813810839862088, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I was actually about to mention logical thoughts in terms of problem-solving, yes. But I... I don't agree with that because computers weaken kids' ability to think because kids don't learn basic skills.", + "original_text": "I was actually about to mention logical thoughts in terms of problem-solving, yes. But I... I don't agree with that because computers weaken kids' ability to think because kids don't learn basic skills.", + "start_time": 17.597680060388722, + "end_time": 31.146523597803686, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--255/temp/line_2_A.wav", + "silence_duration": 0.42652359780368687, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "What do you mean by basic skills? Are you talking about things like spelling and arithmetic?", + "original_text": "What do you mean by basic skills? Are you talking about things like spelling and arithmetic?", + "start_time": 31.74643160573855, + "end_time": 36.10017310233719, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--255/temp/line_3_B.wav", + "silence_duration": 0.5999080079348653, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Exactly. They can't spell, they can't add, they can't subtract, they even don't remember any more. That's because they rely on gadgets.", + "original_text": "Exactly. They can't spell, they can't add, they can't subtract, they even don't remember any more. That's because they rely on gadgets.", + "start_time": 36.61194200155982, + "end_time": 45.26137510813578, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--255/temp/line_4_A.wav", + "silence_duration": 0.5117688992226295, + "is_interrupted": false + } + ] + }, + "DialogSum--val--256": { + "original_text": "A: Look, George, There's the Great Wall. \nB: I see. It's on top of the [interrupt] hills, and it stretches over the mountains for miles with such impressive architectural precision that it's hard to believe it was constructed centuries ago without modern technology. \nA: Sorry to jump in, but do you know where we can actually climb it? \nB: Oh, right! I was just about to say it's on top of the hills. And yes, we do have some choices. \nA: Do we have any choices? \nB: Well, we could take the cable car. \nA: Ah. . . let's just climb. It's more fun, I think. \nB: Okay. Let's go. \nA: Well, that was tough. \nB: But we made it. \nA: This looks great. When was it built?", + "cleaned_text": "A: Look, George, There's the Great Wall. \nB:I see. It's on top of the hills, and it stretches over the mountains for miles with such impressive architectural precision that it's hard to believe it was constructed centuries ago without modern technology.\nA: Sorry to jump in, but do you know where we can actually climb it? \nB: Oh, right! I was just about to say it's on top of the hills. And yes, we do have some choices. \nA: Do we have any choices? \nB: Well, we could take the cable car. \nA: Ah. . . let's just climb. It's more fun, I think. \nB: Okay. Let's go. \nA: Well, that was tough. \nB: But we made it. \nA: This looks great. When was it built?", + "total_duration": 35.689297052154195, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--256/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--256/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--256/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Look, George, There's the Great Wall.", + "original_text": "Look, George, There's the Great Wall.", + "start_time": 0, + "end_time": 2.6586848072562357, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--256/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I see. It's on top of the", + "original_text": "I see. It's on top of the [interrupt] hills, and it stretches over the mountains for miles with such impressive architectural precision that it's hard to believe it was constructed centuries ago without modern technology.", + "start_time": 3.2137872468841264, + "end_time": 14.127165931691383, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--256/temp/line_1_B.wav", + "silence_duration": 0.5551024396278906, + "is_interrupted": true, + "text_after_interrupt": "hills, and it stretches over the mountains for miles with such impressive architectural precision that it's hard to believe it was constructed centuries ago without modern technology." + }, + { + "speaker": "A", + "text": "Sorry to jump in, but do you know where we can actually climb it?", + "original_text": "Sorry to jump in, but do you know where we can actually climb it?", + "start_time": 5.210703346657369, + "end_time": 9.22775550085238, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--256/temp/line_2_A.wav", + "silence_duration": 0.3036464467754378, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Oh, right! I was just about to say it's on top of the hills. And yes, we do have some choices.", + "original_text": "Oh, right! I was just about to say it's on top of the hills. And yes, we do have some choices.", + "start_time": 14.654145871084452, + "end_time": 19.669656075166085, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--256/temp/line_3_B.wav", + "silence_duration": 0.5269799393930692, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Do we have any choices?", + "original_text": "Do we have any choices?", + "start_time": 20.218815815830816, + "end_time": 21.751332822633536, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--256/temp/line_4_A.wav", + "silence_duration": 0.5491597406647294, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Well, we could take the cable car.", + "original_text": "Well, we could take the cable car.", + "start_time": 22.1909465177515, + "end_time": 23.94405309371522, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--256/temp/line_5_B.wav", + "silence_duration": 0.4396136951179618, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Ah. . . let's just climb. It's more fun, I think.", + "original_text": "Ah. . . let's just climb. It's more fun, I think.", + "start_time": 24.363336019392836, + "end_time": 27.532859828916646, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--256/temp/line_6_A.wav", + "silence_duration": 0.4192829256776168, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Okay. Let's go.", + "original_text": "Okay. Let's go.", + "start_time": 27.976863694931332, + "end_time": 29.39328092849142, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--256/temp/line_7_B.wav", + "silence_duration": 0.444003866014685, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Well, that was tough.", + "original_text": "Well, that was tough.", + "start_time": 29.761423998351436, + "end_time": 31.07335143599316, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--256/temp/line_8_A.wav", + "silence_duration": 0.3681430698600141, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "But we made it.", + "original_text": "But we made it.", + "start_time": 31.588330358525436, + "end_time": 32.48229861249369, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--256/temp/line_9_B.wav", + "silence_duration": 0.5149789225322765, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "This looks great. When was it built?", + "original_text": "This looks great. When was it built?", + "start_time": 32.94935782102896, + "end_time": 35.68931246955504, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--256/temp/line_10_A.wav", + "silence_duration": 0.46705920853526595, + "is_interrupted": false + } + ] + }, + "DialogSum--val--257": { + "original_text": "A: Hi, is this the Bread and Cheese Deli? \nB: Yes, ma'am. How may I help you? \nA: I need to place an order for a couple of sandwiches and drinks. Can you [interrupt] tell me if you have any vegetarian options available? I'm particularly interested in plant-based proteins and fresh vegetable combinations that might be on your seasonal menu. \nB: Sorry to jump in, but do you need this order delivered right away, or is there a specific time you'd prefer? \nA: Oh, I was just about to ask if you deliver. Yes, I would like it delivered around noon. \nB: We do deliveries for orders over $15, ma'am. Would you like to go ahead and place your order now?", + "cleaned_text": "A: Hi, is this the Bread and Cheese Deli? \nB: Yes, ma'am. How may I help you? \nA:I need to place an order for a couple of sandwiches and drinks. Can you tell me if you have any vegetarian options available? I'm particularly interested in plant-based proteins and fresh vegetable combinations that might be on your seasonal menu.\nB: Sorry to jump in, but do you need this order delivered right away, or is there a specific time you'd prefer? \nA: Oh, I was just about to ask if you deliver. Yes, I would like it delivered around noon. \nB: We do deliveries for orders over $15, ma'am. Would you like to go ahead and place your order now?", + "total_duration": 32.03333333333333, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--257/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--257/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--257/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Hi, is this the Bread and Cheese Deli?", + "original_text": "Hi, is this the Bread and Cheese Deli?", + "start_time": 0, + "end_time": 2.948934240362812, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--257/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, ma'am. How may I help you?", + "original_text": "Yes, ma'am. How may I help you?", + "start_time": 3.3608069458559418, + "end_time": 5.009423725901293, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--257/temp/line_1_B.wav", + "silence_duration": 0.4118727054931299, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I need to place an order for a couple of sandwiches and drinks. Can you", + "original_text": "I need to place an order for a couple of sandwiches and drinks. Can you [interrupt] tell me if you have any vegetarian options available? I'm particularly interested in plant-based proteins and fresh vegetable combinations that might be on your seasonal menu.", + "start_time": 5.571997190601267, + "end_time": 20.351498324388114, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--257/temp/line_2_A.wav", + "silence_duration": 0.562573464699974, + "is_interrupted": true, + "text_after_interrupt": "tell me if you have any vegetarian options available? I'm particularly interested in plant-based proteins and fresh vegetable combinations that might be on your seasonal menu." + }, + { + "speaker": "B", + "text": "Sorry to jump in, but do you need this order delivered right away, or is there a specific time you'd prefer?", + "original_text": "Sorry to jump in, but do you need this order delivered right away, or is there a specific time you'd prefer?", + "start_time": 9.403289707608069, + "end_time": 15.02251873255138, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--257/temp/line_3_B.wav", + "silence_duration": 0.40670773766659646, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Oh, I was just about to ask if you deliver. Yes, I would like it delivered around noon.", + "original_text": "Oh, I was just about to ask if you deliver. Yes, I would like it delivered around noon.", + "start_time": 20.86633577259651, + "end_time": 26.125655500487667, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--257/temp/line_4_A.wav", + "silence_duration": 0.5148374482083956, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "We do deliveries for orders over $15, ma'am. Would you like to go ahead and place your order now?", + "original_text": "We do deliveries for orders over $15, ma'am. Would you like to go ahead and place your order now?", + "start_time": 26.54183894491241, + "end_time": 32.03335821928883, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--257/temp/line_5_B.wav", + "silence_duration": 0.41618344442474164, + "is_interrupted": false + } + ] + }, + "DialogSum--val--258": { + "original_text": "A: Good morning. Could you tell me the times of trains to London, please? \nB: Yes. There are trains at 7:59, 9:18, and [interrupt] 10:32, which is actually the last morning express service that makes fewer stops and gets you to London in just under an hour and a half. These are the main morning departures. \nA: Sorry to interrupt, but could you also tell me what time the first train gets to London? \nB: Sure, the 7:59 train gets to London at 9:36. The other times I mentioned were 9:18 and 10:32. What about coming back? I'd like to come back at about 7 p.m. \nA: There's one at 7:10 p.m. and the next one is at 7:40 p.m. \nB: Mmm, how much is a return ticket? \nA: If you get on before 4 p.m. or after 6 p.m., there is a saver return which is 9 pounds. It's a good option if you're flexible with your travel times. \nB: Oh, and what about the ordinary return? I might need to travel during peak hours. \nA: The ordinary return is 16 pounds [interrupt] and includes unlimited travel on all services throughout the day, including the faster express trains during busy commuting hours.", + "cleaned_text": "A: Good morning. Could you tell me the times of trains to London, please? \nB:Yes. There are trains at 7:59, 9:18, and 10:32, which is actually the last morning express service that makes fewer stops and gets you to London in just under an hour and a half. These are the main morning departures.\nA: Sorry to interrupt, but could you also tell me what time the first train gets to London? \nB: Sure, the 7:59 train gets to London at 9:36. The other times I mentioned were 9:18 and 10:32. What about coming back? I'd like to come back at about 7 p.m. \nA: There's one at 7:10 p.m. and the next one is at 7:40 p.m. \nB: Mmm, how much is a return ticket? \nA: If you get on before 4 p.m. or after 6 p.m., there is a saver return which is 9 pounds. It's a good option if you're flexible with your travel times. \nB: Oh, and what about the ordinary return? I might need to travel during peak hours. \nA:The ordinary return is 16 pounds and includes unlimited travel on all services throughout the day, including the faster express trains during busy commuting hours.", + "total_duration": 62.09972789115646, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--258/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--258/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--258/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Good morning. Could you tell me the times of trains to London, please?", + "original_text": "Good morning. Could you tell me the times of trains to London, please?", + "start_time": 0, + "end_time": 3.657142857142857, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--258/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes. There are trains at 7:59, 9:18, and", + "original_text": "Yes. There are trains at 7:59, 9:18, and [interrupt] 10:32, which is actually the last morning express service that makes fewer stops and gets you to London in just under an hour and a half. These are the main morning departures.", + "start_time": 4.194484774475562, + "end_time": 16.95384985384064, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--258/temp/line_1_B.wav", + "silence_duration": 0.5373419173327046, + "is_interrupted": true, + "text_after_interrupt": "10:32, which is actually the last morning express service that makes fewer stops and gets you to London in just under an hour and a half. These are the main morning departures." + }, + { + "speaker": "A", + "text": "Sorry to interrupt, but could you also tell me what time the first train gets to London?", + "original_text": "Sorry to interrupt, but could you also tell me what time the first train gets to London?", + "start_time": 8.408906543183045, + "end_time": 13.50568658853452, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--258/temp/line_2_A.wav", + "silence_duration": 0.43966824784254815, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Sure, the 7:59 train gets to London at 9:36. The other times I mentioned were 9:18 and 10:32. What about coming back? I'd like to come back at about 7 p.m.", + "original_text": "Sure, the 7:59 train gets to London at 9:36. The other times I mentioned were 9:18 and 10:32. What about coming back? I'd like to come back at about 7 p.m.", + "start_time": 17.26202934911955, + "end_time": 28.07091823800844, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--258/temp/line_3_B.wav", + "silence_duration": 0.3081794952789119, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "There's one at 7:10 p.m. and the next one is at 7:40 p.m.", + "original_text": "There's one at 7:10 p.m. and the next one is at 7:40 p.m.", + "start_time": 28.44829966848897, + "end_time": 33.19678039411255, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--258/temp/line_4_A.wav", + "silence_duration": 0.37738143048053163, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Mmm, how much is a return ticket?", + "original_text": "Mmm, how much is a return ticket?", + "start_time": 33.74944360227045, + "end_time": 35.90889938458338, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--258/temp/line_5_B.wav", + "silence_duration": 0.5526632081579016, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "If you get on before 4 p.m. or after 6 p.m., there is a saver return which is 9 pounds. It's a good option if you're flexible with your travel times.", + "original_text": "If you get on before 4 p.m. or after 6 p.m., there is a saver return which is 9 pounds. It's a good option if you're flexible with your travel times.", + "start_time": 36.37736166734929, + "end_time": 46.512871871430924, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--258/temp/line_6_A.wav", + "silence_duration": 0.46846228276591484, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Oh, and what about the ordinary return? I might need to travel during peak hours.", + "original_text": "Oh, and what about the ordinary return? I might need to travel during peak hours.", + "start_time": 46.89032357557172, + "end_time": 51.348554868088726, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--258/temp/line_7_B.wav", + "silence_duration": 0.3774517041407949, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "The ordinary return is 16 pounds", + "original_text": "The ordinary return is 16 pounds [interrupt] and includes unlimited travel on all services throughout the day, including the faster express trains during busy commuting hours.", + "start_time": 51.68558058166173, + "end_time": 62.09973024152568, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--258/temp/line_8_A.wav", + "silence_duration": 0.3370257135730058, + "is_interrupted": true, + "text_after_interrupt": "and includes unlimited travel on all services throughout the day, including the faster express trains during busy commuting hours." + } + ] + }, + "DialogSum--val--260": { + "original_text": "A: But how did you know I was working for WebTracker? \nB: When I was in LA, I met the WebTracker sales rep. \nA: He couldn't have told you. Only a few people at WebTracker know about [interrupt] the confidential project I've been working on, which involves developing advanced tracking algorithms for government surveillance programs. \nB: The sales rep had a green notepad just like yours. He said everybody at WebTracker used them. \nA: Wait, the notepad? That's how you figured it out? I can't believe it. I can't believe I fell into your trap. \nB: We both may be snakes, Dave, but I'm just better at it. Among the snakes, I'm the sneakiest. \nA: But what was it you were going to say earlier? Only a few people at WebTracker know about what? \nB: Oh, right. I was going to say, only a few people at WebTracker know about the special project you were assigned to.", + "cleaned_text": "A: But how did you know I was working for WebTracker? \nB: When I was in LA, I met the WebTracker sales rep. \nA:He couldn't have told you. Only a few people at WebTracker know about the confidential project I've been working on, which involves developing advanced tracking algorithms for government surveillance programs.\nB: The sales rep had a green notepad just like yours. He said everybody at WebTracker used them. \nA: Wait, the notepad? That's how you figured it out? I can't believe it. I can't believe I fell into your trap. \nB: We both may be snakes, Dave, but I'm just better at it. Among the snakes, I'm the sneakiest. \nA: But what was it you were going to say earlier? Only a few people at WebTracker know about what? \nB: Oh, right. I was going to say, only a few people at WebTracker know about the special project you were assigned to.", + "total_duration": 44.58829931972789, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--260/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--260/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--260/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "But how did you know I was working for WebTracker?", + "original_text": "But how did you know I was working for WebTracker?", + "start_time": 0, + "end_time": 2.5774149659863945, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--260/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "When I was in LA, I met the WebTracker sales rep.", + "original_text": "When I was in LA, I met the WebTracker sales rep.", + "start_time": 3.04124174823305, + "end_time": 6.094665784514229, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--260/temp/line_1_B.wav", + "silence_duration": 0.4638267822466553, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "He couldn't have told you. Only a few people at WebTracker know about", + "original_text": "He couldn't have told you. Only a few people at WebTracker know about [interrupt] the confidential project I've been working on, which involves developing advanced tracking algorithms for government surveillance programs.", + "start_time": 6.566295132106829, + "end_time": 17.95568288720887, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--260/temp/line_2_A.wav", + "silence_duration": 0.47162934759259983, + "is_interrupted": true, + "text_after_interrupt": "the confidential project I've been working on, which involves developing advanced tracking algorithms for government surveillance programs." + }, + { + "speaker": "B", + "text": "The sales rep had a green notepad just like yours. He said everybody at WebTracker used them.", + "original_text": "The sales rep had a green notepad just like yours. He said everybody at WebTracker used them.", + "start_time": 10.502077445031999, + "end_time": 15.81944705954447, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--260/temp/line_3_B.wav", + "silence_duration": 0.5738385819233394, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Wait, the notepad? That's how you figured it out? I can't believe it. I can't believe I fell into your trap.", + "original_text": "Wait, the notepad? That's how you figured it out? I can't believe it. I can't believe I fell into your trap.", + "start_time": 18.431280639632938, + "end_time": 25.710736421945864, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--260/temp/line_4_A.wav", + "silence_duration": 0.4755977524240692, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "We both may be snakes, Dave, but I'm just better at it. Among the snakes, I'm the sneakiest.", + "original_text": "We both may be snakes, Dave, but I'm just better at it. Among the snakes, I'm the sneakiest.", + "start_time": 26.306195559743497, + "end_time": 31.40297560509497, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--260/temp/line_5_B.wav", + "silence_duration": 0.5954591377976339, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "But what was it you were going to say earlier? Only a few people at WebTracker know about what?", + "original_text": "But what was it you were going to say earlier? Only a few people at WebTracker know about what?", + "start_time": 31.96843926187639, + "end_time": 37.785037901332174, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--260/temp/line_6_A.wav", + "silence_duration": 0.5654636567814222, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Oh, right. I was going to say, only a few people at WebTracker know about the special project you were assigned to.", + "original_text": "Oh, right. I was going to say, only a few people at WebTracker know about the special project you were assigned to.", + "start_time": 38.33054168691799, + "end_time": 44.588319464695765, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--260/temp/line_7_B.wav", + "silence_duration": 0.5455037855858147, + "is_interrupted": false + } + ] + }, + "DialogSum--val--261": { + "original_text": "A: Last weekend I didn't want to go out either, so I stayed at home and played video games by myself. It was really [interrupt] relaxing to just unwind and immerse myself in the game for hours without any distractions or responsibilities weighing on my mind. \nB: Sorry to cut in, but what game were you playing? I'm curious because I might have played it too. \nA: Oh, I was playing \"The Legend of Eldoria.\" It's an RPG that I've been hooked on lately. Anyway, I was saying it was really fun! \nB: Oh yeah, that sounds pretty cool, I guess. . . \nA: Yeah, I'm really into video games. In fact, all my friends are on the Internet. I've never met any of them in the real [interrupt] world, but we've known each other for years through gaming and have developed deep friendships despite the physical distance between us. \nB: Wait, you've never met any of them? How do you manage to maintain those friendships without ever meeting in person? \nA: It's surprisingly easy! We chat a lot and play games together, which helps build a strong connection. But I was going to say, I've never met them in the real world, but we're planning to have a meetup soon.", + "cleaned_text": "A:Last weekend I didn't want to go out either, so I stayed at home and played video games by myself. It was really relaxing to just unwind and immerse myself in the game for hours without any distractions or responsibilities weighing on my mind.\nB: Sorry to cut in, but what game were you playing? I'm curious because I might have played it too. \nA: Oh, I was playing \"The Legend of Eldoria.\" It's an RPG that I've been hooked on lately. Anyway, I was saying it was really fun! \nB: Oh yeah, that sounds pretty cool, I guess. . . \nA:Yeah, I'm really into video games. In fact, all my friends are on the Internet. I've never met any of them in the real world, but we've known each other for years through gaming and have developed deep friendships despite the physical distance between us.\nB: Wait, you've never met any of them? How do you manage to maintain those friendships without ever meeting in person? \nA: It's surprisingly easy! We chat a lot and play games together, which helps build a strong connection. But I was going to say, I've never met them in the real world, but we're planning to have a meetup soon.", + "total_duration": 59.12965986394558, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--261/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--261/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--261/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Last weekend I didn't want to go out either, so I stayed at home and played video games by myself. It was really", + "original_text": "Last weekend I didn't want to go out either, so I stayed at home and played video games by myself. It was really [interrupt] relaxing to just unwind and immerse myself in the game for hours without any distractions or responsibilities weighing on my mind.", + "start_time": 0, + "end_time": 15.452879818594104, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--261/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": true, + "text_after_interrupt": "relaxing to just unwind and immerse myself in the game for hours without any distractions or responsibilities weighing on my mind." + }, + { + "speaker": "B", + "text": "Sorry to cut in, but what game were you playing? I'm curious because I might have played it too.", + "original_text": "Sorry to cut in, but what game were you playing? I'm curious because I might have played it too.", + "start_time": 7.592925170068027, + "end_time": 12.852244897959185, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--261/temp/line_1_B.wav", + "silence_duration": 0.5602114673367538, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Oh, I was playing \"The Legend of Eldoria.\" It's an RPG that I've been hooked on lately. Anyway, I was saying it was really fun!", + "original_text": "Oh, I was playing \"The Legend of Eldoria.\" It's an RPG that I've been hooked on lately. Anyway, I was saying it was really fun!", + "start_time": 15.795540449132544, + "end_time": 23.4116855738491, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--261/temp/line_2_A.wav", + "silence_duration": 0.3426606305384391, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Oh yeah, that sounds pretty cool, I guess. . .", + "original_text": "Oh yeah, that sounds pretty cool, I guess. . .", + "start_time": 23.77177198307535, + "end_time": 25.849957924118435, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--261/temp/line_3_B.wav", + "silence_duration": 0.36008640922625257, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Yeah, I'm really into video games. In fact, all my friends are on the Internet. I've never met any of them in the real", + "original_text": "Yeah, I'm really into video games. In fact, all my friends are on the Internet. I've never met any of them in the real [interrupt] world, but we've known each other for years through gaming and have developed deep friendships despite the physical distance between us.", + "start_time": 26.37248855629073, + "end_time": 41.32613934994153, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--261/temp/line_4_A.wav", + "silence_duration": 0.5225306321722955, + "is_interrupted": true, + "text_after_interrupt": "world, but we've known each other for years through gaming and have developed deep friendships despite the physical distance between us." + }, + { + "speaker": "B", + "text": "Wait, you've never met any of them? How do you manage to maintain those friendships without ever meeting in person?", + "original_text": "Wait, you've never met any of them? How do you manage to maintain those friendships without ever meeting in person?", + "start_time": 40.16346427674719, + "end_time": 46.293532303958074, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--261/temp/line_5_B.wav", + "silence_duration": 0.4343222639011635, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "It's surprisingly easy! We chat a lot and play games together, which helps build a strong connection. But I was going to say, I've never met them in the real world, but we're planning to have a meetup soon.", + "original_text": "It's surprisingly easy! We chat a lot and play games together, which helps build a strong connection. But I was going to say, I've never met them in the real world, but we're planning to have a meetup soon.", + "start_time": 46.79989320040499, + "end_time": 59.12968911877233, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--261/temp/line_6_A.wav", + "silence_duration": 0.5063608964469108, + "is_interrupted": false + } + ] + }, + "DialogSum--val--262": { + "original_text": "A: The summers are so great here! Not hot at all. I love the cooling breezes, the clear air, all the green [interrupt] and the way the landscape just feels so peaceful with its rolling hills and vibrant wildflowers that seem to stretch endlessly towards the horizon.\n\nB: Sorry to cut in, but I just realized—are we in any kind of rush today? I mean, do we have plans later that we need to stick to?\n\nA: No, not really. I had thought we'd stay in Hamburg tonight, but we can't unless we rush it. Let's stay in Bremen instead. Tomorrow we can have lunch in Hamburg, then check into a hostel in Copenhagen and have dinner there.\n\nB: Sounds fine to me. Whatever, let's enjoy this pond first. You were saying something about the greenery?\n\nA: Oh, right! I was just saying how much I love the greenery here. We can walk around to that path that leads into the woods there. Hey, look! There are some wild ducks over there in the reeds.\n\nB: I see them! Wow! How do you know they're wild?\n\nA: I used to go hunting with my uncle, that's how. He taught me how to spot them by their distinctive markings and the way they move differently from domesticated ducks.", + "cleaned_text": "A:The summers are so great here! Not hot at all. I love the cooling breezes, the clear air, all the green and the way the landscape just feels so peaceful with its rolling hills and vibrant wildflowers that seem to stretch endlessly towards the horizon.\n\nB: Sorry to cut in, but I just realized—are we in any kind of rush today? I mean, do we have plans later that we need to stick to?\n\nA: No, not really. I had thought we'd stay in Hamburg tonight, but we can't unless we rush it. Let's stay in Bremen instead. Tomorrow we can have lunch in Hamburg, then check into a hostel in Copenhagen and have dinner there.\n\nB: Sounds fine to me. Whatever, let's enjoy this pond first. You were saying something about the greenery?\n\nA: Oh, right! I was just saying how much I love the greenery here. We can walk around to that path that leads into the woods there. Hey, look! There are some wild ducks over there in the reeds.\n\nB: I see them! Wow! How do you know they're wild?\n\nA: I used to go hunting with my uncle, that's how. He taught me how to spot them by their distinctive markings and the way they move differently from domesticated ducks.", + "total_duration": 59.819818594104305, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--262/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--262/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--262/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "The summers are so great here! Not hot at all. I love the cooling breezes, the clear air, all the green", + "original_text": "The summers are so great here! Not hot at all. I love the cooling breezes, the clear air, all the green [interrupt] and the way the landscape just feels so peaceful with its rolling hills and vibrant wildflowers that seem to stretch endlessly towards the horizon.", + "start_time": 0, + "end_time": 14.97687074829932, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--262/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": true, + "text_after_interrupt": "and the way the landscape just feels so peaceful with its rolling hills and vibrant wildflowers that seem to stretch endlessly towards the horizon." + }, + { + "speaker": "B", + "text": "Sorry to cut in, but I just realized—are we in any kind of rush today? I mean, do we have plans later that we need to stick to?", + "original_text": "Sorry to cut in, but I just realized—are we in any kind of rush today? I mean, do we have plans later that we need to stick to?", + "start_time": 6.675736961451247, + "end_time": 14.315102040816328, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--262/temp/line_1_B.wav", + "silence_duration": 0.3201447363397254, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "No, not really. I had thought we'd stay in Hamburg tonight, but we can't unless we rush it. Let's stay in Bremen instead. Tomorrow we can have lunch in Hamburg, then check into a hostel in Copenhagen and have dinner there.", + "original_text": "No, not really. I had thought we'd stay in Hamburg tonight, but we can't unless we rush it. Let's stay in Bremen instead. Tomorrow we can have lunch in Hamburg, then check into a hostel in Copenhagen and have dinner there.", + "start_time": 15.33429764592593, + "end_time": 28.592891750234323, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--262/temp/line_2_A.wav", + "silence_duration": 0.3574268976266119, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Sounds fine to me. Whatever, let's enjoy this pond first. You were saying something about the greenery?", + "original_text": "Sounds fine to me. Whatever, let's enjoy this pond first. You were saying something about the greenery?", + "start_time": 29.130725523035263, + "end_time": 35.086643890382206, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--262/temp/line_3_B.wav", + "silence_duration": 0.5378337728009422, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Oh, right! I was just saying how much I love the greenery here. We can walk around to that path that leads into the woods there. Hey, look! There are some wild ducks over there in the reeds.", + "original_text": "Oh, right! I was just saying how much I love the greenery here. We can walk around to that path that leads into the woods there. Hey, look! There are some wild ducks over there in the reeds.", + "start_time": 35.63346364637863, + "end_time": 46.66294210442852, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--262/temp/line_4_A.wav", + "silence_duration": 0.5468197559964207, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I see them! Wow! How do you know they're wild?", + "original_text": "I see them! Wow! How do you know they're wild?", + "start_time": 46.96524556493872, + "end_time": 50.0186696012199, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--262/temp/line_5_B.wav", + "silence_duration": 0.3023034605102032, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I used to go hunting with my uncle, that's how. He taught me how to spot them by their distinctive markings and the way they move differently from domesticated ducks.", + "original_text": "I used to go hunting with my uncle, that's how. He taught me how to spot them by their distinctive markings and the way they move differently from domesticated ducks.", + "start_time": 50.58991517123529, + "end_time": 59.81984714402441, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--262/temp/line_6_A.wav", + "silence_duration": 0.5712455700153924, + "is_interrupted": false + } + ] + }, + "DialogSum--val--264": { + "original_text": "A: You look tired. \nB: Yeah, I've been working so much overtime lately. \nA: Really? How come? \nB: My boss gave me a big project. I had to have it finished by this morning. It was so [interrupt] stressful, and I barely had any time to relax because the project involved coordinating with multiple departments and meeting extremely tight deadlines that kept changing at the last minute. \nA: Wait, did you manage to finish it on time? \nB: Yes, I did, but it was so difficult. I had to stay up all night. \nA: You shouldn't work so hard. \nB: I know, but hard work pays off. You [interrupt] know how much I've been wanting that promotion, so I felt I needed to go the extra mile and prove my dedication to the company by delivering exceptional results under pressure. \nA: Sorry, but do you think it's worth it if it affects your health? \nB: I get your point, but I was hoping maybe now I'll get that promotion I was talking about.", + "cleaned_text": "A: You look tired. \nB: Yeah, I've been working so much overtime lately. \nA: Really? How come? \nB:My boss gave me a big project. I had to have it finished by this morning. It was so stressful, and I barely had any time to relax because the project involved coordinating with multiple departments and meeting extremely tight deadlines that kept changing at the last minute.\nA: Wait, did you manage to finish it on time? \nB: Yes, I did, but it was so difficult. I had to stay up all night. \nA: You shouldn't work so hard. \nB:I know, but hard work pays off. You know how much I've been wanting that promotion, so I felt I needed to go the extra mile and prove my dedication to the company by delivering exceptional results under pressure.\nA: Sorry, but do you think it's worth it if it affects your health? \nB: I get your point, but I was hoping maybe now I'll get that promotion I was talking about.", + "total_duration": 42.48707482993197, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--264/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--264/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--264/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "You look tired.", + "original_text": "You look tired.", + "start_time": 0, + "end_time": 1.1145578231292517, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--264/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yeah, I've been working so much overtime lately.", + "original_text": "Yeah, I've been working so much overtime lately.", + "start_time": 1.680755728582348, + "end_time": 4.5135901957025295, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--264/temp/line_1_B.wav", + "silence_duration": 0.5661979054530963, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Really? How come?", + "original_text": "Really? How come?", + "start_time": 4.996629859541089, + "end_time": 6.215677478588709, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--264/temp/line_2_A.wav", + "silence_duration": 0.48303966383856034, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "My boss gave me a big project. I had to have it finished by this morning. It was so", + "original_text": "My boss gave me a big project. I had to have it finished by this morning. It was so [interrupt] stressful, and I barely had any time to relax because the project involved coordinating with multiple departments and meeting extremely tight deadlines that kept changing at the last minute.", + "start_time": 6.70687945692814, + "end_time": 21.080031384365782, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--264/temp/line_3_B.wav", + "silence_duration": 0.49120197833943124, + "is_interrupted": true, + "text_after_interrupt": "stressful, and I barely had any time to relax because the project involved coordinating with multiple departments and meeting extremely tight deadlines that kept changing at the last minute." + }, + { + "speaker": "A", + "text": "Wait, did you manage to finish it on time?", + "original_text": "Wait, did you manage to finish it on time?", + "start_time": 11.664339774388457, + "end_time": 14.543614150805691, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--264/temp/line_4_A.wav", + "silence_duration": 0.577426143829526, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, I did, but it was so difficult. I had to stay up all night.", + "original_text": "Yes, I did, but it was so difficult. I had to stay up all night.", + "start_time": 21.521086044313797, + "end_time": 25.178228901456656, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--264/temp/line_5_B.wav", + "silence_duration": 0.44105465994801696, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "You shouldn't work so hard.", + "original_text": "You shouldn't work so hard.", + "start_time": 25.62220006804717, + "end_time": 27.212766961471207, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--264/temp/line_6_A.wav", + "silence_duration": 0.44397116659051533, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I know, but hard work pays off. You", + "original_text": "I know, but hard work pays off. You [interrupt] know how much I've been wanting that promotion, so I felt I needed to go the extra mile and prove my dedication to the company by delivering exceptional results under pressure.", + "start_time": 27.765914873824183, + "end_time": 38.0639647604455, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--264/temp/line_7_B.wav", + "silence_duration": 0.5531479123529768, + "is_interrupted": true, + "text_after_interrupt": "know how much I've been wanting that promotion, so I felt I needed to go the extra mile and prove my dedication to the company by delivering exceptional results under pressure." + }, + { + "speaker": "A", + "text": "Sorry, but do you think it's worth it if it affects your health?", + "original_text": "Sorry, but do you think it's worth it if it affects your health?", + "start_time": 33.04749140889509, + "end_time": 36.70463426603795, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--264/temp/line_8_A.wav", + "silence_duration": 0.31097847029443887, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I get your point, but I was hoping maybe now I'll get that promotion I was talking about.", + "original_text": "I get your point, but I was hoping maybe now I'll get that promotion I was talking about.", + "start_time": 38.59774604617227, + "end_time": 42.48708844980039, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--264/temp/line_9_B.wav", + "silence_duration": 0.5337812857267646, + "is_interrupted": false + } + ] + }, + "DialogSum--val--265": { + "original_text": "A: What do you like to do in your spare time? \nB: I am a girl of many interests. I like dance, chess, collecting stamps, travelling and [interrupt] exploring new cuisines whenever I get the chance, especially trying out authentic local dishes from different cultures and learning about their culinary traditions. \nA: Sorry to jump in, but I'm really curious—what kind of places do you like to travel to? \nB: I enjoy traveling to historical sites and natural landscapes. But I haven't mentioned my love for taking photos yet—it's actually a big part of why I enjoy traveling so much. \nA: That makes sense, capturing memories is always special. By the way, you mentioned you like chess. I'm not really into Chinese chess; it's too difficult for me. \nB: You can learn Chinese checkers or military chess. Both of them are much easier. \nA: OK, I will try. As for stamp collecting, don't you think it is an expensive hobby? \nB: Yes, it is. But it is full of fun and knowledge. What about you, what do you like to do as a hobby? \nA: I like gardening. I take care of the plants every day. I like those flowers and the swing in my garden. If the weather is nice, I would like to [interrupt] spend the entire afternoon outside, just soaking in the sun and listening to the birds chirping while surrounded by the beautiful colors and fragrances of my garden. \nB: Oh, gardening sounds so calming. Do you grow any vegetables, or is it mostly flowers? \nA: Mostly flowers, but I do have a small section for herbs. I was actually going to say that I like to lie on the lawn when the weather is nice. \nB: That sounds really peaceful.", + "cleaned_text": "A: What do you like to do in your spare time? \nB:I am a girl of many interests. I like dance, chess, collecting stamps, travelling and exploring new cuisines whenever I get the chance, especially trying out authentic local dishes from different cultures and learning about their culinary traditions.\nA: Sorry to jump in, but I'm really curious—what kind of places do you like to travel to? \nB: I enjoy traveling to historical sites and natural landscapes. But I haven't mentioned my love for taking photos yet—it's actually a big part of why I enjoy traveling so much. \nA: That makes sense, capturing memories is always special. By the way, you mentioned you like chess. I'm not really into Chinese chess; it's too difficult for me. \nB: You can learn Chinese checkers or military chess. Both of them are much easier. \nA: OK, I will try. As for stamp collecting, don't you think it is an expensive hobby? \nB: Yes, it is. But it is full of fun and knowledge. What about you, what do you like to do as a hobby? \nA:I like gardening. I take care of the plants every day. I like those flowers and the swing in my garden. If the weather is nice, I would like to spend the entire afternoon outside, just soaking in the sun and listening to the birds chirping while surrounded by the beautiful colors and fragrances of my garden.\nB: Oh, gardening sounds so calming. Do you grow any vegetables, or is it mostly flowers? \nA: Mostly flowers, but I do have a small section for herbs. I was actually going to say that I like to lie on the lawn when the weather is nice. \nB: That sounds really peaceful.", + "total_duration": 83.3061224489796, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--265/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--265/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--265/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "What do you like to do in your spare time?", + "original_text": "What do you like to do in your spare time?", + "start_time": 0, + "end_time": 2.1942857142857144, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--265/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I am a girl of many interests. I like dance, chess, collecting stamps, travelling and", + "original_text": "I am a girl of many interests. I like dance, chess, collecting stamps, travelling and [interrupt] exploring new cuisines whenever I get the chance, especially trying out authentic local dishes from different cultures and learning about their culinary traditions.", + "start_time": 2.5683196110540027, + "end_time": 15.246414849149241, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--265/temp/line_1_B.wav", + "silence_duration": 0.3740338967682883, + "is_interrupted": true, + "text_after_interrupt": "exploring new cuisines whenever I get the chance, especially trying out authentic local dishes from different cultures and learning about their culinary traditions." + }, + { + "speaker": "A", + "text": "Sorry to jump in, but I'm really curious—what kind of places do you like to travel to?", + "original_text": "Sorry to jump in, but I'm really curious—what kind of places do you like to travel to?", + "start_time": 9.104736844614093, + "end_time": 14.723965869557404, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--265/temp/line_2_A.wav", + "silence_duration": 0.4150742969236525, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I enjoy traveling to historical sites and natural landscapes. But I haven't mentioned my love for taking photos yet—it's actually a big part of why I enjoy traveling so much.", + "original_text": "I enjoy traveling to historical sites and natural landscapes. But I haven't mentioned my love for taking photos yet—it's actually a big part of why I enjoy traveling so much.", + "start_time": 15.54835916775961, + "end_time": 24.662191367306093, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--265/temp/line_3_B.wav", + "silence_duration": 0.30194431861036825, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "That makes sense, capturing memories is always special. By the way, you mentioned you like chess. I'm not really into Chinese chess; it's too difficult for me.", + "original_text": "That makes sense, capturing memories is always special. By the way, you mentioned you like chess. I'm not really into Chinese chess; it's too difficult for me.", + "start_time": 24.989787635739557, + "end_time": 35.10207788517266, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--265/temp/line_4_A.wav", + "silence_duration": 0.3275962684334636, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "You can learn Chinese checkers or military chess. Both of them are much easier.", + "original_text": "You can learn Chinese checkers or military chess. Both of them are much easier.", + "start_time": 35.69659114877187, + "end_time": 40.2128723279102, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--265/temp/line_5_B.wav", + "silence_duration": 0.5945132635992145, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "OK, I will try. As for stamp collecting, don't you think it is an expensive hobby?", + "original_text": "OK, I will try. As for stamp collecting, don't you think it is an expensive hobby?", + "start_time": 40.812373657340046, + "end_time": 46.768292024686986, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--265/temp/line_6_A.wav", + "silence_duration": 0.5995013294298512, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, it is. But it is full of fun and knowledge. What about you, what do you like to do as a hobby?", + "original_text": "Yes, it is. But it is full of fun and knowledge. What about you, what do you like to do as a hobby?", + "start_time": 47.3388541682741, + "end_time": 52.83037344265052, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--265/temp/line_7_B.wav", + "silence_duration": 0.5705621435871211, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I like gardening. I take care of the plants every day. I like those flowers and the swing in my garden. If the weather is nice, I would like to", + "original_text": "I like gardening. I take care of the plants every day. I like those flowers and the swing in my garden. If the weather is nice, I would like to [interrupt] spend the entire afternoon outside, just soaking in the sun and listening to the birds chirping while surrounded by the beautiful colors and fragrances of my garden.", + "start_time": 53.418563203375946, + "end_time": 71.58817771584759, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--265/temp/line_8_A.wav", + "silence_duration": 0.5881897607254294, + "is_interrupted": true, + "text_after_interrupt": "spend the entire afternoon outside, just soaking in the sun and listening to the birds chirping while surrounded by the beautiful colors and fragrances of my garden." + }, + { + "speaker": "B", + "text": "Oh, gardening sounds so calming. Do you grow any vegetables, or is it mostly flowers?", + "original_text": "Oh, gardening sounds so calming. Do you grow any vegetables, or is it mostly flowers?", + "start_time": 67.76587876333387, + "end_time": 72.1544501919053, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--265/temp/line_9_B.wav", + "silence_duration": 0.49159452470767623, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Mostly flowers, but I do have a small section for herbs. I was actually going to say that I like to lie on the lawn when the weather is nice.", + "original_text": "Mostly flowers, but I do have a small section for herbs. I was actually going to say that I like to lie on the lawn when the weather is nice.", + "start_time": 72.45892403895895, + "end_time": 81.46826644258707, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--265/temp/line_10_A.wav", + "silence_duration": 0.3044738470536628, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "That sounds really peaceful.", + "original_text": "That sounds really peaceful.", + "start_time": 81.9129414282009, + "end_time": 83.30613870711245, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--265/temp/line_11_B.wav", + "silence_duration": 0.44467498561382623, + "is_interrupted": false + } + ] + }, + "DialogSum--val--266": { + "original_text": "A: Have a nice weekend! \nB: Thanks. You too! Do you have any [interrupt] plans for the weekend? I was thinking maybe we could meet up for coffee if you're free on Saturday afternoon. \nA: Sorry to jump in, but I was just wondering if you've made any plans for the weekend? \nB: Well, my family's away and I can't afford to do much. What about [interrupt] you? Do you have anything exciting planned like visiting that new museum exhibition or trying out the Italian restaurant downtown? \nA: Actually, I was thinking of catching up on some reading, but I was curious—did you mention if you had any specific activities in mind since your family's away?", + "cleaned_text": "A: Have a nice weekend! \nB:Thanks. You too! Do you have any plans for the weekend? I was thinking maybe we could meet up for coffee if you're free on Saturday afternoon.\nA: Sorry to jump in, but I was just wondering if you've made any plans for the weekend? \nB:Well, my family's away and I can't afford to do much. What about you? Do you have anything exciting planned like visiting that new museum exhibition or trying out the Italian restaurant downtown?\nA: Actually, I was thinking of catching up on some reading, but I was curious—did you mention if you had any specific activities in mind since your family's away?", + "total_duration": 27.661269841269842, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--266/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--266/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--266/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Have a nice weekend!", + "original_text": "Have a nice weekend!", + "start_time": 0, + "end_time": 1.3931972789115645, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--266/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Thanks. You too! Do you have any", + "original_text": "Thanks. You too! Do you have any [interrupt] plans for the weekend? I was thinking maybe we could meet up for coffee if you're free on Saturday afternoon.", + "start_time": 1.7630187898295517, + "end_time": 8.856714934954269, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--266/temp/line_1_B.wav", + "silence_duration": 0.3698215109179871, + "is_interrupted": true, + "text_after_interrupt": "plans for the weekend? I was thinking maybe we could meet up for coffee if you're free on Saturday afternoon." + }, + { + "speaker": "A", + "text": "Sorry to jump in, but I was just wondering if you've made any plans for the weekend?", + "original_text": "Sorry to jump in, but I was just wondering if you've made any plans for the weekend?", + "start_time": 3.6786650483329533, + "end_time": 8.531635569874904, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--266/temp/line_2_A.wav", + "silence_duration": 0.4117242663662918, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Well, my family's away and I can't afford to do much. What about", + "original_text": "Well, my family's away and I can't afford to do much. What about [interrupt] you? Do you have anything exciting planned like visiting that new museum exhibition or trying out the Italian restaurant downtown?", + "start_time": 9.419081098878626, + "end_time": 19.450101507041893, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--266/temp/line_3_B.wav", + "silence_duration": 0.5623661639243582, + "is_interrupted": true, + "text_after_interrupt": "you? Do you have anything exciting planned like visiting that new museum exhibition or trying out the Italian restaurant downtown?" + }, + { + "speaker": "A", + "text": "Actually, I was thinking of catching up on some reading, but I was curious—did you mention if you had any specific activities in mind since your family's away?", + "original_text": "Actually, I was thinking of catching up on some reading, but I was curious—did you mention if you had any specific activities in mind since your family's away?", + "start_time": 18.57070185075677, + "end_time": 27.66131409565473, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--266/temp/line_4_A.wav", + "silence_duration": 0.35124003287200695, + "is_interrupted": false + } + ] + }, + "DialogSum--val--267": { + "original_text": "A: Which of the two do you think is better? I mean, what's the difference between [interrupt] the sound quality and overall build of the two options? I've been trying to decide for days but can't quite figure out which would suit my needs better. \nB: Sorry to jump in, but are you planning to use it in a specific room? That might help me give you a better recommendation. \nA: I only want it for the kitchen. I like to listen to the news at breakfast time. \nB: Got it. Well, this one costs more, but it has a much better sound. This part of it is made of wood, not plastic. And there's a tone control, too. \nA: Hmm. . . well, the other one is good for the money. It's much cheaper. We sell a lot of them and all our customers are satisfied with them. \nB: Hmm. . . I'd like the cheaper one, please. Can I pay by [interrupt] cash, or do you only accept cards? I'd prefer to use cash if possible since I have exact change ready. \nA: Oh, before you pay, did you want to hear more about the tone control on the other one, or are you sure about your choice? \nB: No, I'm sure. I'll take the cheaper one. Can I pay by cheque? \nA: Certainly.", + "cleaned_text": "A:Which of the two do you think is better? I mean, what's the difference between the sound quality and overall build of the two options? I've been trying to decide for days but can't quite figure out which would suit my needs better.\nB: Sorry to jump in, but are you planning to use it in a specific room? That might help me give you a better recommendation. \nA: I only want it for the kitchen. I like to listen to the news at breakfast time. \nB: Got it. Well, this one costs more, but it has a much better sound. This part of it is made of wood, not plastic. And there's a tone control, too. \nA: Hmm. . . well, the other one is good for the money. It's much cheaper. We sell a lot of them and all our customers are satisfied with them. \nB:Hmm. . . I'd like the cheaper one, please. Can I pay by cash, or do you only accept cards? I'd prefer to use cash if possible since I have exact change ready.\nA: Oh, before you pay, did you want to hear more about the tone control on the other one, or are you sure about your choice? \nB: No, I'm sure. I'll take the cheaper one. Can I pay by cheque? \nA: Certainly.", + "total_duration": 58.559002267573696, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--267/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--267/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--267/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Which of the two do you think is better? I mean, what's the difference between", + "original_text": "Which of the two do you think is better? I mean, what's the difference between [interrupt] the sound quality and overall build of the two options? I've been trying to decide for days but can't quite figure out which would suit my needs better.", + "start_time": 0, + "end_time": 13.432743764172336, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--267/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": true, + "text_after_interrupt": "the sound quality and overall build of the two options? I've been trying to decide for days but can't quite figure out which would suit my needs better." + }, + { + "speaker": "B", + "text": "Sorry to jump in, but are you planning to use it in a specific room? That might help me give you a better recommendation.", + "original_text": "Sorry to jump in, but are you planning to use it in a specific room? That might help me give you a better recommendation.", + "start_time": 4.574331065759637, + "end_time": 10.565079365079365, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--267/temp/line_1_B.wav", + "silence_duration": 0.5932587070128208, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I only want it for the kitchen. I like to listen to the news at breakfast time.", + "original_text": "I only want it for the kitchen. I like to listen to the news at breakfast time.", + "start_time": 13.900382183763222, + "end_time": 18.451493294874332, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--267/temp/line_2_A.wav", + "silence_duration": 0.46763841959088503, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Got it. Well, this one costs more, but it has a much better sound. This part of it is made of wood, not plastic. And there's a tone control, too.", + "original_text": "Got it. Well, this one costs more, but it has a much better sound. This part of it is made of wood, not plastic. And there's a tone control, too.", + "start_time": 18.908289048944876, + "end_time": 27.13976297184737, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--267/temp/line_3_B.wav", + "silence_duration": 0.4567957540705452, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Hmm. . . well, the other one is good for the money. It's much cheaper. We sell a lot of them and all our customers are satisfied with them.", + "original_text": "Hmm. . . well, the other one is good for the money. It's much cheaper. We sell a lot of them and all our customers are satisfied with them.", + "start_time": 27.501299291946726, + "end_time": 35.75599316949774, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--267/temp/line_4_A.wav", + "silence_duration": 0.3615363200993525, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Hmm. . . I'd like the cheaper one, please. Can I pay by", + "original_text": "Hmm. . . I'd like the cheaper one, please. Can I pay by [interrupt] cash, or do you only accept cards? I'd prefer to use cash if possible since I have exact change ready.", + "start_time": 36.16990186462474, + "end_time": 45.20246422290138, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--267/temp/line_5_B.wav", + "silence_duration": 0.41390869512699846, + "is_interrupted": true, + "text_after_interrupt": "cash, or do you only accept cards? I'd prefer to use cash if possible since I have exact change ready." + }, + { + "speaker": "A", + "text": "Oh, before you pay, did you want to hear more about the tone control on the other one, or are you sure about your choice?", + "original_text": "Oh, before you pay, did you want to hear more about the tone control on the other one, or are you sure about your choice?", + "start_time": 46.7510400623799, + "end_time": 53.48482691045246, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--267/temp/line_6_A.wav", + "silence_duration": 0.36615047718178634, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "No, I'm sure. I'll take the cheaper one. Can I pay by cheque?", + "original_text": "No, I'm sure. I'll take the cheaper one. Can I pay by cheque?", + "start_time": 53.9810430950903, + "end_time": 57.278276655181, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--267/temp/line_7_B.wav", + "silence_duration": 0.4962161846378406, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Certainly.", + "original_text": "Certainly.", + "start_time": 57.80437629897338, + "end_time": 58.55902482505048, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--267/temp/line_8_A.wav", + "silence_duration": 0.5260996437923757, + "is_interrupted": false + } + ] + }, + "DialogSum--val--268": { + "original_text": "A: Come here! I can see the tall camphor trees from [interrupt] here, and they look even more majestic in the sunlight with their sprawling branches casting intricate shadows on the ground below us.\nB: Sorry to interrupt, but I think I also spotted some yew trees over there. Do you see them?\nA: Yes, we can also see some yew trees. This is a great botanical garden in the city. Listen to the sound of nature! It's like music.\nB: Yeah, I agree. It makes you feel really good. By the way, what are those red flowers over there? Miss Liu?\nA: Oh, do you mean the red flowers? They are peony flowers. The red and yellow peony flowers are so beautiful.\nB: Yes, they are! You like them very much, right?\nA: Sure. I'm going to take more pictures today. Oh, and I was going to ask if you wanted me to help you with it? You might find it easier to capture the perfect angle with a little assistance while I hold the branches aside for better framing.\nB: That would be great. You are so kind. Thanks.", + "cleaned_text": "A:Come here! I can see the tall camphor trees from here, and they look even more majestic in the sunlight with their sprawling branches casting intricate shadows on the ground below us.\nB: Sorry to interrupt, but I think I also spotted some yew trees over there. Do you see them?\nA: Yes, we can also see some yew trees. This is a great botanical garden in the city. Listen to the sound of nature! It's like music.\nB: Yeah, I agree. It makes you feel really good. By the way, what are those red flowers over there? Miss Liu?\nA: Oh, do you mean the red flowers? They are peony flowers. The red and yellow peony flowers are so beautiful.\nB: Yes, they are! You like them very much, right?\nA: Sure. I'm going to take more pictures today. Oh, and I was going to ask if you wanted me to help you with it? You might find it easier to capture the perfect angle with a little assistance while I hold the branches aside for better framing.\nB: That would be great. You are so kind. Thanks.", + "total_duration": 52.79047619047619, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--268/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--268/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--268/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Come here! I can see the tall camphor trees from", + "original_text": "Come here! I can see the tall camphor trees from [interrupt] here, and they look even more majestic in the sunlight with their sprawling branches casting intricate shadows on the ground below us.", + "start_time": 0, + "end_time": 9.97297052154195, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--268/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": true, + "text_after_interrupt": "here, and they look even more majestic in the sunlight with their sprawling branches casting intricate shadows on the ground below us." + }, + { + "speaker": "B", + "text": "Sorry to interrupt, but I think I also spotted some yew trees over there. Do you see them?", + "original_text": "Sorry to interrupt, but I think I also spotted some yew trees over there. Do you see them?", + "start_time": 3.378503401360544, + "end_time": 7.534875283446712, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--268/temp/line_1_B.wav", + "silence_duration": 0.48022240191175025, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Yes, we can also see some yew trees. This is a great botanical garden in the city. Listen to the sound of nature! It's like music.", + "original_text": "Yes, we can also see some yew trees. This is a great botanical garden in the city. Listen to the sound of nature! It's like music.", + "start_time": 10.389258246622237, + "end_time": 19.108351217143777, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--268/temp/line_2_A.wav", + "silence_duration": 0.41628772508028844, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yeah, I agree. It makes you feel really good. By the way, what are those red flowers over there? Miss Liu?", + "original_text": "Yeah, I agree. It makes you feel really good. By the way, what are those red flowers over there? Miss Liu?", + "start_time": 19.69941392097982, + "end_time": 25.24898308197755, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--268/temp/line_3_B.wav", + "silence_duration": 0.5910627038360408, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Oh, do you mean the red flowers? They are peony flowers. The red and yellow peony flowers are so beautiful.", + "original_text": "Oh, do you mean the red flowers? They are peony flowers. The red and yellow peony flowers are so beautiful.", + "start_time": 25.667399415354208, + "end_time": 32.795925492451715, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--268/temp/line_4_A.wav", + "silence_duration": 0.4184163333766589, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, they are! You like them very much, right?", + "original_text": "Yes, they are! You like them very much, right?", + "start_time": 33.32363277348165, + "end_time": 36.29578696849298, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--268/temp/line_5_B.wav", + "silence_duration": 0.5277072810299299, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Sure. I'm going to take more pictures today. Oh, and I was going to ask if you wanted me to help you with it? You might find it easier to capture the perfect angle with a little assistance while I hold the branches aside for better framing.", + "original_text": "Sure. I'm going to take more pictures today. Oh, and I was going to ask if you wanted me to help you with it? You might find it easier to capture the perfect angle with a little assistance while I hold the branches aside for better framing.", + "start_time": 36.72379240779198, + "end_time": 50.121706239991525, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--268/temp/line_6_A.wav", + "silence_duration": 0.4280054392990029, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "That would be great. You are so kind. Thanks.", + "original_text": "That would be great. You are so kind. Thanks.", + "start_time": 50.43367288416766, + "end_time": 52.79049828099306, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--268/temp/line_7_B.wav", + "silence_duration": 0.31196664417613496, + "is_interrupted": false + } + ] + }, + "DialogSum--val--269": { + "original_text": "A: Well, that's all for the interview. Thank you for your interest in this job. \nB: You are welcome. Thank you for taking time out of your busy schedule to interview me. May I [interrupt] ask when I might expect to hear back from you regarding the final decision and whether there will be any additional steps in the hiring process after this initial interview? \nA: Sorry to cut in, but before I forget, could you confirm the best time of day to reach you? \nB: Oh, sure! My telephone number is 2974-5328, and you can call me at any time in the daytime. And you were asking if you could call me about the final decision, right? \nA: Yes, exactly. We will get in touch with you by the end of next week. \nB: Great. I will look forward to hearing from you. And do I need the contact details of someone in case I have further questions? \nA: Sorry, just to clarify, if a second interview is needed, we'll definitely notify you. \nB: Understood. Goodbye. \nA: Goodbye.", + "cleaned_text": "A: Well, that's all for the interview. Thank you for your interest in this job. \nB:You are welcome. Thank you for taking time out of your busy schedule to interview me. May I ask when I might expect to hear back from you regarding the final decision and whether there will be any additional steps in the hiring process after this initial interview?\nA: Sorry to cut in, but before I forget, could you confirm the best time of day to reach you? \nB: Oh, sure! My telephone number is 2974-5328, and you can call me at any time in the daytime. And you were asking if you could call me about the final decision, right? \nA: Yes, exactly. We will get in touch with you by the end of next week. \nB: Great. I will look forward to hearing from you. And do I need the contact details of someone in case I have further questions? \nA: Sorry, just to clarify, if a second interview is needed, we'll definitely notify you. \nB: Understood. Goodbye. \nA: Goodbye.", + "total_duration": 50.806666666666665, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--269/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--269/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--269/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Well, that's all for the interview. Thank you for your interest in this job.", + "original_text": "Well, that's all for the interview. Thank you for your interest in this job.", + "start_time": 0, + "end_time": 4.435011337868481, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--269/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "You are welcome. Thank you for taking time out of your busy schedule to interview me. May I", + "original_text": "You are welcome. Thank you for taking time out of your busy schedule to interview me. May I [interrupt] ask when I might expect to hear back from you regarding the final decision and whether there will be any additional steps in the hiring process after this initial interview?", + "start_time": 4.84189781862917, + "end_time": 17.392283306157516, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--269/temp/line_1_B.wav", + "silence_duration": 0.40688648076068884, + "is_interrupted": true, + "text_after_interrupt": "ask when I might expect to hear back from you regarding the final decision and whether there will be any additional steps in the hiring process after this initial interview?" + }, + { + "speaker": "A", + "text": "Sorry to cut in, but before I forget, could you confirm the best time of day to reach you?", + "original_text": "Sorry to cut in, but before I forget, could you confirm the best time of day to reach you?", + "start_time": 9.358178997767492, + "end_time": 15.453417093005587, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--269/temp/line_2_A.wav", + "silence_duration": 0.4255798273256468, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Oh, sure! My telephone number is 2974-5328, and you can call me at any time in the daytime. And you were asking if you could call me about the final decision, right?", + "original_text": "Oh, sure! My telephone number is 2974-5328, and you can call me at any time in the daytime. And you were asking if you could call me about the final decision, right?", + "start_time": 17.860975208090874, + "end_time": 29.494172487002437, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--269/temp/line_3_B.wav", + "silence_duration": 0.46869190193335686, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Yes, exactly. We will get in touch with you by the end of next week.", + "original_text": "Yes, exactly. We will get in touch with you by the end of next week.", + "start_time": 30.00637954834609, + "end_time": 34.38334099959326, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--269/temp/line_4_A.wav", + "silence_duration": 0.5122070613436507, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Great. I will look forward to hearing from you. And do I need the contact details of someone in case I have further questions?", + "original_text": "Great. I will look forward to hearing from you. And do I need the contact details of someone in case I have further questions?", + "start_time": 34.78207372929488, + "end_time": 41.77128007850123, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--269/temp/line_5_B.wav", + "silence_duration": 0.39873272970162155, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Sorry, just to clarify, if a second interview is needed, we'll definitely notify you.", + "original_text": "Sorry, just to clarify, if a second interview is needed, we'll definitely notify you.", + "start_time": 42.11071372991772, + "end_time": 47.79960261880661, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--269/temp/line_6_A.wav", + "silence_duration": 0.3394336514164906, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Understood. Goodbye.", + "original_text": "Understood. Goodbye.", + "start_time": 48.25118308999475, + "end_time": 49.388960867772525, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--269/temp/line_7_B.wav", + "silence_duration": 0.4515804711881366, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Goodbye.", + "original_text": "Goodbye.", + "start_time": 49.970771234341846, + "end_time": 50.80668960168879, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--269/temp/line_8_A.wav", + "silence_duration": 0.5818103665693187, + "is_interrupted": false + } + ] + }, + "DialogSum--val--270": { + "original_text": "A: Hello, John, please invite all our clients to the conference next week. I'd like you to [interrupt] personally reach out to each of them with a customized invitation that highlights the key benefits of attending this particular event.\nB: How should I get their contact info— Should I use the company's CRM system, or do you have another source in mind?\nA: Get the clients' contact info from my Rolodex. It has the most up-to-date information including their preferred method of communication.\nB: Got it. Where should I put them up?\nA: How about the Holiday Inn? They're offering us a corporate discount for block bookings during this period.\nB: The clients like the Shangri-La Hotel more. They've mentioned several times how much they appreciate the luxury amenities and central location.\nA: Well, the client is always right. What else would I— Do you need any help with the logistics? I can assist with transportation arrangements if that would be helpful.\nB: Oh, and should I confirm their attendance once I send out the invitations?\nA: Yes, definitely confirm their attendance. Also, I was going to say, please print out the meeting agenda for me to look over so we can make any necessary adjustments before finalizing it.\nB: Certainly. I'll have that ready for you by end of day.\nA: And make sure to return my Rolodex to my desk when you are done with it. It contains some sensitive information that needs to remain confidential.\nB: Of course. I'm on it. I'll handle everything with the utmost care and professionalism.", + "cleaned_text": "A:Hello, John, please invite all our clients to the conference next week. I'd like you to personally reach out to each of them with a customized invitation that highlights the key benefits of attending this particular event.\nB: How should I get their contact info— Should I use the company's CRM system, or do you have another source in mind?\nA: Get the clients' contact info from my Rolodex. It has the most up-to-date information including their preferred method of communication.\nB: Got it. Where should I put them up?\nA: How about the Holiday Inn? They're offering us a corporate discount for block bookings during this period.\nB: The clients like the Shangri-La Hotel more. They've mentioned several times how much they appreciate the luxury amenities and central location.\nA: Well, the client is always right. What else would I— Do you need any help with the logistics? I can assist with transportation arrangements if that would be helpful.\nB: Oh, and should I confirm their attendance once I send out the invitations?\nA: Yes, definitely confirm their attendance. Also, I was going to say, please print out the meeting agenda for me to look over so we can make any necessary adjustments before finalizing it.\nB: Certainly. I'll have that ready for you by end of day.\nA: And make sure to return my Rolodex to my desk when you are done with it. It contains some sensitive information that needs to remain confidential.\nB: Of course. I'm on it. I'll handle everything with the utmost care and professionalism.", + "total_duration": 83.33986394557823, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--270/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--270/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--270/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Hello, John, please invite all our clients to the conference next week. I'd like you to", + "original_text": "Hello, John, please invite all our clients to the conference next week. I'd like you to [interrupt] personally reach out to each of them with a customized invitation that highlights the key benefits of attending this particular event.", + "start_time": 0, + "end_time": 13.40952380952381, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--270/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": true, + "text_after_interrupt": "personally reach out to each of them with a customized invitation that highlights the key benefits of attending this particular event." + }, + { + "speaker": "B", + "text": "How should I get their contact info— Should I use the company's CRM system, or do you have another source in mind?", + "original_text": "How should I get their contact info— Should I use the company's CRM system, or do you have another source in mind?", + "start_time": 5.12, + "end_time": 11.017868480725625, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--270/temp/line_1_B.wav", + "silence_duration": 0.4967762987746571, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Get the clients' contact info from my Rolodex. It has the most up-to-date information including their preferred method of communication.", + "original_text": "Get the clients' contact info from my Rolodex. It has the most up-to-date information including their preferred method of communication.", + "start_time": 13.840184148073869, + "end_time": 22.094878025624887, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--270/temp/line_2_A.wav", + "silence_duration": 0.4306603385500586, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Got it. Where should I put them up?", + "original_text": "Got it. Where should I put them up?", + "start_time": 22.483348889141563, + "end_time": 23.92298607735018, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--270/temp/line_3_B.wav", + "silence_duration": 0.3884708635166755, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "How about the Holiday Inn? They're offering us a corporate discount for block bookings during this period.", + "original_text": "How about the Holiday Inn? They're offering us a corporate discount for block bookings during this period.", + "start_time": 24.423982329430615, + "end_time": 30.13609117296803, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--270/temp/line_4_A.wav", + "silence_duration": 0.5009962520804333, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "The clients like the Shangri-La Hotel more. They've mentioned several times how much they appreciate the luxury amenities and central location.", + "original_text": "The clients like the Shangri-La Hotel more. They've mentioned several times how much they appreciate the luxury amenities and central location.", + "start_time": 30.597715301740628, + "end_time": 38.73630940604902, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--270/temp/line_5_B.wav", + "silence_duration": 0.4616241287725998, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Well, the client is always right. What else would I— Do you need any help with the logistics? I can assist with transportation arrangements if that would be helpful.", + "original_text": "Well, the client is always right. What else would I— Do you need any help with the logistics? I can assist with transportation arrangements if that would be helpful.", + "start_time": 39.276190122912034, + "end_time": 49.46975021361498, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--270/temp/line_6_A.wav", + "silence_duration": 0.5398807168630186, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Oh, and should I confirm their attendance once I send out the invitations?", + "original_text": "Oh, and should I confirm their attendance once I send out the invitations?", + "start_time": 49.869921353305024, + "end_time": 54.16561296328235, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--270/temp/line_7_B.wav", + "silence_duration": 0.4001711396900433, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Yes, definitely confirm their attendance. Also, I was going to say, please print out the meeting agenda for me to look over so we can make any necessary adjustments before finalizing it.", + "original_text": "Yes, definitely confirm their attendance. Also, I was going to say, please print out the meeting agenda for me to look over so we can make any necessary adjustments before finalizing it.", + "start_time": 54.61935255424134, + "end_time": 67.21617795106674, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--270/temp/line_8_A.wav", + "silence_duration": 0.4537395909589855, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Certainly. I'll have that ready for you by end of day.", + "original_text": "Certainly. I'll have that ready for you by end of day.", + "start_time": 67.58001992280226, + "end_time": 69.94845529695192, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--270/temp/line_9_B.wav", + "silence_duration": 0.363841971735528, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "And make sure to return my Rolodex to my desk when you are done with it. It contains some sensitive information that needs to remain confidential.", + "original_text": "And make sure to return my Rolodex to my desk when you are done with it. It contains some sensitive information that needs to remain confidential.", + "start_time": 70.39106080504443, + "end_time": 78.80829436513514, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--270/temp/line_10_A.wav", + "silence_duration": 0.44260550809250804, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Of course. I'm on it. I'll handle everything with the utmost care and professionalism.", + "original_text": "Of course. I'm on it. I'll handle everything with the utmost care and professionalism.", + "start_time": 79.18353597531546, + "end_time": 83.33990785740163, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--270/temp/line_11_B.wav", + "silence_duration": 0.3752416101803298, + "is_interrupted": false + } + ] + }, + "DialogSum--val--271": { + "original_text": "A: About my driving test, did I do well? \nB: You did a fabulous job. \nA: Are you telling me that I passed the [interrupt] test with flying colors despite my nervousness? I was so anxious I could barely focus during the parallel parking portion. \nB: Sorry to cut in, but yes, you passed! I could tell you were anxious about it. \nA: That's a relief. But what did I mess up on? \nB: You did mess up a little on one thing. \nA: Tell me. \nB: You had a little trouble on your parallel parking. \nA: That's not easy for me. \nB: That's something that you really need to work on. \nA: Am I still going to get my license? \nB: Oh, absolutely. You're still going to get it.", + "cleaned_text": "A: About my driving test, did I do well? \nB: You did a fabulous job. \nA:Are you telling me that I passed the test with flying colors despite my nervousness? I was so anxious I could barely focus during the parallel parking portion.\nB: Sorry to cut in, but yes, you passed! I could tell you were anxious about it. \nA: That's a relief. But what did I mess up on? \nB: You did mess up a little on one thing. \nA: Tell me. \nB: You had a little trouble on your parallel parking. \nA: That's not easy for me. \nB: That's something that you really need to work on. \nA: Am I still going to get my license? \nB: Oh, absolutely. You're still going to get it.", + "total_duration": 33.93201814058957, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--271/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--271/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--271/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "About my driving test, did I do well?", + "original_text": "About my driving test, did I do well?", + "start_time": 0, + "end_time": 2.391655328798186, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--271/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "You did a fabulous job.", + "original_text": "You did a fabulous job.", + "start_time": 2.9338238092957245, + "end_time": 4.385070974828604, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--271/temp/line_1_B.wav", + "silence_duration": 0.5421684804975384, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Are you telling me that I passed the", + "original_text": "Are you telling me that I passed the [interrupt] test with flying colors despite my nervousness? I was so anxious I could barely focus during the parallel parking portion.", + "start_time": 4.872716478586389, + "end_time": 14.532217612373238, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--271/temp/line_2_A.wav", + "silence_duration": 0.4876455037577845, + "is_interrupted": true, + "text_after_interrupt": "test with flying colors despite my nervousness? I was so anxious I could barely focus during the parallel parking portion." + }, + { + "speaker": "B", + "text": "Sorry to cut in, but yes, you passed! I could tell you were anxious about it.", + "original_text": "Sorry to cut in, but yes, you passed! I could tell you were anxious about it.", + "start_time": 7.090222147520629, + "end_time": 11.40913371214648, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--271/temp/line_3_B.wav", + "silence_duration": 0.3277465515093576, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "That's a relief. But what did I mess up on?", + "original_text": "That's a relief. But what did I mess up on?", + "start_time": 14.938045572818563, + "end_time": 18.049519495721057, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--271/temp/line_4_A.wav", + "silence_duration": 0.405827960445326, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "You did mess up a little on one thing.", + "original_text": "You did mess up a little on one thing.", + "start_time": 18.382418989058923, + "end_time": 20.379335088832164, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--271/temp/line_5_B.wav", + "silence_duration": 0.3328994933378669, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Tell me.", + "original_text": "Tell me.", + "start_time": 20.694195209596977, + "end_time": 21.30952400778292, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--271/temp/line_6_A.wav", + "silence_duration": 0.3148601207648112, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "You had a little trouble on your parallel parking.", + "original_text": "You had a little trouble on your parallel parking.", + "start_time": 21.642573612452807, + "end_time": 24.034228941250994, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--271/temp/line_7_B.wav", + "silence_duration": 0.3330496046698873, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "That's not easy for me.", + "original_text": "That's not easy for me.", + "start_time": 24.396169796733922, + "end_time": 26.009956644806483, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--271/temp/line_8_A.wav", + "silence_duration": 0.3619408554829284, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "That's something that you really need to work on.", + "original_text": "That's something that you really need to work on.", + "start_time": 26.58701936058219, + "end_time": 28.53749555105838, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--271/temp/line_9_B.wav", + "silence_duration": 0.5770627157757051, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Am I still going to get my license?", + "original_text": "Am I still going to get my license?", + "start_time": 29.00994976046969, + "end_time": 31.006865860242932, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--271/temp/line_10_A.wav", + "silence_duration": 0.47245420941131117, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Oh, absolutely. You're still going to get it.", + "original_text": "Oh, absolutely. You're still going to get it.", + "start_time": 31.412669539931485, + "end_time": 33.932034619296566, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--271/temp/line_11_B.wav", + "silence_duration": 0.40580367968855197, + "is_interrupted": false + } + ] + }, + "DialogSum--val--272": { + "original_text": "A: How much is the admission fee for a student? \nB: We offer a reduction of 50% and it comes to $10. \nA: Here you are. Where is the museum [interrupt] located? I want to make sure we go in the right direction because we're new to this area and don't want to get lost. \nB: Sorry to interrupt, but I just wanted to clarify, do you need a receipt for the payment? \nA: No, that's okay. But I was asking about the museum guide earlier. Is it available in different languages? \nB: Oh, yes! The guide is free of charge and comes in five different languages including Spanish, French, Mandarin, German, and of course English. Would you like me to show you where to pick one up?", + "cleaned_text": "A: How much is the admission fee for a student? \nB: We offer a reduction of 50% and it comes to $10. \nA:Here you are. Where is the museum located? I want to make sure we go in the right direction because we're new to this area and don't want to get lost.\nB: Sorry to interrupt, but I just wanted to clarify, do you need a receipt for the payment? \nA: No, that's okay. But I was asking about the museum guide earlier. Is it available in different languages? \nB: Oh, yes! The guide is free of charge and comes in five different languages including Spanish, French, Mandarin, German, and of course English. Would you like me to show you where to pick one up?", + "total_duration": 32.73102040816327, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--272/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--272/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--272/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "How much is the admission fee for a student?", + "original_text": "How much is the admission fee for a student?", + "start_time": 0, + "end_time": 2.391655328798186, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--272/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "We offer a reduction of 50% and it comes to $10.", + "original_text": "We offer a reduction of 50% and it comes to $10.", + "start_time": 2.740946006639205, + "end_time": 6.2123292265938534, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--272/temp/line_1_B.wav", + "silence_duration": 0.3492906778410187, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Here you are. Where is the museum", + "original_text": "Here you are. Where is the museum [interrupt] located? I want to make sure we go in the right direction because we're new to this area and don't want to get lost.", + "start_time": 6.586686442578365, + "end_time": 15.642468755503536, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--272/temp/line_2_A.wav", + "silence_duration": 0.3743572159845115, + "is_interrupted": true, + "text_after_interrupt": "located? I want to make sure we go in the right direction because we're new to this area and don't want to get lost." + }, + { + "speaker": "B", + "text": "Sorry to interrupt, but I just wanted to clarify, do you need a receipt for the payment?", + "original_text": "Sorry to interrupt, but I just wanted to clarify, do you need a receipt for the payment?", + "start_time": 8.699702315594239, + "end_time": 13.5178429051634, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--272/temp/line_3_B.wav", + "silence_duration": 0.5178083439287404, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "No, that's okay. But I was asking about the museum guide earlier. Is it available in different languages?", + "original_text": "No, that's okay. But I was asking about the museum guide earlier. Is it available in different languages?", + "start_time": 16.187803483845055, + "end_time": 22.944810286566145, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--272/temp/line_4_A.wav", + "silence_duration": 0.5453347283415179, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Oh, yes! The guide is free of charge and comes in five different languages including Spanish, French, Mandarin, German, and of course English. Would you like me to show you where to pick one up?", + "original_text": "Oh, yes! The guide is free of charge and comes in five different languages including Spanish, French, Mandarin, German, and of course English. Would you like me to show you where to pick one up?", + "start_time": 23.45465622160149, + "end_time": 32.731028103687656, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--272/temp/line_5_B.wav", + "silence_duration": 0.509845935035345, + "is_interrupted": false + } + ] + }, + "DialogSum--val--273": { + "original_text": "A: Excuse me, could you tell me which bus I should take to go to the railway station?\nB: I think you'd better take the No. 16 bus. It can take you right [interrupt] to the station without needing to transfer and it's usually the fastest option during this time of day when traffic isn't too heavy.\nA: Sorry to cut in, but do you know how often that bus runs?\nB: Every fifteen minutes.\nA: I really can't wait that long. Are there any other buses that can take me there?\nB: The No. 2 bus also goes to the railway station. You may [interrupt] need to walk a bit after getting off, but it's still quite convenient since the stop is just across the street from the station's main entrance.\nA: Oh, great! And where exactly can I find that bus?\nB: The bus stop is not far from here. Go straight on and you can easily find it.\nA: Thanks a lot.\nB: You are welcome.", + "cleaned_text": "A: Excuse me, could you tell me which bus I should take to go to the railway station?\nB:I think you'd better take the No. 16 bus. It can take you right to the station without needing to transfer and it's usually the fastest option during this time of day when traffic isn't too heavy.\nA: Sorry to cut in, but do you know how often that bus runs?\nB: Every fifteen minutes.\nA: I really can't wait that long. Are there any other buses that can take me there?\nB:The No. 2 bus also goes to the railway station. You may need to walk a bit after getting off, but it's still quite convenient since the stop is just across the street from the station's main entrance.\nA: Oh, great! And where exactly can I find that bus?\nB: The bus stop is not far from here. Go straight on and you can easily find it.\nA: Thanks a lot.\nB: You are welcome.", + "total_duration": 40.091791383219956, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--273/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--273/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--273/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Excuse me, could you tell me which bus I should take to go to the railway station?", + "original_text": "Excuse me, could you tell me which bus I should take to go to the railway station?", + "start_time": 0, + "end_time": 4.6788208616780045, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--273/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I think you'd better take the No. 16 bus. It can take you right", + "original_text": "I think you'd better take the No. 16 bus. It can take you right [interrupt] to the station without needing to transfer and it's usually the fastest option during this time of day when traffic isn't too heavy.", + "start_time": 5.180752927396302, + "end_time": 14.991183766398569, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--273/temp/line_1_B.wav", + "silence_duration": 0.5019320657182978, + "is_interrupted": true, + "text_after_interrupt": "to the station without needing to transfer and it's usually the fastest option during this time of day when traffic isn't too heavy." + }, + { + "speaker": "A", + "text": "Sorry to cut in, but do you know how often that bus runs?", + "original_text": "Sorry to cut in, but do you know how often that bus runs?", + "start_time": 8.791455875242107, + "end_time": 12.680798278870226, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--273/temp/line_2_A.wav", + "silence_duration": 0.5156295319719097, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Every fifteen minutes.", + "original_text": "Every fifteen minutes.", + "start_time": 15.434309926518502, + "end_time": 16.711407432187436, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--273/temp/line_3_B.wav", + "silence_duration": 0.4431261601199335, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I really can't wait that long. Are there any other buses that can take me there?", + "original_text": "I really can't wait that long. Are there any other buses that can take me there?", + "start_time": 17.068723533524967, + "end_time": 21.201875460962608, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--273/temp/line_4_A.wav", + "silence_duration": 0.35731610133753217, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "The No. 2 bus also goes to the railway station. You may", + "original_text": "The No. 2 bus also goes to the railway station. You may [interrupt] need to walk a bit after getting off, but it's still quite convenient since the stop is just across the street from the station's main entrance.", + "start_time": 21.565812453738573, + "end_time": 31.75937254444152, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--273/temp/line_5_B.wav", + "silence_duration": 0.3639369927759658, + "is_interrupted": true, + "text_after_interrupt": "need to walk a bit after getting off, but it's still quite convenient since the stop is just across the street from the station's main entrance." + }, + { + "speaker": "A", + "text": "Oh, great! And where exactly can I find that bus?", + "original_text": "Oh, great! And where exactly can I find that bus?", + "start_time": 29.372791779182275, + "end_time": 32.70485527124577, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--273/temp/line_6_A.wav", + "silence_duration": 0.42251036406431736, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "The bus stop is not far from here. Go straight on and you can easily find it.", + "original_text": "The bus stop is not far from here. Go straight on and you can easily find it.", + "start_time": 33.26048757053082, + "end_time": 37.19626988345599, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--273/temp/line_7_B.wav", + "silence_duration": 0.5556322992850539, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Thanks a lot.", + "original_text": "Thanks a lot.", + "start_time": 37.68402186910667, + "end_time": 38.69408989631756, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--273/temp/line_8_A.wav", + "silence_duration": 0.4877519856506789, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "You are welcome.", + "original_text": "You are welcome.", + "start_time": 39.19785562866965, + "end_time": 40.091823882637904, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--273/temp/line_9_B.wav", + "silence_duration": 0.5037657323520913, + "is_interrupted": false + } + ] + }, + "DialogSum--val--274": { + "original_text": "A: Are we supposed to get off right here? \nB: I think so; hurry up and get [interrupt] on your things before the doors close because the bus driver doesn't usually wait very long and we don't want to miss our stop completely. \nA: Wait, are you sure this is the right stop? I don't want to end up lost. \nB: I don't know. You said this was the right stop. \nA: I think I was wrong. \nB: Did we get off the bus too early? \nA: I don't know; it kind of looks like we might have gotten off a stop too soon, but I'm not entirely sure. \nB: But why did you tell me to get off if you weren't sure? \nA: I'm sorry. I thought this was our stop. I was about to say it looks like we did get off too early. \nB: I really don't feel like walking. \nA: We could always wait for the next bus to come.", + "cleaned_text": "A: Are we supposed to get off right here? \nB:I think so; hurry up and get on your things before the doors close because the bus driver doesn't usually wait very long and we don't want to miss our stop completely.\nA: Wait, are you sure this is the right stop? I don't want to end up lost. \nB: I don't know. You said this was the right stop. \nA: I think I was wrong. \nB: Did we get off the bus too early? \nA: I don't know; it kind of looks like we might have gotten off a stop too soon, but I'm not entirely sure. \nB: But why did you tell me to get off if you weren't sure? \nA: I'm sorry. I thought this was our stop. I was about to say it looks like we did get off too early. \nB: I really don't feel like walking. \nA: We could always wait for the next bus to come.", + "total_duration": 38.41324263038549, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--274/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--274/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--274/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Are we supposed to get off right here?", + "original_text": "Are we supposed to get off right here?", + "start_time": 0, + "end_time": 1.9156462585034013, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--274/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I think so; hurry up and get", + "original_text": "I think so; hurry up and get [interrupt] on your things before the doors close because the bus driver doesn't usually wait very long and we don't want to miss our stop completely.", + "start_time": 2.2793606857458055, + "end_time": 10.232195152865987, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--274/temp/line_1_B.wav", + "silence_duration": 0.36371442724240427, + "is_interrupted": true, + "text_after_interrupt": "on your things before the doors close because the bus driver doesn't usually wait very long and we don't want to miss our stop completely." + }, + { + "speaker": "A", + "text": "Wait, are you sure this is the right stop? I don't want to end up lost.", + "original_text": "Wait, are you sure this is the right stop? I don't want to end up lost.", + "start_time": 4.090517148330839, + "end_time": 8.966707624521316, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--274/temp/line_2_A.wav", + "silence_duration": 0.49952134293345585, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I don't know. You said this was the right stop.", + "original_text": "I don't know. You said this was the right stop.", + "start_time": 10.804391268806596, + "end_time": 12.975457028443785, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--274/temp/line_3_B.wav", + "silence_duration": 0.5721961159406075, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I think I was wrong.", + "original_text": "I think I was wrong.", + "start_time": 13.45176543144951, + "end_time": 14.844962710361076, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--274/temp/line_4_A.wav", + "silence_duration": 0.47630840300572597, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Did we get off the bus too early?", + "original_text": "Did we get off the bus too early?", + "start_time": 15.174605317694033, + "end_time": 16.753562233793804, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--274/temp/line_5_B.wav", + "silence_duration": 0.3296426073329564, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I don't know; it kind of looks like we might have gotten off a stop too soon, but I'm not entirely sure.", + "original_text": "I don't know; it kind of looks like we might have gotten off a stop too soon, but I'm not entirely sure.", + "start_time": 17.146178439970406, + "end_time": 23.938015174664283, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--274/temp/line_6_A.wav", + "silence_duration": 0.39261620617660054, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "But why did you tell me to get off if you weren't sure?", + "original_text": "But why did you tell me to get off if you weren't sure?", + "start_time": 24.361437836917467, + "end_time": 26.799533075012704, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--274/temp/line_7_B.wav", + "silence_duration": 0.4234226622531855, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I'm sorry. I thought this was our stop. I was about to say it looks like we did get off too early.", + "original_text": "I'm sorry. I thought this was our stop. I was about to say it looks like we did get off too early.", + "start_time": 27.135331175158086, + "end_time": 33.12607947447781, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--274/temp/line_8_A.wav", + "silence_duration": 0.3357981001453838, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I really don't feel like walking.", + "original_text": "I really don't feel like walking.", + "start_time": 33.69750952211019, + "end_time": 35.33451632483128, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--274/temp/line_9_B.wav", + "silence_duration": 0.5714300476323739, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "We could always wait for the next bus to come.", + "original_text": "We could always wait for the next bus to come.", + "start_time": 35.835865480803704, + "end_time": 38.4132804467901, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--274/temp/line_10_A.wav", + "silence_duration": 0.5013491559724287, + "is_interrupted": false + } + ] + }, + "DialogSum--val--275": { + "original_text": "A: I saw your ad in The New York Times. I am seriously considering one of the apartments listed in it. \nB: We are happy to help you. May I know which one it [interrupt] would be? That way, I can provide you with more specific information about the amenities, neighborhood features, and any current promotions we might be offering. \nA: Sorry to jump in, it's the two-bedroom apartment on 38th East Street. \nB: Oh, it is conveniently located, isn't it? \nA: That's why I think it may suit my needs. \nB: I believe it will. It comes furnished. You can move in immediately after the lease is [interrupt] signed, so you won't have to wait long and we can even arrange for a professional cleaning service to prepare the space for your arrival if needed. \nA: Hold on, you mentioned it comes furnished, but I wanted to confirm—does the rent of $840 per month include utilities? \nB: No, the $840 does not include utilities. But as I was saying, you can move in immediately after the lease is signed. \nA: Got it. Also, would it be possible for me to rent the apartment on a month-by-month basis? \nB: I believe that can be arranged. But there should be a refundable security deposit, you know, just to cover any potential damages.", + "cleaned_text": "A: I saw your ad in The New York Times. I am seriously considering one of the apartments listed in it. \nB:We are happy to help you. May I know which one it would be? That way, I can provide you with more specific information about the amenities, neighborhood features, and any current promotions we might be offering.\nA: Sorry to jump in, it's the two-bedroom apartment on 38th East Street. \nB: Oh, it is conveniently located, isn't it? \nA: That's why I think it may suit my needs. \nB:I believe it will. It comes furnished. You can move in immediately after the lease is signed, so you won't have to wait long and we can even arrange for a professional cleaning service to prepare the space for your arrival if needed.\nA: Hold on, you mentioned it comes furnished, but I wanted to confirm—does the rent of $840 per month include utilities? \nB: No, the $840 does not include utilities. But as I was saying, you can move in immediately after the lease is signed. \nA: Got it. Also, would it be possible for me to rent the apartment on a month-by-month basis? \nB: I believe that can be arranged. But there should be a refundable security deposit, you know, just to cover any potential damages.", + "total_duration": 65.6015873015873, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--275/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--275/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--275/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "I saw your ad in The New York Times. I am seriously considering one of the apartments listed in it.", + "original_text": "I saw your ad in The New York Times. I am seriously considering one of the apartments listed in it.", + "start_time": 0, + "end_time": 6.095238095238095, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--275/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "We are happy to help you. May I know which one it", + "original_text": "We are happy to help you. May I know which one it [interrupt] would be? That way, I can provide you with more specific information about the amenities, neighborhood features, and any current promotions we might be offering.", + "start_time": 6.4553514486642705, + "end_time": 17.891179113063366, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--275/temp/line_1_B.wav", + "silence_duration": 0.3601133534261751, + "is_interrupted": true, + "text_after_interrupt": "would be? That way, I can provide you with more specific information about the amenities, neighborhood features, and any current promotions we might be offering." + }, + { + "speaker": "A", + "text": "Sorry to jump in, it's the two-bedroom apartment on 38th East Street.", + "original_text": "Sorry to jump in, it's the two-bedroom apartment on 38th East Street.", + "start_time": 9.346235802405767, + "end_time": 13.885736936192615, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--275/temp/line_2_A.wav", + "silence_duration": 0.5769425851582914, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Oh, it is conveniently located, isn't it?", + "original_text": "Oh, it is conveniently located, isn't it?", + "start_time": 18.44957627913601, + "end_time": 20.66708194807025, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--275/temp/line_3_B.wav", + "silence_duration": 0.5583971660726437, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "That's why I think it may suit my needs.", + "original_text": "That's why I think it may suit my needs.", + "start_time": 21.00298264864248, + "end_time": 23.394637977440667, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--275/temp/line_4_A.wav", + "silence_duration": 0.33590070057222704, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I believe it will. It comes furnished. You can move in immediately after the lease is", + "original_text": "I believe it will. It comes furnished. You can move in immediately after the lease is [interrupt] signed, so you won't have to wait long and we can even arrange for a professional cleaning service to prepare the space for your arrival if needed.", + "start_time": 23.95948056710987, + "end_time": 35.01217897980828, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--275/temp/line_5_B.wav", + "silence_duration": 0.5648425896692029, + "is_interrupted": true, + "text_after_interrupt": "signed, so you won't have to wait long and we can even arrange for a professional cleaning service to prepare the space for your arrival if needed." + }, + { + "speaker": "A", + "text": "Hold on, you mentioned it comes furnished, but I wanted to confirm—does the rent of $840 per month include utilities?", + "original_text": "Hold on, you mentioned it comes furnished, but I wanted to confirm—does the rent of $840 per month include utilities?", + "start_time": 33.9601820190044, + "end_time": 43.236553901090566, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--275/temp/line_6_A.wav", + "silence_duration": 0.4852903730228356, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "No, the $840 does not include utilities. But as I was saying, you can move in immediately after the lease is signed.", + "original_text": "No, the $840 does not include utilities. But as I was saying, you can move in immediately after the lease is signed.", + "start_time": 43.57470638800857, + "end_time": 52.00354992542354, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--275/temp/line_7_B.wav", + "silence_duration": 0.3381524869180062, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Got it. Also, would it be possible for me to rent the apartment on a month-by-month basis?", + "original_text": "Got it. Also, would it be possible for me to rent the apartment on a month-by-month basis?", + "start_time": 52.43413647840616, + "end_time": 58.1694652765921, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--275/temp/line_8_A.wav", + "silence_duration": 0.4305865529826157, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I believe that can be arranged. But there should be a refundable security deposit, you know, just to cover any potential damages.", + "original_text": "I believe that can be arranged. But there should be a refundable security deposit, you know, just to cover any potential damages.", + "start_time": 58.647244170680665, + "end_time": 65.60162058791423, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--275/temp/line_9_B.wav", + "silence_duration": 0.4777788940885682, + "is_interrupted": false + } + ] + }, + "DialogSum--val--276": { + "original_text": "A: Excuse me, this is my first time on a plane. How do I check [interrupt] in and get my boarding pass? I'm a bit nervous about the whole process and want to make sure I don't miss any important steps before my flight.\nB: Sorry to interrupt, but do you have your ticket with you? I can guide you better if I see it. \nA: Yes. Here you are. \nB: You can get a boarding pass at that counter. Do you have anything to check in, like a suitcase or any large luggage? \nA: I just have a handbag, no checked luggage. \nB: Then you could wait in the departure area after going through security. \nA: Is that all I need to do for check-in? \nB: Yeah, I think so. It is very simple. Just make sure to arrive at your gate at least 30 minutes before boarding time to avoid any last-minute rush.", + "cleaned_text": "A:Excuse me, this is my first time on a plane. How do I check in and get my boarding pass? I'm a bit nervous about the whole process and want to make sure I don't miss any important steps before my flight.\nB: Sorry to interrupt, but do you have your ticket with you? I can guide you better if I see it. \nA: Yes. Here you are. \nB: You can get a boarding pass at that counter. Do you have anything to check in, like a suitcase or any large luggage? \nA: I just have a handbag, no checked luggage. \nB: Then you could wait in the departure area after going through security. \nA: Is that all I need to do for check-in? \nB: Yeah, I think so. It is very simple. Just make sure to arrive at your gate at least 30 minutes before boarding time to avoid any last-minute rush.", + "total_duration": 38.71514739229025, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--276/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--276/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--276/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Excuse me, this is my first time on a plane. How do I check", + "original_text": "Excuse me, this is my first time on a plane. How do I check [interrupt] in and get my boarding pass? I'm a bit nervous about the whole process and want to make sure I don't miss any important steps before my flight.", + "start_time": 0, + "end_time": 12.956734693877552, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--276/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": true, + "text_after_interrupt": "in and get my boarding pass? I'm a bit nervous about the whole process and want to make sure I don't miss any important steps before my flight." + }, + { + "speaker": "B", + "text": "Sorry to interrupt, but do you have your ticket with you? I can guide you better if I see it.", + "original_text": "Sorry to interrupt, but do you have your ticket with you? I can guide you better if I see it.", + "start_time": 4.179591836734694, + "end_time": 8.870022675736962, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--276/temp/line_1_B.wav", + "silence_duration": 0.5967192597980187, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Yes. Here you are.", + "original_text": "Yes. Here you are.", + "start_time": 13.336113957463173, + "end_time": 14.810581077644578, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--276/temp/line_2_A.wav", + "silence_duration": 0.379379263585621, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "You can get a boarding pass at that counter. Do you have anything to check in, like a suitcase or any large luggage?", + "original_text": "You can get a boarding pass at that counter. Do you have anything to check in, like a suitcase or any large luggage?", + "start_time": 15.274100566975426, + "end_time": 20.545030272190843, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--276/temp/line_3_B.wav", + "silence_duration": 0.46351948933084786, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I just have a handbag, no checked luggage.", + "original_text": "I just have a handbag, no checked luggage.", + "start_time": 20.971865650248922, + "end_time": 23.74665023074779, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--276/temp/line_4_A.wav", + "silence_duration": 0.42683537805807836, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Then you could wait in the departure area after going through security.", + "original_text": "Then you could wait in the departure area after going through security.", + "start_time": 24.337882644021075, + "end_time": 27.495796476220622, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--276/temp/line_5_B.wav", + "silence_duration": 0.5912324132732846, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Is that all I need to do for check-in?", + "original_text": "Is that all I need to do for check-in?", + "start_time": 27.9874852090263, + "end_time": 30.065671150069385, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--276/temp/line_6_A.wav", + "silence_duration": 0.4916887328056757, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yeah, I think so. It is very simple. Just make sure to arrive at your gate at least 30 minutes before boarding time to avoid any last-minute rush.", + "original_text": "Yeah, I think so. It is very simple. Just make sure to arrive at your gate at least 30 minutes before boarding time to avoid any last-minute rush.", + "start_time": 30.483690012757496, + "end_time": 38.71516393565999, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--276/temp/line_7_B.wav", + "silence_duration": 0.418018862688112, + "is_interrupted": false + } + ] + }, + "DialogSum--val--278": { + "original_text": "A: I would like high-speed internet installed in my house. \nB: You have to make an appointment before we can come out and [interrupt] check the availability of our technicians in your area, assess the installation requirements, and provide you with an accurate estimate for the service. \nA: I'd like to make an appointment right now. \nB: Sure, what day are you available? \nA: I would like to have it done this Friday. \nB: Three o'clock is the only time we can [interrupt] fit you into our schedule that day due to high demand and prior commitments from our installation team. \nA: Is it possible for someone to come a little earlier? \nB: I'm sorry, but that's our only available time. \nA: Oh, I see. How about Saturday? \nB: We're completely open on Saturday. \nA: Great, can you come over at 11? \nB: That'll be fine.", + "cleaned_text": "A: I would like high-speed internet installed in my house. \nB:You have to make an appointment before we can come out and check the availability of our technicians in your area, assess the installation requirements, and provide you with an accurate estimate for the service.\nA: I'd like to make an appointment right now. \nB: Sure, what day are you available? \nA: I would like to have it done this Friday. \nB:Three o'clock is the only time we can fit you into our schedule that day due to high demand and prior commitments from our installation team.\nA: Is it possible for someone to come a little earlier? \nB: I'm sorry, but that's our only available time. \nA: Oh, I see. How about Saturday? \nB: We're completely open on Saturday. \nA: Great, can you come over at 11? \nB: That'll be fine.", + "total_duration": 38.380045351473925, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--278/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--278/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--278/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "I would like high-speed internet installed in my house.", + "original_text": "I would like high-speed internet installed in my house.", + "start_time": 0, + "end_time": 3.308843537414966, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--278/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "You have to make an appointment before we can come out and", + "original_text": "You have to make an appointment before we can come out and [interrupt] check the availability of our technicians in your area, assess the installation requirements, and provide you with an accurate estimate for the service.", + "start_time": 3.715636075562071, + "end_time": 14.164615667398806, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--278/temp/line_1_B.wav", + "silence_duration": 0.4067925381471054, + "is_interrupted": true, + "text_after_interrupt": "check the availability of our technicians in your area, assess the installation requirements, and provide you with an accurate estimate for the service." + }, + { + "speaker": "A", + "text": "I'd like to make an appointment right now.", + "original_text": "I'd like to make an appointment right now.", + "start_time": 6.211781200278624, + "end_time": 8.522166687806969, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--278/temp/line_2_A.wav", + "silence_duration": 0.5245745873300025, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Sure, what day are you available?", + "original_text": "Sure, what day are you available?", + "start_time": 14.530209087764145, + "end_time": 16.167215890485235, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--278/temp/line_3_B.wav", + "silence_duration": 0.36559342036534004, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I would like to have it done this Friday.", + "original_text": "I would like to have it done this Friday.", + "start_time": 16.527372071842212, + "end_time": 18.559118103588244, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--278/temp/line_4_A.wav", + "silence_duration": 0.3601561813569772, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Three o'clock is the only time we can", + "original_text": "Three o'clock is the only time we can [interrupt] fit you into our schedule that day due to high demand and prior commitments from our installation team.", + "start_time": 18.88650943503955, + "end_time": 26.142745262703947, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--278/temp/line_5_B.wav", + "silence_duration": 0.32739133145130767, + "is_interrupted": true, + "text_after_interrupt": "fit you into our schedule that day due to high demand and prior commitments from our installation team." + }, + { + "speaker": "A", + "text": "Is it possible for someone to come a little earlier?", + "original_text": "Is it possible for someone to come a little earlier?", + "start_time": 23.776305494982573, + "end_time": 26.574310030129965, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--278/temp/line_6_A.wav", + "silence_duration": 0.5959100986872614, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I'm sorry, but that's our only available time.", + "original_text": "I'm sorry, but that's our only available time.", + "start_time": 26.957967820878014, + "end_time": 29.256743331082095, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--278/temp/line_7_B.wav", + "silence_duration": 0.38365779074805106, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Oh, I see. How about Saturday?", + "original_text": "Oh, I see. How about Saturday?", + "start_time": 29.57384609022414, + "end_time": 32.06999121494069, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--278/temp/line_8_A.wav", + "silence_duration": 0.3171027591420456, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "We're completely open on Saturday.", + "original_text": "We're completely open on Saturday.", + "start_time": 32.59499903738723, + "end_time": 34.42937545462079, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--278/temp/line_9_B.wav", + "silence_duration": 0.5250078224465403, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Great, can you come over at 11?", + "original_text": "Great, can you come over at 11?", + "start_time": 34.80961090407725, + "end_time": 37.08516645963281, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--278/temp/line_10_A.wav", + "silence_duration": 0.38023544945646726, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "That'll be fine.", + "original_text": "That'll be fine.", + "start_time": 37.42802896473981, + "end_time": 38.38004710532938, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--278/temp/line_11_B.wav", + "silence_duration": 0.34286250510699995, + "is_interrupted": false + } + ] + }, + "DialogSum--val--280": { + "original_text": "A: This is awful! It's like drinking saltwater! It's like drowning in the ocean! \nB: Don't be so dramatic. You're such a baby. Now sit down and finish your [interrupt] soup before it gets cold because I spent hours preparing it with fresh ingredients and special spices to help soothe your throat. \nA: Maybe I'll run away first. \nB: Well, the only free food on the streets is from a soup kitchen, and their soup isn't as tasty as mine! \nA: OK, OK. But when we get back from the doctor's, you'll gargle again, right? \nB: I was going to say that before you interrupted—yes, you'll gargle again.", + "cleaned_text": "A: This is awful! It's like drinking saltwater! It's like drowning in the ocean! \nB:Don't be so dramatic. You're such a baby. Now sit down and finish your soup before it gets cold because I spent hours preparing it with fresh ingredients and special spices to help soothe your throat.\nA: Maybe I'll run away first. \nB: Well, the only free food on the streets is from a soup kitchen, and their soup isn't as tasty as mine! \nA: OK, OK. But when we get back from the doctor's, you'll gargle again, right? \nB: I was going to say that before you interrupted—yes, you'll gargle again.", + "total_duration": 30.063492063492063, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--280/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--280/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--280/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "This is awful! It's like drinking saltwater! It's like drowning in the ocean!", + "original_text": "This is awful! It's like drinking saltwater! It's like drowning in the ocean!", + "start_time": 0, + "end_time": 5.2128798185941045, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--280/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Don't be so dramatic. You're such a baby. Now sit down and finish your", + "original_text": "Don't be so dramatic. You're such a baby. Now sit down and finish your [interrupt] soup before it gets cold because I spent hours preparing it with fresh ingredients and special spices to help soothe your throat.", + "start_time": 5.6944174268218575, + "end_time": 15.82992763090349, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--280/temp/line_1_B.wav", + "silence_duration": 0.4815376082277526, + "is_interrupted": true, + "text_after_interrupt": "soup before it gets cold because I spent hours preparing it with fresh ingredients and special spices to help soothe your throat." + }, + { + "speaker": "A", + "text": "Maybe I'll run away first.", + "original_text": "Maybe I'll run away first.", + "start_time": 9.90883919552934, + "end_time": 11.522626043601903, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--280/temp/line_2_A.wav", + "silence_duration": 0.4016032430232369, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Well, the only free food on the streets is from a soup kitchen, and their soup isn't as tasty as mine!", + "original_text": "Well, the only free food on the streets is from a soup kitchen, and their soup isn't as tasty as mine!", + "start_time": 16.148318684824115, + "end_time": 21.163828888905748, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--280/temp/line_3_B.wav", + "silence_duration": 0.3183910539206242, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "OK, OK. But when we get back from the doctor's, you'll gargle again, right?", + "original_text": "OK, OK. But when we get back from the doctor's, you'll gargle again, right?", + "start_time": 21.49400458420786, + "end_time": 26.207655377858654, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--280/temp/line_4_A.wav", + "silence_duration": 0.3301756953021138, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I was going to say that before you interrupted—yes, you'll gargle again.", + "original_text": "I was going to say that before you interrupted—yes, you'll gargle again.", + "start_time": 26.673393268797845, + "end_time": 30.063506647482654, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--280/temp/line_5_B.wav", + "silence_duration": 0.4657378909391917, + "is_interrupted": false + } + ] + }, + "DialogSum--val--281": { + "original_text": "A: Correct! Another contrast is the rules for the general and the king. It seems the general or marshal in xiangqi is much too incompetent. They are required to stay in the palace, waiting to be checked and fleeing for life under the cover of the guards. Look at the king in chess, he is much more [interrupt] versatile on the board, moving in any direction, even if only one square at a time, which gives him greater strategic flexibility and makes him a more active participant in the game's overall tactics.\nB: Sorry to jump in, but speaking of the king in chess, don't you think it's interesting how the queen, being the most powerful piece, reflects the social dynamics of the time?\nA: Absolutely, the queen's power does highlight the relatively higher social status of aristocratic women in medieval Europe compared to China. But I was going to mention how the king in chess is much more capable despite not having bodyguards, unlike the general in xiangqi. \nB: That's a good point. By the way, you mentioned something about the board sizes earlier. What were you going to say about that?\nA: Oh, right! There's another distinctive contrast. Both board games use a total of 32 pieces, but xiangqi is played on a 9-by-9 board, bigger than the 8-by-8 board used in chess.\nB: You mean, xiangqi pieces are allowed a larger space in which to move around?", + "cleaned_text": "A:Correct! Another contrast is the rules for the general and the king. It seems the general or marshal in xiangqi is much too incompetent. They are required to stay in the palace, waiting to be checked and fleeing for life under the cover of the guards. Look at the king in chess, he is much more versatile on the board, moving in any direction, even if only one square at a time, which gives him greater strategic flexibility and makes him a more active participant in the game's overall tactics.\nB: Sorry to jump in, but speaking of the king in chess, don't you think it's interesting how the queen, being the most powerful piece, reflects the social dynamics of the time?\nA: Absolutely, the queen's power does highlight the relatively higher social status of aristocratic women in medieval Europe compared to China. But I was going to mention how the king in chess is much more capable despite not having bodyguards, unlike the general in xiangqi. \nB: That's a good point. By the way, you mentioned something about the board sizes earlier. What were you going to say about that?\nA: Oh, right! There's another distinctive contrast. Both board games use a total of 32 pieces, but xiangqi is played on a 9-by-9 board, bigger than the 8-by-8 board used in chess.\nB: You mean, xiangqi pieces are allowed a larger space in which to move around?", + "total_duration": 69.20312925170067, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--281/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--281/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--281/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Correct! Another contrast is the rules for the general and the king. It seems the general or marshal in xiangqi is much too incompetent. They are required to stay in the palace, waiting to be checked and fleeing for life under the cover of the guards. Look at the king in chess, he is much more", + "original_text": "Correct! Another contrast is the rules for the general and the king. It seems the general or marshal in xiangqi is much too incompetent. They are required to stay in the palace, waiting to be checked and fleeing for life under the cover of the guards. Look at the king in chess, he is much more [interrupt] versatile on the board, moving in any direction, even if only one square at a time, which gives him greater strategic flexibility and makes him a more active participant in the game's overall tactics.", + "start_time": 0, + "end_time": 27.96843537414966, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--281/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": true, + "text_after_interrupt": "versatile on the board, moving in any direction, even if only one square at a time, which gives him greater strategic flexibility and makes him a more active participant in the game's overall tactics." + }, + { + "speaker": "B", + "text": "Sorry to jump in, but speaking of the king in chess, don't you think it's interesting how the queen, being the most powerful piece, reflects the social dynamics of the time?", + "original_text": "Sorry to jump in, but speaking of the king in chess, don't you think it's interesting how the queen, being the most powerful piece, reflects the social dynamics of the time?", + "start_time": 17.69360544217687, + "end_time": 26.610068027210886, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--281/temp/line_1_B.wav", + "silence_duration": 0.374773301110778, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Absolutely, the queen's power does highlight the relatively higher social status of aristocratic women in medieval Europe compared to China. But I was going to mention how the king in chess is much more capable despite not having bodyguards, unlike the general in xiangqi.", + "original_text": "Absolutely, the queen's power does highlight the relatively higher social status of aristocratic women in medieval Europe compared to China. But I was going to mention how the king in chess is much more capable despite not having bodyguards, unlike the general in xiangqi.", + "start_time": 28.287114493363667, + "end_time": 45.121581613545075, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--281/temp/line_2_A.wav", + "silence_duration": 0.31867911921400716, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "That's a good point. By the way, you mentioned something about the board sizes earlier. What were you going to say about that?", + "original_text": "That's a good point. By the way, you mentioned something about the board sizes earlier. What were you going to say about that?", + "start_time": 45.43836800524339, + "end_time": 50.95310723426833, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--281/temp/line_3_B.wav", + "silence_duration": 0.3167863916983122, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Oh, right! There's another distinctive contrast. Both board games use a total of 32 pieces, but xiangqi is played on a 9-by-9 board, bigger than the 8-by-8 board used in chess.", + "original_text": "Oh, right! There's another distinctive contrast. Both board games use a total of 32 pieces, but xiangqi is played on a 9-by-9 board, bigger than the 8-by-8 board used in chess.", + "start_time": 51.32935431348254, + "end_time": 64.5647284631424, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--281/temp/line_4_A.wav", + "silence_duration": 0.37624707921420675, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "You mean, xiangqi pieces are allowed a larger space in which to move around?", + "original_text": "You mean, xiangqi pieces are allowed a larger space in which to move around?", + "start_time": 65.01196230085819, + "end_time": 69.20316411491714, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--281/temp/line_5_B.wav", + "silence_duration": 0.44723383771579, + "is_interrupted": false + } + ] + }, + "DialogSum--val--282": { + "original_text": "A: Well, this is a pleasant surprise. It seems to me we ran into each other here last week [interrupt] I was actually on my way to grab some coffee, just like last time, and I was thinking how funny it is that we keep meeting in this exact same spot by the produce section.\nB: Oh, that's right! I remember now. We must be on the same grocery schedule. I guess the only way to beat the crowds on a Saturday is to be here when they open at 9:00 o'clock sharp!\nA: Exactly! But I was about to say that last week, we talked about trying that new bakery down the street. Did you get a chance to check it out? Their croissants are supposed to be absolutely divine, made with authentic French butter and baked fresh every morning.", + "cleaned_text": "A:Well, this is a pleasant surprise. It seems to me we ran into each other here last week I was actually on my way to grab some coffee, just like last time, and I was thinking how funny it is that we keep meeting in this exact same spot by the produce section.\nB: Oh, that's right! I remember now. We must be on the same grocery schedule. I guess the only way to beat the crowds on a Saturday is to be here when they open at 9:00 o'clock sharp!\nA: Exactly! But I was about to say that last week, we talked about trying that new bakery down the street. Did you get a chance to check it out? Their croissants are supposed to be absolutely divine, made with authentic French butter and baked fresh every morning.", + "total_duration": 32.2908843537415, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--282/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--282/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--282/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Well, this is a pleasant surprise. It seems to me we ran into each other here last week", + "original_text": "Well, this is a pleasant surprise. It seems to me we ran into each other here last week [interrupt] I was actually on my way to grab some coffee, just like last time, and I was thinking how funny it is that we keep meeting in this exact same spot by the produce section.", + "start_time": 0, + "end_time": 16.439727891156462, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--282/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": true, + "text_after_interrupt": "I was actually on my way to grab some coffee, just like last time, and I was thinking how funny it is that we keep meeting in this exact same spot by the produce section." + }, + { + "speaker": "B", + "text": "Oh, that's right! I remember now. We must be on the same grocery schedule. I guess the only way to beat the crowds on a Saturday is to be here when they open at 9:00 o'clock sharp!", + "original_text": "Oh, that's right! I remember now. We must be on the same grocery schedule. I guess the only way to beat the crowds on a Saturday is to be here when they open at 9:00 o'clock sharp!", + "start_time": 5.456689342403628, + "end_time": 13.955192743764172, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--282/temp/line_1_B.wav", + "silence_duration": 0.5298057398023649, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Exactly! But I was about to say that last week, we talked about trying that new bakery down the street. Did you get a chance to check it out? Their croissants are supposed to be absolutely divine, made with authentic French butter and baked fresh every morning.", + "original_text": "Exactly! But I was about to say that last week, we talked about trying that new bakery down the street. Did you get a chance to check it out? Their croissants are supposed to be absolutely divine, made with authentic French butter and baked fresh every morning.", + "start_time": 16.954117751830033, + "end_time": 32.29089779718151, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--282/temp/line_2_A.wav", + "silence_duration": 0.5143898606735708, + "is_interrupted": false + } + ] + }, + "DialogSum--val--284": { + "original_text": "A: Excuse me. Is this seat taken? \nB: No. it's not taken. \nA: Oh. thank you. \nB: Oh. let me help you with this. \nA: Oh. thank you. \nB: Do you want to sit by the window? \nA: No. no. no. I like the aisle seat better. You can sit by the window. \nB: My name is Mike Gerard Hogan. Pleased to [interrupt] meet you. I've actually been traveling quite a bit lately for work and it's always nice to make new connections during these long flights. \nA: Sorry to interrupt, but did you say your name was Mike Gerard Hogan? That sounds really familiar. \nB: Yes, that's right. And you're Elsa Tobin, right? How do you do? \nA: How do you do? \nB: Do you live in New York? \nA: No. no. I'm from Florida. \nB: I am, too. But didn't you just get on? I thought you were coming from New York. \nA: Oh, no. I was just passing through New York for a business trip. I actually live in Florida. What about you?", + "cleaned_text": "A: Excuse me. Is this seat taken? \nB: No. it's not taken. \nA: Oh. thank you. \nB: Oh. let me help you with this. \nA: Oh. thank you. \nB: Do you want to sit by the window? \nA: No. no. no. I like the aisle seat better. You can sit by the window. \nB:My name is Mike Gerard Hogan. Pleased to meet you. I've actually been traveling quite a bit lately for work and it's always nice to make new connections during these long flights.\nA: Sorry to interrupt, but did you say your name was Mike Gerard Hogan? That sounds really familiar. \nB: Yes, that's right. And you're Elsa Tobin, right? How do you do? \nA: How do you do? \nB: Do you live in New York? \nA: No. no. I'm from Florida. \nB: I am, too. But didn't you just get on? I thought you were coming from New York. \nA: Oh, no. I was just passing through New York for a business trip. I actually live in Florida. What about you?", + "total_duration": 46.90312925170068, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--284/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--284/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--284/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Excuse me. Is this seat taken?", + "original_text": "Excuse me. Is this seat taken?", + "start_time": 0, + "end_time": 2.5774149659863945, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--284/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "No. it's not taken.", + "original_text": "No. it's not taken.", + "start_time": 3.13974992744283, + "end_time": 4.451677365084554, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--284/temp/line_1_B.wav", + "silence_duration": 0.5623349614564357, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Oh. thank you.", + "original_text": "Oh. thank you.", + "start_time": 4.908679293784701, + "end_time": 5.988407184941163, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--284/temp/line_2_A.wav", + "silence_duration": 0.4570019287001468, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Oh. let me help you with this.", + "original_text": "Oh. let me help you with this.", + "start_time": 6.446090359556657, + "end_time": 8.280466776790217, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--284/temp/line_3_B.wav", + "silence_duration": 0.4576831746154937, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Oh. thank you.", + "original_text": "Oh. thank you.", + "start_time": 8.701881203004994, + "end_time": 10.118298436565086, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--284/temp/line_4_A.wav", + "silence_duration": 0.421414426214777, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Do you want to sit by the window?", + "original_text": "Do you want to sit by the window?", + "start_time": 10.622356711201252, + "end_time": 11.818184375600346, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--284/temp/line_5_B.wav", + "silence_duration": 0.5040582746361674, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "No. no. no. I like the aisle seat better. You can sit by the window.", + "original_text": "No. no. no. I like the aisle seat better. You can sit by the window.", + "start_time": 12.37808490235657, + "end_time": 16.47640689782142, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--284/temp/line_6_A.wav", + "silence_duration": 0.5599005267562228, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "My name is Mike Gerard Hogan. Pleased to", + "original_text": "My name is Mike Gerard Hogan. Pleased to [interrupt] meet you. I've actually been traveling quite a bit lately for work and it's always nice to make new connections during these long flights.", + "start_time": 17.028726009940694, + "end_time": 26.038068413568812, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--284/temp/line_7_B.wav", + "silence_duration": 0.552319112119276, + "is_interrupted": true, + "text_after_interrupt": "meet you. I've actually been traveling quite a bit lately for work and it's always nice to make new connections during these long flights." + }, + { + "speaker": "A", + "text": "Sorry to interrupt, but did you say your name was Mike Gerard Hogan? That sounds really familiar.", + "original_text": "Sorry to interrupt, but did you say your name was Mike Gerard Hogan? That sounds really familiar.", + "start_time": 19.443601293387406, + "end_time": 26.177388141459968, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--284/temp/line_8_A.wav", + "silence_duration": 0.5620896259621571, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, that's right. And you're Elsa Tobin, right? How do you do?", + "original_text": "Yes, that's right. And you're Elsa Tobin, right? How do you do?", + "start_time": 26.48612808013697, + "end_time": 30.236150755873933, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--284/temp/line_9_B.wav", + "silence_duration": 0.3087399386770028, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "How do you do?", + "original_text": "How do you do?", + "start_time": 30.768647154259263, + "end_time": 31.720665294848832, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--284/temp/line_10_A.wav", + "silence_duration": 0.5324963983853289, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Do you live in New York?", + "original_text": "Do you live in New York?", + "start_time": 32.29614933791615, + "end_time": 33.30621736512703, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--284/temp/line_11_B.wav", + "silence_duration": 0.5754840430673152, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "No. no. I'm from Florida.", + "original_text": "No. no. I'm from Florida.", + "start_time": 33.66666144009753, + "end_time": 35.64035758522225, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--284/temp/line_12_A.wav", + "silence_duration": 0.36044407497049763, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I am, too. But didn't you just get on? I thought you were coming from New York.", + "original_text": "I am, too. But didn't you just get on? I thought you were coming from New York.", + "start_time": 35.97440843285077, + "end_time": 40.00307056437005, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--284/temp/line_13_B.wav", + "silence_duration": 0.334050847628528, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Oh, no. I was just passing through New York for a business trip. I actually live in Florida. What about you?", + "original_text": "Oh, no. I was just passing through New York for a business trip. I actually live in Florida. What about you?", + "start_time": 40.564115411721936, + "end_time": 46.903163030769555, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--284/temp/line_14_A.wav", + "silence_duration": 0.5610448473518869, + "is_interrupted": false + } + ] + }, + "DialogSum--val--286": { + "original_text": "A: Tina, are you coming to band practice this week? Our show is this Friday...only two days away! \nB: Yes, I'm coming tonight. I didn't come last week because my guitar was [interrupt] giving me some issues with the tuning pegs and the bridge alignment, which made it impossible to play properly until I got it professionally adjusted. \nA: Broken? Did you fix your guitar? My sister has a new guitar you can probably borrow if yours is still broken. \nB: Thanks, but I can only play music on my guitar because it's a left-handed guitar...it's for people who use their left hands for most things. I fixed my guitar on Monday night. \nA: Why didn't you fix it sooner? We only have two days until our show. \nB: I've been so busy this month! I have to work at the grocery store and [interrupt] help my mom with some things at home like deep cleaning the house and organizing all our family documents, which has taken up most of my free time. \nA: And watch your little sister, right? That sounds tough. But what about band practice? Have you had time to rehearse?", + "cleaned_text": "A: Tina, are you coming to band practice this week? Our show is this Friday...only two days away! \nB:Yes, I'm coming tonight. I didn't come last week because my guitar was giving me some issues with the tuning pegs and the bridge alignment, which made it impossible to play properly until I got it professionally adjusted.\nA: Broken? Did you fix your guitar? My sister has a new guitar you can probably borrow if yours is still broken. \nB: Thanks, but I can only play music on my guitar because it's a left-handed guitar...it's for people who use their left hands for most things. I fixed my guitar on Monday night. \nA: Why didn't you fix it sooner? We only have two days until our show. \nB:I've been so busy this month! I have to work at the grocery store and help my mom with some things at home like deep cleaning the house and organizing all our family documents, which has taken up most of my free time.\nA: And watch your little sister, right? That sounds tough. But what about band practice? Have you had time to rehearse?", + "total_duration": 50.95546485260771, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--286/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--286/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--286/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Tina, are you coming to band practice this week? Our show is this Friday...only two days away!", + "original_text": "Tina, are you coming to band practice this week? Our show is this Friday...only two days away!", + "start_time": 0, + "end_time": 6.431927437641724, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--286/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, I'm coming tonight. I didn't come last week because my guitar was", + "original_text": "Yes, I'm coming tonight. I didn't come last week because my guitar was [interrupt] giving me some issues with the tuning pegs and the bridge alignment, which made it impossible to play properly until I got it professionally adjusted.", + "start_time": 7.010065454071755, + "end_time": 17.563534841826858, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--286/temp/line_1_B.wav", + "silence_duration": 0.578138016430032, + "is_interrupted": true, + "text_after_interrupt": "giving me some issues with the tuning pegs and the bridge alignment, which made it impossible to play properly until I got it professionally adjusted." + }, + { + "speaker": "A", + "text": "Broken? Did you fix your guitar? My sister has a new guitar you can probably borrow if yours is still broken.", + "original_text": "Broken? Did you fix your guitar? My sister has a new guitar you can probably borrow if yours is still broken.", + "start_time": 11.108387449536608, + "end_time": 17.818954342960645, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--286/temp/line_2_A.wav", + "silence_duration": 0.3910978620808771, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Thanks, but I can only play music on my guitar because it's a left-handed guitar...it's for people who use their left hands for most things. I fixed my guitar on Monday night.", + "original_text": "Thanks, but I can only play music on my guitar because it's a left-handed guitar...it's for people who use their left hands for most things. I fixed my guitar on Monday night.", + "start_time": 18.415903425671754, + "end_time": 28.191504332701232, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--286/temp/line_3_B.wav", + "silence_duration": 0.5969490827111108, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Why didn't you fix it sooner? We only have two days until our show.", + "original_text": "Why didn't you fix it sooner? We only have two days until our show.", + "start_time": 28.648369517173204, + "end_time": 32.74669151263806, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--286/temp/line_4_A.wav", + "silence_duration": 0.456865184471972, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I've been so busy this month! I have to work at the grocery store and", + "original_text": "I've been so busy this month! I have to work at the grocery store and [interrupt] help my mom with some things at home like deep cleaning the house and organizing all our family documents, which has taken up most of my free time.", + "start_time": 33.255453589183205, + "end_time": 43.83214293158683, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--286/temp/line_5_B.wav", + "silence_duration": 0.5087620765451477, + "is_interrupted": true, + "text_after_interrupt": "help my mom with some things at home like deep cleaning the house and organizing all our family documents, which has taken up most of my free time." + }, + { + "speaker": "A", + "text": "And watch your little sister, right? That sounds tough. But what about band practice? Have you had time to rehearse?", + "original_text": "And watch your little sister, right? That sounds tough. But what about band practice? Have you had time to rehearse?", + "start_time": 43.97791128576594, + "end_time": 50.95550765764803, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--286/temp/line_6_A.wav", + "silence_duration": 0.4980902771446273, + "is_interrupted": false + } + ] + }, + "DialogSum--val--287": { + "original_text": "A: So, you finally got your doctorate in genetics. Well done!\nB: Thanks. Now, I have to find a job.\nA: What are you thinking of doing?\nB: I'd like to conduct some scientific research into genes. It would be wonderful to make a medical breakthrough.\nA: There must be several private companies that are interested in employing someone like you. You could do some research for a university. There's a lot of discussion about genetics nowadays. Someone with your expertise could really [interrupt] contribute to advancing our understanding of genetic diseases by developing innovative therapies and potentially discovering new genetic markers that could revolutionize personalized medicine.\nB: Sorry to jump in, but speaking of universities, do you think it's better to focus on academic research rather than going into the private sector?\nA: That's a good question. Academic research offers more freedom, but it can be slower due to funding issues. However, I was about to say that someone with your expertise could really contribute to groundbreaking studies. By the way, you mentioned wanting to make a medical breakthrough—are you considering working on any specific diseases?\nB: Yes, I'm particularly interested in genetic disorders. I think there's a lot of potential in that area for new treatments.", + "cleaned_text": "A: So, you finally got your doctorate in genetics. Well done!\nB: Thanks. Now, I have to find a job.\nA: What are you thinking of doing?\nB: I'd like to conduct some scientific research into genes. It would be wonderful to make a medical breakthrough.\nA:There must be several private companies that are interested in employing someone like you. You could do some research for a university. There's a lot of discussion about genetics nowadays. Someone with your expertise could really contribute to advancing our understanding of genetic diseases by developing innovative therapies and potentially discovering new genetic markers that could revolutionize personalized medicine.\nB: Sorry to jump in, but speaking of universities, do you think it's better to focus on academic research rather than going into the private sector?\nA: That's a good question. Academic research offers more freedom, but it can be slower due to funding issues. However, I was about to say that someone with your expertise could really contribute to groundbreaking studies. By the way, you mentioned wanting to make a medical breakthrough—are you considering working on any specific diseases?\nB: Yes, I'm particularly interested in genetic disorders. I think there's a lot of potential in that area for new treatments.", + "total_duration": 64.84462585034014, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--287/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--287/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--287/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "So, you finally got your doctorate in genetics. Well done!", + "original_text": "So, you finally got your doctorate in genetics. Well done!", + "start_time": 0, + "end_time": 3.436553287981859, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--287/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Thanks. Now, I have to find a job.", + "original_text": "Thanks. Now, I have to find a job.", + "start_time": 3.747600566157096, + "end_time": 5.721296711281813, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--287/temp/line_1_B.wav", + "silence_duration": 0.31104727817523703, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "What are you thinking of doing?", + "original_text": "What are you thinking of doing?", + "start_time": 6.2886009030921155, + "end_time": 7.7282380913007325, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--287/temp/line_2_A.wav", + "silence_duration": 0.5673041918103026, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I'd like to conduct some scientific research into genes. It would be wonderful to make a medical breakthrough.", + "original_text": "I'd like to conduct some scientific research into genes. It would be wonderful to make a medical breakthrough.", + "start_time": 8.05033650109145, + "end_time": 13.379316092928185, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--287/temp/line_3_B.wav", + "silence_duration": 0.322098409790718, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "There must be several private companies that are interested in employing someone like you. You could do some research for a university. There's a lot of discussion about genetics nowadays. Someone with your expertise could really", + "original_text": "There must be several private companies that are interested in employing someone like you. You could do some research for a university. There's a lot of discussion about genetics nowadays. Someone with your expertise could really [interrupt] contribute to advancing our understanding of genetic diseases by developing innovative therapies and potentially discovering new genetic markers that could revolutionize personalized medicine.", + "start_time": 13.700482039834238, + "end_time": 37.55898544119478, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--287/temp/line_4_A.wav", + "silence_duration": 0.32116594690605205, + "is_interrupted": true, + "text_after_interrupt": "contribute to advancing our understanding of genetic diseases by developing innovative therapies and potentially discovering new genetic markers that could revolutionize personalized medicine." + }, + { + "speaker": "B", + "text": "Sorry to jump in, but speaking of universities, do you think it's better to focus on academic research rather than going into the private sector?", + "original_text": "Sorry to jump in, but speaking of universities, do you think it's better to focus on academic research rather than going into the private sector?", + "start_time": 27.934314239380726, + "end_time": 35.469189522827435, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--287/temp/line_5_B.wav", + "silence_duration": 0.3857182938184326, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "That's a good question. Academic research offers more freedom, but it can be slower due to funding issues. However, I was about to say that someone with your expertise could really contribute to groundbreaking studies. By the way, you mentioned wanting to make a medical breakthrough—are you considering working on any specific diseases?", + "original_text": "That's a good question. Academic research offers more freedom, but it can be slower due to funding issues. However, I was about to say that someone with your expertise could really contribute to groundbreaking studies. By the way, you mentioned wanting to make a medical breakthrough—are you considering working on any specific diseases?", + "start_time": 37.951465898850515, + "end_time": 57.630377463476364, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--287/temp/line_6_A.wav", + "silence_duration": 0.39248045765573925, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, I'm particularly interested in genetic disorders. I think there's a lot of potential in that area for new treatments.", + "original_text": "Yes, I'm particularly interested in genetic disorders. I think there's a lot of potential in that area for new treatments.", + "start_time": 58.02960244063427, + "end_time": 64.84465912997668, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--287/temp/line_7_B.wav", + "silence_duration": 0.39922497715790917, + "is_interrupted": false + } + ] + }, + "DialogSum--val--288": { + "original_text": "A: While you are thinking about what you might like to order for dinner, would you like to order your drinks first? We have some excellent seasonal cocktails that pair [interrupt] perfectly with our menu items and I'd be happy to make recommendations based on your preferences.\nB: Can you tell me where your wine list is?\nA: The wine list is posted right there on the board.\nB: Can we order a mixed drink in this area, or do we need to go to the bar?\nA: Oh, absolutely! We have a wide selection of mixed drinks available from our bar.\nB: Great! Do you have any house specials that you could recommend?\nA: Our most popular drinks are our Cuervo Gold margaritas.\nB: That sounds like a good choice for me. May I have one, please?\nA: Can I bring that to you on the rocks, or would you like it blended with fresh lime juice and a touch of agave syrup for [interrupt] a perfectly balanced flavor profile that complements the tequila beautifully?\nB: Sorry, I meant to ask earlier—can we order mixed drinks to go along with the food later, or do we need to order them separately?\nA: You can definitely order drinks with your food later as well. Now, would you like your margarita on the rocks or blended?\nB: Please bring it to me on the rocks.\nA: Salt or no salt?\nB: I would like it with no salt, please.", + "cleaned_text": "A:While you are thinking about what you might like to order for dinner, would you like to order your drinks first? We have some excellent seasonal cocktails that pair perfectly with our menu items and I'd be happy to make recommendations based on your preferences.\nB: Can you tell me where your wine list is?\nA: The wine list is posted right there on the board.\nB: Can we order a mixed drink in this area, or do we need to go to the bar?\nA: Oh, absolutely! We have a wide selection of mixed drinks available from our bar.\nB: Great! Do you have any house specials that you could recommend?\nA: Our most popular drinks are our Cuervo Gold margaritas.\nB: That sounds like a good choice for me. May I have one, please?\nA:Can I bring that to you on the rocks, or would you like it blended with fresh lime juice and a touch of agave syrup for a perfectly balanced flavor profile that complements the tequila beautifully?\nB: Sorry, I meant to ask earlier—can we order mixed drinks to go along with the food later, or do we need to order them separately?\nA: You can definitely order drinks with your food later as well. Now, would you like your margarita on the rocks or blended?\nB: Please bring it to me on the rocks.\nA: Salt or no salt?\nB: I would like it with no salt, please.", + "total_duration": 68.21841269841269, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--288/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--288/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--288/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "While you are thinking about what you might like to order for dinner, would you like to order your drinks first? We have some excellent seasonal cocktails that pair", + "original_text": "While you are thinking about what you might like to order for dinner, would you like to order your drinks first? We have some excellent seasonal cocktails that pair [interrupt] perfectly with our menu items and I'd be happy to make recommendations based on your preferences.", + "start_time": 0, + "end_time": 14.199002267573697, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--288/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": true, + "text_after_interrupt": "perfectly with our menu items and I'd be happy to make recommendations based on your preferences." + }, + { + "speaker": "B", + "text": "Can you tell me where your wine list is?", + "original_text": "Can you tell me where your wine list is?", + "start_time": 8.359183673469389, + "end_time": 10.216780045351475, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--288/temp/line_1_B.wav", + "silence_duration": 0.34606820095210633, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "The wine list is posted right there on the board.", + "original_text": "The wine list is posted right there on the board.", + "start_time": 14.648148184666818, + "end_time": 17.364882878544368, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--288/temp/line_2_A.wav", + "silence_duration": 0.4491459170931208, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Can we order a mixed drink in this area, or do we need to go to the bar?", + "original_text": "Can we order a mixed drink in this area, or do we need to go to the bar?", + "start_time": 17.935065022465125, + "end_time": 21.267128514528615, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--288/temp/line_3_B.wav", + "silence_duration": 0.5701821439207553, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Oh, absolutely! We have a wide selection of mixed drinks available from our bar.", + "original_text": "Oh, absolutely! We have a wide selection of mixed drinks available from our bar.", + "start_time": 21.567638484066016, + "end_time": 26.69924846139028, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--288/temp/line_4_A.wav", + "silence_duration": 0.300509969537401, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Great! Do you have any house specials that you could recommend?", + "original_text": "Great! Do you have any house specials that you could recommend?", + "start_time": 27.20038038902201, + "end_time": 30.49761394911271, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--288/temp/line_5_B.wav", + "silence_duration": 0.5011319276317272, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Our most popular drinks are our Cuervo Gold margaritas.", + "original_text": "Our most popular drinks are our Cuervo Gold margaritas.", + "start_time": 30.85731737771049, + "end_time": 34.31709062034088, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--288/temp/line_6_A.wav", + "silence_duration": 0.35970342859777754, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "That sounds like a good choice for me. May I have one, please?", + "original_text": "That sounds like a good choice for me. May I have one, please?", + "start_time": 34.63681638772635, + "end_time": 37.748290310628846, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--288/temp/line_7_B.wav", + "silence_duration": 0.31972576738546976, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Can I bring that to you on the rocks, or would you like it blended with fresh lime juice and a touch of agave syrup for", + "original_text": "Can I bring that to you on the rocks, or would you like it blended with fresh lime juice and a touch of agave syrup for [interrupt] a perfectly balanced flavor profile that complements the tequila beautifully?", + "start_time": 38.11391357578991, + "end_time": 48.88797253270601, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--288/temp/line_8_A.wav", + "silence_duration": 0.3656232651610648, + "is_interrupted": true, + "text_after_interrupt": "a perfectly balanced flavor profile that complements the tequila beautifully?" + }, + { + "speaker": "B", + "text": "Sorry, I meant to ask earlier—can we order mixed drinks to go along with the food later, or do we need to order them separately?", + "original_text": "Sorry, I meant to ask earlier—can we order mixed drinks to go along with the food later, or do we need to order them separately?", + "start_time": 47.89832101125896, + "end_time": 54.63210785933152, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--288/temp/line_9_B.wav", + "silence_duration": 0.34428547179643204, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "You can definitely order drinks with your food later as well. Now, would you like your margarita on the rocks or blended?", + "original_text": "You can definitely order drinks with your food later as well. Now, would you like your margarita on the rocks or blended?", + "start_time": 54.97654473026521, + "end_time": 61.988971034120084, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--288/temp/line_10_A.wav", + "silence_duration": 0.34443687093368786, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Please bring it to me on the rocks.", + "original_text": "Please bring it to me on the rocks.", + "start_time": 62.335917737381784, + "end_time": 63.97292454010287, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--288/temp/line_11_B.wav", + "silence_duration": 0.34694670326170296, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Salt or no salt?", + "original_text": "Salt or no salt?", + "start_time": 64.40329490307104, + "end_time": 65.93581190987376, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--288/temp/line_12_A.wav", + "silence_duration": 0.4303703629681638, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I would like it with no salt, please.", + "original_text": "I would like it with no salt, please.", + "start_time": 66.41889033634234, + "end_time": 68.21843682160312, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--288/temp/line_13_B.wav", + "silence_duration": 0.48307842646858445, + "is_interrupted": false + } + ] + }, + "DialogSum--val--289": { + "original_text": "A: How do you feel about teaching my friend how to read? \nB: How old is your friend and why doesn't he know how to [interrupt] read? I'm curious about his background and what specific challenges he might be facing with literacy at his age. \nA: He's 78 and he's a new emigrant from South America and he's never been to school. \nB: Does he even know how to speak English? \nA: No. But I thought that you could start with reading and then go from [interrupt] there to gradually introduce him to basic conversational English through simple vocabulary exercises and daily practice sessions. \nB: Wait, before we move on—does he have any basic understanding of English at all? It might be challenging to teach reading without that foundation. \nA: Oh, good point. I'm not sure if he knows any English at all. But I thought you could start with reading and then maybe work on his speaking skills too. \nB: That was very thoughtful of you to volunteer me. \nA: Come on. You're great at teaching and I know you will love him. He's adorable! \nB: Oh, all right. Have him come over here for dinner. But you get to make dinner!", + "cleaned_text": "A: How do you feel about teaching my friend how to read? \nB:How old is your friend and why doesn't he know how to read? I'm curious about his background and what specific challenges he might be facing with literacy at his age.\nA: He's 78 and he's a new emigrant from South America and he's never been to school. \nB: Does he even know how to speak English? \nA:No. But I thought that you could start with reading and then go from there to gradually introduce him to basic conversational English through simple vocabulary exercises and daily practice sessions.\nB: Wait, before we move on—does he have any basic understanding of English at all? It might be challenging to teach reading without that foundation. \nA: Oh, good point. I'm not sure if he knows any English at all. But I thought you could start with reading and then maybe work on his speaking skills too. \nB: That was very thoughtful of you to volunteer me. \nA: Come on. You're great at teaching and I know you will love him. He's adorable! \nB: Oh, all right. Have him come over here for dinner. But you get to make dinner!", + "total_duration": 52.776326530612245, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--289/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--289/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--289/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "How do you feel about teaching my friend how to read?", + "original_text": "How do you feel about teaching my friend how to read?", + "start_time": 0, + "end_time": 2.716734693877551, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--289/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "How old is your friend and why doesn't he know how to", + "original_text": "How old is your friend and why doesn't he know how to [interrupt] read? I'm curious about his background and what specific challenges he might be facing with literacy at his age.", + "start_time": 3.241799242295316, + "end_time": 11.74030264365586, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--289/temp/line_1_B.wav", + "silence_duration": 0.525064548417765, + "is_interrupted": true, + "text_after_interrupt": "read? I'm curious about his background and what specific challenges he might be facing with literacy at his age." + }, + { + "speaker": "A", + "text": "He's 78 and he's a new emigrant from South America and he's never been to school.", + "original_text": "He's 78 and he's a new emigrant from South America and he's never been to school.", + "start_time": 5.517354797850872, + "end_time": 10.78828450306629, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--289/temp/line_2_A.wav", + "silence_duration": 0.5845019758171655, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Does he even know how to speak English?", + "original_text": "Does he even know how to speak English?", + "start_time": 12.125920338360428, + "end_time": 13.844196982351358, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--289/temp/line_3_B.wav", + "silence_duration": 0.3856176947045683, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "No. But I thought that you could start with reading and then go from", + "original_text": "No. But I thought that you could start with reading and then go from [interrupt] there to gradually introduce him to basic conversational English through simple vocabulary exercises and daily practice sessions.", + "start_time": 14.42925310419167, + "end_time": 25.865080768590765, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--289/temp/line_4_A.wav", + "silence_duration": 0.5850561218403117, + "is_interrupted": true, + "text_after_interrupt": "there to gradually introduce him to basic conversational English through simple vocabulary exercises and daily practice sessions." + }, + { + "speaker": "B", + "text": "Wait, before we move on—does he have any basic understanding of English at all? It might be challenging to teach reading without that foundation.", + "original_text": "Wait, before we move on—does he have any basic understanding of English at all? It might be challenging to teach reading without that foundation.", + "start_time": 24.55334853878593, + "end_time": 31.449675069398175, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--289/temp/line_5_B.wav", + "silence_duration": 0.45789964211133805, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Oh, good point. I'm not sure if he knows any English at all. But I thought you could start with reading and then maybe work on his speaking skills too.", + "original_text": "Oh, good point. I'm not sure if he knows any English at all. But I thought you could start with reading and then maybe work on his speaking skills too.", + "start_time": 31.98003574473605, + "end_time": 40.55980898736644, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--289/temp/line_6_A.wav", + "silence_duration": 0.5303606753378727, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "That was very thoughtful of you to volunteer me.", + "original_text": "That was very thoughtful of you to volunteer me.", + "start_time": 40.96052729875448, + "end_time": 43.32896267290414, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--289/temp/line_7_B.wav", + "silence_duration": 0.4007183113880407, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Come on. You're great at teaching and I know you will love him. He's adorable!", + "original_text": "Come on. You're great at teaching and I know you will love him. He's adorable!", + "start_time": 43.642080644806214, + "end_time": 48.39056137042979, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--289/temp/line_8_A.wav", + "silence_duration": 0.31311797190207313, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Oh, all right. Have him come over here for dinner. But you get to make dinner!", + "original_text": "Oh, all right. Have him come over here for dinner. But you get to make dinner!", + "start_time": 48.70125428813866, + "end_time": 52.77635632895498, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--289/temp/line_9_B.wav", + "silence_duration": 0.31069291770886365, + "is_interrupted": false + } + ] + }, + "DialogSum--val--290": { + "original_text": "A: Veronica, wait—before you decide, I didn't get to finish earlier. My assignment, it's over, but I need you to know that it was never about deceiving you. I had no choice. But now, everything can be different. We can start fresh, without anything between us. [interrupt] I want us to build a life together, with complete honesty and trust, where we can share our dreams and face whatever challenges come our way as partners who truly understand each other.\nB: I understand, but Steven, it's not just about the mission or India. It's about trust, and that's something I'm struggling with right now. I need time to think about whether I can truly open my heart again after everything that's happened between us.", + "cleaned_text": "A:Veronica, wait—before you decide, I didn't get to finish earlier. My assignment, it's over, but I need you to know that it was never about deceiving you. I had no choice. But now, everything can be different. We can start fresh, without anything between us. I want us to build a life together, with complete honesty and trust, where we can share our dreams and face whatever challenges come our way as partners who truly understand each other.\nB: I understand, but Steven, it's not just about the mission or India. It's about trust, and that's something I'm struggling with right now. I need time to think about whether I can truly open my heart again after everything that's happened between us.", + "total_duration": 28.606984126984127, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--290/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--290/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--290/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Veronica, wait—before you decide, I didn't get to finish earlier. My assignment, it's over, but I need you to know that it was never about deceiving you. I had no choice. But now, everything can be different. We can start fresh, without anything between us.", + "original_text": "Veronica, wait—before you decide, I didn't get to finish earlier. My assignment, it's over, but I need you to know that it was never about deceiving you. I had no choice. But now, everything can be different. We can start fresh, without anything between us. [interrupt] I want us to build a life together, with complete honesty and trust, where we can share our dreams and face whatever challenges come our way as partners who truly understand each other.", + "start_time": 0, + "end_time": 27.678185941043083, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--290/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": true, + "text_after_interrupt": "I want us to build a life together, with complete honesty and trust, where we can share our dreams and face whatever challenges come our way as partners who truly understand each other." + }, + { + "speaker": "B", + "text": "I understand, but Steven, it's not just about the mission or India. It's about trust, and that's something I'm struggling with right now. I need time to think about whether I can truly open my heart again after everything that's happened between us.", + "original_text": "I understand, but Steven, it's not just about the mission or India. It's about trust, and that's something I'm struggling with right now. I need time to think about whether I can truly open my heart again after everything that's happened between us.", + "start_time": 15.917278911564626, + "end_time": 28.606984126984127, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--290/temp/line_1_B.wav", + "silence_duration": 0.36217913244397093, + "is_interrupted": false + } + ] + }, + "DialogSum--val--291": { + "original_text": "A: I was told to come to you to get a chest X-ray. \nB: No problem. Just take your clothes off from the waist up and put the gown on, with the opening in the [interrupt] front, so we can get a clear image of your lungs and heart without any obstructions from clothing or other materials. \nA: Sorry, should I take off any jewelry too? \nB: Yes, it's best to remove any jewelry. Now, after you put the gown on with the opening in the back, you will stand over here up against this plate. \nA: Should I just stand naturally? \nB: You will raise your arms up shoulder high. \nA: Is this all right? \nB: Yes, you are doing great. \nA: Where will you be going? \nB: I need to stand behind this shield. Now you will take a deep breath, hold it, and [interrupt] I will quickly take the X-ray while maintaining proper positioning to ensure we capture the clearest possible diagnostic images for the radiologist to review. \nA: Just to clarify, how long should I hold my breath? \nB: Only for a few seconds. Then you can let it out. After that, you can get dressed when the film is developed.", + "cleaned_text": "A: I was told to come to you to get a chest X-ray. \nB:No problem. Just take your clothes off from the waist up and put the gown on, with the opening in the front, so we can get a clear image of your lungs and heart without any obstructions from clothing or other materials.\nA: Sorry, should I take off any jewelry too? \nB: Yes, it's best to remove any jewelry. Now, after you put the gown on with the opening in the back, you will stand over here up against this plate. \nA: Should I just stand naturally? \nB: You will raise your arms up shoulder high. \nA: Is this all right? \nB: Yes, you are doing great. \nA: Where will you be going? \nB:I need to stand behind this shield. Now you will take a deep breath, hold it, and I will quickly take the X-ray while maintaining proper positioning to ensure we capture the clearest possible diagnostic images for the radiologist to review.\nA: Just to clarify, how long should I hold my breath? \nB: Only for a few seconds. Then you can let it out. After that, you can get dressed when the film is developed.", + "total_duration": 50.290022675736964, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--291/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--291/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--291/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "I was told to come to you to get a chest X-ray.", + "original_text": "I was told to come to you to get a chest X-ray.", + "start_time": 0, + "end_time": 3.274013605442177, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--291/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "No problem. Just take your clothes off from the waist up and put the gown on, with the opening in the", + "original_text": "No problem. Just take your clothes off from the waist up and put the gown on, with the opening in the [interrupt] front, so we can get a clear image of your lungs and heart without any obstructions from clothing or other materials.", + "start_time": 3.8074356191015557, + "end_time": 13.884895936561874, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--291/temp/line_1_B.wav", + "silence_duration": 0.5334220136593788, + "is_interrupted": true, + "text_after_interrupt": "front, so we can get a clear image of your lungs and heart without any obstructions from clothing or other materials." + }, + { + "speaker": "A", + "text": "Sorry, should I take off any jewelry too?", + "original_text": "Sorry, should I take off any jewelry too?", + "start_time": 8.184397070348721, + "end_time": 10.634102285768222, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--291/temp/line_2_A.wav", + "silence_duration": 0.47149633677665403, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, it's best to remove any jewelry. Now, after you put the gown on with the opening in the back, you will stand over here up against this plate.", + "original_text": "Yes, it's best to remove any jewelry. Now, after you put the gown on with the opening in the back, you will stand over here up against this plate.", + "start_time": 14.385984974754308, + "end_time": 21.4564611652305, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--291/temp/line_3_B.wav", + "silence_duration": 0.5010890381924342, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Should I just stand naturally?", + "original_text": "Should I just stand naturally?", + "start_time": 21.910151449030216, + "end_time": 23.558768229075568, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--291/temp/line_4_A.wav", + "silence_duration": 0.45369028379971477, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "You will raise your arms up shoulder high.", + "original_text": "You will raise your arms up shoulder high.", + "start_time": 23.901913335837108, + "end_time": 25.8523895263133, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--291/temp/line_5_B.wav", + "silence_duration": 0.3431451067615391, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Is this all right?", + "original_text": "Is this all right?", + "start_time": 26.373223623666846, + "end_time": 27.4877814467961, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--291/temp/line_6_A.wav", + "silence_duration": 0.520834097353547, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, you are doing great.", + "original_text": "Yes, you are doing great.", + "start_time": 27.90804351619775, + "end_time": 29.196750999190947, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--291/temp/line_7_B.wav", + "silence_duration": 0.42026206940164995, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Where will you be going?", + "original_text": "Where will you be going?", + "start_time": 29.602081714658226, + "end_time": 30.960449061597, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--291/temp/line_8_A.wav", + "silence_duration": 0.4053307154672793, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I need to stand behind this shield. Now you will take a deep breath, hold it, and", + "original_text": "I need to stand behind this shield. Now you will take a deep breath, hold it, and [interrupt] I will quickly take the X-ray while maintaining proper positioning to ensure we capture the clearest possible diagnostic images for the radiologist to review.", + "start_time": 31.303036202381772, + "end_time": 44.31782078288064, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--291/temp/line_9_B.wav", + "silence_duration": 0.34258714078477254, + "is_interrupted": true, + "text_after_interrupt": "I will quickly take the X-ray while maintaining proper positioning to ensure we capture the clearest possible diagnostic images for the radiologist to review." + }, + { + "speaker": "A", + "text": "Just to clarify, how long should I hold my breath?", + "original_text": "Just to clarify, how long should I hold my breath?", + "start_time": 38.2861888303708, + "end_time": 41.502152549191656, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--291/temp/line_10_A.wav", + "silence_duration": 0.5538737051171211, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Only for a few seconds. Then you can let it out. After that, you can get dressed when the film is developed.", + "original_text": "Only for a few seconds. Then you can let it out. After that, you can get dressed when the film is developed.", + "start_time": 44.856573788185216, + "end_time": 50.29004317594032, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--291/temp/line_11_B.wav", + "silence_duration": 0.5387530053045807, + "is_interrupted": false + } + ] + }, + "DialogSum--val--292": { + "original_text": "A: Oh, man. Nobody can stand this kind of burning heat.\nB: Tell me about it. You can't even stay in the sun for 5 minutes. You'll be dried up like a [interrupt] raisin in no time if you don't find some shade or proper hydration to protect yourself from this extreme weather.\nA: Sorry to jump in, but I was just thinking—do you have any plans for this afternoon? Maybe we could stay indoors and catch up on some movies.\nB: I like your humor, Mark. Anyway, I guess this afternoon, there is nothing we can do but stay home. I don't want to be taken to the hospital [interrupt] with a heatstroke or something worse, especially since the nearest medical facility is about 30 minutes away in this terrible traffic.\nA: Yeah, speaking of staying home, do you have any beer? It could help us cool down a bit.\nB: Yes, do you want Coors Light or Corona? I also have some snacks if you're feeling peckish while we watch those movies you mentioned earlier.", + "cleaned_text": "A: Oh, man. Nobody can stand this kind of burning heat.\nB:Tell me about it. You can't even stay in the sun for 5 minutes. You'll be dried up like a raisin in no time if you don't find some shade or proper hydration to protect yourself from this extreme weather.\nA: Sorry to jump in, but I was just thinking—do you have any plans for this afternoon? Maybe we could stay indoors and catch up on some movies.\nB:I like your humor, Mark. Anyway, I guess this afternoon, there is nothing we can do but stay home. I don't want to be taken to the hospital with a heatstroke or something worse, especially since the nearest medical facility is about 30 minutes away in this terrible traffic.\nA: Yeah, speaking of staying home, do you have any beer? It could help us cool down a bit.\nB: Yes, do you want Coors Light or Corona? I also have some snacks if you're feeling peckish while we watch those movies you mentioned earlier.", + "total_duration": 43.83369614512472, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--292/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--292/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--292/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Oh, man. Nobody can stand this kind of burning heat.", + "original_text": "Oh, man. Nobody can stand this kind of burning heat.", + "start_time": 0, + "end_time": 3.030204081632653, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--292/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Tell me about it. You can't even stay in the sun for 5 minutes. You'll be dried up like a", + "original_text": "Tell me about it. You can't even stay in the sun for 5 minutes. You'll be dried up like a [interrupt] raisin in no time if you don't find some shade or proper hydration to protect yourself from this extreme weather.", + "start_time": 3.457308658412221, + "end_time": 13.407059225305645, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--292/temp/line_1_B.wav", + "silence_duration": 0.42710457677956815, + "is_interrupted": true, + "text_after_interrupt": "raisin in no time if you don't find some shade or proper hydration to protect yourself from this extreme weather." + }, + { + "speaker": "A", + "text": "Sorry to jump in, but I was just thinking—do you have any plans for this afternoon? Maybe we could stay indoors and catch up on some movies.", + "original_text": "Sorry to jump in, but I was just thinking—do you have any plans for this afternoon? Maybe we could stay indoors and catch up on some movies.", + "start_time": 7.927149928253491, + "end_time": 16.623022944126507, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--292/temp/line_2_A.wav", + "silence_duration": 0.37438737452265, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I like your humor, Mark. Anyway, I guess this afternoon, there is nothing we can do but stay home. I don't want to be taken to the hospital", + "original_text": "I like your humor, Mark. Anyway, I guess this afternoon, there is nothing we can do but stay home. I don't want to be taken to the hospital [interrupt] with a heatstroke or something worse, especially since the nearest medical facility is about 30 minutes away in this terrible traffic.", + "start_time": 16.97940492588555, + "end_time": 30.609518304570358, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--292/temp/line_3_B.wav", + "silence_duration": 0.3563819817590435, + "is_interrupted": true, + "text_after_interrupt": "with a heatstroke or something worse, especially since the nearest medical facility is about 30 minutes away in this terrible traffic." + }, + { + "speaker": "A", + "text": "Yeah, speaking of staying home, do you have any beer? It could help us cool down a bit.", + "original_text": "Yeah, speaking of staying home, do you have any beer? It could help us cool down a bit.", + "start_time": 30.273414999624347, + "end_time": 35.96230388851323, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--292/temp/line_4_A.wav", + "silence_duration": 0.43372257064373393, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, do you want Coors Light or Corona? I also have some snacks if you're feeling peckish while we watch those movies you mentioned earlier.", + "original_text": "Yes, do you want Coors Light or Corona? I also have some snacks if you're feeling peckish while we watch those movies you mentioned earlier.", + "start_time": 36.43814462932604, + "end_time": 43.83370018488159, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--292/temp/line_5_B.wav", + "silence_duration": 0.47584074081280914, + "is_interrupted": false + } + ] + }, + "DialogSum--val--293": { + "original_text": "A: Oh, heavens, I look terrible.\nB: Come on. I'm sure it's not that bad. Can I come in and take a look, hon[interrupt]? I promise I'll be completely honest with you and give you my best fashion advice if you'll just let me see.\nA: Absolutely not. This shirt looked pretty nice on the shelf. But on my fat body, it looks terrib[interrupt]ly unflattering, and I don't want you to see me like this because I know you'll just try to make me feel better instead of telling me the truth.\nB: Wait, why do you say that? You've always looked great in anything you wear. Maybe it's just the lighting in there or—did you consider trying a different size?\nA: It's not just the size, it's the style too. I thought you like the styles from the eighties.\nB: I do, but I didn't realize there were \"bad\" eighties styles. What do you mean by that?\nA: I like good eighties styles. Not bad eighties styles.\nB: I never knew that you could divide it up like that. I just thought all eighties styles were good.\nA: Very funny. Look, can we just get out of here, please? Let's just try to find a more modern store where they might actually have something that doesn't make me look like some huge cartoon animal from the zoo.\nB: It's all up to you.", + "cleaned_text": "A: Oh, heavens, I look terrible.\nB:Come on. I'm sure it's not that bad. Can I come in and take a look, hon ? I promise I'll be completely honest with you and give you my best fashion advice if you'll just let me see.\nA:Absolutely not. This shirt looked pretty nice on the shelf. But on my fat body, it looks terrib ly unflattering, and I don't want you to see me like this because I know you'll just try to make me feel better instead of telling me the truth.\nB: Wait, why do you say that? You've always looked great in anything you wear. Maybe it's just the lighting in there or—did you consider trying a different size?\nA: It's not just the size, it's the style too. I thought you like the styles from the eighties.\nB: I do, but I didn't realize there were \"bad\" eighties styles. What do you mean by that?\nA: I like good eighties styles. Not bad eighties styles.\nB: I never knew that you could divide it up like that. I just thought all eighties styles were good.\nA: Very funny. Look, can we just get out of here, please? Let's just try to find a more modern store where they might actually have something that doesn't make me look like some huge cartoon animal from the zoo.\nB: It's all up to you.", + "total_duration": 61.269342403628116, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--293/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--293/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--293/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Oh, heavens, I look terrible.", + "original_text": "Oh, heavens, I look terrible.", + "start_time": 0, + "end_time": 1.811156462585034, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--293/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Come on. I'm sure it's not that bad. Can I come in and take a look, hon", + "original_text": "Come on. I'm sure it's not that bad. Can I come in and take a look, hon[interrupt]? I promise I'll be completely honest with you and give you my best fashion advice if you'll just let me see.", + "start_time": 2.400319679264306, + "end_time": 12.059820813051154, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--293/temp/line_1_B.wav", + "silence_duration": 0.5891632166792717, + "is_interrupted": true, + "text_after_interrupt": "? I promise I'll be completely honest with you and give you my best fashion advice if you'll just let me see." + }, + { + "speaker": "A", + "text": "Absolutely not. This shirt looked pretty nice on the shelf. But on my fat body, it looks terrib", + "original_text": "Absolutely not. This shirt looked pretty nice on the shelf. But on my fat body, it looks terrib[interrupt]ly unflattering, and I don't want you to see me like this because I know you'll just try to make me feel better instead of telling me the truth.", + "start_time": 5.92975278584027, + "end_time": 20.244854826656596, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--293/temp/line_2_A.wav", + "silence_duration": 0.35580449300286604, + "is_interrupted": true, + "text_after_interrupt": "ly unflattering, and I don't want you to see me like this because I know you'll just try to make me feel better instead of telling me the truth." + }, + { + "speaker": "B", + "text": "Wait, why do you say that? You've always looked great in anything you wear. Maybe it's just the lighting in there or—did you consider trying a different size?", + "original_text": "Wait, why do you say that? You've always looked great in anything you wear. Maybe it's just the lighting in there or—did you consider trying a different size?", + "start_time": 18.731452970453113, + "end_time": 27.009366802652657, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--293/temp/line_3_B.wav", + "silence_duration": 0.5451766572723011, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "It's not just the size, it's the style too. I thought you like the styles from the eighties.", + "original_text": "It's not just the size, it's the style too. I thought you like the styles from the eighties.", + "start_time": 27.447020450686004, + "end_time": 32.93853972506242, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--293/temp/line_4_A.wav", + "silence_duration": 0.43765364803334683, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I do, but I didn't realize there were \"bad\" eighties styles. What do you mean by that?", + "original_text": "I do, but I didn't realize there were \"bad\" eighties styles. What do you mean by that?", + "start_time": 33.39619973282347, + "end_time": 37.7847711613949, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--293/temp/line_5_B.wav", + "silence_duration": 0.4576600077610474, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I like good eighties styles. Not bad eighties styles.", + "original_text": "I like good eighties styles. Not bad eighties styles.", + "start_time": 38.17410175129059, + "end_time": 41.64548497124524, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--293/temp/line_6_A.wav", + "silence_duration": 0.38933058989569413, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I never knew that you could divide it up like that. I just thought all eighties styles were good.", + "original_text": "I never knew that you could divide it up like that. I just thought all eighties styles were good.", + "start_time": 42.163441014385896, + "end_time": 47.07446142254916, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--293/temp/line_7_B.wav", + "silence_duration": 0.5179560431406537, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Very funny. Look, can we just get out of here, please? Let's just try to find a more modern store where they might actually have something that doesn't make me look like some huge cartoon animal from the zoo.", + "original_text": "Very funny. Look, can we just get out of here, please? Let's just try to find a more modern store where they might actually have something that doesn't make me look like some huge cartoon animal from the zoo.", + "start_time": 47.44496872791708, + "end_time": 59.69349480501458, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--293/temp/line_8_A.wav", + "silence_duration": 0.37050730536791393, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "It's all up to you.", + "original_text": "It's all up to you.", + "start_time": 60.17802157608321, + "end_time": 61.26935944456394, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--293/temp/line_9_B.wav", + "silence_duration": 0.48452677106863085, + "is_interrupted": false + } + ] + }, + "DialogSum--val--294": { + "original_text": "A: I heard something terrible happen to your son last weekend. \nB: Yes, my family went swimming with Mr. Henry and his son last Saturday. When we got there, my wife and I started looking for a nice spot near the pool. My son ran off by himself and went over to the pool. The next thing we knew, he was in the [interrupt] deep end struggling to stay afloat and we could see the panic in his eyes as he flailed his arms desperately trying to keep his head above water. \nA: Wait, did he know how to swim? \nB: No, he can't. We told him to stay in the shallow part of the pool, but he slipped into the deep part of the pool by accident. \nA: That's horrible. Did anyone notice what was happening? \nB: Yes, luckily Henry was nearby and immediately realized that he was drowning. Henry has taken some swimming lessons. So he knew right away that my son was in danger. \nA: You must have been in shock when you found out what was happening. \nB: Yes, we were so frightened. We'd originally planned to swim there for an hour, but after that, we decided to leave immediately and take him home to rest. \nA: Hold on, what did Henry do when he saw your son in danger? \nB: Oh right, I didn't mention that. Henry quickly jumped into the pool and pulled my son out. After that, we left in a hurry.", + "cleaned_text": "A: I heard something terrible happen to your son last weekend. \nB:Yes, my family went swimming with Mr. Henry and his son last Saturday. When we got there, my wife and I started looking for a nice spot near the pool. My son ran off by himself and went over to the pool. The next thing we knew, he was in the deep end struggling to stay afloat and we could see the panic in his eyes as he flailed his arms desperately trying to keep his head above water.\nA: Wait, did he know how to swim? \nB: No, he can't. We told him to stay in the shallow part of the pool, but he slipped into the deep part of the pool by accident. \nA: That's horrible. Did anyone notice what was happening? \nB: Yes, luckily Henry was nearby and immediately realized that he was drowning. Henry has taken some swimming lessons. So he knew right away that my son was in danger. \nA: You must have been in shock when you found out what was happening. \nB: Yes, we were so frightened. We'd originally planned to swim there for an hour, but after that, we decided to leave immediately and take him home to rest. \nA: Hold on, what did Henry do when he saw your son in danger? \nB: Oh right, I didn't mention that. Henry quickly jumped into the pool and pulled my son out. After that, we left in a hurry.", + "total_duration": 64.23931972789116, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--294/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--294/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--294/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "I heard something terrible happen to your son last weekend.", + "original_text": "I heard something terrible happen to your son last weekend.", + "start_time": 0, + "end_time": 3.111473922902494, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--294/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, my family went swimming with Mr. Henry and his son last Saturday. When we got there, my wife and I started looking for a nice spot near the pool. My son ran off by himself and went over to the pool. The next thing we knew, he was in the", + "original_text": "Yes, my family went swimming with Mr. Henry and his son last Saturday. When we got there, my wife and I started looking for a nice spot near the pool. My son ran off by himself and went over to the pool. The next thing we knew, he was in the [interrupt] deep end struggling to stay afloat and we could see the panic in his eyes as he flailed his arms desperately trying to keep his head above water.", + "start_time": 3.549438246586923, + "end_time": 22.345991534568782, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--294/temp/line_1_B.wav", + "silence_duration": 0.43796432368442906, + "is_interrupted": true, + "text_after_interrupt": "deep end struggling to stay afloat and we could see the panic in his eyes as he flailed his arms desperately trying to keep his head above water." + }, + { + "speaker": "A", + "text": "Wait, did he know how to swim?", + "original_text": "Wait, did he know how to swim?", + "start_time": 15.879234164954271, + "end_time": 17.9109801967003, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--294/temp/line_2_A.wav", + "silence_duration": 0.3911012384898643, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "No, he can't. We told him to stay in the shallow part of the pool, but he slipped into the deep part of the pool by accident.", + "original_text": "No, he can't. We told him to stay in the shallow part of the pool, but he slipped into the deep part of the pool by accident.", + "start_time": 22.81570031193483, + "end_time": 28.945768339145715, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--294/temp/line_3_B.wav", + "silence_duration": 0.46970877736604616, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "That's horrible. Did anyone notice what was happening?", + "original_text": "That's horrible. Did anyone notice what was happening?", + "start_time": 29.295809570062346, + "end_time": 32.848462631286836, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--294/temp/line_4_A.wav", + "silence_duration": 0.350041230916631, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, luckily Henry was nearby and immediately realized that he was drowning. Henry has taken some swimming lessons. So he knew right away that my son was in danger.", + "original_text": "Yes, luckily Henry was nearby and immediately realized that he was drowning. Henry has taken some swimming lessons. So he knew right away that my son was in danger.", + "start_time": 33.16578613751817, + "end_time": 41.838439198742655, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--294/temp/line_5_B.wav", + "silence_duration": 0.31732350623133126, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "You must have been in shock when you found out what was happening.", + "original_text": "You must have been in shock when you found out what was happening.", + "start_time": 42.40877322571521, + "end_time": 45.43897730734786, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--294/temp/line_6_A.wav", + "silence_duration": 0.5703340269725545, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, we were so frightened. We'd originally planned to swim there for an hour, but after that, we decided to leave immediately and take him home to rest.", + "original_text": "Yes, we were so frightened. We'd originally planned to swim there for an hour, but after that, we decided to leave immediately and take him home to rest.", + "start_time": 45.89474374482554, + "end_time": 53.37156914165094, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--294/temp/line_7_B.wav", + "silence_duration": 0.45576643747767565, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Hold on, what did Henry do when he saw your son in danger?", + "original_text": "Hold on, what did Henry do when he saw your son in danger?", + "start_time": 53.97134180421597, + "end_time": 57.72136447995293, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--294/temp/line_8_A.wav", + "silence_duration": 0.5997726625650301, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Oh right, I didn't mention that. Henry quickly jumped into the pool and pulled my son out. After that, we left in a hurry.", + "original_text": "Oh right, I didn't mention that. Henry quickly jumped into the pool and pulled my son out. After that, we left in a hurry.", + "start_time": 58.260185408621524, + "end_time": 64.23932373061699, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--294/temp/line_9_B.wav", + "silence_duration": 0.5388209286685908, + "is_interrupted": false + } + ] + }, + "DialogSum--val--295": { + "original_text": "A: How is your mother feeling these days? \nB: Much better, thanks. She'll be back home in a few [interrupt] days, and we're all really relieved because the doctors said her recovery has been remarkable considering her initial condition. \nA: Sorry to interrupt, but do you need any help with her care once she's back? I mean, it might be overwhelming to manage everything on your own. \nB: I appreciate the offer, but I think I'll need a week to take care of her and do some cleaning. \nA: Why don't you hire someone to do it? You'll be able to work and also have more free time. \nB: I prefer to do it myself. \nA: You're a kind and thoughtful man. I admire you very much. \nB: I'm just a regular son. Oh, and I was about to say earlier, she'll be back home in a few days, and we're all really looking forward to it.", + "cleaned_text": "A: How is your mother feeling these days? \nB:Much better, thanks. She'll be back home in a few days, and we're all really relieved because the doctors said her recovery has been remarkable considering her initial condition.\nA: Sorry to interrupt, but do you need any help with her care once she's back? I mean, it might be overwhelming to manage everything on your own. \nB: I appreciate the offer, but I think I'll need a week to take care of her and do some cleaning. \nA: Why don't you hire someone to do it? You'll be able to work and also have more free time. \nB: I prefer to do it myself. \nA: You're a kind and thoughtful man. I admire you very much. \nB: I'm just a regular son. Oh, and I was about to say earlier, she'll be back home in a few days, and we're all really looking forward to it.", + "total_duration": 37.31832199546485, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--295/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--295/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--295/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "How is your mother feeling these days?", + "original_text": "How is your mother feeling these days?", + "start_time": 0, + "end_time": 2.136235827664399, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--295/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Much better, thanks. She'll be back home in a few", + "original_text": "Much better, thanks. She'll be back home in a few [interrupt] days, and we're all really relieved because the doctors said her recovery has been remarkable considering her initial condition.", + "start_time": 2.5578600739010637, + "end_time": 11.509152590907867, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--295/temp/line_1_B.wav", + "silence_duration": 0.42162424623666483, + "is_interrupted": true, + "text_after_interrupt": "days, and we're all really relieved because the doctors said her recovery has been remarkable considering her initial condition." + }, + { + "speaker": "A", + "text": "Sorry to interrupt, but do you need any help with her care once she's back? I mean, it might be overwhelming to manage everything on your own.", + "original_text": "Sorry to interrupt, but do you need any help with her care once she's back? I mean, it might be overwhelming to manage everything on your own.", + "start_time": 5.112055085238932, + "end_time": 13.448018804059794, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--295/temp/line_2_A.wav", + "silence_duration": 0.5698175293143477, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I appreciate the offer, but I think I'll need a week to take care of her and do some cleaning.", + "original_text": "I appreciate the offer, but I think I'll need a week to take care of her and do some cleaning.", + "start_time": 13.948767624829438, + "end_time": 18.221239280158237, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--295/temp/line_3_B.wav", + "silence_duration": 0.500748820769644, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Why don't you hire someone to do it? You'll be able to work and also have more free time.", + "original_text": "Why don't you hire someone to do it? You'll be able to work and also have more free time.", + "start_time": 18.618123893122736, + "end_time": 23.656854051852896, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--295/temp/line_4_A.wav", + "silence_duration": 0.3968846129644981, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I prefer to do it myself.", + "original_text": "I prefer to do it myself.", + "start_time": 24.14901384368837, + "end_time": 25.658310895842565, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--295/temp/line_5_B.wav", + "silence_duration": 0.4921597918354713, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "You're a kind and thoughtful man. I admire you very much.", + "original_text": "You're a kind and thoughtful man. I admire you very much.", + "start_time": 26.019924501003654, + "end_time": 29.839607040686193, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--295/temp/line_6_A.wav", + "silence_duration": 0.36161360516108787, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I'm just a regular son. Oh, and I was about to say earlier, she'll be back home in a few days, and we're all really looking forward to it.", + "original_text": "I'm just a regular son. Oh, and I was about to say earlier, she'll be back home in a few days, and we're all really looking forward to it.", + "start_time": 30.387182649933365, + "end_time": 37.3183391125184, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--295/temp/line_7_B.wav", + "silence_duration": 0.5475756092471702, + "is_interrupted": false + } + ] + }, + "DialogSum--val--296": { + "original_text": "A: My car doesn't always start in the morning and it often makes me late for work. I think I'd better buy a new car.\nB: Gina, you should go to Jimmy's garage. I take my car there all the time. They have 20 years of experience and they are especially good at repairing older cars.\nA: Thank you, the last time I took my car to a garage. They didn't really [interrupt] fix the issue completely, which made me lose confidence in their service and I ended up spending more money on temporary solutions that didn't last very long at all.\nB: Oh, that's frustrating! But trust me, Jimmy's is different. You should call and make an appointment now. They do a good job.\nA: I'll consider that. But I was going to say, they didn't really settle the problem last time, so I'm a bit hesitant. Are you sure Jimmy's can handle it better?\nB: Absolutely. They are usually not busy after 6:00 o'clock, so you can even drop by after work.", + "cleaned_text": "A: My car doesn't always start in the morning and it often makes me late for work. I think I'd better buy a new car.\nB: Gina, you should go to Jimmy's garage. I take my car there all the time. They have 20 years of experience and they are especially good at repairing older cars.\nA:Thank you, the last time I took my car to a garage. They didn't really fix the issue completely, which made me lose confidence in their service and I ended up spending more money on temporary solutions that didn't last very long at all.\nB: Oh, that's frustrating! But trust me, Jimmy's is different. You should call and make an appointment now. They do a good job.\nA: I'll consider that. But I was going to say, they didn't really settle the problem last time, so I'm a bit hesitant. Are you sure Jimmy's can handle it better?\nB: Absolutely. They are usually not busy after 6:00 o'clock, so you can even drop by after work.", + "total_duration": 45.33637188208617, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--296/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--296/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--296/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "My car doesn't always start in the morning and it often makes me late for work. I think I'd better buy a new car.", + "original_text": "My car doesn't always start in the morning and it often makes me late for work. I think I'd better buy a new car.", + "start_time": 0, + "end_time": 6.489977324263038, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--296/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Gina, you should go to Jimmy's garage. I take my car there all the time. They have 20 years of experience and they are especially good at repairing older cars.", + "original_text": "Gina, you should go to Jimmy's garage. I take my car there all the time. They have 20 years of experience and they are especially good at repairing older cars.", + "start_time": 6.893648556719448, + "end_time": 15.067072593000628, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--296/temp/line_1_B.wav", + "silence_duration": 0.4036712324564098, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Thank you, the last time I took my car to a garage. They didn't really", + "original_text": "Thank you, the last time I took my car to a garage. They didn't really [interrupt] fix the issue completely, which made me lose confidence in their service and I ended up spending more money on temporary solutions that didn't last very long at all.", + "start_time": 15.566176987905637, + "end_time": 29.335610094481602, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--296/temp/line_2_A.wav", + "silence_duration": 0.4991043949050095, + "is_interrupted": true, + "text_after_interrupt": "fix the issue completely, which made me lose confidence in their service and I ended up spending more money on temporary solutions that didn't last very long at all." + }, + { + "speaker": "B", + "text": "Oh, that's frustrating! But trust me, Jimmy's is different. You should call and make an appointment now. They do a good job.", + "original_text": "Oh, that's frustrating! But trust me, Jimmy's is different. You should call and make an appointment now. They do a good job.", + "start_time": 19.74576882464033, + "end_time": 26.340235944821735, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--296/temp/line_3_B.wav", + "silence_duration": 0.35325298758932117, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I'll consider that. But I was going to say, they didn't really settle the problem last time, so I'm a bit hesitant. Are you sure Jimmy's can handle it better?", + "original_text": "I'll consider that. But I was going to say, they didn't really settle the problem last time, so I'm a bit hesitant. Are you sure Jimmy's can handle it better?", + "start_time": 29.709544928519115, + "end_time": 39.54319572216991, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--296/temp/line_4_A.wav", + "silence_duration": 0.37393483403751265, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Absolutely. They are usually not busy after 6:00 o'clock, so you can even drop by after work.", + "original_text": "Absolutely. They are usually not busy after 6:00 o'clock, so you can even drop by after work.", + "start_time": 40.123512043686006, + "end_time": 45.33639186228011, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--296/temp/line_5_B.wav", + "silence_duration": 0.5803163215160945, + "is_interrupted": false + } + ] + }, + "DialogSum--val--297": { + "original_text": "A: What about taking a tour around Cambridge today? \nB: I did that with a friend yesterday. \nA: But didn't you say you would go to the London Eye [interrupt] yesterday? I thought you were really excited about it because you mentioned how much you wanted to see the panoramic views of the city from that iconic Ferris wheel. \nB: Oh, actually, my friend had already been there, so we decided to change our plan. Today I want to see some modern art work. \nA: If so, you can go to Tate Modern. It's a museum with a collection of international artwork from the nineteen hundreds. \nB: That sounds interesting. Do many people visit it? By the way, what were you saying about the London Eye earlier?", + "cleaned_text": "A: What about taking a tour around Cambridge today? \nB: I did that with a friend yesterday. \nA:But didn't you say you would go to the London Eye yesterday? I thought you were really excited about it because you mentioned how much you wanted to see the panoramic views of the city from that iconic Ferris wheel.\nB: Oh, actually, my friend had already been there, so we decided to change our plan. Today I want to see some modern art work. \nA: If so, you can go to Tate Modern. It's a museum with a collection of international artwork from the nineteen hundreds. \nB: That sounds interesting. Do many people visit it? By the way, what were you saying about the London Eye earlier?", + "total_duration": 31.04231292517007, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--297/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--297/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--297/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "What about taking a tour around Cambridge today?", + "original_text": "What about taking a tour around Cambridge today?", + "start_time": 0, + "end_time": 2.670294784580499, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--297/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I did that with a friend yesterday.", + "original_text": "I did that with a friend yesterday.", + "start_time": 3.168290168745144, + "end_time": 4.700807175547865, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--297/temp/line_1_B.wav", + "silence_duration": 0.49799538416464495, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "But didn't you say you would go to the London Eye", + "original_text": "But didn't you say you would go to the London Eye [interrupt] yesterday? I thought you were really excited about it because you mentioned how much you wanted to see the panoramic views of the city from that iconic Ferris wheel.", + "start_time": 5.233731054195558, + "end_time": 17.70284670045406, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--297/temp/line_2_A.wav", + "silence_duration": 0.5329238786476929, + "is_interrupted": true, + "text_after_interrupt": "yesterday? I thought you were really excited about it because you mentioned how much you wanted to see the panoramic views of the city from that iconic Ferris wheel." + }, + { + "speaker": "B", + "text": "Oh, actually, my friend had already been there, so we decided to change our plan. Today I want to see some modern art work.", + "original_text": "Oh, actually, my friend had already been there, so we decided to change our plan. Today I want to see some modern art work.", + "start_time": 7.822755997506215, + "end_time": 14.811962346712566, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--297/temp/line_3_B.wav", + "silence_duration": 0.47544114152953376, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "If so, you can go to Tate Modern. It's a museum with a collection of international artwork from the nineteen hundreds.", + "original_text": "If so, you can go to Tate Modern. It's a museum with a collection of international artwork from the nineteen hundreds.", + "start_time": 18.20189466975495, + "end_time": 25.400080610798035, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--297/temp/line_4_A.wav", + "silence_duration": 0.4990479693008897, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "That sounds interesting. Do many people visit it? By the way, what were you saying about the London Eye earlier?", + "original_text": "That sounds interesting. Do many people visit it? By the way, what were you saying about the London Eye earlier?", + "start_time": 25.72498093025301, + "end_time": 31.042350544765483, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--297/temp/line_5_B.wav", + "silence_duration": 0.32490031945497666, + "is_interrupted": false + } + ] + }, + "DialogSum--val--298": { + "original_text": "A: How are you Mrs. Brandon? \nB: Pretty good. How are you [interrupt] I was going to ask how your new job was going since we last spoke about your exciting career transition into the tech industry. \nA: Not so good. I just lost my job today. \nB: Oh no, I'm really sorry to hear that. How are you holding up? \nA: It's been tough, but I'm trying to stay positive. How are your students doing? \nB: They're very nervous about the final. I remember you gave our class a hard final exam in my first year of college, and many of us [interrupt] struggled to pass at first, but through dedicated study sessions and your excellent guidance, we ended up learning a lot more than we expected. \nA: Oh, speaking of finals, do you think your students are prepared enough this time? \nB: They are, but they're still worried. By the way, you mentioned that many of you failed my exam back then, but what I wanted to say was that I'm really glad to hear you learned a lot from it. \nA: Yes, it was challenging, but it must have worked because I can speak very good English now. \nB: I'm so glad to hear that.", + "cleaned_text": "A: How are you Mrs. Brandon? \nB:Pretty good. How are you I was going to ask how your new job was going since we last spoke about your exciting career transition into the tech industry.\nA: Not so good. I just lost my job today. \nB: Oh no, I'm really sorry to hear that. How are you holding up? \nA: It's been tough, but I'm trying to stay positive. How are your students doing? \nB:They're very nervous about the final. I remember you gave our class a hard final exam in my first year of college, and many of us struggled to pass at first, but through dedicated study sessions and your excellent guidance, we ended up learning a lot more than we expected.\nA: Oh, speaking of finals, do you think your students are prepared enough this time? \nB: They are, but they're still worried. By the way, you mentioned that many of you failed my exam back then, but what I wanted to say was that I'm really glad to hear you learned a lot from it. \nA: Yes, it was challenging, but it must have worked because I can speak very good English now. \nB: I'm so glad to hear that.", + "total_duration": 50.42848072562358, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--298/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--298/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--298/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "How are you Mrs. Brandon?", + "original_text": "How are you Mrs. Brandon?", + "start_time": 0, + "end_time": 1.474467120181406, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--298/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Pretty good. How are you", + "original_text": "Pretty good. How are you [interrupt] I was going to ask how your new job was going since we last spoke about your exciting career transition into the tech industry.", + "start_time": 1.8345038834760103, + "end_time": 9.613188690732247, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--298/temp/line_1_B.wav", + "silence_duration": 0.3600367632946043, + "is_interrupted": true, + "text_after_interrupt": "I was going to ask how your new job was going since we last spoke about your exciting career transition into the tech industry." + }, + { + "speaker": "A", + "text": "Not so good. I just lost my job today.", + "original_text": "Not so good. I just lost my job today.", + "start_time": 2.9722816612537883, + "end_time": 6.106975538804809, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--298/temp/line_2_A.wav", + "silence_duration": 0.5898433537206039, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Oh no, I'm really sorry to hear that. How are you holding up?", + "original_text": "Oh no, I'm really sorry to hear that. How are you holding up?", + "start_time": 9.933183127953194, + "end_time": 12.986607164234373, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--298/temp/line_3_B.wav", + "silence_duration": 0.31999443722094634, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "It's been tough, but I'm trying to stay positive. How are your students doing?", + "original_text": "It's been tough, but I'm trying to stay positive. How are your students doing?", + "start_time": 13.539421813063532, + "end_time": 18.287902538687113, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--298/temp/line_4_A.wav", + "silence_duration": 0.5528146488291583, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "They're very nervous about the final. I remember you gave our class a hard final exam in my first year of college, and many of us", + "original_text": "They're very nervous about the final. I remember you gave our class a hard final exam in my first year of college, and many of us [interrupt] struggled to pass at first, but through dedicated study sessions and your excellent guidance, we ended up learning a lot more than we expected.", + "start_time": 18.646975301196512, + "end_time": 32.70665784087905, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--298/temp/line_5_B.wav", + "silence_duration": 0.3590727625093996, + "is_interrupted": true, + "text_after_interrupt": "struggled to pass at first, but through dedicated study sessions and your excellent guidance, we ended up learning a lot more than we expected." + }, + { + "speaker": "A", + "text": "Oh, speaking of finals, do you think your students are prepared enough this time?", + "original_text": "Oh, speaking of finals, do you think your students are prepared enough this time?", + "start_time": 29.285018990404247, + "end_time": 33.754860260245515, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--298/temp/line_6_A.wav", + "silence_duration": 0.4285242839800171, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "They are, but they're still worried. By the way, you mentioned that many of you failed my exam back then, but what I wanted to say was that I'm really glad to hear you learned a lot from it.", + "original_text": "They are, but they're still worried. By the way, you mentioned that many of you failed my exam back then, but what I wanted to say was that I'm really glad to hear you learned a lot from it.", + "start_time": 34.15039961322589, + "end_time": 42.86949258374744, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--298/temp/line_7_B.wav", + "silence_duration": 0.39553935298038195, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Yes, it was challenging, but it must have worked because I can speak very good English now.", + "original_text": "Yes, it was challenging, but it must have worked because I can speak very good English now.", + "start_time": 43.26244281393628, + "end_time": 48.52176254182744, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--298/temp/line_8_A.wav", + "silence_duration": 0.39295023018884767, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I'm so glad to hear that.", + "original_text": "I'm so glad to hear that.", + "start_time": 48.930823750240506, + "end_time": 50.42851082507044, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--298/temp/line_9_B.wav", + "silence_duration": 0.4090612084130659, + "is_interrupted": false + } + ] + }, + "DialogSum--val--299": { + "original_text": "A: You look tired. What time did you get up? \nB: Hmm...I got up at 11:30 AM. I'm having brunch [interrupt] because I didn't have time for breakfast earlier and I was absolutely starving after sleeping through my usual morning routine. \nA: Wait, 11:30 AM? That's really late! Did you stay up all night? \nB: Yeah, I went to bed at 2:00 AM. I was playing computer games and got so absorbed that I lost track of time. \nA: Oh, so you were gaming late into the night. Have you thought about cutting down on that? Maybe finding something else to focus on could help. \nB: You're right. It's just that I'm always crazy about playing the game. It's a pain in the neck to cut down, but I really should try. \nA: Absolutely. If you were busy with other things, you might not even have time to play. But wait, you mentioned brunch earlier—what did you have? \nB: Just something quick, like eggs and toast. And yeah, I'll try to find something more productive to do starting tomorrow. Thanks for the suggestion. \nA: No problem at all. Really nice speaking to you. \nB: You, too. See you later. \nA: See you.", + "cleaned_text": "A: You look tired. What time did you get up? \nB:Hmm...I got up at 11:30 AM. I'm having brunch because I didn't have time for breakfast earlier and I was absolutely starving after sleeping through my usual morning routine.\nA: Wait, 11:30 AM? That's really late! Did you stay up all night? \nB: Yeah, I went to bed at 2:00 AM. I was playing computer games and got so absorbed that I lost track of time. \nA: Oh, so you were gaming late into the night. Have you thought about cutting down on that? Maybe finding something else to focus on could help. \nB: You're right. It's just that I'm always crazy about playing the game. It's a pain in the neck to cut down, but I really should try. \nA: Absolutely. If you were busy with other things, you might not even have time to play. But wait, you mentioned brunch earlier—what did you have? \nB: Just something quick, like eggs and toast. And yeah, I'll try to find something more productive to do starting tomorrow. Thanks for the suggestion. \nA: No problem at all. Really nice speaking to you. \nB: You, too. See you later. \nA: See you.", + "total_duration": 59.9734693877551, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--299/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--299/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--299/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "You look tired. What time did you get up?", + "original_text": "You look tired. What time did you get up?", + "start_time": 0, + "end_time": 2.7747845804988662, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--299/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Hmm...I got up at 11:30 AM. I'm having brunch", + "original_text": "Hmm...I got up at 11:30 AM. I'm having brunch [interrupt] because I didn't have time for breakfast earlier and I was absolutely starving after sleeping through my usual morning routine.", + "start_time": 3.1785263437962414, + "end_time": 12.814807522934563, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--299/temp/line_1_B.wav", + "silence_duration": 0.4037417632973754, + "is_interrupted": true, + "text_after_interrupt": "because I didn't have time for breakfast earlier and I was absolutely starving after sleeping through my usual morning routine." + }, + { + "speaker": "A", + "text": "Wait, 11:30 AM? That's really late! Did you stay up all night?", + "original_text": "Wait, 11:30 AM? That's really late! Did you stay up all night?", + "start_time": 6.290000266698735, + "end_time": 11.50288008529284, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--299/temp/line_2_A.wav", + "silence_duration": 0.4306184983798105, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yeah, I went to bed at 2:00 AM. I was playing computer games and got so absorbed that I lost track of time.", + "original_text": "Yeah, I went to bed at 2:00 AM. I was playing computer games and got so absorbed that I lost track of time.", + "start_time": 13.210390208949851, + "end_time": 19.108258689675473, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--299/temp/line_3_B.wav", + "silence_duration": 0.3955826860152887, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Oh, so you were gaming late into the night. Have you thought about cutting down on that? Maybe finding something else to focus on could help.", + "original_text": "Oh, so you were gaming late into the night. Have you thought about cutting down on that? Maybe finding something else to focus on could help.", + "start_time": 19.70497131696817, + "end_time": 27.79712551197951, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--299/temp/line_4_A.wav", + "silence_duration": 0.5967126272926953, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "You're right. It's just that I'm always crazy about playing the game. It's a pain in the neck to cut down, but I really should try.", + "original_text": "You're right. It's just that I'm always crazy about playing the game. It's a pain in the neck to cut down, but I really should try.", + "start_time": 28.125357173739033, + "end_time": 35.10295354562112, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--299/temp/line_5_B.wav", + "silence_duration": 0.328231661759524, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Absolutely. If you were busy with other things, you might not even have time to play. But wait, you mentioned brunch earlier—what did you have?", + "original_text": "Absolutely. If you were busy with other things, you might not even have time to play. But wait, you mentioned brunch earlier—what did you have?", + "start_time": 35.529644603602435, + "end_time": 44.42288723398792, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--299/temp/line_6_A.wav", + "silence_duration": 0.4266910579813148, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Just something quick, like eggs and toast. And yeah, I'll try to find something more productive to do starting tomorrow. Thanks for the suggestion.", + "original_text": "Just something quick, like eggs and toast. And yeah, I'll try to find something more productive to do starting tomorrow. Thanks for the suggestion.", + "start_time": 44.82736817638884, + "end_time": 52.88469243942738, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--299/temp/line_7_B.wav", + "silence_duration": 0.40448094240091614, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "No problem at all. Really nice speaking to you.", + "original_text": "No problem at all. Really nice speaking to you.", + "start_time": 53.43806183385775, + "end_time": 56.82817521254256, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--299/temp/line_8_A.wav", + "silence_duration": 0.5533693944303688, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "You, too. See you later.", + "original_text": "You, too. See you later.", + "start_time": 57.270335863857, + "end_time": 58.74480298403841, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--299/temp/line_9_B.wav", + "silence_duration": 0.4421606513144378, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "See you.", + "original_text": "See you.", + "start_time": 59.11435783055456, + "end_time": 59.97349615255003, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--299/temp/line_10_A.wav", + "silence_duration": 0.3695548465161549, + "is_interrupted": false + } + ] + }, + "DialogSum--val--301": { + "original_text": "A: Let's go over this plan again. \nB: From Vancouver, we bike along the border all the way to Winnipeg. \nA: And that is mostly flat, right? \nB: Relatively, once we're out of Alberta, anyway. Then it's hills again in Manitoba but nothing we can't handle with the right preparation and [interrupt] proper gear. We should definitely pack some extra climbing gear and maybe even consider lighter bikes for those sections to make the ascent more manageable. \nA: Wait, did you mean Manitoba? I just want to make sure we're talking about the same place. \nB: Oh, yes, Manitoba. Sorry about that. And from Winnipeg, we go around the lakes through Toronto, right? \nA: That's right. And up into Quebec. And that's where we stop. \nB: It doesn't sound like that much when we go over the plan but that's a long, long ride. \nA: Are you ready for the cross country of a lifetime? \nB: Definitely! By the way, you mentioned hills again earlier—how steep are they compared to the ones in Alberta?", + "cleaned_text": "A: Let's go over this plan again. \nB: From Vancouver, we bike along the border all the way to Winnipeg. \nA: And that is mostly flat, right? \nB:Relatively, once we're out of Alberta, anyway. Then it's hills again in Manitoba but nothing we can't handle with the right preparation and proper gear. We should definitely pack some extra climbing gear and maybe even consider lighter bikes for those sections to make the ascent more manageable.\nA: Wait, did you mean Manitoba? I just want to make sure we're talking about the same place. \nB: Oh, yes, Manitoba. Sorry about that. And from Winnipeg, we go around the lakes through Toronto, right? \nA: That's right. And up into Quebec. And that's where we stop. \nB: It doesn't sound like that much when we go over the plan but that's a long, long ride. \nA: Are you ready for the cross country of a lifetime? \nB: Definitely! By the way, you mentioned hills again earlier—how steep are they compared to the ones in Alberta?", + "total_duration": 46.445034013605444, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--301/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--301/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--301/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Let's go over this plan again.", + "original_text": "Let's go over this plan again.", + "start_time": 0, + "end_time": 1.7763265306122449, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--301/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "From Vancouver, we bike along the border all the way to Winnipeg.", + "original_text": "From Vancouver, we bike along the border all the way to Winnipeg.", + "start_time": 2.11378672183395, + "end_time": 5.387800327276127, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--301/temp/line_1_B.wav", + "silence_duration": 0.3374601912217052, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "And that is mostly flat, right?", + "original_text": "And that is mostly flat, right?", + "start_time": 5.966487701620929, + "end_time": 7.766034186881701, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--301/temp/line_2_A.wav", + "silence_duration": 0.5786873743448024, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Relatively, once we're out of Alberta, anyway. Then it's hills again in Manitoba but nothing we can't handle with the right preparation and", + "original_text": "Relatively, once we're out of Alberta, anyway. Then it's hills again in Manitoba but nothing we can't handle with the right preparation and [interrupt] proper gear. We should definitely pack some extra climbing gear and maybe even consider lighter bikes for those sections to make the ascent more manageable.", + "start_time": 8.107370817642938, + "end_time": 22.538572631701896, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--301/temp/line_3_B.wav", + "silence_duration": 0.34133663076123644, + "is_interrupted": true, + "text_after_interrupt": "proper gear. We should definitely pack some extra climbing gear and maybe even consider lighter bikes for those sections to make the ascent more manageable." + }, + { + "speaker": "A", + "text": "Wait, did you mean Manitoba? I just want to make sure we're talking about the same place.", + "original_text": "Wait, did you mean Manitoba? I just want to make sure we're talking about the same place.", + "start_time": 16.02537535279033, + "end_time": 22.039343606758585, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--301/temp/line_4_A.wav", + "silence_duration": 0.5674573208943371, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Oh, yes, Manitoba. Sorry about that. And from Winnipeg, we go around the lakes through Toronto, right?", + "original_text": "Oh, yes, Manitoba. Sorry about that. And from Winnipeg, we go around the lakes through Toronto, right?", + "start_time": 23.085910646726862, + "end_time": 28.34523037461802, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--301/temp/line_5_B.wav", + "silence_duration": 0.5473380150249663, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "That's right. And up into Quebec. And that's where we stop.", + "original_text": "That's right. And up into Quebec. And that's where we stop.", + "start_time": 28.71737413164084, + "end_time": 32.71120633118733, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--301/temp/line_6_A.wav", + "silence_duration": 0.3721437570228232, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "It doesn't sound like that much when we go over the plan but that's a long, long ride.", + "original_text": "It doesn't sound like that much when we go over the plan but that's a long, long ride.", + "start_time": 33.03737886974193, + "end_time": 37.333070479719254, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--301/temp/line_7_B.wav", + "silence_duration": 0.3261725385546042, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Are you ready for the cross country of a lifetime?", + "original_text": "Are you ready for the cross country of a lifetime?", + "start_time": 37.92336658253784, + "end_time": 40.75620104965802, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--301/temp/line_8_A.wav", + "silence_duration": 0.5902961028185838, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Definitely! By the way, you mentioned hills again earlier—how steep are they compared to the ones in Alberta?", + "original_text": "Definitely! By the way, you mentioned hills again earlier—how steep are they compared to the ones in Alberta?", + "start_time": 41.313426618961415, + "end_time": 46.445036596285675, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--301/temp/line_9_B.wav", + "silence_duration": 0.5572255693033978, + "is_interrupted": false + } + ] + }, + "DialogSum--val--303": { + "original_text": "A: Do you think we should travel by bus or by train? \nB: It's a difficult choice. The train is a little faster, but much more [interrupt] expensive and sometimes the schedules aren't as flexible as bus routes, especially for last-minute trips. \nA: Sorry to cut in, but do you think the extra cost is really worth it for the time saved? \nB: It depends. We could face delays if we travel by bus, thanks to traffic jams. But buses are more cramped and you can't walk around. \nA: That's true. But I feel that I see more when I travel by bus. \nB: Really? I think you see more traveling by train. \nA: So which form of transport do you prefer to use? \nB: I prefer going by train, even though it costs more. \nA: Ok, then we'll go by train. I'm sure we'll have a good journey. Shall we go to the station and buy the tickets? \nB: The trains aren't usually full. We can get them on the day we travel. We should buy return tickets, because they are much [interrupt] cheaper and often come with additional benefits like seat reservations and access to station lounges during longer layovers. \nA: Oh, speaking of tickets, do you know if there's a discount for booking online? \nB: That's a good point. But as I was saying, return tickets are much cheaper than getting two singles, so we should definitely consider that.", + "cleaned_text": "A: Do you think we should travel by bus or by train? \nB:It's a difficult choice. The train is a little faster, but much more expensive and sometimes the schedules aren't as flexible as bus routes, especially for last-minute trips.\nA: Sorry to cut in, but do you think the extra cost is really worth it for the time saved? \nB: It depends. We could face delays if we travel by bus, thanks to traffic jams. But buses are more cramped and you can't walk around. \nA: That's true. But I feel that I see more when I travel by bus. \nB: Really? I think you see more traveling by train. \nA: So which form of transport do you prefer to use? \nB: I prefer going by train, even though it costs more. \nA: Ok, then we'll go by train. I'm sure we'll have a good journey. Shall we go to the station and buy the tickets? \nB:The trains aren't usually full. We can get them on the day we travel. We should buy return tickets, because they are much cheaper and often come with additional benefits like seat reservations and access to station lounges during longer layovers.\nA: Oh, speaking of tickets, do you know if there's a discount for booking online? \nB: That's a good point. But as I was saying, return tickets are much cheaper than getting two singles, so we should definitely consider that.", + "total_duration": 67.53396825396825, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--303/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--303/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--303/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Do you think we should travel by bus or by train?", + "original_text": "Do you think we should travel by bus or by train?", + "start_time": 0, + "end_time": 2.7747845804988662, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--303/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "It's a difficult choice. The train is a little faster, but much more", + "original_text": "It's a difficult choice. The train is a little faster, but much more [interrupt] expensive and sometimes the schedules aren't as flexible as bus routes, especially for last-minute trips.", + "start_time": 3.1967216485406005, + "end_time": 12.28733389343856, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--303/temp/line_1_B.wav", + "silence_duration": 0.4219370680417344, + "is_interrupted": true, + "text_after_interrupt": "expensive and sometimes the schedules aren't as flexible as bus routes, especially for last-minute trips." + }, + { + "speaker": "A", + "text": "Sorry to cut in, but do you think the extra cost is really worth it for the time saved?", + "original_text": "Sorry to cut in, but do you think the extra cost is really worth it for the time saved?", + "start_time": 7.295043644005453, + "end_time": 12.914272668948763, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--303/temp/line_2_A.wav", + "silence_duration": 0.3828305339874739, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "It depends. We could face delays if we travel by bus, thanks to traffic jams. But buses are more cramped and you can't walk around.", + "original_text": "It depends. We could face delays if we travel by bus, thanks to traffic jams. But buses are more cramped and you can't walk around.", + "start_time": 13.248101118158097, + "end_time": 20.98034601611728, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--303/temp/line_3_B.wav", + "silence_duration": 0.3338284492093328, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "That's true. But I feel that I see more when I travel by bus.", + "original_text": "That's true. But I feel that I see more when I travel by bus.", + "start_time": 21.30567936567098, + "end_time": 25.462051247757145, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--303/temp/line_4_A.wav", + "silence_duration": 0.32533334955369986, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Really? I think you see more traveling by train.", + "original_text": "Really? I think you see more traveling by train.", + "start_time": 25.892707809504422, + "end_time": 28.771982185921654, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--303/temp/line_5_B.wav", + "silence_duration": 0.4306565617472762, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "So which form of transport do you prefer to use?", + "original_text": "So which form of transport do you prefer to use?", + "start_time": 29.161311442094767, + "end_time": 32.237955433024474, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--303/temp/line_6_A.wav", + "silence_duration": 0.3893292561731117, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I prefer going by train, even though it costs more.", + "original_text": "I prefer going by train, even though it costs more.", + "start_time": 32.56453602601996, + "end_time": 35.176780923979145, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--303/temp/line_7_B.wav", + "silence_duration": 0.3265805929954815, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Ok, then we'll go by train. I'm sure we'll have a good journey. Shall we go to the station and buy the tickets?", + "original_text": "Ok, then we'll go by train. I'm sure we'll have a good journey. Shall we go to the station and buy the tickets?", + "start_time": 35.55800864815421, + "end_time": 42.39628529214514, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--303/temp/line_8_A.wav", + "silence_duration": 0.3812277241750629, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "The trains aren't usually full. We can get them on the day we travel. We should buy return tickets, because they are much", + "original_text": "The trains aren't usually full. We can get them on the day we travel. We should buy return tickets, because they are much [interrupt] cheaper and often come with additional benefits like seat reservations and access to station lounges during longer layovers.", + "start_time": 42.71033948488301, + "end_time": 55.50453449622088, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--303/temp/line_9_B.wav", + "silence_duration": 0.31405419273787055, + "is_interrupted": true, + "text_after_interrupt": "cheaper and often come with additional benefits like seat reservations and access to station lounges during longer layovers." + }, + { + "speaker": "A", + "text": "Oh, speaking of tickets, do you know if there's a discount for booking online?", + "original_text": "Oh, speaking of tickets, do you know if there's a discount for booking online?", + "start_time": 54.98926071175682, + "end_time": 60.14409064372961, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--303/temp/line_10_A.wav", + "silence_duration": 0.33209706203054373, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "That's a good point. But as I was saying, return tickets are much cheaper than getting two singles, so we should definitely consider that.", + "original_text": "That's a good point. But as I was saying, return tickets are much cheaper than getting two singles, so we should definitely consider that.", + "start_time": 60.6376527122913, + "end_time": 67.53397924290354, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--303/temp/line_11_B.wav", + "silence_duration": 0.4935620685616904, + "is_interrupted": false + } + ] + }, + "DialogSum--val--304": { + "original_text": "A: Ahhchooo! \nB: You've been sneezing a lot lately. Are you sick or something? \nA: No. Every spring time around April, I'm stricken with [interrupt] seasonal allergies that make my life miserable for weeks on end with constant sneezing, itchy eyes, and a runny nose that just won't quit. It happens every year like clockwork. \nB: Oh, that reminds me, do you take any medication for it? I know some people rely on antihistamines. \nA: I do take antihistamines, but they only help so much. I was going to say that I'm stricken with allergies every April. \nB: I never have seasonal allergies. \nA: Consider yourself lucky. \nB: What are all the symptoms? \nA: Well, as you just saw, I sneeze a lot. Also, my nose becomes very runny, my throat sometimes itches, and my eyes start to water uncontrollably, which makes it hard to focus on anything. \nB: Does it affect your daily activities? Like, can you still work or go outside? \nA: It can be pretty disruptive, especially when my eyes start to water. But I manage. So, you don't have any type of allergies? \nB: Well, I have a severe allergic reaction to alcohol. It runs in the family. \nA: Everyone to some extent is allergic to alcohol. \nB: I get it pretty bad. My whole face turns red, including my ears. My eyes become bloodshot, and I start to itch all over my body.", + "cleaned_text": "A: Ahhchooo! \nB: You've been sneezing a lot lately. Are you sick or something? \nA:No. Every spring time around April, I'm stricken with seasonal allergies that make my life miserable for weeks on end with constant sneezing, itchy eyes, and a runny nose that just won't quit. It happens every year like clockwork.\nB: Oh, that reminds me, do you take any medication for it? I know some people rely on antihistamines. \nA: I do take antihistamines, but they only help so much. I was going to say that I'm stricken with allergies every April. \nB: I never have seasonal allergies. \nA: Consider yourself lucky. \nB: What are all the symptoms? \nA: Well, as you just saw, I sneeze a lot. Also, my nose becomes very runny, my throat sometimes itches, and my eyes start to water uncontrollably, which makes it hard to focus on anything. \nB: Does it affect your daily activities? Like, can you still work or go outside? \nA: It can be pretty disruptive, especially when my eyes start to water. But I manage. So, you don't have any type of allergies? \nB: Well, I have a severe allergic reaction to alcohol. It runs in the family. \nA: Everyone to some extent is allergic to alcohol. \nB: I get it pretty bad. My whole face turns red, including my ears. My eyes become bloodshot, and I start to itch all over my body.", + "total_duration": 75.34498866213151, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--304/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--304/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--304/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Ahhchooo!", + "original_text": "Ahhchooo!", + "start_time": 0, + "end_time": 0.8707482993197279, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--304/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "You've been sneezing a lot lately. Are you sick or something?", + "original_text": "You've been sneezing a lot lately. Are you sick or something?", + "start_time": 1.2241298518660333, + "end_time": 4.056964318986214, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--304/temp/line_1_B.wav", + "silence_duration": 0.35338155254630543, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "No. Every spring time around April, I'm stricken with", + "original_text": "No. Every spring time around April, I'm stricken with [interrupt] seasonal allergies that make my life miserable for weeks on end with constant sneezing, itchy eyes, and a runny nose that just won't quit. It happens every year like clockwork.", + "start_time": 4.6266146902370355, + "end_time": 19.278406073456992, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--304/temp/line_2_A.wav", + "silence_duration": 0.5696503712508212, + "is_interrupted": true, + "text_after_interrupt": "seasonal allergies that make my life miserable for weeks on end with constant sneezing, itchy eyes, and a runny nose that just won't quit. It happens every year like clockwork." + }, + { + "speaker": "B", + "text": "Oh, that reminds me, do you take any medication for it? I know some people rely on antihistamines.", + "original_text": "Oh, that reminds me, do you take any medication for it? I know some people rely on antihistamines.", + "start_time": 8.376637365973997, + "end_time": 14.193236005429778, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--304/temp/line_3_B.wav", + "silence_duration": 0.48304080671126404, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I do take antihistamines, but they only help so much. I was going to say that I'm stricken with allergies every April.", + "original_text": "I do take antihistamines, but they only help so much. I was going to say that I'm stricken with allergies every April.", + "start_time": 19.771443278567283, + "end_time": 27.52690813117499, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--304/temp/line_4_A.wav", + "silence_duration": 0.4930372051102892, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I never have seasonal allergies.", + "original_text": "I never have seasonal allergies.", + "start_time": 28.1141185556492, + "end_time": 29.76273533569455, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--304/temp/line_5_B.wav", + "silence_duration": 0.587210424474209, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Consider yourself lucky.", + "original_text": "Consider yourself lucky.", + "start_time": 30.123898655906935, + "end_time": 31.59836577608834, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--304/temp/line_6_A.wav", + "silence_duration": 0.3611633202123842, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "What are all the symptoms?", + "original_text": "What are all the symptoms?", + "start_time": 32.11971608943296, + "end_time": 33.3968135951019, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--304/temp/line_7_B.wav", + "silence_duration": 0.5213503133446264, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Well, as you just saw, I sneeze a lot. Also, my nose becomes very runny, my throat sometimes itches, and my eyes start to water uncontrollably, which makes it hard to focus on anything.", + "original_text": "Well, as you just saw, I sneeze a lot. Also, my nose becomes very runny, my throat sometimes itches, and my eyes start to water uncontrollably, which makes it hard to focus on anything.", + "start_time": 33.7520886760344, + "end_time": 46.52306373272374, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--304/temp/line_8_A.wav", + "silence_duration": 0.3552750809324981, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Does it affect your daily activities? Like, can you still work or go outside?", + "original_text": "Does it affect your daily activities? Like, can you still work or go outside?", + "start_time": 47.11224370175938, + "end_time": 51.26861558384555, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--304/temp/line_9_B.wav", + "silence_duration": 0.5891799690356441, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "It can be pretty disruptive, especially when my eyes start to water. But I manage. So, you don't have any type of allergies?", + "original_text": "It can be pretty disruptive, especially when my eyes start to water. But I manage. So, you don't have any type of allergies?", + "start_time": 51.75536387402979, + "end_time": 59.870738023689654, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--304/temp/line_10_A.wav", + "silence_duration": 0.4867482901842354, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Well, I have a severe allergic reaction to alcohol. It runs in the family.", + "original_text": "Well, I have a severe allergic reaction to alcohol. It runs in the family.", + "start_time": 60.36316783624217, + "end_time": 64.46148983170703, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--304/temp/line_11_B.wav", + "silence_duration": 0.4924298125525134, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Everyone to some extent is allergic to alcohol.", + "original_text": "Everyone to some extent is allergic to alcohol.", + "start_time": 64.89258065923693, + "end_time": 67.77185503565416, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--304/temp/line_12_A.wav", + "silence_duration": 0.4310908275298981, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I get it pretty bad. My whole face turns red, including my ears. My eyes become bloodshot, and I start to itch all over my body.", + "original_text": "I get it pretty bad. My whole face turns red, including my ears. My eyes become bloodshot, and I start to itch all over my body.", + "start_time": 68.13522936975174, + "end_time": 75.34502528811909, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--304/temp/line_13_B.wav", + "silence_duration": 0.36337433409758724, + "is_interrupted": false + } + ] + }, + "DialogSum--val--305": { + "original_text": "A: Let's have a look at the map first. \nB: All right. Wukesong stop is quite a few stops from [interrupt] here on the western line, so we should plan our route accordingly and maybe consider transferring at the next major station to save some time. \nA: Wait, did you say Wukesong? I just realized I might have confused it with another stop. Are we sure that's where we need to go? \nB: Yes, Wukesong is correct. But I was going to say it's quite a few stops from here. Let's buy some tickets. \nA: The train is coming. There are a lot of people waiting here. Let's stand in a better position to make sure we get on quickly and find a spot to sit. \nB: Oh, I see an opening near the doors! Should we move there quickly before it gets too crowded? \nA: Good idea. Well, it's not as crowded as we expected, is it? \nB: No, but it will be soon. Look, there're two empty seats over there. Let's get them before someone else does.", + "cleaned_text": "A: Let's have a look at the map first. \nB:All right. Wukesong stop is quite a few stops from here on the western line, so we should plan our route accordingly and maybe consider transferring at the next major station to save some time.\nA: Wait, did you say Wukesong? I just realized I might have confused it with another stop. Are we sure that's where we need to go? \nB: Yes, Wukesong is correct. But I was going to say it's quite a few stops from here. Let's buy some tickets. \nA: The train is coming. There are a lot of people waiting here. Let's stand in a better position to make sure we get on quickly and find a spot to sit. \nB: Oh, I see an opening near the doors! Should we move there quickly before it gets too crowded? \nA: Good idea. Well, it's not as crowded as we expected, is it? \nB: No, but it will be soon. Look, there're two empty seats over there. Let's get them before someone else does.", + "total_duration": 44.46698412698413, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--305/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--305/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--305/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Let's have a look at the map first.", + "original_text": "Let's have a look at the map first.", + "start_time": 0, + "end_time": 1.9388662131519274, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--305/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "All right. Wukesong stop is quite a few stops from", + "original_text": "All right. Wukesong stop is quite a few stops from [interrupt] here on the western line, so we should plan our route accordingly and maybe consider transferring at the next major station to save some time.", + "start_time": 2.269875852529096, + "end_time": 12.358946147313677, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--305/temp/line_1_B.wav", + "silence_duration": 0.3310096393771688, + "is_interrupted": true, + "text_after_interrupt": "here on the western line, so we should plan our route accordingly and maybe consider transferring at the next major station to save some time." + }, + { + "speaker": "A", + "text": "Wait, did you say Wukesong? I just realized I might have confused it with another stop. Are we sure that's where we need to go?", + "original_text": "Wait, did you say Wukesong? I just realized I might have confused it with another stop. Are we sure that's where we need to go?", + "start_time": 5.9618486416447425, + "end_time": 13.577993766361296, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--305/temp/line_2_A.wav", + "silence_duration": 0.5399901584081276, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, Wukesong is correct. But I was going to say it's quite a few stops from here. Let's buy some tickets.", + "original_text": "Yes, Wukesong is correct. But I was going to say it's quite a few stops from here. Let's buy some tickets.", + "start_time": 14.068294618052219, + "end_time": 20.059042917371947, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--305/temp/line_3_B.wav", + "silence_duration": 0.490300851690923, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "The train is coming. There are a lot of people waiting here. Let's stand in a better position to make sure we get on quickly and find a spot to sit.", + "original_text": "The train is coming. There are a lot of people waiting here. Let's stand in a better position to make sure we get on quickly and find a spot to sit.", + "start_time": 20.649465523351967, + "end_time": 28.741619718363303, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--305/temp/line_4_A.wav", + "silence_duration": 0.59042260598002, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Oh, I see an opening near the doors! Should we move there quickly before it gets too crowded?", + "original_text": "Oh, I see an opening near the doors! Should we move there quickly before it gets too crowded?", + "start_time": 29.174409472048886, + "end_time": 34.050599948239366, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--305/temp/line_5_B.wav", + "silence_duration": 0.43278975368558315, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Good idea. Well, it's not as crowded as we expected, is it?", + "original_text": "Good idea. Well, it's not as crowded as we expected, is it?", + "start_time": 34.48016123966447, + "end_time": 38.47399343921096, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--305/temp/line_6_A.wav", + "silence_duration": 0.429561291425099, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "No, but it will be soon. Look, there're two empty seats over there. Let's get them before someone else does.", + "original_text": "No, but it will be soon. Look, there're two empty seats over there. Let's get them before someone else does.", + "start_time": 38.83617744417701, + "end_time": 44.46701644644458, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--305/temp/line_7_B.wav", + "silence_duration": 0.3621840049660504, + "is_interrupted": false + } + ] + }, + "DialogSum--val--307": { + "original_text": "A: Is there anything worth watching on another channel?\nB: I think there's a Western on.\nA: Do you mind if we watch it? I'd really like to [interrupt] relax with something different tonight, maybe something with a good storyline and interesting characters that we haven't seen before.\nB: Actually, I was hoping to catch the football game. Do you mind if we switch to that instead?\nA: Football game? Ok, and you know what comes on [interrupt] after the game? I was thinking of watching something else later, perhaps a movie or documentary that we could both enjoy together.\nB: Oh, before I forget, do you know what's on Channel 2 at 10 pm? I wanted to check if there's something interesting later.\nA: I think it's a quiz show. But I was about to ask what comes on after the football game?\nB: I believe there's a sitcom. Are you interested in watching it?\nA: Let me look in the TV Guide first.\nB: Let's watch it together.", + "cleaned_text": "A: Is there anything worth watching on another channel?\nB: I think there's a Western on.\nA:Do you mind if we watch it? I'd really like to relax with something different tonight, maybe something with a good storyline and interesting characters that we haven't seen before.\nB: Actually, I was hoping to catch the football game. Do you mind if we switch to that instead?\nA:Football game? Ok, and you know what comes on after the game? I was thinking of watching something else later, perhaps a movie or documentary that we could both enjoy together.\nB: Oh, before I forget, do you know what's on Channel 2 at 10 pm? I wanted to check if there's something interesting later.\nA: I think it's a quiz show. But I was about to ask what comes on after the football game?\nB: I believe there's a sitcom. Are you interested in watching it?\nA: Let me look in the TV Guide first.\nB: Let's watch it together.", + "total_duration": 44.364761904761906, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--307/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--307/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--307/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Is there anything worth watching on another channel?", + "original_text": "Is there anything worth watching on another channel?", + "start_time": 0, + "end_time": 2.5774149659863945, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--307/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I think there's a Western on.", + "original_text": "I think there's a Western on.", + "start_time": 3.054593291299938, + "end_time": 4.749649980642342, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--307/temp/line_1_B.wav", + "silence_duration": 0.4771783253135435, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Do you mind if we watch it? I'd really like to", + "original_text": "Do you mind if we watch it? I'd really like to [interrupt] relax with something different tonight, maybe something with a good storyline and interesting characters that we haven't seen before.", + "start_time": 5.2330465717142784, + "end_time": 14.892547705501126, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--307/temp/line_2_A.wav", + "silence_duration": 0.4833965910719362, + "is_interrupted": true, + "text_after_interrupt": "relax with something different tonight, maybe something with a good storyline and interesting characters that we haven't seen before." + }, + { + "speaker": "B", + "text": "Actually, I was hoping to catch the football game. Do you mind if we switch to that instead?", + "original_text": "Actually, I was hoping to catch the football game. Do you mind if we switch to that instead?", + "start_time": 8.367740449265298, + "end_time": 12.837581719106568, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--307/temp/line_3_B.wav", + "silence_duration": 0.4358969073228833, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Football game? Ok, and you know what comes on", + "original_text": "Football game? Ok, and you know what comes on [interrupt] after the game? I was thinking of watching something else later, perhaps a movie or documentary that we could both enjoy together.", + "start_time": 15.434265988411621, + "end_time": 26.243154877300512, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--307/temp/line_4_A.wav", + "silence_duration": 0.5417182829104946, + "is_interrupted": true, + "text_after_interrupt": "after the game? I was thinking of watching something else later, perhaps a movie or documentary that we could both enjoy together." + }, + { + "speaker": "B", + "text": "Oh, before I forget, do you know what's on Channel 2 at 10 pm? I wanted to check if there's something interesting later.", + "original_text": "Oh, before I forget, do you know what's on Channel 2 at 10 pm? I wanted to check if there's something interesting later.", + "start_time": 23.118714327858154, + "end_time": 30.270460359604186, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--307/temp/line_5_B.wav", + "silence_duration": 0.40970414007532574, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I think it's a quiz show. But I was about to ask what comes on after the football game?", + "original_text": "I think it's a quiz show. But I was about to ask what comes on after the football game?", + "start_time": 30.78660174233862, + "end_time": 35.802111946420254, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--307/temp/line_6_A.wav", + "silence_duration": 0.516141382734431, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I believe there's a sitcom. Are you interested in watching it?", + "original_text": "I believe there's a sitcom. Are you interested in watching it?", + "start_time": 36.11022170807779, + "end_time": 40.080833952975745, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--307/temp/line_7_B.wav", + "silence_duration": 0.3081097616575366, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Let me look in the TV Guide first.", + "original_text": "Let me look in the TV Guide first.", + "start_time": 40.51104337872174, + "end_time": 42.60083929708908, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--307/temp/line_8_A.wav", + "silence_duration": 0.43020942574599286, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Let's watch it together.", + "original_text": "Let's watch it together.", + "start_time": 43.1457442235612, + "end_time": 44.364791842608824, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--307/temp/line_9_B.wav", + "silence_duration": 0.5449049264721204, + "is_interrupted": false + } + ] + }, + "DialogSum--val--308": { + "original_text": "A: How long will you stay in New York? \nB: Just for three days. I won't need these luggages. Could I put them [interrupt] in storage here at the airport while I'm in New York? I've heard some airports offer convenient short-term storage solutions for travelers in similar situations. \nA: Sorry to interrupt. Just to clarify, are you asking if you can store your luggage here at the airport? \nB: Yes, exactly. I was wondering if I could put them here since I won't need them in New York. \nA: I understand, but if you have more than 24 hours between connecting flights, we can't check your luggage through London. \nB: Oh, I see. In that case, maybe I can put them in the airport storage there. \nA: That could work. By the way, you mentioned not needing the luggage in New York, but did you have any other specific plans for your stay?", + "cleaned_text": "A: How long will you stay in New York? \nB:Just for three days. I won't need these luggages. Could I put them in storage here at the airport while I'm in New York? I've heard some airports offer convenient short-term storage solutions for travelers in similar situations.\nA: Sorry to interrupt. Just to clarify, are you asking if you can store your luggage here at the airport? \nB: Yes, exactly. I was wondering if I could put them here since I won't need them in New York. \nA: I understand, but if you have more than 24 hours between connecting flights, we can't check your luggage through London. \nB: Oh, I see. In that case, maybe I can put them in the airport storage there. \nA: That could work. By the way, you mentioned not needing the luggage in New York, but did you have any other specific plans for your stay?", + "total_duration": 39.09510204081633, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--308/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--308/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--308/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "How long will you stay in New York?", + "original_text": "How long will you stay in New York?", + "start_time": 0, + "end_time": 1.7763265306122449, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--308/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Just for three days. I won't need these luggages. Could I put them", + "original_text": "Just for three days. I won't need these luggages. Could I put them [interrupt] in storage here at the airport while I'm in New York? I've heard some airports offer convenient short-term storage solutions for travelers in similar situations.", + "start_time": 2.3433076934296038, + "end_time": 13.802355312477221, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--308/temp/line_1_B.wav", + "silence_duration": 0.5669811628173591, + "is_interrupted": true, + "text_after_interrupt": "in storage here at the airport while I'm in New York? I've heard some airports offer convenient short-term storage solutions for travelers in similar situations." + }, + { + "speaker": "A", + "text": "Sorry to interrupt. Just to clarify, are you asking if you can store your luggage here at the airport?", + "original_text": "Sorry to interrupt. Just to clarify, are you asking if you can store your luggage here at the airport?", + "start_time": 5.582491366898992, + "end_time": 12.281448282998765, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--308/temp/line_2_A.wav", + "silence_duration": 0.40847689381023033, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, exactly. I was wondering if I could put them here since I won't need them in New York.", + "original_text": "Yes, exactly. I was wondering if I could put them here since I won't need them in New York.", + "start_time": 14.341492702270227, + "end_time": 18.660404266896077, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--308/temp/line_3_B.wav", + "silence_duration": 0.5391373897930051, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I understand, but if you have more than 24 hours between connecting flights, we can't check your luggage through London.", + "original_text": "I understand, but if you have more than 24 hours between connecting flights, we can't check your luggage through London.", + "start_time": 19.221985562434874, + "end_time": 26.617541117990427, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--308/temp/line_4_A.wav", + "silence_duration": 0.5615812955387964, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Oh, I see. In that case, maybe I can put them in the airport storage there.", + "original_text": "Oh, I see. In that case, maybe I can put them in the airport storage there.", + "start_time": 27.13310996099454, + "end_time": 31.068892273919708, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--308/temp/line_5_B.wav", + "silence_duration": 0.5155688430041112, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "That could work. By the way, you mentioned not needing the luggage in New York, but did you have any other specific plans for your stay?", + "original_text": "That could work. By the way, you mentioned not needing the luggage in New York, but did you have any other specific plans for your stay?", + "start_time": 31.664726381303982, + "end_time": 39.095111868832326, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--308/temp/line_6_A.wav", + "silence_duration": 0.5958341073842739, + "is_interrupted": false + } + ] + }, + "DialogSum--val--309": { + "original_text": "A: Do you have spare time tonight? \nB: What's the matter? \nA: There will be a live show of football tonight featuring two of the most legendary teams in European football history [interrupt] and I thought it would be more fun to watch it together rather than alone. \nB: What teams are playing? Is it a big match or just a regular one? \nA: Sorry, I just remembered, do you prefer watching it at your place or mine? \nB: Hmm, good question. Let's watch at your place. But you were saying, which teams are playing? \nA: Oh right, it's AC Milan versus Real Madrid in what promises to be an electrifying Champions League quarterfinal match. \nB: That will be a tough match, right? Both teams have been in great form lately and their head-to-head record is always fascinating to analyze. \nA: Absolutely. \nB: What are we waiting for? It's already 7 pm now. Let's buy some drinks and desserts now before the match starts at 8.", + "cleaned_text": "A: Do you have spare time tonight? \nB: What's the matter? \nA:There will be a live show of football tonight featuring two of the most legendary teams in European football history and I thought it would be more fun to watch it together rather than alone.\nB: What teams are playing? Is it a big match or just a regular one? \nA: Sorry, I just remembered, do you prefer watching it at your place or mine? \nB: Hmm, good question. Let's watch at your place. But you were saying, which teams are playing? \nA: Oh right, it's AC Milan versus Real Madrid in what promises to be an electrifying Champions League quarterfinal match. \nB: That will be a tough match, right? Both teams have been in great form lately and their head-to-head record is always fascinating to analyze. \nA: Absolutely. \nB: What are we waiting for? It's already 7 pm now. Let's buy some drinks and desserts now before the match starts at 8.", + "total_duration": 47.5707029478458, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--309/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--309/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--309/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Do you have spare time tonight?", + "original_text": "Do you have spare time tonight?", + "start_time": 0, + "end_time": 1.811156462585034, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--309/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "What's the matter?", + "original_text": "What's the matter?", + "start_time": 2.244581937902626, + "end_time": 2.9992304639797234, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--309/temp/line_1_B.wav", + "silence_duration": 0.43342547531759174, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "There will be a live show of football tonight featuring two of the most legendary teams in European football history", + "original_text": "There will be a live show of football tonight featuring two of the most legendary teams in European football history [interrupt] and I thought it would be more fun to watch it together rather than alone.", + "start_time": 3.4540930092433237, + "end_time": 13.229693916272801, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--309/temp/line_2_A.wav", + "silence_duration": 0.45486254526360015, + "is_interrupted": true, + "text_after_interrupt": "and I thought it would be more fun to watch it together rather than alone." + }, + { + "speaker": "B", + "text": "What teams are playing? Is it a big match or just a regular one?", + "original_text": "What teams are playing? Is it a big match or just a regular one?", + "start_time": 9.769920673642417, + "end_time": 13.36901364416396, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--309/temp/line_3_B.wav", + "silence_duration": 0.5247083971203307, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Sorry, I just remembered, do you prefer watching it at your place or mine?", + "original_text": "Sorry, I just remembered, do you prefer watching it at your place or mine?", + "start_time": 13.686958296323459, + "end_time": 18.342559203352938, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--309/temp/line_4_A.wav", + "silence_duration": 0.31794465215949863, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Hmm, good question. Let's watch at your place. But you were saying, which teams are playing?", + "original_text": "Hmm, good question. Let's watch at your place. But you were saying, which teams are playing?", + "start_time": 18.813170642630805, + "end_time": 24.14215023446754, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--309/temp/line_5_B.wav", + "silence_duration": 0.4706114392778675, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Oh right, it's AC Milan versus Real Madrid in what promises to be an electrifying Champions League quarterfinal match.", + "original_text": "Oh right, it's AC Milan versus Real Madrid in what promises to be an electrifying Champions League quarterfinal match.", + "start_time": 24.718465006395903, + "end_time": 31.47547180911699, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--309/temp/line_6_A.wav", + "silence_duration": 0.5763147719283631, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "That will be a tough match, right? Both teams have been in great form lately and their head-to-head record is always fascinating to analyze.", + "original_text": "That will be a tough match, right? Both teams have been in great form lately and their head-to-head record is always fascinating to analyze.", + "start_time": 32.044777283452405, + "end_time": 38.999153700685966, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--309/temp/line_7_B.wav", + "silence_duration": 0.5693054743354186, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Absolutely.", + "original_text": "Absolutely.", + "start_time": 39.57612370633142, + "end_time": 40.60941168819083, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--309/temp/line_8_A.wav", + "silence_duration": 0.5769700056454543, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "What are we waiting for? It's already 7 pm now. Let's buy some drinks and desserts now before the match starts at 8.", + "original_text": "What are we waiting for? It's already 7 pm now. Let's buy some drinks and desserts now before the match starts at 8.", + "start_time": 41.08074699881303, + "end_time": 47.570724323076064, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--309/temp/line_9_B.wav", + "silence_duration": 0.4713353106221932, + "is_interrupted": false + } + ] + }, + "DialogSum--val--310": { + "original_text": "A: I would love to rent this apartment. \nB: I'm happy to hear you say that. \nA: How much are you asking for every month? \nB: I'm renting this apartment out for $1050 a month. \nA: That is quite a lot of money for just one [interrupt] bedroom, especially considering my current budget constraints and the fact that similar apartments in the neighborhood are going for significantly less. \nB: Sorry to jump in, but considering the amenities and the location, I think $1050 is quite reasonable. \nA: I understand that, but what do you say to $850 a month? \nB: That's no good. \nA: It's either $850 or nothing at this point, as I have other options to consider. \nB: I see where you're coming from, but I really can't go any lower than $1050. \nA: Could you please go lower? \nB: That's the best I can do.", + "cleaned_text": "A: I would love to rent this apartment. \nB: I'm happy to hear you say that. \nA: How much are you asking for every month? \nB: I'm renting this apartment out for $1050 a month. \nA:That is quite a lot of money for just one bedroom, especially considering my current budget constraints and the fact that similar apartments in the neighborhood are going for significantly less.\nB: Sorry to jump in, but considering the amenities and the location, I think $1050 is quite reasonable. \nA: I understand that, but what do you say to $850 a month? \nB: That's no good. \nA: It's either $850 or nothing at this point, as I have other options to consider. \nB: I see where you're coming from, but I really can't go any lower than $1050. \nA: Could you please go lower? \nB: That's the best I can do.", + "total_duration": 43.11800453514739, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--310/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--310/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--310/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "I would love to rent this apartment.", + "original_text": "I would love to rent this apartment.", + "start_time": 0, + "end_time": 1.9736961451247166, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--310/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I'm happy to hear you say that.", + "original_text": "I'm happy to hear you say that.", + "start_time": 2.477803278301052, + "end_time": 4.126420058346404, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--310/temp/line_1_B.wav", + "silence_duration": 0.5041071331763357, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "How much are you asking for every month?", + "original_text": "How much are you asking for every month?", + "start_time": 4.588498207677512, + "end_time": 6.562194352802228, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--310/temp/line_2_A.wav", + "silence_duration": 0.46207814933110813, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I'm renting this apartment out for $1050 a month.", + "original_text": "I'm renting this apartment out for $1050 a month.", + "start_time": 6.958754442925389, + "end_time": 10.697167141338088, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--310/temp/line_3_B.wav", + "silence_duration": 0.3965600901231607, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "That is quite a lot of money for just one", + "original_text": "That is quite a lot of money for just one [interrupt] bedroom, especially considering my current budget constraints and the fact that similar apartments in the neighborhood are going for significantly less.", + "start_time": 11.071181119822116, + "end_time": 21.961339849980845, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--310/temp/line_4_A.wav", + "silence_duration": 0.374013978484028, + "is_interrupted": true, + "text_after_interrupt": "bedroom, especially considering my current budget constraints and the fact that similar apartments in the neighborhood are going for significantly less." + }, + { + "speaker": "B", + "text": "Sorry to jump in, but considering the amenities and the location, I think $1050 is quite reasonable.", + "original_text": "Sorry to jump in, but considering the amenities and the location, I think $1050 is quite reasonable.", + "start_time": 13.439616493971776, + "end_time": 19.999253682180395, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--310/temp/line_5_B.wav", + "silence_duration": 0.5437263577358513, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I understand that, but what do you say to $850 a month?", + "original_text": "I understand that, but what do you say to $850 a month?", + "start_time": 22.47379135950603, + "end_time": 26.79270292413188, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--310/temp/line_6_A.wav", + "silence_duration": 0.5124515095251849, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "That's no good.", + "original_text": "That's no good.", + "start_time": 27.27661861040242, + "end_time": 28.170586864370673, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--310/temp/line_7_B.wav", + "silence_duration": 0.4839156862705402, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "It's either $850 or nothing at this point, as I have other options to consider.", + "original_text": "It's either $850 or nothing at this point, as I have other options to consider.", + "start_time": 28.522000243404694, + "end_time": 34.47791861075163, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--310/temp/line_8_A.wav", + "silence_duration": 0.3514133790340219, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I see where you're coming from, but I really can't go any lower than $1050.", + "original_text": "I see where you're coming from, but I really can't go any lower than $1050.", + "start_time": 35.06465571054117, + "end_time": 39.638986776300804, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--310/temp/line_9_B.wav", + "silence_duration": 0.5867370997895354, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Could you please go lower?", + "original_text": "Could you please go lower?", + "start_time": 40.08121925982679, + "end_time": 41.439586606765566, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--310/temp/line_10_A.wav", + "silence_duration": 0.44223248352598504, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "That's the best I can do.", + "original_text": "That's the best I can do.", + "start_time": 41.78288154872557, + "end_time": 43.11802894101582, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--310/temp/line_11_B.wav", + "silence_duration": 0.3432949419600041, + "is_interrupted": false + } + ] + }, + "DialogSum--val--313": { + "original_text": "A: Hi! Wang Mei. Come and have a look at my new dress. \nB: Oh! What a beautiful dress! It fits you so well. You look so charming in the [interrupt] color, it really complements your complexion and brings out the warmth in your features, especially under natural lighting. \nA: Thanks! I really appreciate it. But I was curious, where did you get your dress from last week? I loved the design. \nB: Oh, that one? I got it online. But speaking of where I bought mine, where did you get this one? \nA: I bought it in a store near my school. \nB: How much is it? \nA: It's only thirty yuan. \nB: It's so cheap. I'll buy one, too. By the way, you didn't finish telling me what you were saying about how the dress fits me earlier. \nA: Oh, right! I was saying it fits you so well and makes you look really charming.", + "cleaned_text": "A: Hi! Wang Mei. Come and have a look at my new dress. \nB:Oh! What a beautiful dress! It fits you so well. You look so charming in the color, it really complements your complexion and brings out the warmth in your features, especially under natural lighting.\nA: Thanks! I really appreciate it. But I was curious, where did you get your dress from last week? I loved the design. \nB: Oh, that one? I got it online. But speaking of where I bought mine, where did you get this one? \nA: I bought it in a store near my school. \nB: How much is it? \nA: It's only thirty yuan. \nB: It's so cheap. I'll buy one, too. By the way, you didn't finish telling me what you were saying about how the dress fits me earlier. \nA: Oh, right! I was saying it fits you so well and makes you look really charming.", + "total_duration": 39.599002267573695, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--313/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--313/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--313/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Hi! Wang Mei. Come and have a look at my new dress.", + "original_text": "Hi! Wang Mei. Come and have a look at my new dress.", + "start_time": 0, + "end_time": 3.889342403628118, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--313/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Oh! What a beautiful dress! It fits you so well. You look so charming in the", + "original_text": "Oh! What a beautiful dress! It fits you so well. You look so charming in the [interrupt] color, it really complements your complexion and brings out the warmth in your features, especially under natural lighting.", + "start_time": 4.407936530240185, + "end_time": 14.601496620943132, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--313/temp/line_1_B.wav", + "silence_duration": 0.5185941266120677, + "is_interrupted": true, + "text_after_interrupt": "color, it really complements your complexion and brings out the warmth in your features, especially under natural lighting." + }, + { + "speaker": "A", + "text": "Thanks! I really appreciate it. But I was curious, where did you get your dress from last week? I loved the design.", + "original_text": "Thanks! I really appreciate it. But I was curious, where did you get your dress from last week? I loved the design.", + "start_time": 8.506258525705038, + "end_time": 16.517142879446535, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--313/temp/line_2_A.wav", + "silence_duration": 0.4328317310167902, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Oh, that one? I got it online. But speaking of where I bought mine, where did you get this one?", + "original_text": "Oh, that one? I got it online. But speaking of where I bought mine, where did you get this one?", + "start_time": 16.924820333042383, + "end_time": 21.475931444153495, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--313/temp/line_3_B.wav", + "silence_duration": 0.40767745359584967, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I bought it in a store near my school.", + "original_text": "I bought it in a store near my school.", + "start_time": 21.80077074028988, + "end_time": 23.960226522602806, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--313/temp/line_4_A.wav", + "silence_duration": 0.32483929613638685, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "How much is it?", + "original_text": "How much is it?", + "start_time": 24.521397191028115, + "end_time": 25.38053551302358, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--313/temp/line_5_B.wav", + "silence_duration": 0.561170668425309, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "It's only thirty yuan.", + "original_text": "It's only thirty yuan.", + "start_time": 25.836659773622856, + "end_time": 27.206637097885896, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--313/temp/line_6_A.wav", + "silence_duration": 0.45612426059927563, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "It's so cheap. I'll buy one, too. By the way, you didn't finish telling me what you were saying about how the dress fits me earlier.", + "original_text": "It's so cheap. I'll buy one, too. By the way, you didn't finish telling me what you were saying about how the dress fits me earlier.", + "start_time": 27.531493708528153, + "end_time": 34.24206060195219, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--313/temp/line_7_B.wav", + "silence_duration": 0.3248566106422558, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Oh, right! I was saying it fits you so well and makes you look really charming.", + "original_text": "Oh, right! I was saying it fits you so well and makes you look really charming.", + "start_time": 34.72284723667025, + "end_time": 39.59903771286072, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--313/temp/line_8_A.wav", + "silence_duration": 0.4807866347180559, + "is_interrupted": false + } + ] + }, + "DialogSum--val--314": { + "original_text": "A: Will you be done doing my hair soon? \nB: Give me a little while [interrupt] I'm almost finished with the last section and just need to add some final touches to make sure everything looks perfectly blended and polished. \nA: Sorry, I just want to make sure I'm not running late. How much longer do you think it'll take? \nB: It should be just a few more minutes. There you go. How do you like it? \nA: I think it looks gorgeous. \nB: You think it looks as good as you imagined? \nA: Oh, absolutely. I honestly think it looks great. By the way, how much is it for my hair? \nB: Just give me $55. \nA: Thanks for doing such a good job. \nB: No problem, girlfriend. I'll see you next time.", + "cleaned_text": "A: Will you be done doing my hair soon? \nB:Give me a little while I'm almost finished with the last section and just need to add some final touches to make sure everything looks perfectly blended and polished.\nA: Sorry, I just want to make sure I'm not running late. How much longer do you think it'll take? \nB: It should be just a few more minutes. There you go. How do you like it? \nA: I think it looks gorgeous. \nB: You think it looks as good as you imagined? \nA: Oh, absolutely. I honestly think it looks great. By the way, how much is it for my hair? \nB: Just give me $55. \nA: Thanks for doing such a good job. \nB: No problem, girlfriend. I'll see you next time.", + "total_duration": 31.344489795918367, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--314/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--314/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--314/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Will you be done doing my hair soon?", + "original_text": "Will you be done doing my hair soon?", + "start_time": 0, + "end_time": 1.8692063492063493, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--314/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Give me a little while", + "original_text": "Give me a little while [interrupt] I'm almost finished with the last section and just need to add some final touches to make sure everything looks perfectly blended and polished.", + "start_time": 2.3777682786499836, + "end_time": 9.808153766178329, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--314/temp/line_1_B.wav", + "silence_duration": 0.5085619294436345, + "is_interrupted": true, + "text_after_interrupt": "I'm almost finished with the last section and just need to add some final touches to make sure everything looks perfectly blended and polished." + }, + { + "speaker": "A", + "text": "Sorry, I just want to make sure I'm not running late. How much longer do you think it'll take?", + "original_text": "Sorry, I just want to make sure I'm not running late. How much longer do you think it'll take?", + "start_time": 3.492326101779235, + "end_time": 9.401804559829122, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--314/temp/line_2_A.wav", + "silence_duration": 0.3494970874049326, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "It should be just a few more minutes. There you go. How do you like it?", + "original_text": "It should be just a few more minutes. There you go. How do you like it?", + "start_time": 10.405699356842838, + "end_time": 13.679712962285015, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--314/temp/line_3_B.wav", + "silence_duration": 0.5975455906645086, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I think it looks gorgeous.", + "original_text": "I think it looks gorgeous.", + "start_time": 14.235875883814364, + "end_time": 15.8264427772384, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--314/temp/line_4_A.wav", + "silence_duration": 0.5561629215293489, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "You think it looks as good as you imagined?", + "original_text": "You think it looks as good as you imagined?", + "start_time": 16.228215981871124, + "end_time": 18.097422331077475, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--314/temp/line_5_B.wav", + "silence_duration": 0.4017732046327253, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Oh, absolutely. I honestly think it looks great. By the way, how much is it for my hair?", + "original_text": "Oh, absolutely. I honestly think it looks great. By the way, how much is it for my hair?", + "start_time": 18.507049331987606, + "end_time": 24.079838447633865, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--314/temp/line_6_A.wav", + "silence_duration": 0.40962700091012977, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Just give me $55.", + "original_text": "Just give me $55.", + "start_time": 24.565775456666234, + "end_time": 26.202782259387323, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--314/temp/line_7_B.wav", + "silence_duration": 0.4859370090323706, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Thanks for doing such a good job.", + "original_text": "Thanks for doing such a good job.", + "start_time": 26.53031433065129, + "end_time": 28.399520679857638, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--314/temp/line_8_A.wav", + "silence_duration": 0.3275320712639685, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "No problem, girlfriend. I'll see you next time.", + "original_text": "No problem, girlfriend. I'll see you next time.", + "start_time": 28.952874567843455, + "end_time": 31.344529896641642, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--314/temp/line_9_B.wav", + "silence_duration": 0.5533538879858168, + "is_interrupted": false + } + ] + }, + "DialogSum--val--315": { + "original_text": "A: Ahh... What a fine day! I do feel like an outdoor exercise. How about taking a walk in the park?\nB: OK. It's delightful to have a walk in the park with the air so fresh.\nA: Oh, it's so quiet here. We have the park to ourselves, only you and [interrupt] the sound of the birds chirping in the trees creating such a peaceful atmosphere that makes me forget all my worries and stresses from work.\nB: Sorry to cut in, but did you notice that group of people on our left?\nA: Oh, I see them. Some are doing Taijiquan, some are performing swordplay, some are practising the Chinese Wushu. But I was saying, it's nice to have the park almost to ourselves.", + "cleaned_text": "A: Ahh... What a fine day! I do feel like an outdoor exercise. How about taking a walk in the park?\nB: OK. It's delightful to have a walk in the park with the air so fresh.\nA:Oh, it's so quiet here. We have the park to ourselves, only you and the sound of the birds chirping in the trees creating such a peaceful atmosphere that makes me forget all my worries and stresses from work.\nB: Sorry to cut in, but did you notice that group of people on our left?\nA: Oh, I see them. Some are doing Taijiquan, some are performing swordplay, some are practising the Chinese Wushu. But I was saying, it's nice to have the park almost to ourselves.", + "total_duration": 35.749977324263035, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--315/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--315/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--315/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Ahh... What a fine day! I do feel like an outdoor exercise. How about taking a walk in the park?", + "original_text": "Ahh... What a fine day! I do feel like an outdoor exercise. How about taking a walk in the park?", + "start_time": 0, + "end_time": 6.594467120181406, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--315/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "OK. It's delightful to have a walk in the park with the air so fresh.", + "original_text": "OK. It's delightful to have a walk in the park with the air so fresh.", + "start_time": 6.916009577050043, + "end_time": 10.944671708569317, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--315/temp/line_1_B.wav", + "silence_duration": 0.32154245686863725, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Oh, it's so quiet here. We have the park to ourselves, only you and", + "original_text": "Oh, it's so quiet here. We have the park to ourselves, only you and [interrupt] the sound of the birds chirping in the trees creating such a peaceful atmosphere that makes me forget all my worries and stresses from work.", + "start_time": 11.50020740688555, + "end_time": 23.934493121171265, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--315/temp/line_2_A.wav", + "silence_duration": 0.5555356983162341, + "is_interrupted": true, + "text_after_interrupt": "the sound of the birds chirping in the trees creating such a peaceful atmosphere that makes me forget all my worries and stresses from work." + }, + { + "speaker": "B", + "text": "Sorry to cut in, but did you notice that group of people on our left?", + "original_text": "Sorry to cut in, but did you notice that group of people on our left?", + "start_time": 16.596987452237023, + "end_time": 19.847781103030673, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--315/temp/line_3_B.wav", + "silence_duration": 0.5343801511008008, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Oh, I see them. Some are doing Taijiquan, some are performing swordplay, some are practising the Chinese Wushu. But I was saying, it's nice to have the park almost to ourselves.", + "original_text": "Oh, I see them. Some are doing Taijiquan, some are performing swordplay, some are practising the Chinese Wushu. But I was saying, it's nice to have the park almost to ourselves.", + "start_time": 24.279356690569223, + "end_time": 35.75001428694111, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--315/temp/line_4_A.wav", + "silence_duration": 0.34486356939795987, + "is_interrupted": false + } + ] + }, + "DialogSum--val--316": { + "original_text": "A: Are you studying here? \nB: Yes, I am studying in Eastern Asian language department. \nA: What are you majoring in? \nB: I major in Japanese. \nA: What do you think of the literature course? \nB: It's very helpful. The course has let me into a new world of literature. I read so many great [interrupt] works from authors I had never heard of before, and it really broadened my perspective on cultural differences and historical contexts that shaped these literary masterpieces. \nA: Speaking of great literature, have you had the chance to explore any classic Japanese novels yet? \nB: Yes, I have. But I was actually going to mention that I read so many great literatures from different periods and genres. \nA: That sounds fascinating! Which genre did you find most intriguing?", + "cleaned_text": "A: Are you studying here? \nB: Yes, I am studying in Eastern Asian language department. \nA: What are you majoring in? \nB: I major in Japanese. \nA: What do you think of the literature course? \nB:It's very helpful. The course has let me into a new world of literature. I read so many great works from authors I had never heard of before, and it really broadened my perspective on cultural differences and historical contexts that shaped these literary masterpieces.\nA: Speaking of great literature, have you had the chance to explore any classic Japanese novels yet? \nB: Yes, I have. But I was actually going to mention that I read so many great literatures from different periods and genres. \nA: That sounds fascinating! Which genre did you find most intriguing?", + "total_duration": 36.64621315192744, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--316/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--316/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--316/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Are you studying here?", + "original_text": "Are you studying here?", + "start_time": 0, + "end_time": 1.3119274376417234, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--316/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, I am studying in Eastern Asian language department.", + "original_text": "Yes, I am studying in Eastern Asian language department.", + "start_time": 1.7102156457826811, + "end_time": 5.204818820385856, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--316/temp/line_1_B.wav", + "silence_duration": 0.3982882081409578, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "What are you majoring in?", + "original_text": "What are you majoring in?", + "start_time": 5.7693317049059685, + "end_time": 7.243798825087374, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--316/temp/line_2_A.wav", + "silence_duration": 0.5645128845201128, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I major in Japanese.", + "original_text": "I major in Japanese.", + "start_time": 7.631393676892201, + "end_time": 9.024590955803765, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--316/temp/line_3_B.wav", + "silence_duration": 0.38759485180482695, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "What do you think of the literature course?", + "original_text": "What do you think of the literature course?", + "start_time": 9.47310327173908, + "end_time": 11.806708713915949, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--316/temp/line_4_A.wav", + "silence_duration": 0.44851231593531404, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "It's very helpful. The course has let me into a new world of literature. I read so many great", + "original_text": "It's very helpful. The course has let me into a new world of literature. I read so many great [interrupt] works from authors I had never heard of before, and it really broadened my perspective on cultural differences and historical contexts that shaped these literary masterpieces.", + "start_time": 12.28747802659871, + "end_time": 25.627341972176943, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--316/temp/line_5_B.wav", + "silence_duration": 0.4807693126827606, + "is_interrupted": true, + "text_after_interrupt": "works from authors I had never heard of before, and it really broadened my perspective on cultural differences and historical contexts that shaped these literary masterpieces." + }, + { + "speaker": "A", + "text": "Speaking of great literature, have you had the chance to explore any classic Japanese novels yet?", + "original_text": "Speaking of great literature, have you had the chance to explore any classic Japanese novels yet?", + "start_time": 17.662897527732497, + "end_time": 23.433056257891227, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--316/temp/line_6_A.wav", + "silence_duration": 0.4011548163531782, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, I have. But I was actually going to mention that I read so many great literatures from different periods and genres.", + "original_text": "Yes, I have. But I was actually going to mention that I read so many great literatures from different periods and genres.", + "start_time": 26.166543800456147, + "end_time": 32.064412281181774, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--316/temp/line_7_B.wav", + "silence_duration": 0.5392018282792038, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "That sounds fascinating! Which genre did you find most intriguing?", + "original_text": "That sounds fascinating! Which genre did you find most intriguing?", + "start_time": 32.61756347211604, + "end_time": 36.646225603635315, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--316/temp/line_8_A.wav", + "silence_duration": 0.5531511909342637, + "is_interrupted": false + } + ] + }, + "DialogSum--val--317": { + "original_text": "A: I'm so excited! We have two weeks off! What are you going to [interrupt] do with all that free time? I was thinking we could plan something fun together if you're interested in hanging out during the break.\nB: Sorry to jump in, but I just realized—do you know if we'll have any assignments due right after the break? I don't want to be caught off guard. \nA: Oh, good point! I think we might have a report due, but I'll double-check that. Anyway, I was saying I might just stay at home and catch up on my reading. What about you? Any plans? \nB: Well, my parents have rented a condominium in Florida. I'm going to take long walks along the beach every day and do lots of [interrupt] relaxing and maybe even some snorkeling, especially since the water is supposed to be crystal clear this time of year with perfect visibility for marine life.\nA: Wait, did you say Florida? That sounds amazing! Are you going to visit any specific places there, like Disney World? \nB: I hadn't thought about that yet, but mostly I'm just looking forward to the beach and swimming. By the way, I was going to say, why don't you come with us? We have plenty of room. \nA: Do you mean it? I'd love to!", + "cleaned_text": "A:I'm so excited! We have two weeks off! What are you going to do with all that free time? I was thinking we could plan something fun together if you're interested in hanging out during the break.\nB: Sorry to jump in, but I just realized—do you know if we'll have any assignments due right after the break? I don't want to be caught off guard. \nA: Oh, good point! I think we might have a report due, but I'll double-check that. Anyway, I was saying I might just stay at home and catch up on my reading. What about you? Any plans? \nB:Well, my parents have rented a condominium in Florida. I'm going to take long walks along the beach every day and do lots of relaxing and maybe even some snorkeling, especially since the water is supposed to be crystal clear this time of year with perfect visibility for marine life.\nA: Wait, did you say Florida? That sounds amazing! Are you going to visit any specific places there, like Disney World? \nB: I hadn't thought about that yet, but mostly I'm just looking forward to the beach and swimming. By the way, I was going to say, why don't you come with us? We have plenty of room. \nA: Do you mean it? I'd love to!", + "total_duration": 55.4043537414966, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--317/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--317/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--317/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "I'm so excited! We have two weeks off! What are you going to", + "original_text": "I'm so excited! We have two weeks off! What are you going to [interrupt] do with all that free time? I was thinking we could plan something fun together if you're interested in hanging out during the break.", + "start_time": 0, + "end_time": 10.599909297052154, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--317/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": true, + "text_after_interrupt": "do with all that free time? I was thinking we could plan something fun together if you're interested in hanging out during the break." + }, + { + "speaker": "B", + "text": "Sorry to jump in, but I just realized—do you know if we'll have any assignments due right after the break? I don't want to be caught off guard.", + "original_text": "Sorry to jump in, but I just realized—do you know if we'll have any assignments due right after the break? I don't want to be caught off guard.", + "start_time": 4.435011337868481, + "end_time": 10.890158730158731, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--317/temp/line_1_B.wav", + "silence_duration": 0.47902415336668613, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Oh, good point! I think we might have a report due, but I'll double-check that. Anyway, I was saying I might just stay at home and catch up on my reading. What about you? Any plans?", + "original_text": "Oh, good point! I think we might have a report due, but I'll double-check that. Anyway, I was saying I might just stay at home and catch up on my reading. What about you? Any plans?", + "start_time": 11.478225745431978, + "end_time": 22.287114634320865, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--317/temp/line_2_A.wav", + "silence_duration": 0.5880670152732461, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Well, my parents have rented a condominium in Florida. I'm going to take long walks along the beach every day and do lots of", + "original_text": "Well, my parents have rented a condominium in Florida. I'm going to take long walks along the beach every day and do lots of [interrupt] relaxing and maybe even some snorkeling, especially since the water is supposed to be crystal clear this time of year with perfect visibility for marine life.", + "start_time": 22.855957663790477, + "end_time": 37.3916492737678, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--317/temp/line_3_B.wav", + "silence_duration": 0.5688430294696107, + "is_interrupted": true, + "text_after_interrupt": "relaxing and maybe even some snorkeling, especially since the water is supposed to be crystal clear this time of year with perfect visibility for marine life." + }, + { + "speaker": "A", + "text": "Wait, did you say Florida? That sounds amazing! Are you going to visit any specific places there, like Disney World?", + "original_text": "Wait, did you say Florida? That sounds amazing! Are you going to visit any specific places there, like Disney World?", + "start_time": 35.97059299190654, + "end_time": 43.94664741367525, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--317/temp/line_4_A.wav", + "silence_duration": 0.5423028981898519, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I hadn't thought about that yet, but mostly I'm just looking forward to the beach and swimming. By the way, I was going to say, why don't you come with us? We have plenty of room.", + "original_text": "I hadn't thought about that yet, but mostly I'm just looking forward to the beach and swimming. By the way, I was going to say, why don't you come with us? We have plenty of room.", + "start_time": 44.50377025656876, + "end_time": 52.83973397538962, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--317/temp/line_5_B.wav", + "silence_duration": 0.5571228428935063, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Do you mean it? I'd love to!", + "original_text": "Do you mean it? I'd love to!", + "start_time": 53.23329184888288, + "end_time": 55.404357608520066, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--317/temp/line_6_A.wav", + "silence_duration": 0.3935578734932601, + "is_interrupted": false + } + ] + }, + "DialogSum--val--318": { + "original_text": "A: Hi, come on in. Can I take your coat? \nB: Sure, thanks. I brought you a bottle of wine as well. \nA: You're the first guest to arrive. I'll just put your coat away and then I'll get you something to [interrupt] drink. Maybe a glass of wine to start? I've got a nice selection of beverages prepared for the evening, including some craft cocktails if you're feeling adventurous. \nB: Oh, should I take my shoes off? \nA: Whatever you prefer. Would you like a drink? \nB: This is a very nice place. How long have you been living here now? \nA: Just over three weeks. I was just about to ask—what do you want to drink? \nB: Sure, what do you have? \nA: I've got white wine, red wine, gin and tonics, ginger ale, lemonade, orange juice, and sprite. \nB: I'll have a glass of red wine please. \nA: One glass of red wine coming up! \nB: So how many people are coming for the dinner tonight?", + "cleaned_text": "A: Hi, come on in. Can I take your coat? \nB: Sure, thanks. I brought you a bottle of wine as well. \nA:You're the first guest to arrive. I'll just put your coat away and then I'll get you something to drink. Maybe a glass of wine to start? I've got a nice selection of beverages prepared for the evening, including some craft cocktails if you're feeling adventurous.\nB: Oh, should I take my shoes off? \nA: Whatever you prefer. Would you like a drink? \nB: This is a very nice place. How long have you been living here now? \nA: Just over three weeks. I was just about to ask—what do you want to drink? \nB: Sure, what do you have? \nA: I've got white wine, red wine, gin and tonics, ginger ale, lemonade, orange juice, and sprite. \nB: I'll have a glass of red wine please. \nA: One glass of red wine coming up! \nB: So how many people are coming for the dinner tonight?", + "total_duration": 50.56458049886621, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--318/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--318/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--318/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Hi, come on in. Can I take your coat?", + "original_text": "Hi, come on in. Can I take your coat?", + "start_time": 0, + "end_time": 2.716734693877551, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--318/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Sure, thanks. I brought you a bottle of wine as well.", + "original_text": "Sure, thanks. I brought you a bottle of wine as well.", + "start_time": 3.2474732140333717, + "end_time": 5.882938066641081, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--318/temp/line_1_B.wav", + "silence_duration": 0.5307385201558206, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "You're the first guest to arrive. I'll just put your coat away and then I'll get you something to", + "original_text": "You're the first guest to arrive. I'll just put your coat away and then I'll get you something to [interrupt] drink. Maybe a glass of wine to start? I've got a nice selection of beverages prepared for the evening, including some craft cocktails if you're feeling adventurous.", + "start_time": 6.434061822051338, + "end_time": 21.585082230214603, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--318/temp/line_2_A.wav", + "silence_duration": 0.5511237554102568, + "is_interrupted": true, + "text_after_interrupt": "drink. Maybe a glass of wine to start? I've got a nice selection of beverages prepared for the evening, including some craft cocktails if you're feeling adventurous." + }, + { + "speaker": "B", + "text": "Oh, should I take my shoes off?", + "original_text": "Oh, should I take my shoes off?", + "start_time": 12.366760234749751, + "end_time": 14.2359665839561, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--318/temp/line_3_B.wav", + "silence_duration": 0.3167684906455701, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Whatever you prefer. Would you like a drink?", + "original_text": "Whatever you prefer. Would you like a drink?", + "start_time": 21.911945498144448, + "end_time": 24.651900146670524, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--318/temp/line_4_A.wav", + "silence_duration": 0.3268632679298462, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "This is a very nice place. How long have you been living here now?", + "original_text": "This is a very nice place. How long have you been living here now?", + "start_time": 25.18310242056495, + "end_time": 28.53838586727697, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--318/temp/line_5_B.wav", + "silence_duration": 0.531202273894424, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Just over three weeks. I was just about to ask—what do you want to drink?", + "original_text": "Just over three weeks. I was just about to ask—what do you want to drink?", + "start_time": 29.0513669343328, + "end_time": 34.229416820954114, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--318/temp/line_6_A.wav", + "silence_duration": 0.5129810670558315, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Sure, what do you have?", + "original_text": "Sure, what do you have?", + "start_time": 34.68623252370048, + "end_time": 35.91689012007237, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--318/temp/line_7_B.wav", + "silence_duration": 0.4568157027463694, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I've got white wine, red wine, gin and tonics, ginger ale, lemonade, orange juice, and sprite.", + "original_text": "I've got white wine, red wine, gin and tonics, ginger ale, lemonade, orange juice, and sprite.", + "start_time": 36.51636665901034, + "end_time": 43.0295639379219, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--318/temp/line_8_A.wav", + "silence_duration": 0.5994765389379701, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I'll have a glass of red wine please.", + "original_text": "I'll have a glass of red wine please.", + "start_time": 43.3935572514571, + "end_time": 45.33242346460903, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--318/temp/line_9_B.wav", + "silence_duration": 0.36399331353520537, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "One glass of red wine coming up!", + "original_text": "One glass of red wine coming up!", + "start_time": 45.74366469001362, + "end_time": 47.74058078978686, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--318/temp/line_10_A.wav", + "silence_duration": 0.4112412254045896, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "So how many people are coming for the dinner tonight?", + "original_text": "So how many people are coming for the dinner tonight?", + "start_time": 48.289026540760574, + "end_time": 50.56458209631613, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--318/temp/line_11_B.wav", + "silence_duration": 0.5484457509737151, + "is_interrupted": false + } + ] + }, + "DialogSum--val--319": { + "original_text": "A: I don't know about you, but I'm famished. Are you interested in getting a bite to eat?\nB: That sounds great. I'm absolutely starving! What kind of food are you in the mood for?\nA: I'd love something spicy. Maybe we could get some Sichuan Hotpot [interrupt] from that authentic restaurant downtown that uses traditional Sichuan peppercorns and has that amazing dipping sauce selection.\nB: You're a woman after my own heart. I don't know many people who can handle spicy food. Are you sure you are up for the level of heat that Sichuan Hotpot is famous for?\nA: Hotpot? Absolutely! If I could, I would eat hotpot every day!\nB: Ok, you're really all eyes when it comes to talking about food, aren't you?\nA: Well, let's stop dragging our feet and find a Sichuan Hotpot restaurant for dinner!\nB: Let me think about it for a minute. Let's see. . . oh the name of the restaurant is on the tip of my tongue, but I just can't seem to remember it right now.\nA: Wait, are you talking about that place near the China World Trade Towers on Chang An Street? Have you been there?\nB: That's it! That's the one I was thinking of! I told you I'd remember it!", + "cleaned_text": "A: I don't know about you, but I'm famished. Are you interested in getting a bite to eat?\nB: That sounds great. I'm absolutely starving! What kind of food are you in the mood for?\nA:I'd love something spicy. Maybe we could get some Sichuan Hotpot from that authentic restaurant downtown that uses traditional Sichuan peppercorns and has that amazing dipping sauce selection.\nB: You're a woman after my own heart. I don't know many people who can handle spicy food. Are you sure you are up for the level of heat that Sichuan Hotpot is famous for?\nA: Hotpot? Absolutely! If I could, I would eat hotpot every day!\nB: Ok, you're really all eyes when it comes to talking about food, aren't you?\nA: Well, let's stop dragging our feet and find a Sichuan Hotpot restaurant for dinner!\nB: Let me think about it for a minute. Let's see. . . oh the name of the restaurant is on the tip of my tongue, but I just can't seem to remember it right now.\nA: Wait, are you talking about that place near the China World Trade Towers on Chang An Street? Have you been there?\nB: That's it! That's the one I was thinking of! I told you I'd remember it!", + "total_duration": 54.5437641723356, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--319/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--319/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--319/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "I don't know about you, but I'm famished. Are you interested in getting a bite to eat?", + "original_text": "I don't know about you, but I'm famished. Are you interested in getting a bite to eat?", + "start_time": 0, + "end_time": 4.85297052154195, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--319/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "That sounds great. I'm absolutely starving! What kind of food are you in the mood for?", + "original_text": "That sounds great. I'm absolutely starving! What kind of food are you in the mood for?", + "start_time": 5.343115075781946, + "end_time": 9.917446141541582, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--319/temp/line_1_B.wav", + "silence_duration": 0.49014455423999626, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I'd love something spicy. Maybe we could get some Sichuan Hotpot", + "original_text": "I'd love something spicy. Maybe we could get some Sichuan Hotpot [interrupt] from that authentic restaurant downtown that uses traditional Sichuan peppercorns and has that amazing dipping sauce selection.", + "start_time": 10.430335235442483, + "end_time": 22.086752469002576, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--319/temp/line_2_A.wav", + "silence_duration": 0.5128890939009012, + "is_interrupted": true, + "text_after_interrupt": "from that authentic restaurant downtown that uses traditional Sichuan peppercorns and has that amazing dipping sauce selection." + }, + { + "speaker": "B", + "text": "You're a woman after my own heart. I don't know many people who can handle spicy food. Are you sure you are up for the level of heat that Sichuan Hotpot is famous for?", + "original_text": "You're a woman after my own heart. I don't know many people who can handle spicy food. Are you sure you are up for the level of heat that Sichuan Hotpot is famous for?", + "start_time": 14.38933750301618, + "end_time": 23.34063002002298, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--319/temp/line_3_B.wav", + "silence_duration": 0.552022638386326, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Hotpot? Absolutely! If I could, I would eat hotpot every day!", + "original_text": "Hotpot? Absolutely! If I could, I would eat hotpot every day!", + "start_time": 23.650623180088356, + "end_time": 27.806995062174522, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--319/temp/line_4_A.wav", + "silence_duration": 0.3099931600653752, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Ok, you're really all eyes when it comes to talking about food, aren't you?", + "original_text": "Ok, you're really all eyes when it comes to talking about food, aren't you?", + "start_time": 28.12762835517013, + "end_time": 31.645451484421834, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--319/temp/line_5_B.wav", + "silence_duration": 0.3206332929956104, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Well, let's stop dragging our feet and find a Sichuan Hotpot restaurant for dinner!", + "original_text": "Well, let's stop dragging our feet and find a Sichuan Hotpot restaurant for dinner!", + "start_time": 32.200806691958675, + "end_time": 36.33395861939632, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--319/temp/line_6_A.wav", + "silence_duration": 0.555355207536843, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Let me think about it for a minute. Let's see. . . oh the name of the restaurant is on the tip of my tongue, but I just can't seem to remember it right now.", + "original_text": "Let me think about it for a minute. Let's see. . . oh the name of the restaurant is on the tip of my tongue, but I just can't seem to remember it right now.", + "start_time": 36.8280550114163, + "end_time": 43.95658108851381, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--319/temp/line_7_B.wav", + "silence_duration": 0.49409639201998423, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Wait, are you talking about that place near the China World Trade Towers on Chang An Street? Have you been there?", + "original_text": "Wait, are you talking about that place near the China World Trade Towers on Chang An Street? Have you been there?", + "start_time": 44.32376491457226, + "end_time": 50.95306196672645, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--319/temp/line_8_A.wav", + "silence_duration": 0.36718382605845223, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "That's it! That's the one I was thinking of! I told you I'd remember it!", + "original_text": "That's it! That's the one I was thinking of! I told you I'd remember it!", + "start_time": 51.46712264532651, + "end_time": 54.543766636256215, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--319/temp/line_9_B.wav", + "silence_duration": 0.5140606786000637, + "is_interrupted": false + } + ] + }, + "DialogSum--val--321": { + "original_text": "A: Hello, Is this room service? \nB: Yes, May I help you? \nA: This is room 1425, we asked for the room service an hour ago. \nB: We are very sorry to cause you a lot of [interrupt] inconvenience due to the delay in service and we understand how frustrating this must be for you, especially since you've been waiting for so long already. \nA: What's the matter? Is there a specific issue that's causing the delay? \nB: We're rather busy right now. It will take another 15 minutes. \nA: Is it really going to take that long? Could you please rush the order? \nB: I'm afraid it will take 15 minutes at most. Again, we apologize for the inconvenience.", + "cleaned_text": "A: Hello, Is this room service? \nB: Yes, May I help you? \nA: This is room 1425, we asked for the room service an hour ago. \nB:We are very sorry to cause you a lot of inconvenience due to the delay in service and we understand how frustrating this must be for you, especially since you've been waiting for so long already.\nA: What's the matter? Is there a specific issue that's causing the delay? \nB: We're rather busy right now. It will take another 15 minutes. \nA: Is it really going to take that long? Could you please rush the order? \nB: I'm afraid it will take 15 minutes at most. Again, we apologize for the inconvenience.", + "total_duration": 32.13165532879819, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--321/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--321/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--321/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Hello, Is this room service?", + "original_text": "Hello, Is this room service?", + "start_time": 0, + "end_time": 2.078185941043084, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--321/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, May I help you?", + "original_text": "Yes, May I help you?", + "start_time": 2.563907463283079, + "end_time": 3.817785014303487, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--321/temp/line_1_B.wav", + "silence_duration": 0.4857215222399952, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "This is room 1425, we asked for the room service an hour ago.", + "original_text": "This is room 1425, we asked for the room service an hour ago.", + "start_time": 4.134156216623074, + "end_time": 8.464677758573188, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--321/temp/line_2_A.wav", + "silence_duration": 0.31637120231958715, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "We are very sorry to cause you a lot of", + "original_text": "We are very sorry to cause you a lot of [interrupt] inconvenience due to the delay in service and we understand how frustrating this must be for you, especially since you've been waiting for so long already.", + "start_time": 8.866157040560937, + "end_time": 18.23540874124121, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--321/temp/line_3_B.wav", + "silence_duration": 0.4014792819877496, + "is_interrupted": true, + "text_after_interrupt": "inconvenience due to the delay in service and we understand how frustrating this must be for you, especially since you've been waiting for so long already." + }, + { + "speaker": "A", + "text": "What's the matter? Is there a specific issue that's causing the delay?", + "original_text": "What's the matter? Is there a specific issue that's causing the delay?", + "start_time": 11.16493255076502, + "end_time": 15.576723933984974, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--321/temp/line_4_A.wav", + "silence_duration": 0.495136289911122, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "We're rather busy right now. It will take another 15 minutes.", + "original_text": "We're rather busy right now. It will take another 15 minutes.", + "start_time": 18.55233944796214, + "end_time": 21.849573008052843, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--321/temp/line_5_B.wav", + "silence_duration": 0.31693070672093204, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Is it really going to take that long? Could you please rush the order?", + "original_text": "Is it really going to take that long? Could you please rush the order?", + "start_time": 22.21126208489649, + "end_time": 26.53017364952234, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--321/temp/line_6_A.wav", + "silence_duration": 0.3616890768436458, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I'm afraid it will take 15 minutes at most. Again, we apologize for the inconvenience.", + "original_text": "I'm afraid it will take 15 minutes at most. Again, we apologize for the inconvenience.", + "start_time": 27.011670869136385, + "end_time": 32.131670869136386, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--321/temp/line_7_B.wav", + "silence_duration": 0.48149721961404357, + "is_interrupted": false + } + ] + }, + "DialogSum--val--322": { + "original_text": "A: Excuse me, sir. Didn't you see the red light?\nB: Oh, I thought I could make a right turn on red [interrupt] if there was no oncoming traffic, which is usually permitted unless specifically prohibited by signage like in this situation.\nA: No, sir. The sign says No Turn on Red.\nB: Oh, I guess I didn't see it.\nA: I am sorry, sir. But may I see your driver's license and insurance policy, PLS? I have to give you a [interrupt] citation for the violation which will include details about the fine amount and instructions for how to contest it if you choose to do so.\nB: Wait, before you issue the ticket, I just want to confirm—will this affect my insurance rate?\nA: That's something your insurance company will decide, but I still need to issue the ticket. Here they are.\nB: Oh, right. Here are my documents.\nA: Sign here, PLS. You can appeal to the court within 14 days. This slip has all the information you need. Pls drive safely, sir.\nB: Thank you, Ma'am.", + "cleaned_text": "A: Excuse me, sir. Didn't you see the red light?\nB:Oh, I thought I could make a right turn on red if there was no oncoming traffic, which is usually permitted unless specifically prohibited by signage like in this situation.\nA: No, sir. The sign says No Turn on Red.\nB: Oh, I guess I didn't see it.\nA:I am sorry, sir. But may I see your driver's license and insurance policy, PLS? I have to give you a citation for the violation which will include details about the fine amount and instructions for how to contest it if you choose to do so.\nB: Wait, before you issue the ticket, I just want to confirm—will this affect my insurance rate?\nA: That's something your insurance company will decide, but I still need to issue the ticket. Here they are.\nB: Oh, right. Here are my documents.\nA: Sign here, PLS. You can appeal to the court within 14 days. This slip has all the information you need. Pls drive safely, sir.\nB: Thank you, Ma'am.", + "total_duration": 49.97106575963719, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--322/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--322/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--322/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Excuse me, sir. Didn't you see the red light?", + "original_text": "Excuse me, sir. Didn't you see the red light?", + "start_time": 0, + "end_time": 2.716734693877551, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--322/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Oh, I thought I could make a right turn on red", + "original_text": "Oh, I thought I could make a right turn on red [interrupt] if there was no oncoming traffic, which is usually permitted unless specifically prohibited by signage like in this situation.", + "start_time": 3.301683317891128, + "end_time": 12.02077628841267, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--322/temp/line_1_B.wav", + "silence_duration": 0.5849486240135766, + "is_interrupted": true, + "text_after_interrupt": "if there was no oncoming traffic, which is usually permitted unless specifically prohibited by signage like in this situation." + }, + { + "speaker": "A", + "text": "No, sir. The sign says No Turn on Red.", + "original_text": "No, sir. The sign says No Turn on Red.", + "start_time": 5.774608487959155, + "end_time": 8.688712796349177, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--322/temp/line_2_A.wav", + "silence_duration": 0.37559378577015545, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Oh, I guess I didn't see it.", + "original_text": "Oh, I guess I didn't see it.", + "start_time": 12.402924448016357, + "end_time": 13.958661409467604, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--322/temp/line_3_B.wav", + "silence_duration": 0.3821481596036879, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I am sorry, sir. But may I see your driver's license and insurance policy, PLS? I have to give you a", + "original_text": "I am sorry, sir. But may I see your driver's license and insurance policy, PLS? I have to give you a [interrupt] citation for the violation which will include details about the fine amount and instructions for how to contest it if you choose to do so.", + "start_time": 14.381079824798542, + "end_time": 29.79912971141986, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--322/temp/line_4_A.wav", + "silence_duration": 0.4224184153309384, + "is_interrupted": true, + "text_after_interrupt": "citation for the violation which will include details about the fine amount and instructions for how to contest it if you choose to do so." + }, + { + "speaker": "B", + "text": "Wait, before you issue the ticket, I just want to confirm—will this affect my insurance rate?", + "original_text": "Wait, before you issue the ticket, I just want to confirm—will this affect my insurance rate?", + "start_time": 25.48966271593637, + "end_time": 30.505172920018, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--322/temp/line_5_B.wav", + "silence_duration": 0.43526337607935195, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "That's something your insurance company will decide, but I still need to issue the ticket. Here they are.", + "original_text": "That's something your insurance company will decide, but I still need to issue the ticket. Here they are.", + "start_time": 30.850657571391803, + "end_time": 36.806575938738746, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--322/temp/line_6_A.wav", + "silence_duration": 0.34548465137380235, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Oh, right. Here are my documents.", + "original_text": "Oh, right. Here are my documents.", + "start_time": 37.115538522300646, + "end_time": 39.205334440668, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--322/temp/line_7_B.wav", + "silence_duration": 0.30896258356190043, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Sign here, PLS. You can appeal to the court within 14 days. This slip has all the information you need. Pls drive safely, sir.", + "original_text": "Sign here, PLS. You can appeal to the court within 14 days. This slip has all the information you need. Pls drive safely, sir.", + "start_time": 39.65154904871787, + "end_time": 48.660891452345986, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--322/temp/line_8_A.wav", + "silence_duration": 0.4462146080498681, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Thank you, Ma'am.", + "original_text": "Thank you, Ma'am.", + "start_time": 49.1583915007126, + "end_time": 49.97108991341101, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--322/temp/line_9_B.wav", + "silence_duration": 0.4975000483666095, + "is_interrupted": false + } + ] + }, + "DialogSum--val--323": { + "original_text": "A: What are you waiting for? Get on that bus quickly. \nB: But where do I get a [interrupt] ticket from? I've never taken this bus line before and I'm not sure about the payment procedures or if there are any special requirements for boarding. \nA: Sorry, I should have mentioned it earlier—the driver collects the fares on the bus. \nB: Okay, and I'll have to take my luggage on board, right? \nA: Yes, you'll have to take it on board. By the way, you were asking where to get a ticket, right? \nB: Oh, right. I guess I just pay the driver directly. I wish I didn't have so much to carry.", + "cleaned_text": "A: What are you waiting for? Get on that bus quickly. \nB:But where do I get a ticket from? I've never taken this bus line before and I'm not sure about the payment procedures or if there are any special requirements for boarding.\nA: Sorry, I should have mentioned it earlier—the driver collects the fares on the bus. \nB: Okay, and I'll have to take my luggage on board, right? \nA: Yes, you'll have to take it on board. By the way, you were asking where to get a ticket, right? \nB: Oh, right. I guess I just pay the driver directly. I wish I didn't have so much to carry.", + "total_duration": 25.94426303854875, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--323/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--323/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--323/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "What are you waiting for? Get on that bus quickly.", + "original_text": "What are you waiting for? Get on that bus quickly.", + "start_time": 0, + "end_time": 3.575873015873016, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--323/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "But where do I get a", + "original_text": "But where do I get a [interrupt] ticket from? I've never taken this bus line before and I'm not sure about the payment procedures or if there are any special requirements for boarding.", + "start_time": 3.9368355837734454, + "end_time": 12.296019257242834, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--323/temp/line_1_B.wav", + "silence_duration": 0.3609625679004294, + "is_interrupted": true, + "text_after_interrupt": "ticket from? I've never taken this bus line before and I'm not sure about the payment procedures or if there are any special requirements for boarding." + }, + { + "speaker": "A", + "text": "Sorry, I should have mentioned it earlier—the driver collects the fares on the bus.", + "original_text": "Sorry, I should have mentioned it earlier—the driver collects the fares on the bus.", + "start_time": 5.016563474929908, + "end_time": 9.915973905768912, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--323/temp/line_2_A.wav", + "silence_duration": 0.5482632374783776, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Okay, and I'll have to take my luggage on board, right?", + "original_text": "Okay, and I'll have to take my luggage on board, right?", + "start_time": 12.653339874130147, + "end_time": 15.764813797032641, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--323/temp/line_3_B.wav", + "silence_duration": 0.35732061688731176, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Yes, you'll have to take it on board. By the way, you were asking where to get a ticket, right?", + "original_text": "Yes, you'll have to take it on board. By the way, you were asking where to get a ticket, right?", + "start_time": 16.33981864758706, + "end_time": 21.192789169129007, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--323/temp/line_4_A.wav", + "silence_duration": 0.5750048505544194, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Oh, right. I guess I just pay the driver directly. I wish I didn't have so much to carry.", + "original_text": "Oh, right. I guess I just pay the driver directly. I wish I didn't have so much to carry.", + "start_time": 21.613750658579196, + "end_time": 25.94427220052931, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--323/temp/line_5_B.wav", + "silence_duration": 0.4209614894501876, + "is_interrupted": false + } + ] + }, + "DialogSum--val--324": { + "original_text": "A: Excuse me. I'm your new neighbor, Jack. I just moved [interrupt] into the apartment next door and wanted to introduce myself properly since we'll be seeing each other around the building quite often.\nB: Sorry to interrupt, welcome to the neighborhood! Have you settled in okay?\nA: Thank you! Yes, mostly. I was actually looking for a grocery store. Are there any around here?\nB: Yes, there are some on Pine Street.\nA: OK. And is there a laundromat near [interrupt] here that you'd recommend, or will I need to go further out to find one with good machines and reasonable prices?\nB: Oh, before I forget, do you need any help with finding other places nearby? Like maybe a pharmacy or a coffee shop?\nA: Thanks for asking! Actually, I was going to ask about a laundromat. Is there one near here?\nB: Well, I think there's one across from the shopping center.\nA: Great, thank you.\nB: By the way, there's a barber shop in the shopping center, too.", + "cleaned_text": "A:Excuse me. I'm your new neighbor, Jack. I just moved into the apartment next door and wanted to introduce myself properly since we'll be seeing each other around the building quite often.\nB: Sorry to interrupt, welcome to the neighborhood! Have you settled in okay?\nA: Thank you! Yes, mostly. I was actually looking for a grocery store. Are there any around here?\nB: Yes, there are some on Pine Street.\nA:OK. And is there a laundromat near here that you'd recommend, or will I need to go further out to find one with good machines and reasonable prices?\nB: Oh, before I forget, do you need any help with finding other places nearby? Like maybe a pharmacy or a coffee shop?\nA: Thanks for asking! Actually, I was going to ask about a laundromat. Is there one near here?\nB: Well, I think there's one across from the shopping center.\nA: Great, thank you.\nB: By the way, there's a barber shop in the shopping center, too.", + "total_duration": 47.964444444444446, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--324/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--324/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--324/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Excuse me. I'm your new neighbor, Jack. I just moved", + "original_text": "Excuse me. I'm your new neighbor, Jack. I just moved [interrupt] into the apartment next door and wanted to introduce myself properly since we'll be seeing each other around the building quite often.", + "start_time": 0, + "end_time": 10.832108843537416, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--324/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": true, + "text_after_interrupt": "into the apartment next door and wanted to introduce myself properly since we'll be seeing each other around the building quite often." + }, + { + "speaker": "B", + "text": "Sorry to interrupt, welcome to the neighborhood! Have you settled in okay?", + "original_text": "Sorry to interrupt, welcome to the neighborhood! Have you settled in okay?", + "start_time": 3.8312925170068026, + "end_time": 7.186575963718821, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--324/temp/line_1_B.wav", + "silence_duration": 0.4978944078543781, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Thank you! Yes, mostly. I was actually looking for a grocery store. Are there any around here?", + "original_text": "Thank you! Yes, mostly. I was actually looking for a grocery store. Are there any around here?", + "start_time": 11.163127144993581, + "end_time": 16.712696305991315, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--324/temp/line_2_A.wav", + "silence_duration": 0.3310183014561644, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, there are some on Pine Street.", + "original_text": "Yes, there are some on Pine Street.", + "start_time": 17.26468822638099, + "end_time": 19.157114530235866, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--324/temp/line_3_B.wav", + "silence_duration": 0.5519919203896761, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "OK. And is there a laundromat near", + "original_text": "OK. And is there a laundromat near [interrupt] here that you'd recommend, or will I need to go further out to find one with good machines and reasonable prices?", + "start_time": 19.567222491747163, + "end_time": 28.65783473664512, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--324/temp/line_4_A.wav", + "silence_duration": 0.41010796151129725, + "is_interrupted": true, + "text_after_interrupt": "here that you'd recommend, or will I need to go further out to find one with good machines and reasonable prices?" + }, + { + "speaker": "B", + "text": "Oh, before I forget, do you need any help with finding other places nearby? Like maybe a pharmacy or a coffee shop?", + "original_text": "Oh, before I forget, do you need any help with finding other places nearby? Like maybe a pharmacy or a coffee shop?", + "start_time": 26.060151387259893, + "end_time": 32.6546185074413, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--324/temp/line_5_B.wav", + "silence_duration": 0.46000508906949733, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Thanks for asking! Actually, I was going to ask about a laundromat. Is there one near here?", + "original_text": "Thanks for asking! Actually, I was going to ask about a laundromat. Is there one near here?", + "start_time": 33.18382141231407, + "end_time": 38.44314114020523, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--324/temp/line_6_A.wav", + "silence_duration": 0.5292029048727693, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Well, I think there's one across from the shopping center.", + "original_text": "Well, I think there's one across from the shopping center.", + "start_time": 39.0338814924511, + "end_time": 42.47043478043296, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--324/temp/line_7_B.wav", + "silence_duration": 0.5907403522458725, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Great, thank you.", + "original_text": "Great, thank you.", + "start_time": 42.898654836945006, + "end_time": 44.11770245599263, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--324/temp/line_8_A.wav", + "silence_duration": 0.42822005651204703, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "By the way, there's a barber shop in the shopping center, too.", + "original_text": "By the way, there's a barber shop in the shopping center, too.", + "start_time": 44.65560541822792, + "end_time": 47.96444895564289, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--324/temp/line_9_B.wav", + "silence_duration": 0.5379029622352904, + "is_interrupted": false + } + ] + }, + "DialogSum--val--326": { + "original_text": "A: Is there anything I can do for you? \nB: Yes, I joined your group bus tour this morning. You promised the journey would last 3 hours and we would visit 15 sightseeing spots. \nA: Yes, sir. We promised [interrupt] to cover all the major attractions within the given time frame, including the historical landmarks, cultural hotspots, and scenic viewpoints that make this tour so special. \nB: But the journey only lasted 2 hours. Why was it shorter than expected? \nA: I apologize for that. There was an unforeseen issue with traffic that shortened the trip. However, I haven't mentioned yet that we also had to skip some stops due to time constraints and a road closure that occurred unexpectedly. \nB: Skipping stops? That explains the fewer sightseeing spots. But could you clarify which stops were skipped and why? \n", + "cleaned_text": "A: Is there anything I can do for you? \nB: Yes, I joined your group bus tour this morning. You promised the journey would last 3 hours and we would visit 15 sightseeing spots. \nA:Yes, sir. We promised to cover all the major attractions within the given time frame, including the historical landmarks, cultural hotspots, and scenic viewpoints that make this tour so special.\nB: But the journey only lasted 2 hours. Why was it shorter than expected? \nA: I apologize for that. There was an unforeseen issue with traffic that shortened the trip. However, I haven't mentioned yet that we also had to skip some stops due to time constraints and a road closure that occurred unexpectedly. \nB: Skipping stops? That explains the fewer sightseeing spots. But could you clarify which stops were skipped and why? \n", + "total_duration": 42.45133786848073, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--326/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--326/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--326/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Is there anything I can do for you?", + "original_text": "Is there anything I can do for you?", + "start_time": 0, + "end_time": 1.7298866213151927, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--326/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, I joined your group bus tour this morning. You promised the journey would last 3 hours and we would visit 15 sightseeing spots.", + "original_text": "Yes, I joined your group bus tour this morning. You promised the journey would last 3 hours and we would visit 15 sightseeing spots.", + "start_time": 2.2101448040116227, + "end_time": 9.0019815387055, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--326/temp/line_1_B.wav", + "silence_duration": 0.4802581826964301, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Yes, sir. We promised", + "original_text": "Yes, sir. We promised [interrupt] to cover all the major attractions within the given time frame, including the historical landmarks, cultural hotspots, and scenic viewpoints that make this tour so special.", + "start_time": 9.330581605794224, + "end_time": 21.370128091054994, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--326/temp/line_2_A.wav", + "silence_duration": 0.3286000670887244, + "is_interrupted": true, + "text_after_interrupt": "to cover all the major attractions within the given time frame, including the historical landmarks, cultural hotspots, and scenic viewpoints that make this tour so special." + }, + { + "speaker": "B", + "text": "But the journey only lasted 2 hours. Why was it shorter than expected?", + "original_text": "But the journey only lasted 2 hours. Why was it shorter than expected?", + "start_time": 10.944368453866787, + "end_time": 15.356159837086741, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--326/temp/line_3_B.wav", + "silence_duration": 0.5574649180655832, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I apologize for that. There was an unforeseen issue with traffic that shortened the trip. However, I haven't mentioned yet that we also had to skip some stops due to time constraints and a road closure that occurred unexpectedly.", + "original_text": "I apologize for that. There was an unforeseen issue with traffic that shortened the trip. However, I haven't mentioned yet that we also had to skip some stops due to time constraints and a road closure that occurred unexpectedly.", + "start_time": 21.925958348373676, + "end_time": 35.18455245268207, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--326/temp/line_4_A.wav", + "silence_duration": 0.555830257318684, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Skipping stops? That explains the fewer sightseeing spots. But could you clarify which stops were skipped and why?", + "original_text": "Skipping stops? That explains the fewer sightseeing spots. But could you clarify which stops were skipped and why?", + "start_time": 35.68272595629116, + "end_time": 42.45134273633651, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--326/temp/line_5_B.wav", + "silence_duration": 0.49817350360908763, + "is_interrupted": false + } + ] + }, + "DialogSum--val--327": { + "original_text": "A: Can I help you, sir? \nB: Yes, what sort of warranty comes with this stereo? \nA: Well, our store offers a 90-day return policy and the manufacturer offers a one-year warranty on any factory [interrupt] defects, such as malfunctioning parts or issues that arise from normal use, and this includes free repairs or replacements depending on the severity of the issue. \nB: Sorry, can you clarify what exactly the store's return policy covers? \nA: Sure, we'll give you your money back as long as the stereo is returned in the original packaging and with a receipt. But to finish what I was saying earlier, the manufacturer's warranty covers any factory defects for one year. \nB: O.K. How do I get the manufacturer's warranty? \nA: Just send in the warranty card with a copy of your receipt. \nB: All right, those sound good. I'll take it.", + "cleaned_text": "A: Can I help you, sir? \nB: Yes, what sort of warranty comes with this stereo? \nA:Well, our store offers a 90-day return policy and the manufacturer offers a one-year warranty on any factory defects, such as malfunctioning parts or issues that arise from normal use, and this includes free repairs or replacements depending on the severity of the issue.\nB: Sorry, can you clarify what exactly the store's return policy covers? \nA: Sure, we'll give you your money back as long as the stereo is returned in the original packaging and with a receipt. But to finish what I was saying earlier, the manufacturer's warranty covers any factory defects for one year. \nB: O.K. How do I get the manufacturer's warranty? \nA: Just send in the warranty card with a copy of your receipt. \nB: All right, those sound good. I'll take it.", + "total_duration": 45.58249433106576, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--327/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--327/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--327/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Can I help you, sir?", + "original_text": "Can I help you, sir?", + "start_time": 0, + "end_time": 1.253877551020408, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--327/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, what sort of warranty comes with this stereo?", + "original_text": "Yes, what sort of warranty comes with this stereo?", + "start_time": 1.8068679579582025, + "end_time": 4.3262330373232825, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--327/temp/line_1_B.wav", + "silence_duration": 0.5529904069377944, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Well, our store offers a 90-day return policy and the manufacturer offers a one-year warranty on any factory", + "original_text": "Well, our store offers a 90-day return policy and the manufacturer offers a one-year warranty on any factory [interrupt] defects, such as malfunctioning parts or issues that arise from normal use, and this includes free repairs or replacements depending on the severity of the issue.", + "start_time": 4.6484117268571055, + "end_time": 21.70346841619951, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--327/temp/line_2_A.wav", + "silence_duration": 0.3221786895338228, + "is_interrupted": true, + "text_after_interrupt": "defects, such as malfunctioning parts or issues that arise from normal use, and this includes free repairs or replacements depending on the severity of the issue." + }, + { + "speaker": "B", + "text": "Sorry, can you clarify what exactly the store's return policy covers?", + "original_text": "Sorry, can you clarify what exactly the store's return policy covers?", + "start_time": 12.102017169033976, + "end_time": 16.23516909647162, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--327/temp/line_3_B.wav", + "silence_duration": 0.34656082250621567, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Sure, we'll give you your money back as long as the stereo is returned in the original packaging and with a receipt. But to finish what I was saying earlier, the manufacturer's warranty covers any factory defects for one year.", + "original_text": "Sure, we'll give you your money back as long as the stereo is returned in the original packaging and with a receipt. But to finish what I was saying earlier, the manufacturer's warranty covers any factory defects for one year.", + "start_time": 22.12886277143279, + "end_time": 35.5383865809566, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--327/temp/line_4_A.wav", + "silence_duration": 0.425394355233281, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "O.K. How do I get the manufacturer's warranty?", + "original_text": "O.K. How do I get the manufacturer's warranty?", + "start_time": 36.07527224631148, + "end_time": 38.71073709891919, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--327/temp/line_5_B.wav", + "silence_duration": 0.5368856653548801, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Just send in the warranty card with a copy of your receipt.", + "original_text": "Just send in the warranty card with a copy of your receipt.", + "start_time": 39.11897549847533, + "end_time": 42.39298910391751, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--327/temp/line_6_A.wav", + "silence_duration": 0.40823839955613883, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "All right, those sound good. I'll take it.", + "original_text": "All right, those sound good. I'll take it.", + "start_time": 42.70323136586521, + "end_time": 45.58250574228244, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--327/temp/line_7_B.wav", + "silence_duration": 0.31024226194769994, + "is_interrupted": false + } + ] + }, + "DialogSum--val--328": { + "original_text": "A: I have to do some shopping. \nB: What are you going to look for? \nA: I'm trying to buy a new bedroom set. \nB: What store are you going to? \nA: I'm not [interrupt] completely sure yet, but I was thinking of checking out a few places downtown that specialize in modern furniture designs and have good customer reviews. \nB: Sorry to jump in, but if you're not sure, have you considered checking online first? Sometimes you can find better deals or at least get an idea of what stores have what you need. \nA: That's a good idea. I was actually going to say I'm not sure where to start. Would you like me to tell you where I got mine? \nB: I would appreciate that. \nA: I went to get mine from IKEA. \nB: Is the furniture at IKEA cheap? \nA: They're not cheap, but neither is their [interrupt] design. They have some really stylish options that are worth the price, especially when you consider the durability and functionality of their modular pieces. \nB: Oh, I get what you mean. The quality matches the price, right? \nA: Exactly!", + "cleaned_text": "A: I have to do some shopping. \nB: What are you going to look for? \nA: I'm trying to buy a new bedroom set. \nB: What store are you going to? \nA:I'm not completely sure yet, but I was thinking of checking out a few places downtown that specialize in modern furniture designs and have good customer reviews.\nB: Sorry to jump in, but if you're not sure, have you considered checking online first? Sometimes you can find better deals or at least get an idea of what stores have what you need. \nA: That's a good idea. I was actually going to say I'm not sure where to start. Would you like me to tell you where I got mine? \nB: I would appreciate that. \nA: I went to get mine from IKEA. \nB: Is the furniture at IKEA cheap? \nA:They're not cheap, but neither is their design. They have some really stylish options that are worth the price, especially when you consider the durability and functionality of their modular pieces.\nB: Oh, I get what you mean. The quality matches the price, right? \nA: Exactly!", + "total_duration": 49.48789115646259, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--328/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--328/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--328/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "I have to do some shopping.", + "original_text": "I have to do some shopping.", + "start_time": 0, + "end_time": 1.6486167800453515, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--328/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "What are you going to look for?", + "original_text": "What are you going to look for?", + "start_time": 1.9592083777308675, + "end_time": 3.155036042129961, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--328/temp/line_1_B.wav", + "silence_duration": 0.3105915976855161, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I'm trying to buy a new bedroom set.", + "original_text": "I'm trying to buy a new bedroom set.", + "start_time": 3.517172922906408, + "end_time": 5.873998319731805, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--328/temp/line_2_A.wav", + "silence_duration": 0.3621368807764474, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "What store are you going to?", + "original_text": "What store are you going to?", + "start_time": 6.427716444051304, + "end_time": 7.704813949720238, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--328/temp/line_3_B.wav", + "silence_duration": 0.5537181243194997, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I'm not", + "original_text": "I'm not [interrupt] completely sure yet, but I was thinking of checking out a few places downtown that specialize in modern furniture designs and have good customer reviews.", + "start_time": 8.19722737581776, + "end_time": 18.35595753454792, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--328/temp/line_4_A.wav", + "silence_duration": 0.4924134260975235, + "is_interrupted": true, + "text_after_interrupt": "completely sure yet, but I was thinking of checking out a few places downtown that specialize in modern furniture designs and have good customer reviews." + }, + { + "speaker": "B", + "text": "Sorry to jump in, but if you're not sure, have you considered checking online first? Sometimes you can find better deals or at least get an idea of what stores have what you need.", + "original_text": "Sorry to jump in, but if you're not sure, have you considered checking online first? Sometimes you can find better deals or at least get an idea of what stores have what you need.", + "start_time": 9.195685425704383, + "end_time": 18.36756751187218, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--328/temp/line_5_B.wav", + "silence_duration": 0.3261085104579388, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "That's a good idea. I was actually going to say I'm not sure where to start. Would you like me to tell you where I got mine?", + "original_text": "That's a good idea. I was actually going to say I'm not sure where to start. Would you like me to tell you where I got mine?", + "start_time": 18.962458928683567, + "end_time": 26.334794529590596, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--328/temp/line_6_A.wav", + "silence_duration": 0.5948914168113857, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I would appreciate that.", + "original_text": "I would appreciate that.", + "start_time": 26.914223115831827, + "end_time": 28.249370508122077, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--328/temp/line_7_B.wav", + "silence_duration": 0.5794285862412316, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I went to get mine from IKEA.", + "original_text": "I went to get mine from IKEA.", + "start_time": 28.778744739291668, + "end_time": 30.555071269903912, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--328/temp/line_8_A.wav", + "silence_duration": 0.5293742311695909, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Is the furniture at IKEA cheap?", + "original_text": "Is the furniture at IKEA cheap?", + "start_time": 31.046114826089287, + "end_time": 32.54380190091922, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--328/temp/line_9_B.wav", + "silence_duration": 0.49104355618537426, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "They're not cheap, but neither is their", + "original_text": "They're not cheap, but neither is their [interrupt] design. They have some really stylish options that are worth the price, especially when you consider the durability and functionality of their modular pieces.", + "start_time": 32.85149314889264, + "end_time": 44.14800108540057, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--328/temp/line_10_A.wav", + "silence_duration": 0.30769124797341296, + "is_interrupted": true, + "text_after_interrupt": "design. They have some really stylish options that are worth the price, especially when you consider the durability and functionality of their modular pieces." + }, + { + "speaker": "B", + "text": "Oh, I get what you mean. The quality matches the price, right?", + "original_text": "Oh, I get what you mean. The quality matches the price, right?", + "start_time": 44.55000302937138, + "end_time": 47.9052864760834, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--328/temp/line_11_B.wav", + "silence_duration": 0.5248916908300998, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Exactly!", + "original_text": "Exactly!", + "start_time": 48.39658381000756, + "end_time": 49.48792167848829, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--328/temp/line_12_A.wav", + "silence_duration": 0.4912973339241677, + "is_interrupted": false + } + ] + }, + "DialogSum--val--329": { + "original_text": "A: What's the matter with me, Doctor? I feel so tired these days. \nB: It's your blood pressure, I'm afraid. It's far too [interrupt] high, and that's something we need to address immediately with a comprehensive treatment plan including medication and lifestyle changes. \nA: Too high? Oh no, that sounds serious. What's the cause of that? \nB: Overwork—amongst other things. You can't work 24 hours a day. You've got to slow down your pace and give your body the rest it needs. \nA: Slow down? But I can't just slow down, Doctor. There's too much on my plate right now. \nB: You've got to, I'm afraid. And look at this. You weigh 200 stones. That's too much for a man of your size. \nA: Wait, did you say 200 stones? That's... shocking. You mean I've got to lose weight? \nB: Yes. You've got to cut down on bread and potatoes and take more [interrupt] exercise, starting with gentle activities like walking or swimming before gradually increasing intensity as your health improves.", + "cleaned_text": "A: What's the matter with me, Doctor? I feel so tired these days. \nB:It's your blood pressure, I'm afraid. It's far too high, and that's something we need to address immediately with a comprehensive treatment plan including medication and lifestyle changes.\nA: Too high? Oh no, that sounds serious. What's the cause of that? \nB: Overwork—amongst other things. You can't work 24 hours a day. You've got to slow down your pace and give your body the rest it needs. \nA: Slow down? But I can't just slow down, Doctor. There's too much on my plate right now. \nB: You've got to, I'm afraid. And look at this. You weigh 200 stones. That's too much for a man of your size. \nA: Wait, did you say 200 stones? That's... shocking. You mean I've got to lose weight? \nB:Yes. You've got to cut down on bread and potatoes and take more exercise, starting with gentle activities like walking or swimming before gradually increasing intensity as your health improves.", + "total_duration": 51.44390022675737, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--329/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--329/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--329/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "What's the matter with me, Doctor? I feel so tired these days.", + "original_text": "What's the matter with me, Doctor? I feel so tired these days.", + "start_time": 0, + "end_time": 3.7732426303854876, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--329/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "It's your blood pressure, I'm afraid. It's far too", + "original_text": "It's your blood pressure, I'm afraid. It's far too [interrupt] high, and that's something we need to address immediately with a comprehensive treatment plan including medication and lifestyle changes.", + "start_time": 4.256579449921412, + "end_time": 13.892860629059733, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--329/temp/line_1_B.wav", + "silence_duration": 0.4833368195359239, + "is_interrupted": true, + "text_after_interrupt": "high, and that's something we need to address immediately with a comprehensive treatment plan including medication and lifestyle changes." + }, + { + "speaker": "A", + "text": "Too high? Oh no, that sounds serious. What's the cause of that?", + "original_text": "Too high? Oh no, that sounds serious. What's the cause of that?", + "start_time": 7.251953599581276, + "end_time": 11.686964937449757, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--329/temp/line_2_A.wav", + "silence_duration": 0.33993914328340513, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Overwork—amongst other things. You can't work 24 hours a day. You've got to slow down your pace and give your body the rest it needs.", + "original_text": "Overwork—amongst other things. You can't work 24 hours a day. You've got to slow down your pace and give your body the rest it needs.", + "start_time": 14.45124483334201, + "end_time": 21.87002034354609, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--329/temp/line_3_B.wav", + "silence_duration": 0.5583842042822775, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Slow down? But I can't just slow down, Doctor. There's too much on my plate right now.", + "original_text": "Slow down? But I can't just slow down, Doctor. There's too much on my plate right now.", + "start_time": 22.288526619920187, + "end_time": 28.999093513344224, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--329/temp/line_4_A.wav", + "silence_duration": 0.41850627637409676, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "You've got to, I'm afraid. And look at this. You weigh 200 stones. That's too much for a man of your size.", + "original_text": "You've got to, I'm afraid. And look at this. You weigh 200 stones. That's too much for a man of your size.", + "start_time": 29.536232270843016, + "end_time": 35.387660842271586, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--329/temp/line_5_B.wav", + "silence_duration": 0.5371387574987909, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Wait, did you say 200 stones? That's... shocking. You mean I've got to lose weight?", + "original_text": "Wait, did you say 200 stones? That's... shocking. You mean I've got to lose weight?", + "start_time": 35.832226379564474, + "end_time": 41.5095052911291, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--329/temp/line_6_A.wav", + "silence_duration": 0.4445655372928857, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes. You've got to cut down on bread and potatoes and take more", + "original_text": "Yes. You've got to cut down on bread and potatoes and take more [interrupt] exercise, starting with gentle activities like walking or swimming before gradually increasing intensity as your health improves.", + "start_time": 41.93534531975223, + "end_time": 51.44391674832366, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--329/temp/line_7_B.wav", + "silence_duration": 0.4258400286231269, + "is_interrupted": true, + "text_after_interrupt": "exercise, starting with gentle activities like walking or swimming before gradually increasing intensity as your health improves." + } + ] + }, + "DialogSum--val--331": { + "original_text": "A: Hi, Martin. How are you? \nB: Fine, but busy. We've got some exams next week, remember? \nA: I know. How much work did you do last night? \nB: None. I went to the cinema. What about you? \nA: I had no time last night. It was my sister's birthday, so we all went out to [interrupt] celebrate at her favorite restaurant which had this amazing live band playing and the food was absolutely delicious, though I probably ate too much cake! \nB: Oh, that sounds nice! But speaking of last night, did you manage to find your physics book? \nA: Actually, I was just about to ask you that. I couldn't find it anywhere. Do you know where it might be? \nB: I've got no idea, but you can borrow mine if you want. \nA: Thanks. Let's meet outside Natbank in High Street at lunch time. I'll bring your book back then. \nB: Sure, and I'll bring my physics book for you. By the way, I'm really worried about the physics exam. Have you got any old exam papers? I'd really like to look through them. \nA: I haven't, but my brother's got some. I'll bring them with me at lunch time.", + "cleaned_text": "A: Hi, Martin. How are you? \nB: Fine, but busy. We've got some exams next week, remember? \nA: I know. How much work did you do last night? \nB: None. I went to the cinema. What about you? \nA:I had no time last night. It was my sister's birthday, so we all went out to celebrate at her favorite restaurant which had this amazing live band playing and the food was absolutely delicious, though I probably ate too much cake!\nB: Oh, that sounds nice! But speaking of last night, did you manage to find your physics book? \nA: Actually, I was just about to ask you that. I couldn't find it anywhere. Do you know where it might be? \nB: I've got no idea, but you can borrow mine if you want. \nA: Thanks. Let's meet outside Natbank in High Street at lunch time. I'll bring your book back then. \nB: Sure, and I'll bring my physics book for you. By the way, I'm really worried about the physics exam. Have you got any old exam papers? I'd really like to look through them. \nA: I haven't, but my brother's got some. I'll bring them with me at lunch time.", + "total_duration": 55.620816326530615, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--331/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--331/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--331/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Hi, Martin. How are you?", + "original_text": "Hi, Martin. How are you?", + "start_time": 0, + "end_time": 1.7182766439909296, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--331/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Fine, but busy. We've got some exams next week, remember?", + "original_text": "Fine, but busy. We've got some exams next week, remember?", + "start_time": 2.2825076254243633, + "end_time": 5.614571117487856, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--331/temp/line_1_B.wav", + "silence_duration": 0.5642309814334336, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I know. How much work did you do last night?", + "original_text": "I know. How much work did you do last night?", + "start_time": 6.024351593350765, + "end_time": 8.555326650040108, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--331/temp/line_2_A.wav", + "silence_duration": 0.4097804758629096, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "None. I went to the cinema. What about you?", + "original_text": "None. I went to the cinema. What about you?", + "start_time": 8.947000647476482, + "end_time": 11.257386135004827, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--331/temp/line_3_B.wav", + "silence_duration": 0.39167399743637454, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I had no time last night. It was my sister's birthday, so we all went out to", + "original_text": "I had no time last night. It was my sister's birthday, so we all went out to [interrupt] celebrate at her favorite restaurant which had this amazing live band playing and the food was absolutely delicious, though I probably ate too much cake!", + "start_time": 11.77102881793495, + "end_time": 25.703001607050595, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--331/temp/line_4_A.wav", + "silence_duration": 0.5136426829301215, + "is_interrupted": true, + "text_after_interrupt": "celebrate at her favorite restaurant which had this amazing live band playing and the food was absolutely delicious, though I probably ate too much cake!" + }, + { + "speaker": "B", + "text": "Oh, that sounds nice! But speaking of last night, did you manage to find your physics book?", + "original_text": "Oh, that sounds nice! But speaking of last night, did you manage to find your physics book?", + "start_time": 16.949078704556264, + "end_time": 22.185178477798893, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--331/temp/line_5_B.wav", + "silence_duration": 0.42076327550353687, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Actually, I was just about to ask you that. I couldn't find it anywhere. Do you know where it might be?", + "original_text": "Actually, I was just about to ask you that. I couldn't find it anywhere. Do you know where it might be?", + "start_time": 26.171079898701237, + "end_time": 31.523279445186496, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--331/temp/line_6_A.wav", + "silence_duration": 0.4680782916506431, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I've got no idea, but you can borrow mine if you want.", + "original_text": "I've got no idea, but you can borrow mine if you want.", + "start_time": 31.972333553237913, + "end_time": 34.88643786162794, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--331/temp/line_7_B.wav", + "silence_duration": 0.44905410805141616, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Thanks. Let's meet outside Natbank in High Street at lunch time. I'll bring your book back then.", + "original_text": "Thanks. Let's meet outside Natbank in High Street at lunch time. I'll bring your book back then.", + "start_time": 35.361128989475134, + "end_time": 40.875868218500074, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--331/temp/line_8_A.wav", + "silence_duration": 0.47469112784719736, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Sure, and I'll bring my physics book for you. By the way, I'm really worried about the physics exam. Have you got any old exam papers? I'd really like to look through them.", + "original_text": "Sure, and I'll bring my physics book for you. By the way, I'm really worried about the physics exam. Have you got any old exam papers? I'd really like to look through them.", + "start_time": 41.35440656125118, + "end_time": 50.71204828460719, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--331/temp/line_9_B.wav", + "silence_duration": 0.47853834275110774, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I haven't, but my brother's got some. I'll bring them with me at lunch time.", + "original_text": "I haven't, but my brother's got some. I'll bring them with me at lunch time.", + "start_time": 51.10454571806854, + "end_time": 55.62082689720687, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--331/temp/line_10_A.wav", + "silence_duration": 0.3924974334613528, + "is_interrupted": false + } + ] + }, + "DialogSum--val--332": { + "original_text": "A: Hello, my name's David Parker. I'm calling about the apartment advertised in the paper. Can you tell me something about it? \nB: Yes, it's a one-bedroom apartment, with a living room, a kitchen, a bathroom and a [interrupt] small storage space that could be useful for keeping extra items like seasonal decorations, luggage, or other belongings you don't need daily access to. \nA: Sorry to cut in, but could you clarify whether it's in a quiet neighborhood? I'm particularly concerned about noise levels. \nB: It's actually in a very quiet area, which is one of its best features. Now, as I was saying, it also has a balcony. \nA: That sounds good. Where is it located? \nB: It's on Montreal Road. \nA: Is it furnished? \nB: Yes, it is furnished with sofas, a dining table, chairs and [interrupt] a bed in the bedroom, which is quite convenient if you don't have your own furniture and want to move in without the hassle of buying and transporting large items. \nA: And what about appliances? Are those included too? \nB: Yes, some appliances are included as well. \nA: How much is the rent? \nB: It's five hundred dollars per month, including utilities. \nA: You mean gas, electricity and heat? \nB: Yes, that's right. \nA: Is there anything like management fee or parking fee? \nB: The management fee is included in the rent. But parking is fifty dollars a month.", + "cleaned_text": "A: Hello, my name's David Parker. I'm calling about the apartment advertised in the paper. Can you tell me something about it? \nB:Yes, it's a one-bedroom apartment, with a living room, a kitchen, a bathroom and a small storage space that could be useful for keeping extra items like seasonal decorations, luggage, or other belongings you don't need daily access to.\nA: Sorry to cut in, but could you clarify whether it's in a quiet neighborhood? I'm particularly concerned about noise levels. \nB: It's actually in a very quiet area, which is one of its best features. Now, as I was saying, it also has a balcony. \nA: That sounds good. Where is it located? \nB: It's on Montreal Road. \nA: Is it furnished? \nB:Yes, it is furnished with sofas, a dining table, chairs and a bed in the bedroom, which is quite convenient if you don't have your own furniture and want to move in without the hassle of buying and transporting large items.\nA: And what about appliances? Are those included too? \nB: Yes, some appliances are included as well. \nA: How much is the rent? \nB: It's five hundred dollars per month, including utilities. \nA: You mean gas, electricity and heat? \nB: Yes, that's right. \nA: Is there anything like management fee or parking fee? \nB: The management fee is included in the rent. But parking is fifty dollars a month.", + "total_duration": 72.17301587301587, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--332/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--332/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--332/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Hello, my name's David Parker. I'm calling about the apartment advertised in the paper. Can you tell me something about it?", + "original_text": "Hello, my name's David Parker. I'm calling about the apartment advertised in the paper. Can you tell me something about it?", + "start_time": 0, + "end_time": 7.569705215419501, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--332/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, it's a one-bedroom apartment, with a living room, a kitchen, a bathroom and a", + "original_text": "Yes, it's a one-bedroom apartment, with a living room, a kitchen, a bathroom and a [interrupt] small storage space that could be useful for keeping extra items like seasonal decorations, luggage, or other belongings you don't need daily access to.", + "start_time": 8.110037441511185, + "end_time": 20.405003427905744, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--332/temp/line_1_B.wav", + "silence_duration": 0.5403322260916846, + "is_interrupted": true, + "text_after_interrupt": "small storage space that could be useful for keeping extra items like seasonal decorations, luggage, or other belongings you don't need daily access to." + }, + { + "speaker": "A", + "text": "Sorry to cut in, but could you clarify whether it's in a quiet neighborhood? I'm particularly concerned about noise levels.", + "original_text": "Sorry to cut in, but could you clarify whether it's in a quiet neighborhood? I'm particularly concerned about noise levels.", + "start_time": 12.765638348540664, + "end_time": 20.822962611579214, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--332/temp/line_2_A.wav", + "silence_duration": 0.5976759389474726, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "It's actually in a very quiet area, which is one of its best features. Now, as I was saying, it also has a balcony.", + "original_text": "It's actually in a very quiet area, which is one of its best features. Now, as I was saying, it also has a balcony.", + "start_time": 21.1241753037017, + "end_time": 27.521272809370636, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--332/temp/line_3_B.wav", + "silence_duration": 0.30121269212248825, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "That sounds good. Where is it located?", + "original_text": "That sounds good. Where is it located?", + "start_time": 27.93473391133275, + "end_time": 30.709518491831616, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--332/temp/line_4_A.wav", + "silence_duration": 0.41346110196211244, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "It's on Montreal Road.", + "original_text": "It's on Montreal Road.", + "start_time": 31.06636301824412, + "end_time": 32.43634034250716, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--332/temp/line_5_B.wav", + "silence_duration": 0.3568445264125053, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Is it furnished?", + "original_text": "Is it furnished?", + "start_time": 32.798385770891755, + "end_time": 33.831673752751165, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--332/temp/line_6_A.wav", + "silence_duration": 0.3620454283845985, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, it is furnished with sofas, a dining table, chairs and", + "original_text": "Yes, it is furnished with sofas, a dining table, chairs and [interrupt] a bed in the bedroom, which is quite convenient if you don't have your own furniture and want to move in without the hassle of buying and transporting large items.", + "start_time": 34.285170636424276, + "end_time": 44.560000568397065, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--332/temp/line_7_B.wav", + "silence_duration": 0.453496883673113, + "is_interrupted": true, + "text_after_interrupt": "a bed in the bedroom, which is quite convenient if you don't have your own furniture and want to move in without the hassle of buying and transporting large items." + }, + { + "speaker": "A", + "text": "And what about appliances? Are those included too?", + "original_text": "And what about appliances? Are those included too?", + "start_time": 46.40256521761226, + "end_time": 49.8158985509456, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--332/temp/line_8_A.wav", + "silence_duration": 0.3055241922543854, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, some appliances are included as well.", + "original_text": "Yes, some appliances are included as well.", + "start_time": 50.381728092950745, + "end_time": 53.214562560070924, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--332/temp/line_9_B.wav", + "silence_duration": 0.5658295420051501, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "How much is the rent?", + "original_text": "How much is the rent?", + "start_time": 53.540475975910994, + "end_time": 54.875623368201246, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--332/temp/line_10_A.wav", + "silence_duration": 0.3259134158400684, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "It's five hundred dollars per month, including utilities.", + "original_text": "It's five hundred dollars per month, including utilities.", + "start_time": 55.408446515451764, + "end_time": 58.961099576676254, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--332/temp/line_11_B.wav", + "silence_duration": 0.5328231472505205, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "You mean gas, electricity and heat?", + "original_text": "You mean gas, electricity and heat?", + "start_time": 59.36443903892529, + "end_time": 62.46430298450352, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--332/temp/line_12_A.wav", + "silence_duration": 0.40333946224903455, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, that's right.", + "original_text": "Yes, that's right.", + "start_time": 63.01088621932817, + "end_time": 64.0093442692148, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--332/temp/line_13_B.wav", + "silence_duration": 0.5465832348246488, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Is there anything like management fee or parking fee?", + "original_text": "Is there anything like management fee or parking fee?", + "start_time": 64.37691586365452, + "end_time": 67.39550996796291, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--332/temp/line_14_A.wav", + "silence_duration": 0.36757159443973, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "The management fee is included in the rent. But parking is fifty dollars a month.", + "original_text": "The management fee is included in the rent. But parking is fifty dollars a month.", + "start_time": 67.87736048567423, + "end_time": 72.17305209565156, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--332/temp/line_15_B.wav", + "silence_duration": 0.48185051771132575, + "is_interrupted": false + } + ] + }, + "DialogSum--val--333": { + "original_text": "A: Hello, Barbara, welcome back. You look great. \nB: Rod, it's lovely to see you again. \nA: How was your trip? \nB: Fine but tiring. Milan was interesting, it's bigger than I expected, noisier and [interrupt] busier than I imagined, especially in the city center where the streets were constantly packed with people rushing to work and tourists exploring the historic landmarks. \nA: Sorry to cut you off, but did you manage to visit Florence as well? \nB: Well, I didn't go there. Have you been there? \nA: No, I've never been to Italy. I'd really like to go to Roma. Well, the cars are in the car park. Is this all your luggage? \nB: Yes, but the suitcase is very heavy. \nA: Barbara, what's in it? Books or [interrupt] souvenirs from all the amazing shops you must have visited during your time in Milan? \nB: Just 20 pairs of shoes. \nA: Oh wow, that's a lot of shoes! But you mentioned Milan was noisier and busier—what did you mean by that?", + "cleaned_text": "A: Hello, Barbara, welcome back. You look great. \nB: Rod, it's lovely to see you again. \nA: How was your trip? \nB:Fine but tiring. Milan was interesting, it's bigger than I expected, noisier and busier than I imagined, especially in the city center where the streets were constantly packed with people rushing to work and tourists exploring the historic landmarks.\nA: Sorry to cut you off, but did you manage to visit Florence as well? \nB: Well, I didn't go there. Have you been there? \nA: No, I've never been to Italy. I'd really like to go to Roma. Well, the cars are in the car park. Is this all your luggage? \nB: Yes, but the suitcase is very heavy. \nA:Barbara, what's in it? Books or souvenirs from all the amazing shops you must have visited during your time in Milan?\nB: Just 20 pairs of shoes. \nA: Oh wow, that's a lot of shoes! But you mentioned Milan was noisier and busier—what did you mean by that?", + "total_duration": 51.20829931972789, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--333/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--333/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--333/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Hello, Barbara, welcome back. You look great.", + "original_text": "Hello, Barbara, welcome back. You look great.", + "start_time": 0, + "end_time": 2.75156462585034, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--333/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Rod, it's lovely to see you again.", + "original_text": "Rod, it's lovely to see you again.", + "start_time": 3.272729779200624, + "end_time": 5.66438510799881, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--333/temp/line_1_B.wav", + "silence_duration": 0.5211651533502839, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "How was your trip?", + "original_text": "How was your trip?", + "start_time": 6.222668252348356, + "end_time": 7.221126302234977, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--333/temp/line_2_A.wav", + "silence_duration": 0.5582831443495462, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Fine but tiring. Milan was interesting, it's bigger than I expected, noisier and", + "original_text": "Fine but tiring. Milan was interesting, it's bigger than I expected, noisier and [interrupt] busier than I imagined, especially in the city center where the streets were constantly packed with people rushing to work and tourists exploring the historic landmarks.", + "start_time": 7.651113443176085, + "end_time": 20.422088499865428, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--333/temp/line_3_B.wav", + "silence_duration": 0.4299871409411072, + "is_interrupted": true, + "text_after_interrupt": "busier than I imagined, especially in the city center where the streets were constantly packed with people rushing to work and tourists exploring the historic landmarks." + }, + { + "speaker": "A", + "text": "Sorry to cut you off, but did you manage to visit Florence as well?", + "original_text": "Sorry to cut you off, but did you manage to visit Florence as well?", + "start_time": 13.200682604173817, + "end_time": 17.473154259502614, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--333/temp/line_4_A.wav", + "silence_duration": 0.4351564240286421, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Well, I didn't go there. Have you been there?", + "original_text": "Well, I didn't go there. Have you been there?", + "start_time": 20.77478790203359, + "end_time": 23.189663185480303, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--333/temp/line_5_B.wav", + "silence_duration": 0.3526994021681631, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "No, I've never been to Italy. I'd really like to go to Roma. Well, the cars are in the car park. Is this all your luggage?", + "original_text": "No, I've never been to Italy. I'd really like to go to Roma. Well, the cars are in the car park. Is this all your luggage?", + "start_time": 23.51931485192087, + "end_time": 31.79722868412042, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--333/temp/line_6_A.wav", + "silence_duration": 0.329651666440567, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, but the suitcase is very heavy.", + "original_text": "Yes, but the suitcase is very heavy.", + "start_time": 32.196724380492356, + "end_time": 34.14720057096854, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--333/temp/line_7_B.wav", + "silence_duration": 0.39949569637193544, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Barbara, what's in it? Books or", + "original_text": "Barbara, what's in it? Books or [interrupt] souvenirs from all the amazing shops you must have visited during your time in Milan?", + "start_time": 34.666508239085324, + "end_time": 41.620884656318886, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--333/temp/line_8_A.wav", + "silence_duration": 0.5193076681167836, + "is_interrupted": true, + "text_after_interrupt": "souvenirs from all the amazing shops you must have visited during your time in Milan?" + }, + { + "speaker": "B", + "text": "Just 20 pairs of shoes.", + "original_text": "Just 20 pairs of shoes.", + "start_time": 42.59570644448001, + "end_time": 44.18627333790405, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--333/temp/line_9_B.wav", + "silence_duration": 0.5547321337410251, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Oh wow, that's a lot of shoes! But you mentioned Milan was noisier and busier—what did you mean by that?", + "original_text": "Oh wow, that's a lot of shoes! But you mentioned Milan was noisier and busier—what did you mean by that?", + "start_time": 44.53259786062069, + "end_time": 51.20833482207194, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--333/temp/line_10_A.wav", + "silence_duration": 0.34632452271664343, + "is_interrupted": false + } + ] + }, + "DialogSum--val--335": { + "original_text": "A: Well, it WAS going to be a surprise, but look in the back of the [interrupt] truck. There's something special back there for you - a beautiful golden retriever puppy with the most adorable face you've ever seen!\nB: Wait, are you serious? You bought a dog? Without even asking me first?\nA: I was just about to show you. Look in the back of the truck.\nB: What?\nA: Ah, ha, hah. Speechless. I knew you'd love him.\nB: That thing? That dog's as big as a horse. He probably eats like one, too.\nA: Ah, but he's sure friendly. And someone was giving him away at the supermarket, and I... I... I couldn't let that poor thing pass another day without a loving home.\nB: Whatever. Where was I? Eighteen dollars and nineteen cents ($18.19) for twenty-four cans of tomato juice? You don't even like that stuff!\nA: Ahhhh. Not yet. I've decided to change my eating habits.\nB: Hold on, before we move on—what were you saying about the dog? How did you end up with him?\nA: Oh, right. I was saying that someone at the supermarket was giving him away, and I couldn't resist bringing him home.", + "cleaned_text": "A:Well, it WAS going to be a surprise, but look in the back of the truck. There's something special back there for you - a beautiful golden retriever puppy with the most adorable face you've ever seen!\nB: Wait, are you serious? You bought a dog? Without even asking me first?\nA: I was just about to show you. Look in the back of the truck.\nB: What?\nA: Ah, ha, hah. Speechless. I knew you'd love him.\nB: That thing? That dog's as big as a horse. He probably eats like one, too.\nA: Ah, but he's sure friendly. And someone was giving him away at the supermarket, and I... I... I couldn't let that poor thing pass another day without a loving home.\nB: Whatever. Where was I? Eighteen dollars and nineteen cents ($18.19) for twenty-four cans of tomato juice? You don't even like that stuff!\nA: Ahhhh. Not yet. I've decided to change my eating habits.\nB: Hold on, before we move on—what were you saying about the dog? How did you end up with him?\nA: Oh, right. I was saying that someone at the supermarket was giving him away, and I couldn't resist bringing him home.", + "total_duration": 60.895873015873015, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--335/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--335/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--335/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Well, it WAS going to be a surprise, but look in the back of the", + "original_text": "Well, it WAS going to be a surprise, but look in the back of the [interrupt] truck. There's something special back there for you - a beautiful golden retriever puppy with the most adorable face you've ever seen!", + "start_time": 0, + "end_time": 12.87546485260771, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--335/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": true, + "text_after_interrupt": "truck. There's something special back there for you - a beautiful golden retriever puppy with the most adorable face you've ever seen!" + }, + { + "speaker": "B", + "text": "Wait, are you serious? You bought a dog? Without even asking me first?", + "original_text": "Wait, are you serious? You bought a dog? Without even asking me first?", + "start_time": 4.4117913832199545, + "end_time": 8.626213151927438, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--335/temp/line_1_B.wav", + "silence_duration": 0.487872778263373, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I was just about to show you. Look in the back of the truck.", + "original_text": "I was just about to show you. Look in the back of the truck.", + "start_time": 13.469039135611315, + "end_time": 16.77788267302628, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--335/temp/line_2_A.wav", + "silence_duration": 0.5935742830036039, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "What?", + "original_text": "What?", + "start_time": 17.24297621094174, + "end_time": 17.742205235885052, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--335/temp/line_3_B.wav", + "silence_duration": 0.46509353791545993, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Ah, ha, hah. Speechless. I knew you'd love him.", + "original_text": "Ah, ha, hah. Speechless. I knew you'd love him.", + "start_time": 18.078097310984734, + "end_time": 21.352110916426913, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--335/temp/line_4_A.wav", + "silence_duration": 0.3358920750996825, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "That thing? That dog's as big as a horse. He probably eats like one, too.", + "original_text": "That thing? That dog's as big as a horse. He probably eats like one, too.", + "start_time": 21.81058973851371, + "end_time": 25.630272278196248, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--335/temp/line_5_B.wav", + "silence_duration": 0.4584788220867956, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Ah, but he's sure friendly. And someone was giving him away at the supermarket, and I... I... I couldn't let that poor thing pass another day without a loving home.", + "original_text": "Ah, but he's sure friendly. And someone was giving him away at the supermarket, and I... I... I couldn't let that poor thing pass another day without a loving home.", + "start_time": 26.114950725443848, + "end_time": 36.64520015855042, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--335/temp/line_6_A.wav", + "silence_duration": 0.484678447247598, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Whatever. Where was I? Eighteen dollars and nineteen cents ($18.19) for twenty-four cans of tomato juice? You don't even like that stuff!", + "original_text": "Whatever. Where was I? Eighteen dollars and nineteen cents ($18.19) for twenty-four cans of tomato juice? You don't even like that stuff!", + "start_time": 36.95678232893378, + "end_time": 45.315966002403165, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--335/temp/line_7_B.wav", + "silence_duration": 0.31158217038335606, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Ahhhh. Not yet. I've decided to change my eating habits.", + "original_text": "Ahhhh. Not yet. I've decided to change my eating habits.", + "start_time": 45.656978113533725, + "end_time": 49.56954047181037, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--335/temp/line_8_A.wav", + "silence_duration": 0.34101211113056046, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Hold on, before we move on—what were you saying about the dog? How did you end up with him?", + "original_text": "Hold on, before we move on—what were you saying about the dog? How did you end up with him?", + "start_time": 49.877988487672326, + "end_time": 54.11563021102833, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--335/temp/line_9_B.wav", + "silence_duration": 0.30844801586195847, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Oh, right. I was saying that someone at the supermarket was giving him away, and I couldn't resist bringing him home.", + "original_text": "Oh, right. I was saying that someone at the supermarket was giving him away, and I couldn't resist bringing him home.", + "start_time": 54.55684330540995, + "end_time": 60.89589092445757, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--335/temp/line_10_A.wav", + "silence_duration": 0.4412130943816137, + "is_interrupted": false + } + ] + }, + "DialogSum--val--336": { + "original_text": "A: Err. what about the next two days? \nB: Let me see. Tomorrow at 8:30 a.m. in the meeting room, meet managers from 4 departments. At lunch, host Mr. Turner from the MG Company. Nothing special in the afternoon and evening. You can have a good rest. \nA: Mmm, not bad. \nB: But the day after tomorrow you'll have a busy day. Visit the products exhibition in the morning, have a quick lunch, and attend your management classes at 1:30 [interrupt] which will cover some new strategies we've been discussing and provide hands-on exercises to implement them effectively in our current projects.\nA: Wait, about the products exhibition—do I need to prepare anything specific for that? \nB: No special preparation needed, just your presence. As I was saying, your management classes are from 1:30 through to 5:00. Don't forget the party at the Century Palace at 6:00. The whole of your family are going [interrupt] and it might be a good idea to prepare a brief speech since the CEO will be expecting a few words from you about our recent successes.\nA: Right, and the party—should I be aware of anything particular for that?", + "cleaned_text": "A: Err. what about the next two days? \nB: Let me see. Tomorrow at 8:30 a.m. in the meeting room, meet managers from 4 departments. At lunch, host Mr. Turner from the MG Company. Nothing special in the afternoon and evening. You can have a good rest. \nA: Mmm, not bad. \nB:But the day after tomorrow you'll have a busy day. Visit the products exhibition in the morning, have a quick lunch, and attend your management classes at 1:30 which will cover some new strategies we've been discussing and provide hands-on exercises to implement them effectively in our current projects.\nA: Wait, about the products exhibition—do I need to prepare anything specific for that? \nB:No special preparation needed, just your presence. As I was saying, your management classes are from 1:30 through to 5:00. Don't forget the party at the Century Palace at 6:00. The whole of your family are going and it might be a good idea to prepare a brief speech since the CEO will be expecting a few words from you about our recent successes.\nA: Right, and the party—should I be aware of anything particular for that?", + "total_duration": 54.4291156462585, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--336/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--336/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--336/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Err. what about the next two days?", + "original_text": "Err. what about the next two days?", + "start_time": 0, + "end_time": 2.4961451247165534, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--336/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Let me see. Tomorrow at 8:30 a.m. in the meeting room, meet managers from 4 departments. At lunch, host Mr. Turner from the MG Company. Nothing special in the afternoon and evening. You can have a good rest.", + "original_text": "Let me see. Tomorrow at 8:30 a.m. in the meeting room, meet managers from 4 departments. At lunch, host Mr. Turner from the MG Company. Nothing special in the afternoon and evening. You can have a good rest.", + "start_time": 2.8450057793599997, + "end_time": 14.733622559405351, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--336/temp/line_1_B.wav", + "silence_duration": 0.34886065464344634, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Mmm, not bad.", + "original_text": "Mmm, not bad.", + "start_time": 15.150229786595121, + "end_time": 16.647916861425053, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--336/temp/line_2_A.wav", + "silence_duration": 0.4166072271897695, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "But the day after tomorrow you'll have a busy day. Visit the products exhibition in the morning, have a quick lunch, and attend your management classes at 1:30", + "original_text": "But the day after tomorrow you'll have a busy day. Visit the products exhibition in the morning, have a quick lunch, and attend your management classes at 1:30 [interrupt] which will cover some new strategies we've been discussing and provide hands-on exercises to implement them effectively in our current projects.", + "start_time": 17.009403897192342, + "end_time": 32.8221930128386, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--336/temp/line_3_B.wav", + "silence_duration": 0.3614870357672889, + "is_interrupted": true, + "text_after_interrupt": "which will cover some new strategies we've been discussing and provide hands-on exercises to implement them effectively in our current projects." + }, + { + "speaker": "A", + "text": "Wait, about the products exhibition—do I need to prepare anything specific for that?", + "original_text": "Wait, about the products exhibition—do I need to prepare anything specific for that?", + "start_time": 24.98545831896105, + "end_time": 29.67588915796332, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--336/temp/line_4_A.wav", + "silence_duration": 0.43420144968197305, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "No special preparation needed, just your presence. As I was saying, your management classes are from 1:30 through to 5:00. Don't forget the party at the Century Palace at 6:00. The whole of your family are going", + "original_text": "No special preparation needed, just your presence. As I was saying, your management classes are from 1:30 through to 5:00. Don't forget the party at the Century Palace at 6:00. The whole of your family are going [interrupt] and it might be a good idea to prepare a brief speech since the CEO will be expecting a few words from you about our recent successes.", + "start_time": 33.278124353781635, + "end_time": 51.714768344711345, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--336/temp/line_5_B.wav", + "silence_duration": 0.455931340943035, + "is_interrupted": true, + "text_after_interrupt": "and it might be a good idea to prepare a brief speech since the CEO will be expecting a few words from you about our recent successes." + }, + { + "speaker": "A", + "text": "Right, and the party—should I be aware of anything particular for that?", + "original_text": "Right, and the party—should I be aware of anything particular for that?", + "start_time": 50.21471566755406, + "end_time": 54.42913743626154, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--336/temp/line_6_A.wav", + "silence_duration": 0.51155512358773, + "is_interrupted": false + } + ] + }, + "DialogSum--val--337": { + "original_text": "A: That's my alarm. I have an appointment back at the hotel at eleven o'clock. \nB: Is it eleven already? \nA: No, no. Actually, it's 10:30. I set my watch half an hour [interrupt] ahead so I always feel like I have a buffer and can account for unexpected delays like traffic or last-minute preparations that might otherwise make me late.\nB: Oh, I do that too sometimes! It helps me stay on top of things. But do you always manage to keep up with that, or do you find it confusing at times? \nA: It can be a bit confusing, but it usually works for me. Speaking of which, I haven't mentioned— \nB: You're never late, are you? \nA: I try not to be, but I was about to say, I haven't mentioned yet why I set it that way. It's just a trick to make sure I'm always ahead of schedule.", + "cleaned_text": "A: That's my alarm. I have an appointment back at the hotel at eleven o'clock. \nB: Is it eleven already? \nA:No, no. Actually, it's 10:30. I set my watch half an hour ahead so I always feel like I have a buffer and can account for unexpected delays like traffic or last-minute preparations that might otherwise make me late.\nB: Oh, I do that too sometimes! It helps me stay on top of things. But do you always manage to keep up with that, or do you find it confusing at times? \nA: It can be a bit confusing, but it usually works for me. Speaking of which, I haven't mentioned— \nB: You're never late, are you? \nA: I try not to be, but I was about to say, I haven't mentioned yet why I set it that way. It's just a trick to make sure I'm always ahead of schedule.", + "total_duration": 38.81292517006803, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--337/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--337/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--337/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "That's my alarm. I have an appointment back at the hotel at eleven o'clock.", + "original_text": "That's my alarm. I have an appointment back at the hotel at eleven o'clock.", + "start_time": 0, + "end_time": 4.133151927437642, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--337/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Is it eleven already?", + "original_text": "Is it eleven already?", + "start_time": 4.4345067969122525, + "end_time": 5.630334461311346, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--337/temp/line_1_B.wav", + "silence_duration": 0.30135486947461076, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "No, no. Actually, it's 10:30. I set my watch half an hour", + "original_text": "No, no. Actually, it's 10:30. I set my watch half an hour [interrupt] ahead so I always feel like I have a buffer and can account for unexpected delays like traffic or last-minute preparations that might otherwise make me late.", + "start_time": 5.9608851816848185, + "end_time": 19.939297880097516, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--337/temp/line_2_A.wav", + "silence_duration": 0.3305507203734722, + "is_interrupted": true, + "text_after_interrupt": "ahead so I always feel like I have a buffer and can account for unexpected delays like traffic or last-minute preparations that might otherwise make me late." + }, + { + "speaker": "B", + "text": "Oh, I do that too sometimes! It helps me stay on top of things. But do you always manage to keep up with that, or do you find it confusing at times?", + "original_text": "Oh, I do that too sometimes! It helps me stay on top of things. But do you always manage to keep up with that, or do you find it confusing at times?", + "start_time": 10.570046179417245, + "end_time": 18.00043166694559, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--337/temp/line_3_B.wav", + "silence_duration": 0.34746968100747416, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "It can be a bit confusing, but it usually works for me. Speaking of which, I haven't mentioned—", + "original_text": "It can be a bit confusing, but it usually works for me. Speaking of which, I haven't mentioned—", + "start_time": 20.39480800241391, + "end_time": 26.43199621103069, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--337/temp/line_4_A.wav", + "silence_duration": 0.4555101223163931, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "You're never late, are you?", + "original_text": "You're never late, are you?", + "start_time": 26.734054861421715, + "end_time": 27.848612684550968, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--337/temp/line_5_B.wav", + "silence_duration": 0.30205865039102603, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I try not to be, but I was about to say, I haven't mentioned yet why I set it that way. It's just a trick to make sure I'm always ahead of schedule.", + "original_text": "I try not to be, but I was about to say, I haven't mentioned yet why I set it that way. It's just a trick to make sure I'm always ahead of schedule.", + "start_time": 28.3407403731496, + "end_time": 38.81293991963486, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--337/temp/line_6_A.wav", + "silence_duration": 0.4921276885986332, + "is_interrupted": false + } + ] + }, + "DialogSum--val--338": { + "original_text": "A: Excuse me, I'd like to make a suit of this material. \nB: Well, sir. Can I take your measurements [interrupt]? I just need to ensure everything is accurate before we proceed with the cutting and stitching process, which requires precise measurements for the perfect fit.\nA: Oh, before we start, should I take off my coat? \nB: That'll be helpful. All right, thank you. \nA: Please make a single-breasted. \nB: No problem. If you'll wait one moment, I'll make out your [interrupt] order form with all the necessary specifications including fabric choice, style preferences, and delivery timeline for your review and approval.\nA: Sorry to interrupt, but how much does it cost? \nB: Let me see, with padding and lining cloth, it comes to 357 dollars altogether. I was just about to make out your receipt. \nA: All right. When can I get it? \nB: In two weeks.", + "cleaned_text": "A: Excuse me, I'd like to make a suit of this material. \nB:Well, sir. Can I take your measurements ? I just need to ensure everything is accurate before we proceed with the cutting and stitching process, which requires precise measurements for the perfect fit.\nA: Oh, before we start, should I take off my coat? \nB: That'll be helpful. All right, thank you. \nA: Please make a single-breasted. \nB:No problem. If you'll wait one moment, I'll make out your order form with all the necessary specifications including fabric choice, style preferences, and delivery timeline for your review and approval.\nA: Sorry to interrupt, but how much does it cost? \nB: Let me see, with padding and lining cloth, it comes to 357 dollars altogether. I was just about to make out your receipt. \nA: All right. When can I get it? \nB: In two weeks.", + "total_duration": 41.14054421768707, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--338/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--338/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--338/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Excuse me, I'd like to make a suit of this material.", + "original_text": "Excuse me, I'd like to make a suit of this material.", + "start_time": 0, + "end_time": 3.076643990929705, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--338/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Well, sir. Can I take your measurements", + "original_text": "Well, sir. Can I take your measurements [interrupt]? I just need to ensure everything is accurate before we proceed with the cutting and stitching process, which requires precise measurements for the perfect fit.", + "start_time": 3.582202601312414, + "end_time": 13.973132306527834, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--338/temp/line_1_B.wav", + "silence_duration": 0.5055586103827089, + "is_interrupted": true, + "text_after_interrupt": "? I just need to ensure everything is accurate before we proceed with the cutting and stitching process, which requires precise measurements for the perfect fit." + }, + { + "speaker": "A", + "text": "Oh, before we start, should I take off my coat?", + "original_text": "Oh, before we start, should I take off my coat?", + "start_time": 6.171227544623072, + "end_time": 9.050501921040306, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--338/temp/line_2_A.wav", + "silence_duration": 0.5534730189045973, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "That'll be helpful. All right, thank you.", + "original_text": "That'll be helpful. All right, thank you.", + "start_time": 14.307005481282909, + "end_time": 15.978842215976787, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--338/temp/line_3_B.wav", + "silence_duration": 0.33387317475507416, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Please make a single-breasted.", + "original_text": "Please make a single-breasted.", + "start_time": 16.364879063783047, + "end_time": 18.164425549043816, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--338/temp/line_4_A.wav", + "silence_duration": 0.3860368478062584, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "No problem. If you'll wait one moment, I'll make out your", + "original_text": "No problem. If you'll wait one moment, I'll make out your [interrupt] order form with all the necessary specifications including fabric choice, style preferences, and delivery timeline for your review and approval.", + "start_time": 18.54527557211448, + "end_time": 29.93466332721652, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--338/temp/line_5_B.wav", + "silence_duration": 0.3808500230706644, + "is_interrupted": true, + "text_after_interrupt": "order form with all the necessary specifications including fabric choice, style preferences, and delivery timeline for your review and approval." + }, + { + "speaker": "A", + "text": "Sorry to interrupt, but how much does it cost?", + "original_text": "Sorry to interrupt, but how much does it cost?", + "start_time": 25.83026011417941, + "end_time": 28.906904105109113, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--338/temp/line_6_A.wav", + "silence_duration": 0.3178293647644626, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Let me see, with padding and lining cloth, it comes to 357 dollars altogether. I was just about to make out your receipt.", + "original_text": "Let me see, with padding and lining cloth, it comes to 357 dollars altogether. I was just about to make out your receipt.", + "start_time": 30.389459731261155, + "end_time": 37.5992556496285, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--338/temp/line_7_B.wav", + "silence_duration": 0.45479640404463506, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "All right. When can I get it?", + "original_text": "All right. When can I get it?", + "start_time": 37.96410470572949, + "end_time": 39.79848112296305, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--338/temp/line_8_A.wav", + "silence_duration": 0.3648490561009866, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "In two weeks.", + "original_text": "In two weeks.", + "start_time": 40.21175939469707, + "end_time": 41.14055758063811, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--338/temp/line_9_B.wav", + "silence_duration": 0.413278271734025, + "is_interrupted": false + } + ] + }, + "DialogSum--val--339": { + "original_text": "A: Did you go to university? \nB: Yes, I graduated with a BA in English from Qingdao University. \nA: When did you graduate? \nB: Just a few years ago. What about [interrupt] your plans after high school? I'm particularly interested in hearing about your academic aspirations and how you're navigating the decision-making process. \nA: Sorry to interrupt, but I'm curious—why did you choose Qingdao University for your BA? \nB: Oh, it was mainly because of its strong English program and the location. But you were asking about my graduation, right? \nA: Yes, I was. When did you graduate? \nB: Just a few years ago. What about you? \nA: I just graduated from high school. \nB: Are you planning on going to university? \nA: I'd like to get a BA, but I don't know where I should go. \nB: Have you applied anywhere yet? \nA: Yes, I've applied to four universities and have been accepted into all of them. \nB: Congratulations! Which one is the cheapest? \nA: The tuition is the same for all of them. \nB: Which one has the most interesting course offerings?", + "cleaned_text": "A: Did you go to university? \nB: Yes, I graduated with a BA in English from Qingdao University. \nA: When did you graduate? \nB:Just a few years ago. What about your plans after high school? I'm particularly interested in hearing about your academic aspirations and how you're navigating the decision-making process.\nA: Sorry to interrupt, but I'm curious—why did you choose Qingdao University for your BA? \nB: Oh, it was mainly because of its strong English program and the location. But you were asking about my graduation, right? \nA: Yes, I was. When did you graduate? \nB: Just a few years ago. What about you? \nA: I just graduated from high school. \nB: Are you planning on going to university? \nA: I'd like to get a BA, but I don't know where I should go. \nB: Have you applied anywhere yet? \nA: Yes, I've applied to four universities and have been accepted into all of them. \nB: Congratulations! Which one is the cheapest? \nA: The tuition is the same for all of them. \nB: Which one has the most interesting course offerings?", + "total_duration": 56.108979591836736, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--339/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--339/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--339/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Did you go to university?", + "original_text": "Did you go to university?", + "start_time": 0, + "end_time": 1.6370068027210884, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--339/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, I graduated with a BA in English from Qingdao University.", + "original_text": "Yes, I graduated with a BA in English from Qingdao University.", + "start_time": 2.1172649854175187, + "end_time": 5.855677683830217, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--339/temp/line_1_B.wav", + "silence_duration": 0.4802581826964301, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "When did you graduate?", + "original_text": "When did you graduate?", + "start_time": 6.184277750918942, + "end_time": 7.519425143209191, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--339/temp/line_2_A.wav", + "silence_duration": 0.3286000670887244, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Just a few years ago. What about", + "original_text": "Just a few years ago. What about [interrupt] your plans after high school? I'm particularly interested in hearing about your academic aspirations and how you're navigating the decision-making process.", + "start_time": 8.076890061274774, + "end_time": 18.90899890481219, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--339/temp/line_3_B.wav", + "silence_duration": 0.5574649180655832, + "is_interrupted": true, + "text_after_interrupt": "your plans after high school? I'm particularly interested in hearing about your academic aspirations and how you're navigating the decision-making process." + }, + { + "speaker": "A", + "text": "Sorry to interrupt, but I'm curious—why did you choose Qingdao University for your BA?", + "original_text": "Sorry to interrupt, but I'm curious—why did you choose Qingdao University for your BA?", + "start_time": 10.247955820911962, + "end_time": 16.4244637574199, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--339/temp/line_4_A.wav", + "silence_duration": 0.3212840379259968, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Oh, it was mainly because of its strong English program and the location. But you were asking about my graduation, right?", + "original_text": "Oh, it was mainly because of its strong English program and the location. But you were asking about my graduation, right?", + "start_time": 19.472434796357646, + "end_time": 26.090121871187577, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--339/temp/line_5_B.wav", + "silence_duration": 0.5634358915454571, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Yes, I was. When did you graduate?", + "original_text": "Yes, I was. When did you graduate?", + "start_time": 26.589822210387467, + "end_time": 29.30655690426502, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--339/temp/line_6_A.wav", + "silence_duration": 0.49970033919988865, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Just a few years ago. What about you?", + "original_text": "Just a few years ago. What about you?", + "start_time": 29.677338068957678, + "end_time": 31.534934440839763, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--339/temp/line_7_B.wav", + "silence_duration": 0.37078116469265715, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I just graduated from high school.", + "original_text": "I just graduated from high school.", + "start_time": 31.963135586401002, + "end_time": 33.91361177687719, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--339/temp/line_8_A.wav", + "silence_duration": 0.4282011455612389, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Are you planning on going to university?", + "original_text": "Are you planning on going to university?", + "start_time": 34.28569522333958, + "end_time": 36.2593913684643, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--339/temp/line_9_B.wav", + "silence_duration": 0.3720834464623898, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I'd like to get a BA, but I don't know where I should go.", + "original_text": "I'd like to get a BA, but I don't know where I should go.", + "start_time": 36.73663139641453, + "end_time": 39.95259511523539, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--339/temp/line_10_A.wav", + "silence_duration": 0.4772400279502338, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Have you applied anywhere yet?", + "original_text": "Have you applied anywhere yet?", + "start_time": 40.51541676986598, + "end_time": 42.12920361793854, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--339/temp/line_11_B.wav", + "silence_duration": 0.5628216546305873, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Yes, I've applied to four universities and have been accepted into all of them.", + "original_text": "Yes, I've applied to four universities and have been accepted into all of them.", + "start_time": 42.527788424056055, + "end_time": 46.99762969389732, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--339/temp/line_12_A.wav", + "silence_duration": 0.3985848061175154, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Congratulations! Which one is the cheapest?", + "original_text": "Congratulations! Which one is the cheapest?", + "start_time": 47.48513520156102, + "end_time": 50.294749714032676, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--339/temp/line_13_B.wav", + "silence_duration": 0.48750550766370077, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "The tuition is the same for all of them.", + "original_text": "The tuition is the same for all of them.", + "start_time": 50.8498785043389, + "end_time": 53.28797374243414, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--339/temp/line_14_A.wav", + "silence_duration": 0.5551287903062289, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Which one has the most interesting course offerings?", + "original_text": "Which one has the most interesting course offerings?", + "start_time": 53.63609396580989, + "end_time": 56.109019135877915, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--339/temp/line_15_B.wav", + "silence_duration": 0.3481202233757518, + "is_interrupted": false + } + ] + }, + "DialogSum--val--340": { + "original_text": "A: Have you read the new rules about using cell phone at work? \nB: Yes, not bad. Like turn your cell phone ringer off and find a private place to make calls which it's showing your respect to your [interrupt] co-workers and maintaining a professional environment by minimizing distractions and fostering better focus on collaborative tasks. \nA: Sorry to interrupt, but I was just thinking, what about the rule on not bringing your cell phone to meetings? I think it is not reasonable. What if there are some important calls? \nB: Well, this one is not compulsory. It is just a suggestion. But you mentioned respect to co-workers earlier—what were you going to say about that? \n\n", + "cleaned_text": "A: Have you read the new rules about using cell phone at work? \nB:Yes, not bad. Like turn your cell phone ringer off and find a private place to make calls which it's showing your respect to your co-workers and maintaining a professional environment by minimizing distractions and fostering better focus on collaborative tasks.\nA: Sorry to interrupt, but I was just thinking, what about the rule on not bringing your cell phone to meetings? I think it is not reasonable. What if there are some important calls? \nB: Well, this one is not compulsory. It is just a suggestion. But you mentioned respect to co-workers earlier—what were you going to say about that? \n\n", + "total_duration": 28.72331065759637, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--340/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--340/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--340/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Have you read the new rules about using cell phone at work?", + "original_text": "Have you read the new rules about using cell phone at work?", + "start_time": 0, + "end_time": 3.053424036281179, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--340/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, not bad. Like turn your cell phone ringer off and find a private place to make calls which it's showing your respect to your", + "original_text": "Yes, not bad. Like turn your cell phone ringer off and find a private place to make calls which it's showing your respect to your [interrupt] co-workers and maintaining a professional environment by minimizing distractions and fostering better focus on collaborative tasks.", + "start_time": 3.5002005171029253, + "end_time": 16.97938419057231, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--340/temp/line_1_B.wav", + "silence_duration": 0.44677648082174626, + "is_interrupted": true, + "text_after_interrupt": "co-workers and maintaining a professional environment by minimizing distractions and fostering better focus on collaborative tasks." + }, + { + "speaker": "A", + "text": "Sorry to interrupt, but I was just thinking, what about the rule on not bringing your cell phone to meetings? I think it is not reasonable. What if there are some important calls?", + "original_text": "Sorry to interrupt, but I was just thinking, what about the rule on not bringing your cell phone to meetings? I think it is not reasonable. What if there are some important calls?", + "start_time": 10.489406866309274, + "end_time": 21.042876254064375, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--340/temp/line_2_A.wav", + "silence_duration": 0.3207631409668338, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Well, this one is not compulsory. It is just a suggestion. But you mentioned respect to co-workers earlier—what were you going to say about that?", + "original_text": "Well, this one is not compulsory. It is just a suggestion. But you mentioned respect to co-workers earlier—what were you going to say about that?", + "start_time": 21.467106202380013, + "end_time": 28.723342030044414, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--340/temp/line_3_B.wav", + "silence_duration": 0.42422994831563887, + "is_interrupted": false + } + ] + }, + "DialogSum--val--341": { + "original_text": "A: Hi! Is that the new laptop you brought last week? It looks very nice. \nB: Yes, it is. Thanks. I'm just surfing on the internet. \nA: Here? In this cafe? How can you [interrupt] connect to the internet? I didn't see any cables and I'm really curious about how this wireless technology actually works. Does it use some kind of invisible signals? \nB: Oh, this cafe offers a wireless internet connection. That means I can get on the net for free while I'm here. Of course, I have to buy a cup of coffee! \nA: That's great. Can you do it anywhere? \nB: No, you can only do it when the cafe offers a wireless connection. There are only about 10 or 12 places that offer it in this city. \nA: So, what programs do you have on your laptop? \nB: I've got all the usual ones for word processing and then I have a few for creating and editing [interrupt] videos as well. I find them really useful for my projects, especially when I need to add special effects or combine different clips into one cohesive story. \nA: Editing photographs? I remember you mentioned before that you love photography. It's very useful for you to be able to download photos from your digital camera. Then you attach the picture files to emails and send them to anyone, anywhere, at anytime! \nB: Absolutely, it's wonderful! By the way, I was about to tell you I also have some software for video editing. Would you like to see some photos that I took recently?", + "cleaned_text": "A: Hi! Is that the new laptop you brought last week? It looks very nice. \nB: Yes, it is. Thanks. I'm just surfing on the internet. \nA:Here? In this cafe? How can you connect to the internet? I didn't see any cables and I'm really curious about how this wireless technology actually works. Does it use some kind of invisible signals?\nB: Oh, this cafe offers a wireless internet connection. That means I can get on the net for free while I'm here. Of course, I have to buy a cup of coffee! \nA: That's great. Can you do it anywhere? \nB: No, you can only do it when the cafe offers a wireless connection. There are only about 10 or 12 places that offer it in this city. \nA: So, what programs do you have on your laptop? \nB:I've got all the usual ones for word processing and then I have a few for creating and editing videos as well. I find them really useful for my projects, especially when I need to add special effects or combine different clips into one cohesive story.\nA: Editing photographs? I remember you mentioned before that you love photography. It's very useful for you to be able to download photos from your digital camera. Then you attach the picture files to emails and send them to anyone, anywhere, at anytime! \nB: Absolutely, it's wonderful! By the way, I was about to tell you I also have some software for video editing. Would you like to see some photos that I took recently?", + "total_duration": 74.399410430839, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--341/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--341/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--341/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Hi! Is that the new laptop you brought last week? It looks very nice.", + "original_text": "Hi! Is that the new laptop you brought last week? It looks very nice.", + "start_time": 0, + "end_time": 5.050340136054421, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--341/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, it is. Thanks. I'm just surfing on the internet.", + "original_text": "Yes, it is. Thanks. I'm just surfing on the internet.", + "start_time": 5.463863622272958, + "end_time": 9.202276320685657, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--341/temp/line_1_B.wav", + "silence_duration": 0.4135234862185375, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Here? In this cafe? How can you", + "original_text": "Here? In this cafe? How can you [interrupt] connect to the internet? I didn't see any cables and I'm really curious about how this wireless technology actually works. Does it use some kind of invisible signals?", + "start_time": 9.673401521668263, + "end_time": 22.943605603300917, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--341/temp/line_2_A.wav", + "silence_duration": 0.4711252009826048, + "is_interrupted": true, + "text_after_interrupt": "connect to the internet? I didn't see any cables and I'm really curious about how this wireless technology actually works. Does it use some kind of invisible signals?" + }, + { + "speaker": "B", + "text": "Oh, this cafe offers a wireless internet connection. That means I can get on the net for free while I'm here. Of course, I have to buy a cup of coffee!", + "original_text": "Oh, this cafe offers a wireless internet connection. That means I can get on the net for free while I'm here. Of course, I have to buy a cup of coffee!", + "start_time": 11.76319744003561, + "end_time": 19.994671362938107, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--341/temp/line_3_B.wav", + "silence_duration": 0.38355017326305973, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "That's great. Can you do it anywhere?", + "original_text": "That's great. Can you do it anywhere?", + "start_time": 23.321424997497015, + "end_time": 25.689860371646674, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--341/temp/line_4_A.wav", + "silence_duration": 0.37781939419609917, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "No, you can only do it when the cafe offers a wireless connection. There are only about 10 or 12 places that offer it in this city.", + "original_text": "No, you can only do it when the cafe offers a wireless connection. There are only about 10 or 12 places that offer it in this city.", + "start_time": 26.166718093004757, + "end_time": 33.225584306156684, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--341/temp/line_5_B.wav", + "silence_duration": 0.47685772135808424, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "So, what programs do you have on your laptop?", + "original_text": "So, what programs do you have on your laptop?", + "start_time": 33.59534940464331, + "end_time": 36.12632446133265, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--341/temp/line_6_A.wav", + "silence_duration": 0.36976509848662187, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I've got all the usual ones for word processing and then I have a few for creating and editing", + "original_text": "I've got all the usual ones for word processing and then I have a few for creating and editing [interrupt] videos as well. I find them really useful for my projects, especially when I need to add special effects or combine different clips into one cohesive story.", + "start_time": 36.69950882841559, + "end_time": 49.71429340891446, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--341/temp/line_7_B.wav", + "silence_duration": 0.5731843670829371, + "is_interrupted": true, + "text_after_interrupt": "videos as well. I find them really useful for my projects, especially when I need to add special effects or combine different clips into one cohesive story." + }, + { + "speaker": "A", + "text": "Editing photographs? I remember you mentioned before that you love photography. It's very useful for you to be able to download photos from your digital camera. Then you attach the picture files to emails and send them to anyone, anywhere, at anytime!", + "original_text": "Editing photographs? I remember you mentioned before that you love photography. It's very useful for you to be able to download photos from your digital camera. Then you attach the picture files to emails and send them to anyone, anywhere, at anytime!", + "start_time": 49.819848353320374, + "end_time": 64.95925878415937, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--341/temp/line_8_A.wav", + "silence_duration": 0.5765268452837535, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Absolutely, it's wonderful! By the way, I was about to tell you I also have some software for video editing. Would you like to see some photos that I took recently?", + "original_text": "Absolutely, it's wonderful! By the way, I was about to tell you I also have some software for video editing. Would you like to see some photos that I took recently?", + "start_time": 65.36685399303745, + "end_time": 74.3994163513141, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--341/temp/line_9_B.wav", + "silence_duration": 0.40759520887807205, + "is_interrupted": false + } + ] + }, + "DialogSum--val--343": { + "original_text": "A: Are you ready to order, sir? \nB: Yes. I'll have the beef stew for starters and my wife would like tomato soup. \nA: One beef stew and one tomato soup. What would you like for the main course? \nB: I'll have the Cayenne Pepper Steak and my wife would like the Fried Trout with [interrupt] a side of mashed potatoes and steamed vegetables, along with your house specialty sauce if that's possible, please. \nA: I'm afraid the trout is off. \nB: Oh dear. Err. . . What else do you recommend? \nA: The sole is very good. \nB: OK. I'll have that. Do you have any coleslaw? \nA: No, I'm sorry, we don't. \nB: Just give me a small mixed salad then. Same for me. \nA: Certainly. Oh, you were saying Fried Trout with something earlier? \nB: Oh yes, with mashed potatoes. But since the trout is off, we'll stick with the sole. Would you like something to drink? \nA: Yes, please. May I see the wine list?", + "cleaned_text": "A: Are you ready to order, sir? \nB: Yes. I'll have the beef stew for starters and my wife would like tomato soup. \nA: One beef stew and one tomato soup. What would you like for the main course? \nB:I'll have the Cayenne Pepper Steak and my wife would like the Fried Trout with a side of mashed potatoes and steamed vegetables, along with your house specialty sauce if that's possible, please.\nA: I'm afraid the trout is off. \nB: Oh dear. Err. . . What else do you recommend? \nA: The sole is very good. \nB: OK. I'll have that. Do you have any coleslaw? \nA: No, I'm sorry, we don't. \nB: Just give me a small mixed salad then. Same for me. \nA: Certainly. Oh, you were saying Fried Trout with something earlier? \nB: Oh yes, with mashed potatoes. But since the trout is off, we'll stick with the sole. Would you like something to drink? \nA: Yes, please. May I see the wine list?", + "total_duration": 48.83061224489796, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--343/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--343/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--343/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Are you ready to order, sir?", + "original_text": "Are you ready to order, sir?", + "start_time": 0, + "end_time": 1.509297052154195, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--343/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes. I'll have the beef stew for starters and my wife would like tomato soup.", + "original_text": "Yes. I'll have the beef stew for starters and my wife would like tomato soup.", + "start_time": 2.0676812564364724, + "end_time": 6.026683524010169, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--343/temp/line_1_B.wav", + "silence_duration": 0.5583842042822775, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "One beef stew and one tomato soup. What would you like for the main course?", + "original_text": "One beef stew and one tomato soup. What would you like for the main course?", + "start_time": 6.445189800384266, + "end_time": 11.298160321926215, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--343/temp/line_2_A.wav", + "silence_duration": 0.41850627637409676, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I'll have the Cayenne Pepper Steak and my wife would like the Fried Trout with", + "original_text": "I'll have the Cayenne Pepper Steak and my wife would like the Fried Trout with [interrupt] a side of mashed potatoes and steamed vegetables, along with your house specialty sauce if that's possible, please.", + "start_time": 11.835299079425006, + "end_time": 20.415072322055394, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--343/temp/line_3_B.wav", + "silence_duration": 0.5371387574987909, + "is_interrupted": true, + "text_after_interrupt": "a side of mashed potatoes and steamed vegetables, along with your house specialty sauce if that's possible, please." + }, + { + "speaker": "A", + "text": "I'm afraid the trout is off.", + "original_text": "I'm afraid the trout is off.", + "start_time": 15.144142616839972, + "end_time": 16.792759396885323, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--343/temp/line_4_A.wav", + "silence_duration": 0.4445655372928857, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Oh dear. Err. . . What else do you recommend?", + "original_text": "Oh dear. Err. . . What else do you recommend?", + "start_time": 20.74462315888304, + "end_time": 23.658727467273064, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--343/temp/line_5_B.wav", + "silence_duration": 0.3295508368276475, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "The sole is very good.", + "original_text": "The sole is very good.", + "start_time": 24.17130762639352, + "end_time": 25.6225547919264, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--343/temp/line_6_A.wav", + "silence_duration": 0.5125801591204564, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "OK. I'll have that. Do you have any coleslaw?", + "original_text": "OK. I'll have that. Do you have any coleslaw?", + "start_time": 25.995168570702376, + "end_time": 29.234352244171763, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--343/temp/line_7_B.wav", + "silence_duration": 0.3726137787759739, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "No, I'm sorry, we don't.", + "original_text": "No, I'm sorry, we don't.", + "start_time": 29.765910768793375, + "end_time": 31.635117117999727, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--343/temp/line_8_A.wav", + "silence_duration": 0.5315585246216125, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Just give me a small mixed salad then. Same for me.", + "original_text": "Just give me a small mixed salad then. Same for me.", + "start_time": 32.10319540965037, + "end_time": 34.93602987677055, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--343/temp/line_9_B.wav", + "silence_duration": 0.4680782916506431, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Certainly. Oh, you were saying Fried Trout with something earlier?", + "original_text": "Certainly. Oh, you were saying Fried Trout with something earlier?", + "start_time": 35.38508398482196, + "end_time": 39.41374611634124, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--343/temp/line_10_A.wav", + "silence_duration": 0.44905410805141616, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Oh yes, with mashed potatoes. But since the trout is off, we'll stick with the sole. Would you like something to drink?", + "original_text": "Oh yes, with mashed potatoes. But since the trout is off, we'll stick with the sole. Would you like something to drink?", + "start_time": 39.88843724418843, + "end_time": 45.57732613307732, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--343/temp/line_11_B.wav", + "silence_duration": 0.47469112784719736, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Yes, please. May I see the wine list?", + "original_text": "Yes, please. May I see the wine list?", + "start_time": 46.05586447582843, + "end_time": 48.830649056327296, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--343/temp/line_12_A.wav", + "silence_duration": 0.47853834275110774, + "is_interrupted": false + } + ] + }, + "DialogSum--val--344": { + "original_text": "A: Ah, that's the fourth ad that appears suddenly on my computer screen since I started working on my paper. It's so distracting.\nB: You can buy an app that will stop those ads.\nA: I can't afford to buy some fancy $10 software just so I can [interrupt] get a few more hours of peace while I work on this paper, especially when I'm already struggling to make ends meet as a student with limited financial resources.\nB: It's not that expensive. It's $1 per month.\nA: So that's $12 a year. But I still don't see the point if I can just close the ads manually.\nB: Is it going to take you a whole year to finish that essay?\nA: Well, no, Harriet. It'll be done in 3 weeks. But I'll be doing school work on this computer for 4 years before I graduate. I just don't want to commit to another expense right now.\nB: I think it's worth it, John. And if you spend $30, you don't have to [interrupt] worry about ads ever again because the software automatically updates itself and works across all your devices including your phone and tablet without any additional charges.\nA: Wait, $30? Does that mean I pay once and can use it forever, or is there some kind of catch? Because that sounds like a pretty good deal if it's true.", + "cleaned_text": "A: Ah, that's the fourth ad that appears suddenly on my computer screen since I started working on my paper. It's so distracting.\nB: You can buy an app that will stop those ads.\nA:I can't afford to buy some fancy $10 software just so I can get a few more hours of peace while I work on this paper, especially when I'm already struggling to make ends meet as a student with limited financial resources.\nB: It's not that expensive. It's $1 per month.\nA: So that's $12 a year. But I still don't see the point if I can just close the ads manually.\nB: Is it going to take you a whole year to finish that essay?\nA: Well, no, Harriet. It'll be done in 3 weeks. But I'll be doing school work on this computer for 4 years before I graduate. I just don't want to commit to another expense right now.\nB:I think it's worth it, John. And if you spend $30, you don't have to worry about ads ever again because the software automatically updates itself and works across all your devices including your phone and tablet without any additional charges.\nA: Wait, $30? Does that mean I pay once and can use it forever, or is there some kind of catch? Because that sounds like a pretty good deal if it's true.", + "total_duration": 63.42557823129252, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--344/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--344/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--344/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Ah, that's the fourth ad that appears suddenly on my computer screen since I started working on my paper. It's so distracting.", + "original_text": "Ah, that's the fourth ad that appears suddenly on my computer screen since I started working on my paper. It's so distracting.", + "start_time": 0, + "end_time": 7.349115646258503, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--344/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "You can buy an app that will stop those ads.", + "original_text": "You can buy an app that will stop those ads.", + "start_time": 7.714129599624393, + "end_time": 9.931635268558633, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--344/temp/line_1_B.wav", + "silence_duration": 0.36501395336588993, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I can't afford to buy some fancy $10 software just so I can", + "original_text": "I can't afford to buy some fancy $10 software just so I can [interrupt] get a few more hours of peace while I work on this paper, especially when I'm already struggling to make ends meet as a student with limited financial resources.", + "start_time": 10.471967494650318, + "end_time": 24.020811032065282, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--344/temp/line_2_A.wav", + "silence_duration": 0.5403322260916846, + "is_interrupted": true, + "text_after_interrupt": "get a few more hours of peace while I work on this paper, especially when I'm already struggling to make ends meet as a student with limited financial resources." + }, + { + "speaker": "B", + "text": "It's not that expensive. It's $1 per month.", + "original_text": "It's not that expensive. It's $1 per month.", + "start_time": 14.744439149979115, + "end_time": 18.099722596691134, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--344/temp/line_3_B.wav", + "silence_duration": 0.5976759389474726, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "So that's $12 a year. But I still don't see the point if I can just close the ads manually.", + "original_text": "So that's $12 a year. But I still don't see the point if I can just close the ads manually.", + "start_time": 24.40102269093221, + "end_time": 30.97226985646509, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--344/temp/line_4_A.wav", + "silence_duration": 0.38021165886692576, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Is it going to take you a whole year to finish that essay?", + "original_text": "Is it going to take you a whole year to finish that essay?", + "start_time": 31.44202103666492, + "end_time": 34.07748588927263, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--344/temp/line_5_B.wav", + "silence_duration": 0.46975118019982787, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Well, no, Harriet. It'll be done in 3 weeks. But I'll be doing school work on this computer for 4 years before I graduate. I just don't want to commit to another expense right now.", + "original_text": "Well, no, Harriet. It'll be done in 3 weeks. But I'll be doing school work on this computer for 4 years before I graduate. I just don't want to commit to another expense right now.", + "start_time": 34.487987771368594, + "end_time": 45.40136645617585, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--344/temp/line_6_A.wav", + "silence_duration": 0.4105018820959613, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I think it's worth it, John. And if you spend $30, you don't have to", + "original_text": "I think it's worth it, John. And if you spend $30, you don't have to [interrupt] worry about ads ever again because the software automatically updates itself and works across all your devices including your phone and tablet without any additional charges.", + "start_time": 45.878701240523164, + "end_time": 59.114075390183025, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--344/temp/line_7_B.wav", + "silence_duration": 0.477334784347311, + "is_interrupted": true, + "text_after_interrupt": "worry about ads ever again because the software automatically updates itself and works across all your devices including your phone and tablet without any additional charges." + }, + { + "speaker": "A", + "text": "Wait, $30? Does that mean I pay once and can use it forever, or is there some kind of catch? Because that sounds like a pretty good deal if it's true.", + "original_text": "Wait, $30? Does that mean I pay once and can use it forever, or is there some kind of catch? Because that sounds like a pretty good deal if it's true.", + "start_time": 53.95184857998739, + "end_time": 63.42559007658603, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--344/temp/line_8_A.wav", + "silence_duration": 0.5687408622669254, + "is_interrupted": false + } + ] + }, + "DialogSum--val--345": { + "original_text": "A: Thank you. The tea smells good. What is it called? \nB: It's called Tie Guanyin, and is a kind of Wu[interrupt] fermented tea, also known as oolong tea, which originates from China's Fujian province and is famous for its complex floral aroma and rich cultural history. \n\nA: Oh, Tie Guanyin! I've heard this name before, but I could never understand the tea classification. \n\nB: It's confusing and there is no agreement on it. Generally speaking, there are 4 kinds of tea based on processing methods. They're green tea, black tea, Wu long tea, and white tea. \n\nA: Sorry to cut in, you mentioned 4 kinds of tea—what about their health benefits? I've heard that different kinds of tea have different health benefits, isn't it? \n\nB: Yes, it is. But there are also considerations of time and personal health. For example, green tea is good in summer. It seems to drive away the heat and bring a feeling of relaxation. However, pregnant women should not drink it. \n\nA: That's interesting. By the way, you were saying something about the types of tea before I interrupted. What was the fourth one? \n\nB: Oh, right! The fourth one is scented tea. There seems to be a lot to know about tea. You must tell me more about tea culture in the future. \nA: Sure, I'll be glad to.", + "cleaned_text": "A: Thank you. The tea smells good. What is it called? \nB:It's called Tie Guanyin, and is a kind of Wu fermented tea, also known as oolong tea, which originates from China's Fujian province and is famous for its complex floral aroma and rich cultural history.\n\nA: Oh, Tie Guanyin! I've heard this name before, but I could never understand the tea classification. \n\nB: It's confusing and there is no agreement on it. Generally speaking, there are 4 kinds of tea based on processing methods. They're green tea, black tea, Wu long tea, and white tea. \n\nA: Sorry to cut in, you mentioned 4 kinds of tea—what about their health benefits? I've heard that different kinds of tea have different health benefits, isn't it? \n\nB: Yes, it is. But there are also considerations of time and personal health. For example, green tea is good in summer. It seems to drive away the heat and bring a feeling of relaxation. However, pregnant women should not drink it. \n\nA: That's interesting. By the way, you were saying something about the types of tea before I interrupted. What was the fourth one? \n\nB: Oh, right! The fourth one is scented tea. There seems to be a lot to know about tea. You must tell me more about tea culture in the future. \nA: Sure, I'll be glad to.", + "total_duration": 67.0469387755102, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--345/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--345/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--345/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Thank you. The tea smells good. What is it called?", + "original_text": "Thank you. The tea smells good. What is it called?", + "start_time": 0, + "end_time": 3.575873015873016, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--345/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "It's called Tie Guanyin, and is a kind of Wu", + "original_text": "It's called Tie Guanyin, and is a kind of Wu[interrupt] fermented tea, also known as oolong tea, which originates from China's Fujian province and is famous for its complex floral aroma and rich cultural history.", + "start_time": 4.012706358046806, + "end_time": 16.34250227641415, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--345/temp/line_1_B.wav", + "silence_duration": 0.4368333421737901, + "is_interrupted": true, + "text_after_interrupt": "fermented tea, also known as oolong tea, which originates from China's Fujian province and is famous for its complex floral aroma and rich cultural history." + }, + { + "speaker": "A", + "text": "Oh, Tie Guanyin! I've heard this name before, but I could never understand the tea classification.", + "original_text": "Oh, Tie Guanyin! I've heard this name before, but I could never understand the tea classification.", + "start_time": 6.950030621085355, + "end_time": 13.207808398863133, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--345/temp/line_2_A.wav", + "silence_duration": 0.38144386942283137, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "It's confusing and there is no agreement on it. Generally speaking, there are 4 kinds of tea based on processing methods. They're green tea, black tea, Wu long tea, and white tea.", + "original_text": "It's confusing and there is no agreement on it. Generally speaking, there are 4 kinds of tea based on processing methods. They're green tea, black tea, Wu long tea, and white tea.", + "start_time": 16.861457943989837, + "end_time": 27.19433776258394, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--345/temp/line_3_B.wav", + "silence_duration": 0.518955667575685, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Sorry to cut in, you mentioned 4 kinds of tea—what about their health benefits? I've heard that different kinds of tea have different health benefits, isn't it?", + "original_text": "Sorry to cut in, you mentioned 4 kinds of tea—what about their health benefits? I've heard that different kinds of tea have different health benefits, isn't it?", + "start_time": 27.598157526904284, + "end_time": 36.93257929561177, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--345/temp/line_4_A.wav", + "silence_duration": 0.40381976432034283, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, it is. But there are also considerations of time and personal health. For example, green tea is good in summer. It seems to drive away the heat and bring a feeling of relaxation. However, pregnant women should not drink it.", + "original_text": "Yes, it is. But there are also considerations of time and personal health. For example, green tea is good in summer. It seems to drive away the heat and bring a feeling of relaxation. However, pregnant women should not drink it.", + "start_time": 37.23456368183395, + "end_time": 49.92426889725345, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--345/temp/line_5_B.wav", + "silence_duration": 0.30198438622218016, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "That's interesting. By the way, you were saying something about the types of tea before I interrupted. What was the fourth one?", + "original_text": "That's interesting. By the way, you were saying something about the types of tea before I interrupted. What was the fourth one?", + "start_time": 50.40804453806183, + "end_time": 57.25793115937702, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--345/temp/line_6_A.wav", + "silence_duration": 0.48377564080838126, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Oh, right! The fourth one is scented tea. There seems to be a lot to know about tea. You must tell me more about tea culture in the future.", + "original_text": "Oh, right! The fourth one is scented tea. There seems to be a lot to know about tea. You must tell me more about tea culture in the future.", + "start_time": 57.604408164815695, + "end_time": 65.02318367501978, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--345/temp/line_7_B.wav", + "silence_duration": 0.3464770054386732, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Sure, I'll be glad to.", + "original_text": "Sure, I'll be glad to.", + "start_time": 65.53765389884767, + "end_time": 67.04695095100186, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--345/temp/line_8_A.wav", + "silence_duration": 0.5144702238278801, + "is_interrupted": false + } + ] + }, + "DialogSum--val--346": { + "original_text": "A: What time is it? We're going to be late! \nB: It's a quarter after 7. We're on time. Don't panic. \nA: But I thought we had to be at the restaurant by 7:30 for the surprise party, we will never make it there with all this evening [interrupt] traffic and possible delays along the main highway which is notorious for congestion during peak dining hours. \nB: Sorry, but I think we should check the GPS first. It might show a faster route, considering the traffic. \nA: Sure, but even if we find a faster route, do you know where we park our car? I was going to ask you to call the restaurant for that [interrupt] information because I remember the parking situation there can be tricky especially on weekends when they have special events and the valet service gets overwhelmed. \nB: Oh, right! I'll call them now to find out about parking options and maybe reserve a spot if possible.", + "cleaned_text": "A: What time is it? We're going to be late! \nB: It's a quarter after 7. We're on time. Don't panic. \nA:But I thought we had to be at the restaurant by 7:30 for the surprise party, we will never make it there with all this evening traffic and possible delays along the main highway which is notorious for congestion during peak dining hours.\nB: Sorry, but I think we should check the GPS first. It might show a faster route, considering the traffic. \nA:Sure, but even if we find a faster route, do you know where we park our car? I was going to ask you to call the restaurant for that information because I remember the parking situation there can be tricky especially on weekends when they have special events and the valet service gets overwhelmed.\nB: Oh, right! I'll call them now to find out about parking options and maybe reserve a spot if possible.", + "total_duration": 41.56, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--346/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--346/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--346/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "What time is it? We're going to be late!", + "original_text": "What time is it? We're going to be late!", + "start_time": 0, + "end_time": 2.589024943310658, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--346/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "It's a quarter after 7. We're on time. Don't panic.", + "original_text": "It's a quarter after 7. We're on time. Don't panic.", + "start_time": 3.1877981361695262, + "end_time": 5.985802671316918, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--346/temp/line_1_B.wav", + "silence_duration": 0.5987731928588684, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "But I thought we had to be at the restaurant by 7:30 for the surprise party, we will never make it there with all this evening", + "original_text": "But I thought we had to be at the restaurant by 7:30 for the surprise party, we will never make it there with all this evening [interrupt] traffic and possible delays along the main highway which is notorious for congestion during peak dining hours.", + "start_time": 6.535576980589531, + "end_time": 21.268638205079327, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--346/temp/line_2_A.wav", + "silence_duration": 0.5497743092726131, + "is_interrupted": true, + "text_after_interrupt": "traffic and possible delays along the main highway which is notorious for congestion during peak dining hours." + }, + { + "speaker": "B", + "text": "Sorry, but I think we should check the GPS first. It might show a faster route, considering the traffic.", + "original_text": "Sorry, but I think we should check the GPS first. It might show a faster route, considering the traffic.", + "start_time": 13.489953397823092, + "end_time": 19.26011212798182, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--346/temp/line_3_B.wav", + "silence_duration": 0.5358071963979545, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Sure, but even if we find a faster route, do you know where we park our car? I was going to ask you to call the restaurant for that", + "original_text": "Sure, but even if we find a faster route, do you know where we park our car? I was going to ask you to call the restaurant for that [interrupt] information because I remember the parking situation there can be tricky especially on weekends when they have special events and the valet service gets overwhelmed.", + "start_time": 21.691476111691077, + "end_time": 39.32703166724663, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--346/temp/line_4_A.wav", + "silence_duration": 0.4228379066117495, + "is_interrupted": true, + "text_after_interrupt": "information because I remember the parking situation there can be tricky especially on weekends when they have special events and the valet service gets overwhelmed." + }, + { + "speaker": "B", + "text": "Oh, right! I'll call them now to find out about parking options and maybe reserve a spot if possible.", + "original_text": "Oh, right! I'll call them now to find out about parking options and maybe reserve a spot if possible.", + "start_time": 36.23103311771489, + "end_time": 41.56001270955162, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--346/temp/line_5_B.wav", + "silence_duration": 0.5211651533502839, + "is_interrupted": false + } + ] + }, + "DialogSum--val--347": { + "original_text": "A: I saw a beautiful fish in the market the other day, it was orange and blue. I'm thinking of buying some next [interrupt] week when I have more time to set up the tank properly with all the necessary equipment and decorations to create a comfortable environment for them.\nB: Where would you keep them?\nA: In that round bottle over there.\nB: It's a bit small, isn't it?\nA: So are the fish.\nB: I think you should get a tank if you want to keep fish.\nA: Really?\nB: Yes, you should never keep fish in a small round bottle. They don't get enough air. I suggest we go shopping together and look for a nice tank.\nA: That might be quite expensive.\nB: Check the prices before you buy one and you ought to put a few large rocks in the tank. Fish love swimming around the rocks and through holes in them.\nA: Is there anything else that I ought to get? Oh, I was going to ask earlier—what about the plants? Should I get some for the tank?\nB: Yes, you need to get some underwater plants, for one thing, they keep the water clean, also they make the tank look much prettier.", + "cleaned_text": "A:I saw a beautiful fish in the market the other day, it was orange and blue. I'm thinking of buying some next week when I have more time to set up the tank properly with all the necessary equipment and decorations to create a comfortable environment for them.\nB: Where would you keep them?\nA: In that round bottle over there.\nB: It's a bit small, isn't it?\nA: So are the fish.\nB: I think you should get a tank if you want to keep fish.\nA: Really?\nB: Yes, you should never keep fish in a small round bottle. They don't get enough air. I suggest we go shopping together and look for a nice tank.\nA: That might be quite expensive.\nB: Check the prices before you buy one and you ought to put a few large rocks in the tank. Fish love swimming around the rocks and through holes in them.\nA: Is there anything else that I ought to get? Oh, I was going to ask earlier—what about the plants? Should I get some for the tank?\nB: Yes, you need to get some underwater plants, for one thing, they keep the water clean, also they make the tank look much prettier.", + "total_duration": 58.65750566893424, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--347/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--347/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--347/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "I saw a beautiful fish in the market the other day, it was orange and blue. I'm thinking of buying some next", + "original_text": "I saw a beautiful fish in the market the other day, it was orange and blue. I'm thinking of buying some next [interrupt] week when I have more time to set up the tank properly with all the necessary equipment and decorations to create a comfortable environment for them.", + "start_time": 0, + "end_time": 15.394829931972788, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--347/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": true, + "text_after_interrupt": "week when I have more time to set up the tank properly with all the necessary equipment and decorations to create a comfortable environment for them." + }, + { + "speaker": "B", + "text": "Where would you keep them?", + "original_text": "Where would you keep them?", + "start_time": 6.873106575963718, + "end_time": 7.964444444444444, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--347/temp/line_1_B.wav", + "silence_duration": 0.426331194007072, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "In that round bottle over there.", + "original_text": "In that round bottle over there.", + "start_time": 15.942442676950353, + "end_time": 17.61427941164423, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--347/temp/line_2_A.wav", + "silence_duration": 0.5476127449775645, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "It's a bit small, isn't it?", + "original_text": "It's a bit small, isn't it?", + "start_time": 18.053591961586648, + "end_time": 19.55127903641658, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--347/temp/line_3_B.wav", + "silence_duration": 0.439312549942418, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "So are the fish.", + "original_text": "So are the fish.", + "start_time": 20.05862652292987, + "end_time": 21.20801427803191, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--347/temp/line_4_A.wav", + "silence_duration": 0.5073474865132908, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I think you should get a tank if you want to keep fish.", + "original_text": "I think you should get a tank if you want to keep fish.", + "start_time": 21.697726551101542, + "end_time": 24.309971449060725, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--347/temp/line_5_B.wav", + "silence_duration": 0.48971227306963083, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Really?", + "original_text": "Really?", + "start_time": 24.7978442273241, + "end_time": 25.49444286677988, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--347/temp/line_6_A.wav", + "silence_duration": 0.487872778263373, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, you should never keep fish in a small round bottle. They don't get enough air. I suggest we go shopping together and look for a nice tank.", + "original_text": "Yes, you should never keep fish in a small round bottle. They don't get enough air. I suggest we go shopping together and look for a nice tank.", + "start_time": 26.02587990903595, + "end_time": 32.94542639429672, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--347/temp/line_7_B.wav", + "silence_duration": 0.5314370422560686, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "That might be quite expensive.", + "original_text": "That might be quite expensive.", + "start_time": 33.39198199833336, + "end_time": 35.12186861964855, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--347/temp/line_8_A.wav", + "silence_duration": 0.44655560403664124, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Check the prices before you buy one and you ought to put a few large rocks in the tank. Fish love swimming around the rocks and through holes in them.", + "original_text": "Check the prices before you buy one and you ought to put a few large rocks in the tank. Fish love swimming around the rocks and through holes in them.", + "start_time": 35.707175693037506, + "end_time": 43.125951203241584, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--347/temp/line_9_B.wav", + "silence_duration": 0.5853070733889535, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Is there anything else that I ought to get? Oh, I was going to ask earlier—what about the plants? Should I get some for the tank?", + "original_text": "Is there anything else that I ought to get? Oh, I was going to ask earlier—what about the plants? Should I get some for the tank?", + "start_time": 43.60408148491064, + "end_time": 51.66140574794919, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--347/temp/line_10_A.wav", + "silence_duration": 0.47813028166905325, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, you need to get some underwater plants, for one thing, they keep the water clean, also they make the tank look much prettier.", + "original_text": "Yes, you need to get some underwater plants, for one thing, they keep the water clean, also they make the tank look much prettier.", + "start_time": 52.00502794422194, + "end_time": 58.65754495102466, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--347/temp/line_11_B.wav", + "silence_duration": 0.3436221962727513, + "is_interrupted": false + } + ] + }, + "DialogSum--val--349": { + "original_text": "A: Hi Joe, many people in our Department are leaving for Thanksgiving. What are you going to do? \nB: I think I'll just stay at home. I may see some friends and watch a few DVDs and I probably would go to the auto [interrupt] showroom to check out some new car models that I've been interested in, particularly the latest electric vehicles with their advanced battery technology and sleek designs. \nA: Sorry to interrupt, but did you say you might go to a car show? That sounds interesting! \nB: Yes, exactly. There's a car show in town that I've been wanting to check out. What about you Alexia? What's your plan? \nA: I am going to do some traveling with my family. \nB: Oh? Where to? \nA: Toronto and on our way we're going to visit my aunt Betty in Kingston. \nB: That's exciting. How long do you plan to stay? \nA: 2 days. I have a get-together party with my college friends in Toronto. Oh, I'm afraid I've got to go now. My husband is waiting for me and we'll have to pick up Daniel from school. Have a nice holiday, Joe. \nB: Thank you. You too. By the way, you mentioned something about a car show earlier—what kind of cars are you hoping to see?", + "cleaned_text": "A: Hi Joe, many people in our Department are leaving for Thanksgiving. What are you going to do? \nB:I think I'll just stay at home. I may see some friends and watch a few DVDs and I probably would go to the auto showroom to check out some new car models that I've been interested in, particularly the latest electric vehicles with their advanced battery technology and sleek designs.\nA: Sorry to interrupt, but did you say you might go to a car show? That sounds interesting! \nB: Yes, exactly. There's a car show in town that I've been wanting to check out. What about you Alexia? What's your plan? \nA: I am going to do some traveling with my family. \nB: Oh? Where to? \nA: Toronto and on our way we're going to visit my aunt Betty in Kingston. \nB: That's exciting. How long do you plan to stay? \nA: 2 days. I have a get-together party with my college friends in Toronto. Oh, I'm afraid I've got to go now. My husband is waiting for me and we'll have to pick up Daniel from school. Have a nice holiday, Joe. \nB: Thank you. You too. By the way, you mentioned something about a car show earlier—what kind of cars are you hoping to see?", + "total_duration": 59.198095238095235, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--349/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--349/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--349/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Hi Joe, many people in our Department are leaving for Thanksgiving. What are you going to do?", + "original_text": "Hi Joe, many people in our Department are leaving for Thanksgiving. What are you going to do?", + "start_time": 0, + "end_time": 5.270929705215419, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--349/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I think I'll just stay at home. I may see some friends and watch a few DVDs and I probably would go to the auto", + "original_text": "I think I'll just stay at home. I may see some friends and watch a few DVDs and I probably would go to the auto [interrupt] showroom to check out some new car models that I've been interested in, particularly the latest electric vehicles with their advanced battery technology and sleek designs.", + "start_time": 5.864503988219023, + "end_time": 19.87774661860451, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--349/temp/line_1_B.wav", + "silence_duration": 0.5935742830036039, + "is_interrupted": true, + "text_after_interrupt": "showroom to check out some new car models that I've been interested in, particularly the latest electric vehicles with their advanced battery technology and sleek designs." + }, + { + "speaker": "A", + "text": "Sorry to interrupt, but did you say you might go to a car show? That sounds interesting!", + "original_text": "Sorry to interrupt, but did you say you might go to a car show? That sounds interesting!", + "start_time": 11.762372468944648, + "end_time": 18.101420087992267, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--349/temp/line_2_A.wav", + "silence_duration": 0.46509353791545993, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, exactly. There's a car show in town that I've been wanting to check out. What about you Alexia? What's your plan?", + "original_text": "Yes, exactly. There's a car show in town that I've been wanting to check out. What about you Alexia? What's your plan?", + "start_time": 20.44367627921334, + "end_time": 27.432882628419687, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--349/temp/line_3_B.wav", + "silence_duration": 0.565929660608826, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I am going to do some traveling with my family.", + "original_text": "I am going to do some traveling with my family.", + "start_time": 27.781743283063133, + "end_time": 30.393988181022316, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--349/temp/line_4_A.wav", + "silence_duration": 0.34886065464344634, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Oh? Where to?", + "original_text": "Oh? Where to?", + "start_time": 30.810595408212084, + "end_time": 31.762613548801653, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--349/temp/line_5_B.wav", + "silence_duration": 0.4166072271897695, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Toronto and on our way we're going to visit my aunt Betty in Kingston.", + "original_text": "Toronto and on our way we're going to visit my aunt Betty in Kingston.", + "start_time": 32.12410058456894, + "end_time": 36.175982670736744, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--349/temp/line_6_A.wav", + "silence_duration": 0.3614870357672889, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "That's exciting. How long do you plan to stay?", + "original_text": "That's exciting. How long do you plan to stay?", + "start_time": 36.610184120418715, + "end_time": 39.280478904999214, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--349/temp/line_7_B.wav", + "silence_duration": 0.43420144968197305, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "2 days. I have a get-together party with my college friends in Toronto. Oh, I'm afraid I've got to go now. My husband is waiting for me and we'll have to pick up Daniel from school. Have a nice holiday, Joe.", + "original_text": "2 days. I have a get-together party with my college friends in Toronto. Oh, I'm afraid I've got to go now. My husband is waiting for me and we'll have to pick up Daniel from school. Have a nice holiday, Joe.", + "start_time": 39.67136246830935, + "end_time": 52.662927094159684, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--349/temp/line_8_A.wav", + "silence_duration": 0.3908835633101311, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Thank you. You too. By the way, you mentioned something about a car show earlier—what kind of cars are you hoping to see?", + "original_text": "Thank you. You too. By the way, you mentioned something about a car show earlier—what kind of cars are you hoping to see?", + "start_time": 53.02163082238071, + "end_time": 59.198138758888646, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--349/temp/line_9_B.wav", + "silence_duration": 0.3587037282210253, + "is_interrupted": false + } + ] + }, + "DialogSum--val--350": { + "original_text": "A: Lisa, hi! \nB: Hi, Net! \nA: Don't you usually drive to work? \nB: Usually, but not in bad weather. \nA: Why is [interrupt] it that you avoid driving in bad weather? I've always wondered if it's just about the traffic or if there are other factors involved like visibility or road conditions. \nB: The traffic gets a lot worse when it rains or snows. \nA: Oh, I see. I always take the train. It's a lot faster for me than driving. \nB: It's faster for me, too. But the time isn't always convenient. \nA: Yeah, but think of all the things you can do on the train. You can read a book or [interrupt] listen to a podcast to make the commute more enjoyable and productive, maybe even learn something new while you're traveling to work. \nB: Or catch up on emails! But you were saying about reading? \nA: Right, or the newspaper. It's a nice way to start the day.", + "cleaned_text": "A: Lisa, hi! \nB: Hi, Net! \nA: Don't you usually drive to work? \nB: Usually, but not in bad weather. \nA:Why is it that you avoid driving in bad weather? I've always wondered if it's just about the traffic or if there are other factors involved like visibility or road conditions.\nB: The traffic gets a lot worse when it rains or snows. \nA: Oh, I see. I always take the train. It's a lot faster for me than driving. \nB: It's faster for me, too. But the time isn't always convenient. \nA:Yeah, but think of all the things you can do on the train. You can read a book or listen to a podcast to make the commute more enjoyable and productive, maybe even learn something new while you're traveling to work.\nB: Or catch up on emails! But you were saying about reading? \nA: Right, or the newspaper. It's a nice way to start the day.", + "total_duration": 44.02063492063492, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--350/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--350/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--350/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Lisa, hi!", + "original_text": "Lisa, hi!", + "start_time": 0, + "end_time": 0.9520181405895691, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--350/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Hi, Net!", + "original_text": "Hi, Net!", + "start_time": 1.4635732641772992, + "end_time": 2.4968612460367097, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--350/temp/line_1_B.wav", + "silence_duration": 0.51155512358773, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Don't you usually drive to work?", + "original_text": "Don't you usually drive to work?", + "start_time": 3.043593248475903, + "end_time": 4.796699824439622, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--350/temp/line_2_A.wav", + "silence_duration": 0.5467320024391933, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Usually, but not in bad weather.", + "original_text": "Usually, but not in bad weather.", + "start_time": 5.098054693914232, + "end_time": 6.9672610431205815, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--350/temp/line_3_B.wav", + "silence_duration": 0.30135486947461076, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Why is", + "original_text": "Why is [interrupt] it that you avoid driving in bad weather? I've always wondered if it's just about the traffic or if there are other factors involved like visibility or road conditions.", + "start_time": 7.297811763494054, + "end_time": 17.909331037870473, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--350/temp/line_4_A.wav", + "silence_duration": 0.3305507203734722, + "is_interrupted": true, + "text_after_interrupt": "it that you avoid driving in bad weather? I've always wondered if it's just about the traffic or if there are other factors involved like visibility or road conditions." + }, + { + "speaker": "B", + "text": "The traffic gets a lot worse when it rains or snows.", + "original_text": "The traffic gets a lot worse when it rains or snows.", + "start_time": 8.273049858732149, + "end_time": 11.013004507258227, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--350/temp/line_5_B.wav", + "silence_duration": 0.34746968100747416, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Oh, I see. I always take the train. It's a lot faster for me than driving.", + "original_text": "Oh, I see. I always take the train. It's a lot faster for me than driving.", + "start_time": 18.401458726469105, + "end_time": 23.08027958814711, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--350/temp/line_6_A.wav", + "silence_duration": 0.4921276885986332, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "It's faster for me, too. But the time isn't always convenient.", + "original_text": "It's faster for me, too. But the time isn't always convenient.", + "start_time": 23.679735768617796, + "end_time": 26.953749374059974, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--350/temp/line_7_B.wav", + "silence_duration": 0.5994561804706837, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Yeah, but think of all the things you can do on the train. You can read a book or", + "original_text": "Yeah, but think of all the things you can do on the train. You can read a book or [interrupt] listen to a podcast to make the commute more enjoyable and productive, maybe even learn something new while you're traveling to work.", + "start_time": 27.459307984442685, + "end_time": 39.87037374407987, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--350/temp/line_8_A.wav", + "silence_duration": 0.5055586103827089, + "is_interrupted": true, + "text_after_interrupt": "listen to a podcast to make the commute more enjoyable and productive, maybe even learn something new while you're traveling to work." + }, + { + "speaker": "B", + "text": "Or catch up on emails! But you were saying about reading?", + "original_text": "Or catch up on emails! But you were saying about reading?", + "start_time": 36.100769957315784, + "end_time": 39.25868378951533, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--350/temp/line_9_B.wav", + "silence_duration": 0.5534730189045973, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Right, or the newspaper. It's a nice way to start the day.", + "original_text": "Right, or the newspaper. It's a nice way to start the day.", + "start_time": 40.305481981098644, + "end_time": 44.020674724862815, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--350/temp/line_10_A.wav", + "silence_duration": 0.43510823701877155, + "is_interrupted": false + } + ] + }, + "DialogSum--val--351": { + "original_text": "A: Hello, how can I help you today? \nB: I'd like to withdraw some money from my account. \nA: Please fill out this slip stating how much you wish to withdraw. \nB: Well, actually, it's quite a substantial amount. Here's my Bank Book. Will that cause a [interrupt] delay in processing or any issues with my account balance, especially considering the recent changes in banking regulations regarding large withdrawals? \nA: Sorry to interrupt, but just to clarify, how much are you planning to withdraw? \nB: Oh, it's 10,000 RMB. \nA: On your account there is no limit to over-the-counter withdrawals, it won't cause a problem. Here's your money, 10,000 RMB. Please count it before you leave the counter, as we want to ensure everything is correct. \nB: Oh, before I go, I just realized I didn't ask—will this withdrawal affect any of my other transactions or account balance? \nA: No, your account balance is still sufficient for other transactions. Please count the money before you leave. \nB: Yes, that seems to be all in order. Thanks very much.", + "cleaned_text": "A: Hello, how can I help you today? \nB: I'd like to withdraw some money from my account. \nA: Please fill out this slip stating how much you wish to withdraw. \nB:Well, actually, it's quite a substantial amount. Here's my Bank Book. Will that cause a delay in processing or any issues with my account balance, especially considering the recent changes in banking regulations regarding large withdrawals?\nA: Sorry to interrupt, but just to clarify, how much are you planning to withdraw? \nB: Oh, it's 10,000 RMB. \nA: On your account there is no limit to over-the-counter withdrawals, it won't cause a problem. Here's your money, 10,000 RMB. Please count it before you leave the counter, as we want to ensure everything is correct. \nB: Oh, before I go, I just realized I didn't ask—will this withdrawal affect any of my other transactions or account balance? \nA: No, your account balance is still sufficient for other transactions. Please count the money before you leave. \nB: Yes, that seems to be all in order. Thanks very much.", + "total_duration": 55.0233560090703, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--351/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--351/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--351/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Hello, how can I help you today?", + "original_text": "Hello, how can I help you today?", + "start_time": 0, + "end_time": 2.2291156462585033, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--351/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I'd like to withdraw some money from my account.", + "original_text": "I'd like to withdraw some money from my account.", + "start_time": 2.7401106040714587, + "end_time": 4.899566386384384, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--351/temp/line_1_B.wav", + "silence_duration": 0.5109949578129555, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Please fill out this slip stating how much you wish to withdraw.", + "original_text": "Please fill out this slip stating how much you wish to withdraw.", + "start_time": 5.463908825741055, + "end_time": 9.063001796262597, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--351/temp/line_2_A.wav", + "silence_duration": 0.5643424393566712, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Well, actually, it's quite a substantial amount. Here's my Bank Book. Will that cause a", + "original_text": "Well, actually, it's quite a substantial amount. Here's my Bank Book. Will that cause a [interrupt] delay in processing or any issues with my account balance, especially considering the recent changes in banking regulations regarding large withdrawals?", + "start_time": 9.484329604210462, + "end_time": 21.721245703983705, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--351/temp/line_3_B.wav", + "silence_duration": 0.42132780794786545, + "is_interrupted": true, + "text_after_interrupt": "delay in processing or any issues with my account balance, especially considering the recent changes in banking regulations regarding large withdrawals?" + }, + { + "speaker": "A", + "text": "Sorry to interrupt, but just to clarify, how much are you planning to withdraw?", + "original_text": "Sorry to interrupt, but just to clarify, how much are you planning to withdraw?", + "start_time": 14.55788969491341, + "end_time": 19.213490601942887, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--351/temp/line_4_A.wav", + "silence_duration": 0.5800424695241806, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Oh, it's 10,000 RMB.", + "original_text": "Oh, it's 10,000 RMB.", + "start_time": 22.036683159253613, + "end_time": 23.975549372405542, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--351/temp/line_5_B.wav", + "silence_duration": 0.3154374552699074, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "On your account there is no limit to over-the-counter withdrawals, it won't cause a problem. Here's your money, 10,000 RMB. Please count it before you leave the counter, as we want to ensure everything is correct.", + "original_text": "On your account there is no limit to over-the-counter withdrawals, it won't cause a problem. Here's your money, 10,000 RMB. Please count it before you leave the counter, as we want to ensure everything is correct.", + "start_time": 24.391792594543805, + "end_time": 37.73165654012204, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--351/temp/line_6_A.wav", + "silence_duration": 0.4162432221382618, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Oh, before I go, I just realized I didn't ask—will this withdrawal affect any of my other transactions or account balance?", + "original_text": "Oh, before I go, I just realized I didn't ask—will this withdrawal affect any of my other transactions or account balance?", + "start_time": 38.21917389963804, + "end_time": 44.20992219895776, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--351/temp/line_7_B.wav", + "silence_duration": 0.48751735951599773, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "No, your account balance is still sufficient for other transactions. Please count the money before you leave.", + "original_text": "No, your account balance is still sufficient for other transactions. Please count the money before you leave.", + "start_time": 44.76336313460562, + "end_time": 51.3346103001385, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--351/temp/line_8_A.wav", + "silence_duration": 0.5534409356478531, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, that seems to be all in order. Thanks very much.", + "original_text": "Yes, that seems to be all in order. Thanks very much.", + "start_time": 51.80742926570226, + "end_time": 55.02339298452312, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--351/temp/line_9_B.wav", + "silence_duration": 0.47281896556376124, + "is_interrupted": false + } + ] + }, + "DialogSum--val--352": { + "original_text": "A: I can't make out anything, the words are too light. I thought they have already changed the toner cartridge this month [interrupt] but apparently it needs to be replaced again which is quite unusual for such a short period of time.\nB: It seems not or somebody has recently received a large fax.\nA: Ok, no problem. We do it ourselves.\nB: Do you know how to replace the toner cartridge? It might be a bit tricky if you haven't done it before.\nA: Actually, I was just about to ask if you knew how to do it. I'm not so good at machine things either.\nB: I will have somebody do it as soon as possible.", + "cleaned_text": "A:I can't make out anything, the words are too light. I thought they have already changed the toner cartridge this month but apparently it needs to be replaced again which is quite unusual for such a short period of time.\nB: It seems not or somebody has recently received a large fax.\nA: Ok, no problem. We do it ourselves.\nB: Do you know how to replace the toner cartridge? It might be a bit tricky if you haven't done it before.\nA: Actually, I was just about to ask if you knew how to do it. I'm not so good at machine things either.\nB: I will have somebody do it as soon as possible.", + "total_duration": 31.34566893424036, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--352/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--352/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--352/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "I can't make out anything, the words are too light. I thought they have already changed the toner cartridge this month", + "original_text": "I can't make out anything, the words are too light. I thought they have already changed the toner cartridge this month [interrupt] but apparently it needs to be replaced again which is quite unusual for such a short period of time.", + "start_time": 0, + "end_time": 12.631655328798185, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--352/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": true, + "text_after_interrupt": "but apparently it needs to be replaced again which is quite unusual for such a short period of time." + }, + { + "speaker": "B", + "text": "It seems not or somebody has recently received a large fax.", + "original_text": "It seems not or somebody has recently received a large fax.", + "start_time": 6.431927437641724, + "end_time": 9.845260770975058, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--352/temp/line_1_B.wav", + "silence_duration": 0.4345081214721259, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Ok, no problem. We do it ourselves.", + "original_text": "Ok, no problem. We do it ourselves.", + "start_time": 13.163768671970985, + "end_time": 15.961773207118377, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--352/temp/line_2_A.wav", + "silence_duration": 0.5321133431727997, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Do you know how to replace the toner cartridge? It might be a bit tricky if you haven't done it before.", + "original_text": "Do you know how to replace the toner cartridge? It might be a bit tricky if you haven't done it before.", + "start_time": 16.468650729340652, + "end_time": 21.600260706664915, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--352/temp/line_3_B.wav", + "silence_duration": 0.5068775222222739, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Actually, I was just about to ask if you knew how to do it. I'm not so good at machine things either.", + "original_text": "Actually, I was just about to ask if you knew how to do it. I'm not so good at machine things either.", + "start_time": 22.196071953273385, + "end_time": 28.546729549645267, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--352/temp/line_4_A.wav", + "silence_duration": 0.59581124660847, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I will have somebody do it as soon as possible.", + "original_text": "I will have somebody do it as soon as possible.", + "start_time": 29.07015015424157, + "end_time": 31.345705709797127, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--352/temp/line_5_B.wav", + "silence_duration": 0.5234206045963049, + "is_interrupted": false + } + ] + }, + "DialogSum--val--353": { + "original_text": "A: Welcome to China, Mr. Smith. \nB: Thank you. So pleasant to meet you here! \nA: I heard that you are interested in our silk skirts and new style of [interrupt] traditional Chinese dresses that we've recently launched, featuring innovative designs that blend modern aesthetics with centuries-old craftsmanship techniques. \nB: Sorry to jump in, but regarding the new styles, do you have any samples that we could review before making a final decision? \nA: Yes, we do have samples available. I was just about to mention that we've also brought a list of your recent products with us. We'd like to import some of your latest clothes for the second half of this year. We're ready to place an order with you. \nB: Great! Most of the items listed are available this year. I hope we can come to an agreement and sign the contracts, so as to enable our timely [interrupt] delivery to your stores and ensure that everything is in place for the upcoming season while maintaining the highest quality standards our customers expect. \nA: Speaking of contracts, I just realized we haven't discussed the payment terms yet. Should we clarify that before proceeding? \nB: Absolutely, payment terms are crucial. But I was going to suggest earlier that we allow some of our clients to join us in the discussions to better align with their needs. \nA: Good idea! In this way, our clients' needs will be met and disagreements between the two parties avoided. \nB: Sounds like we have the same idea.", + "cleaned_text": "A: Welcome to China, Mr. Smith. \nB: Thank you. So pleasant to meet you here! \nA:I heard that you are interested in our silk skirts and new style of traditional Chinese dresses that we've recently launched, featuring innovative designs that blend modern aesthetics with centuries-old craftsmanship techniques.\nB: Sorry to jump in, but regarding the new styles, do you have any samples that we could review before making a final decision? \nA: Yes, we do have samples available. I was just about to mention that we've also brought a list of your recent products with us. We'd like to import some of your latest clothes for the second half of this year. We're ready to place an order with you. \nB:Great! Most of the items listed are available this year. I hope we can come to an agreement and sign the contracts, so as to enable our timely delivery to your stores and ensure that everything is in place for the upcoming season while maintaining the highest quality standards our customers expect.\nA: Speaking of contracts, I just realized we haven't discussed the payment terms yet. Should we clarify that before proceeding? \nB: Absolutely, payment terms are crucial. But I was going to suggest earlier that we allow some of our clients to join us in the discussions to better align with their needs. \nA: Good idea! In this way, our clients' needs will be met and disagreements between the two parties avoided. \nB: Sounds like we have the same idea.", + "total_duration": 72.99238095238096, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--353/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--353/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--353/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Welcome to China, Mr. Smith.", + "original_text": "Welcome to China, Mr. Smith.", + "start_time": 0, + "end_time": 1.9504761904761905, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--353/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Thank you. So pleasant to meet you here!", + "original_text": "Thank you. So pleasant to meet you here!", + "start_time": 2.425521009316284, + "end_time": 4.596586768953472, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--353/temp/line_1_B.wav", + "silence_duration": 0.47504481884009353, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I heard that you are interested in our silk skirts and new style of", + "original_text": "I heard that you are interested in our silk skirts and new style of [interrupt] traditional Chinese dresses that we've recently launched, featuring innovative designs that blend modern aesthetics with centuries-old craftsmanship techniques.", + "start_time": 5.08504580411812, + "end_time": 17.995340588698618, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--353/temp/line_2_A.wav", + "silence_duration": 0.4884590351646477, + "is_interrupted": true, + "text_after_interrupt": "traditional Chinese dresses that we've recently launched, featuring innovative designs that blend modern aesthetics with centuries-old craftsmanship techniques." + }, + { + "speaker": "B", + "text": "Sorry to jump in, but regarding the new styles, do you have any samples that we could review before making a final decision?", + "original_text": "Sorry to jump in, but regarding the new styles, do you have any samples that we could review before making a final decision?", + "start_time": 9.241417686204286, + "end_time": 15.510805441306328, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--353/temp/line_3_B.wav", + "silence_duration": 0.4836908622759285, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Yes, we do have samples available. I was just about to mention that we've also brought a list of your recent products with us. We'd like to import some of your latest clothes for the second half of this year. We're ready to place an order with you.", + "original_text": "Yes, we do have samples available. I was just about to mention that we've also brought a list of your recent products with us. We'd like to import some of your latest clothes for the second half of this year. We're ready to place an order with you.", + "start_time": 18.304131410407777, + "end_time": 32.07356451698374, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--353/temp/line_4_A.wav", + "silence_duration": 0.30879082170915917, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Great! Most of the items listed are available this year. I hope we can come to an agreement and sign the contracts, so as to enable our timely", + "original_text": "Great! Most of the items listed are available this year. I hope we can come to an agreement and sign the contracts, so as to enable our timely [interrupt] delivery to your stores and ensure that everything is in place for the upcoming season while maintaining the highest quality standards our customers expect.", + "start_time": 32.61123801252751, + "end_time": 47.42556907828715, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--353/temp/line_5_B.wav", + "silence_duration": 0.537673495543773, + "is_interrupted": true, + "text_after_interrupt": "delivery to your stores and ensure that everything is in place for the upcoming season while maintaining the highest quality standards our customers expect." + }, + { + "speaker": "A", + "text": "Speaking of contracts, I just realized we haven't discussed the payment terms yet. Should we clarify that before proceeding?", + "original_text": "Speaking of contracts, I just realized we haven't discussed the payment terms yet. Should we clarify that before proceeding?", + "start_time": 47.307046463665245, + "end_time": 54.51684238203259, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--353/temp/line_6_A.wav", + "silence_duration": 0.5510932826041002, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Absolutely, payment terms are crucial. But I was going to suggest earlier that we allow some of our clients to join us in the discussions to better align with their needs.", + "original_text": "Absolutely, payment terms are crucial. But I was going to suggest earlier that we allow some of our clients to join us in the discussions to better align with their needs.", + "start_time": 54.88169097974636, + "end_time": 63.75171365548332, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--353/temp/line_7_B.wav", + "silence_duration": 0.36484859771376826, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Good idea! In this way, our clients' needs will be met and disagreements between the two parties avoided.", + "original_text": "Good idea! In this way, our clients' needs will be met and disagreements between the two parties avoided.", + "start_time": 64.11250453494993, + "end_time": 70.67214172315855, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--353/temp/line_8_A.wav", + "silence_duration": 0.3607908794666066, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Sounds like we have the same idea.", + "original_text": "Sounds like we have the same idea.", + "start_time": 71.18125224254028, + "end_time": 72.99240870512531, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--353/temp/line_9_B.wav", + "silence_duration": 0.5091105193817291, + "is_interrupted": false + } + ] + }, + "DialogSum--val--355": { + "original_text": "A: Cigarette? \nB: Oh, uh. . . Thanks. Henry, do you have a light? \nA: Sorry, here. \nB: Thanks. Lovely day. Pity I'm on [interrupt] duty and can't enjoy it as much as I'd like, especially with this perfect weather making me wish I could just take a long walk in the park instead. \nA: Sorry to cut in, but I just remembered—are you still planning to take that weekend off you mentioned last week? \nB: Oh, right. I was going to say I'm on duty today, so I can't really think about time off. But I might take a break next month. Anyway, I'll stand in with you if you like. I've got nothing else to do this afternoon, so it wouldn't be a problem at all. \nA: Actually, I was wondering, what exactly does your duty today involve? I mean, are you expecting anything [interrupt] specific or unusual that might require extra attention or preparation on your part? \nB: Nothing too specific, just the usual rounds. But really, I couldn't possibly let you stand in with me. It's my responsibility, after all.", + "cleaned_text": "A: Cigarette? \nB: Oh, uh. . . Thanks. Henry, do you have a light? \nA: Sorry, here. \nB:Thanks. Lovely day. Pity I'm on duty and can't enjoy it as much as I'd like, especially with this perfect weather making me wish I could just take a long walk in the park instead.\nA: Sorry to cut in, but I just remembered—are you still planning to take that weekend off you mentioned last week? \nB: Oh, right. I was going to say I'm on duty today, so I can't really think about time off. But I might take a break next month. Anyway, I'll stand in with you if you like. I've got nothing else to do this afternoon, so it wouldn't be a problem at all. \nA:Actually, I was wondering, what exactly does your duty today involve? I mean, are you expecting anything specific or unusual that might require extra attention or preparation on your part?\nB: Nothing too specific, just the usual rounds. But really, I couldn't possibly let you stand in with me. It's my responsibility, after all.", + "total_duration": 51.010884353741496, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--355/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--355/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--355/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Cigarette?", + "original_text": "Cigarette?", + "start_time": 0, + "end_time": 0.8707482993197279, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--355/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Oh, uh. . . Thanks. Henry, do you have a light?", + "original_text": "Oh, uh. . . Thanks. Henry, do you have a light?", + "start_time": 1.2509195702447147, + "end_time": 4.130193946661948, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--355/temp/line_1_B.wav", + "silence_duration": 0.38017127092498687, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Sorry, here.", + "original_text": "Sorry, here.", + "start_time": 4.695013398745498, + "end_time": 5.774741289901961, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--355/temp/line_2_A.wav", + "silence_duration": 0.5648194520835503, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Thanks. Lovely day. Pity I'm on", + "original_text": "Thanks. Lovely day. Pity I'm on [interrupt] duty and can't enjoy it as much as I'd like, especially with this perfect weather making me wish I could just take a long walk in the park instead.", + "start_time": 6.171073717147173, + "end_time": 15.679645145718602, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--355/temp/line_3_B.wav", + "silence_duration": 0.3963324272452115, + "is_interrupted": true, + "text_after_interrupt": "duty and can't enjoy it as much as I'd like, especially with this perfect weather making me wish I could just take a long walk in the park instead." + }, + { + "speaker": "A", + "text": "Sorry to cut in, but I just remembered—are you still planning to take that weekend off you mentioned last week?", + "original_text": "Sorry to cut in, but I just remembered—are you still planning to take that weekend off you mentioned last week?", + "start_time": 8.34213947678436, + "end_time": 14.541867367940824, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--355/temp/line_4_A.wav", + "silence_duration": 0.5603023153147992, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Oh, right. I was going to say I'm on duty today, so I can't really think about time off. But I might take a break next month. Anyway, I'll stand in with you if you like. I've got nothing else to do this afternoon, so it wouldn't be a problem at all.", + "original_text": "Oh, right. I was going to say I'm on duty today, so I can't really think about time off. But I might take a break next month. Anyway, I'll stand in with you if you like. I've got nothing else to do this afternoon, so it wouldn't be a problem at all.", + "start_time": 16.051506946251703, + "end_time": 28.6483323430771, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--355/temp/line_5_B.wav", + "silence_duration": 0.37186180053310114, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Actually, I was wondering, what exactly does your duty today involve? I mean, are you expecting anything", + "original_text": "Actually, I was wondering, what exactly does your duty today involve? I mean, are you expecting anything [interrupt] specific or unusual that might require extra attention or preparation on your part?", + "start_time": 29.219776650173262, + "end_time": 40.65560431457236, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--355/temp/line_6_A.wav", + "silence_duration": 0.5714443070961623, + "is_interrupted": true, + "text_after_interrupt": "specific or unusual that might require extra attention or preparation on your part?" + }, + { + "speaker": "B", + "text": "Nothing too specific, just the usual rounds. But really, I couldn't possibly let you stand in with me. It's my responsibility, after all.", + "original_text": "Nothing too specific, just the usual rounds. But really, I couldn't possibly let you stand in with me. It's my responsibility, after all.", + "start_time": 43.01162275677327, + "end_time": 51.010897133190504, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--355/temp/line_7_B.wav", + "silence_duration": 0.37803939169195777, + "is_interrupted": false + } + ] + }, + "DialogSum--val--357": { + "original_text": "A: It's nice and bright today, isn't it? \nB: Yeah. The autumn is marvelous here. \nA: How about winter? \nB: That's a hard time. The air is cold and damp, and the road is often [interrupt] covered in ice, which makes it really difficult to drive safely especially during early mornings when temperatures drop below freezing point. \nA: I was just thinking, with the roads being icy, do you have to take any special precautions when driving? \nB: Yes, we do. We install winter tires and keep emergency kits in our cars just in case we get stranded during particularly bad snowstorms. \nA: That sounds tough. So, do you get much rain during the summer? \nB: Plenty. We never worry about lack of rainwater in our area as the summer showers are quite frequent and sometimes quite heavy. \nA: So you should bring an umbrella often. \nB: That's right. It's better to be prepared than caught in a sudden downpour while going about your daily activities.", + "cleaned_text": "A: It's nice and bright today, isn't it? \nB: Yeah. The autumn is marvelous here. \nA: How about winter? \nB:That's a hard time. The air is cold and damp, and the road is often covered in ice, which makes it really difficult to drive safely especially during early mornings when temperatures drop below freezing point.\nA: I was just thinking, with the roads being icy, do you have to take any special precautions when driving? \nB: Yes, we do. We install winter tires and keep emergency kits in our cars just in case we get stranded during particularly bad snowstorms. \nA: That sounds tough. So, do you get much rain during the summer? \nB: Plenty. We never worry about lack of rainwater in our area as the summer showers are quite frequent and sometimes quite heavy. \nA: So you should bring an umbrella often. \nB: That's right. It's better to be prepared than caught in a sudden downpour while going about your daily activities.", + "total_duration": 44.20235827664399, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--357/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--357/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--357/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "It's nice and bright today, isn't it?", + "original_text": "It's nice and bright today, isn't it?", + "start_time": 0, + "end_time": 2.078185941043084, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--357/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yeah. The autumn is marvelous here.", + "original_text": "Yeah. The autumn is marvelous here.", + "start_time": 2.511522641686634, + "end_time": 4.879958015836294, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--357/temp/line_1_B.wav", + "silence_duration": 0.43333670064355023, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "How about winter?", + "original_text": "How about winter?", + "start_time": 5.278468938326003, + "end_time": 6.358196829482465, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--357/temp/line_2_A.wav", + "silence_duration": 0.3985109224897083, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "That's a hard time. The air is cold and damp, and the road is often", + "original_text": "That's a hard time. The air is cold and damp, and the road is often [interrupt] covered in ice, which makes it really difficult to drive safely especially during early mornings when temperatures drop below freezing point.", + "start_time": 6.674672232518462, + "end_time": 16.45027313954794, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--357/temp/line_3_B.wav", + "silence_duration": 0.3164754030359975, + "is_interrupted": true, + "text_after_interrupt": "covered in ice, which makes it really difficult to drive safely especially during early mornings when temperatures drop below freezing point." + }, + { + "speaker": "A", + "text": "I was just thinking, with the roads being icy, do you have to take any special precautions when driving?", + "original_text": "I was just thinking, with the roads being icy, do you have to take any special precautions when driving?", + "start_time": 10.192495361770163, + "end_time": 16.229683570386943, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--357/temp/line_4_A.wav", + "silence_duration": 0.5083619608006916, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, we do. We install winter tires and keep emergency kits in our cars just in case we get stranded during particularly bad snowstorms.", + "original_text": "Yes, we do. We install winter tires and keep emergency kits in our cars just in case we get stranded during particularly bad snowstorms.", + "start_time": 16.982280651276817, + "end_time": 24.261736433589743, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--357/temp/line_5_B.wav", + "silence_duration": 0.5320075117288774, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "That sounds tough. So, do you get much rain during the summer?", + "original_text": "That sounds tough. So, do you get much rain during the summer?", + "start_time": 24.775077585338277, + "end_time": 28.513490283750976, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--357/temp/line_6_A.wav", + "silence_duration": 0.5133411517485332, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Plenty. We never worry about lack of rainwater in our area as the summer showers are quite frequent and sometimes quite heavy.", + "original_text": "Plenty. We never worry about lack of rainwater in our area as the summer showers are quite frequent and sometimes quite heavy.", + "start_time": 28.95106101451897, + "end_time": 35.87060749977974, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--357/temp/line_7_B.wav", + "silence_duration": 0.4375707307679938, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "So you should bring an umbrella often.", + "original_text": "So you should bring an umbrella often.", + "start_time": 36.341112986545774, + "end_time": 38.51217874618296, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--357/temp/line_8_A.wav", + "silence_duration": 0.47050548676603854, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "That's right. It's better to be prepared than caught in a sudden downpour while going about your daily activities.", + "original_text": "That's right. It's better to be prepared than caught in a sudden downpour while going about your daily activities.", + "start_time": 39.024315112424496, + "end_time": 44.20236499904581, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--357/temp/line_9_B.wav", + "silence_duration": 0.5121363662415375, + "is_interrupted": false + } + ] + }, + "DialogSum--val--358": { + "original_text": "A: Yes, But I couldn't help it. I was late getting off work for a start and then I missed the bus. The bus I did catch got stuck in the traffic jam. It was one thing after [interrupt] another, and everything just seemed to go wrong - first my computer crashed while I was typing the letters, then the printer ran out of ink right when I needed to print them.\nB: Wait, why were you getting off work so late? The office closes at six, doesn't it?\nA: Yes, but there was a rush at that moment, and my boss asked me to do some urgent letters.\nB: Didn't you tell him you had an appointment?\nA: Well, no. I thought I'd finish in five minutes, and I didn't want to be difficult about just a few minutes. If I hadn't missed the bus and got stuck in traffic, I wouldn't have been so late. I'm sorry.\nB: I understand. But just to clarify, you mentioned your boss asked you to handle urgent letters—did you manage to finish them on time?\nA: Yes, I did. But it took longer than expected. Anyway, I'm really sorry for being late.\nB: Well, you're here now.", + "cleaned_text": "A:Yes, But I couldn't help it. I was late getting off work for a start and then I missed the bus. The bus I did catch got stuck in the traffic jam. It was one thing after another, and everything just seemed to go wrong - first my computer crashed while I was typing the letters, then the printer ran out of ink right when I needed to print them.\nB: Wait, why were you getting off work so late? The office closes at six, doesn't it?\nA: Yes, but there was a rush at that moment, and my boss asked me to do some urgent letters.\nB: Didn't you tell him you had an appointment?\nA: Well, no. I thought I'd finish in five minutes, and I didn't want to be difficult about just a few minutes. If I hadn't missed the bus and got stuck in traffic, I wouldn't have been so late. I'm sorry.\nB: I understand. But just to clarify, you mentioned your boss asked you to handle urgent letters—did you manage to finish them on time?\nA: Yes, I did. But it took longer than expected. Anyway, I'm really sorry for being late.\nB: Well, you're here now.", + "total_duration": 57.72321995464853, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--358/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--358/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--358/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Yes, But I couldn't help it. I was late getting off work for a start and then I missed the bus. The bus I did catch got stuck in the traffic jam. It was one thing after", + "original_text": "Yes, But I couldn't help it. I was late getting off work for a start and then I missed the bus. The bus I did catch got stuck in the traffic jam. It was one thing after [interrupt] another, and everything just seemed to go wrong - first my computer crashed while I was typing the letters, then the printer ran out of ink right when I needed to print them.", + "start_time": 0, + "end_time": 20.538049886621316, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--358/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": true, + "text_after_interrupt": "another, and everything just seemed to go wrong - first my computer crashed while I was typing the letters, then the printer ran out of ink right when I needed to print them." + }, + { + "speaker": "B", + "text": "Wait, why were you getting off work so late? The office closes at six, doesn't it?", + "original_text": "Wait, why were you getting off work so late? The office closes at six, doesn't it?", + "start_time": 10.193560090702947, + "end_time": 14.547301587301586, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--358/temp/line_1_B.wav", + "silence_duration": 0.39512661667910026, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Yes, but there was a rush at that moment, and my boss asked me to do some urgent letters.", + "original_text": "Yes, but there was a rush at that moment, and my boss asked me to do some urgent letters.", + "start_time": 20.857916279399472, + "end_time": 26.11723600729063, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--358/temp/line_2_A.wav", + "silence_duration": 0.3198663927781564, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Didn't you tell him you had an appointment?", + "original_text": "Didn't you tell him you had an appointment?", + "start_time": 26.476395049803944, + "end_time": 28.206281671119136, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--358/temp/line_3_B.wav", + "silence_duration": 0.35915904251331576, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Well, no. I thought I'd finish in five minutes, and I didn't want to be difficult about just a few minutes. If I hadn't missed the bus and got stuck in traffic, I wouldn't have been so late. I'm sorry.", + "original_text": "Well, no. I thought I'd finish in five minutes, and I didn't want to be difficult about just a few minutes. If I hadn't missed the bus and got stuck in traffic, I wouldn't have been so late. I'm sorry.", + "start_time": 28.799338735510275, + "end_time": 41.31489429106583, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--358/temp/line_4_A.wav", + "silence_duration": 0.593057064391139, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I understand. But just to clarify, you mentioned your boss asked you to handle urgent letters—did you manage to finish them on time?", + "original_text": "I understand. But just to clarify, you mentioned your boss asked you to handle urgent letters—did you manage to finish them on time?", + "start_time": 41.75225192274586, + "end_time": 49.04331768238305, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--358/temp/line_5_B.wav", + "silence_duration": 0.4373576316800315, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Yes, I did. But it took longer than expected. Anyway, I'm really sorry for being late.", + "original_text": "Yes, I did. But it took longer than expected. Anyway, I'm really sorry for being late.", + "start_time": 49.353104752071296, + "end_time": 55.84308207633433, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--358/temp/line_6_A.wav", + "silence_duration": 0.309787069688246, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Well, you're here now.", + "original_text": "Well, you're here now.", + "start_time": 56.30681146470374, + "end_time": 57.72322869826383, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--358/temp/line_7_B.wav", + "silence_duration": 0.46372938836940825, + "is_interrupted": false + } + ] + }, + "DialogSum--val--359": { + "original_text": "A: Look! They are playing The Matrix today.\nB: You are right, look at the crowd. Do you think we will be able to [interrupt] get good seats if we manage to get tickets? The theater seems packed and I'm worried we might end up sitting in the very front row.\nA: Sorry to cut in, but if we can't, maybe we should consider buying from ticket scalpers?\nB: No way. I'd rather go to another movie house.\nA: Come on. We are already here. Besides, I really wanna see this picture.\nB: All right. Let's see when the next movie is playing?\nA: Seven thirty. There is only 10 minutes left and look at the long [interrupt] line stretching all the way to the parking lot. We might not make it in time unless we find some way to speed up the process.\nB: Oh, I just realized, did you check if the scalpers have tickets for this showing? We might not have time to wait in this line.\nA: I didn't, but I really don't want to buy from them. Shall we just take a chance and see if we can get in?\nB: Yeah, let's do so.\nA: It's moving so slow.\nB: What can you expect with this crowd? I am praying that no one will cut in the line.\nA: I don't think anyone will.", + "cleaned_text": "A: Look! They are playing The Matrix today.\nB:You are right, look at the crowd. Do you think we will be able to get good seats if we manage to get tickets? The theater seems packed and I'm worried we might end up sitting in the very front row.\nA: Sorry to cut in, but if we can't, maybe we should consider buying from ticket scalpers?\nB: No way. I'd rather go to another movie house.\nA: Come on. We are already here. Besides, I really wanna see this picture.\nB: All right. Let's see when the next movie is playing?\nA:Seven thirty. There is only 10 minutes left and look at the long line stretching all the way to the parking lot. We might not make it in time unless we find some way to speed up the process.\nB: Oh, I just realized, did you check if the scalpers have tickets for this showing? We might not have time to wait in this line.\nA: I didn't, but I really don't want to buy from them. Shall we just take a chance and see if we can get in?\nB: Yeah, let's do so.\nA: It's moving so slow.\nB: What can you expect with this crowd? I am praying that no one will cut in the line.\nA: I don't think anyone will.", + "total_duration": 58.63242630385488, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--359/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--359/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--359/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Look! They are playing The Matrix today.", + "original_text": "Look! They are playing The Matrix today.", + "start_time": 0, + "end_time": 2.6586848072562357, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--359/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "You are right, look at the crowd. Do you think we will be able to", + "original_text": "You are right, look at the crowd. Do you think we will be able to [interrupt] get good seats if we manage to get tickets? The theater seems packed and I'm worried we might end up sitting in the very front row.", + "start_time": 3.0551410545246247, + "end_time": 12.470832664501948, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--359/temp/line_1_B.wav", + "silence_duration": 0.396456247268389, + "is_interrupted": true, + "text_after_interrupt": "get good seats if we manage to get tickets? The theater seems packed and I'm worried we might end up sitting in the very front row." + }, + { + "speaker": "A", + "text": "Sorry to cut in, but if we can't, maybe we should consider buying from ticket scalpers?", + "original_text": "Sorry to cut in, but if we can't, maybe we should consider buying from ticket scalpers?", + "start_time": 6.665844002370429, + "end_time": 12.180583231395373, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--359/temp/line_2_A.wav", + "silence_duration": 0.49151380233654524, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "No way. I'd rather go to another movie house.", + "original_text": "No way. I'd rather go to another movie house.", + "start_time": 12.795375808025975, + "end_time": 15.349570819363844, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--359/temp/line_3_B.wav", + "silence_duration": 0.32454314352402636, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Come on. We are already here. Besides, I really wanna see this picture.", + "original_text": "Come on. We are already here. Besides, I really wanna see this picture.", + "start_time": 15.655707896952627, + "end_time": 20.17198907609095, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--359/temp/line_4_A.wav", + "silence_duration": 0.3061370775887837, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "All right. Let's see when the next movie is playing?", + "original_text": "All right. Let's see when the next movie is playing?", + "start_time": 20.605749282837817, + "end_time": 23.05545449825732, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--359/temp/line_5_B.wav", + "silence_duration": 0.43376020674686633, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Seven thirty. There is only 10 minutes left and look at the long", + "original_text": "Seven thirty. There is only 10 minutes left and look at the long [interrupt] line stretching all the way to the parking lot. We might not make it in time unless we find some way to speed up the process.", + "start_time": 23.61899701876185, + "end_time": 35.27541425232194, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--359/temp/line_6_A.wav", + "silence_duration": 0.5635425205045295, + "is_interrupted": true, + "text_after_interrupt": "line stretching all the way to the parking lot. We might not make it in time unless we find some way to speed up the process." + }, + { + "speaker": "B", + "text": "Oh, I just realized, did you check if the scalpers have tickets for this showing? We might not have time to wait in this line.", + "original_text": "Oh, I just realized, did you check if the scalpers have tickets for this showing? We might not have time to wait in this line.", + "start_time": 34.96849171373388, + "end_time": 41.45846903799692, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--359/temp/line_7_B.wav", + "silence_duration": 0.41636619356626203, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I didn't, but I really don't want to buy from them. Shall we just take a chance and see if we can get in?", + "original_text": "I didn't, but I really don't want to buy from them. Shall we just take a chance and see if we can get in?", + "start_time": 42.03077951515783, + "end_time": 48.24211738363856, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--359/temp/line_8_A.wav", + "silence_duration": 0.5723104771609117, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yeah, let's do so.", + "original_text": "Yeah, let's do so.", + "start_time": 48.63896752267371, + "end_time": 49.78835527777575, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--359/temp/line_9_B.wav", + "silence_duration": 0.3968501390351494, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "It's moving so slow.", + "original_text": "It's moving so slow.", + "start_time": 50.18997793376708, + "end_time": 51.78054482719112, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--359/temp/line_10_A.wav", + "silence_duration": 0.4016226559913295, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "What can you expect with this crowd? I am praying that no one will cut in the line.", + "original_text": "What can you expect with this crowd? I am praying that no one will cut in the line.", + "start_time": 52.22999210654413, + "end_time": 56.46763382990014, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--359/temp/line_11_B.wav", + "silence_duration": 0.4494472793530125, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I don't think anyone will.", + "original_text": "I don't think anyone will.", + "start_time": 56.99546216488536, + "end_time": 58.63246896760645, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--359/temp/line_12_A.wav", + "silence_duration": 0.5278283349852235, + "is_interrupted": false + } + ] + }, + "DialogSum--val--360": { + "original_text": "A: What can I do for you today? \nB: I need to return a book. \nA: Can I do anything else for you? \nB: I want to check this magazine [interrupt] to see if there's an article I was looking for about sustainable architecture and urban planning, which I heard was featured in this month's issue. \nA: Oh, just to clarify, we don't allow people to check out magazines. \nB: Why not? \nA: It's just a policy of ours. \nB: So what am I allowed to check out? \nA: You may check out books or videos. By the way, you mentioned wanting to check out the magazine earlier. Unfortunately— \nB: You will have to just read it in the library, right? That doesn't make any sense.", + "cleaned_text": "A: What can I do for you today? \nB: I need to return a book. \nA: Can I do anything else for you? \nB:I want to check this magazine to see if there's an article I was looking for about sustainable architecture and urban planning, which I heard was featured in this month's issue.\nA: Oh, just to clarify, we don't allow people to check out magazines. \nB: Why not? \nA: It's just a policy of ours. \nB: So what am I allowed to check out? \nA: You may check out books or videos. By the way, you mentioned wanting to check out the magazine earlier. Unfortunately— \nB: You will have to just read it in the library, right? That doesn't make any sense.", + "total_duration": 32.83587301587301, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--360/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--360/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--360/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "What can I do for you today?", + "original_text": "What can I do for you today?", + "start_time": 0, + "end_time": 1.7182766439909296, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--360/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I need to return a book.", + "original_text": "I need to return a book.", + "start_time": 2.227689831344252, + "end_time": 3.400297541094819, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--360/temp/line_1_B.wav", + "silence_duration": 0.5094131873533223, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Can I do anything else for you?", + "original_text": "Can I do anything else for you?", + "start_time": 3.914482570413078, + "end_time": 5.6675891463767964, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--360/temp/line_2_A.wav", + "silence_duration": 0.514185029318259, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I want to check this magazine", + "original_text": "I want to check this magazine [interrupt] to see if there's an article I was looking for about sustainable architecture and urban planning, which I heard was featured in this month's issue.", + "start_time": 6.033218843559572, + "end_time": 14.671041972811272, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--360/temp/line_3_B.wav", + "silence_duration": 0.36562969718277555, + "is_interrupted": true, + "text_after_interrupt": "to see if there's an article I was looking for about sustainable architecture and urban planning, which I heard was featured in this month's issue." + }, + { + "speaker": "A", + "text": "Oh, just to clarify, we don't allow people to check out magazines.", + "original_text": "Oh, just to clarify, we don't allow people to check out magazines.", + "start_time": 7.542515895713767, + "end_time": 11.931087324285196, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--360/temp/line_4_A.wav", + "silence_duration": 0.5745357730491525, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Why not?", + "original_text": "Why not?", + "start_time": 15.19822364339209, + "end_time": 15.976092124117713, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--360/temp/line_5_B.wav", + "silence_duration": 0.5271816705808179, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "It's just a policy of ours.", + "original_text": "It's just a policy of ours.", + "start_time": 16.43158151601765, + "end_time": 18.544597389033523, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--360/temp/line_6_A.wav", + "silence_duration": 0.45548939189994, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "So what am I allowed to check out?", + "original_text": "So what am I allowed to check out?", + "start_time": 18.95162768599713, + "end_time": 20.58863448871822, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--360/temp/line_7_B.wav", + "silence_duration": 0.40703029696360676, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "You may check out books or videos. By the way, you mentioned wanting to check out the magazine earlier. Unfortunately—", + "original_text": "You may check out books or videos. By the way, you mentioned wanting to check out the magazine earlier. Unfortunately—", + "start_time": 21.09278892611849, + "end_time": 28.186485071243208, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--360/temp/line_8_A.wav", + "silence_duration": 0.5041544374002715, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "You will have to just read it in the library, right? That doesn't make any sense.", + "original_text": "You will have to just read it in the library, right? That doesn't make any sense.", + "start_time": 28.737575179331238, + "end_time": 32.83589717479609, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--360/temp/line_9_B.wav", + "silence_duration": 0.5510901080880277, + "is_interrupted": false + } + ] + }, + "DialogSum--val--361": { + "original_text": "A: Hey, Mary, nice to see you again. I heard you're going back home to the U.S. \nB: Yes. I'm leaving tomorrow. I came here just because I want to [interrupt] personally say goodbye and thank you for everything you've done during my stay here - your kindness and support made my experience truly unforgettable. \nA: Oh, before I forget, do you need any help with packing or getting to the airport? \nB: That's so kind of you! But I've already taken care of everything. I actually wanted to say good-bye to you. \nA: You're so thoughtful. Wish you a good trip home. And we'll miss you. \nB: I'll miss you too, my friends. Let's definitely keep in touch and maybe plan a reunion visit next year if possible.", + "cleaned_text": "A: Hey, Mary, nice to see you again. I heard you're going back home to the U.S. \nB:Yes. I'm leaving tomorrow. I came here just because I want to personally say goodbye and thank you for everything you've done during my stay here - your kindness and support made my experience truly unforgettable.\nA: Oh, before I forget, do you need any help with packing or getting to the airport? \nB: That's so kind of you! But I've already taken care of everything. I actually wanted to say good-bye to you. \nA: You're so thoughtful. Wish you a good trip home. And we'll miss you. \nB: I'll miss you too, my friends. Let's definitely keep in touch and maybe plan a reunion visit next year if possible.", + "total_duration": 32.60013605442177, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--361/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--361/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--361/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Hey, Mary, nice to see you again. I heard you're going back home to the U.S.", + "original_text": "Hey, Mary, nice to see you again. I heard you're going back home to the U.S.", + "start_time": 0, + "end_time": 5.073560090702948, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--361/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes. I'm leaving tomorrow. I came here just because I want to", + "original_text": "Yes. I'm leaving tomorrow. I came here just because I want to [interrupt] personally say goodbye and thank you for everything you've done during my stay here - your kindness and support made my experience truly unforgettable.", + "start_time": 5.3902219371739735, + "end_time": 16.524190191142228, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--361/temp/line_1_B.wav", + "silence_duration": 0.31666184647102563, + "is_interrupted": true, + "text_after_interrupt": "personally say goodbye and thank you for everything you've done during my stay here - your kindness and support made my experience truly unforgettable." + }, + { + "speaker": "A", + "text": "Oh, before I forget, do you need any help with packing or getting to the airport?", + "original_text": "Oh, before I forget, do you need any help with packing or getting to the airport?", + "start_time": 8.826775225155833, + "end_time": 13.726185655994836, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--361/temp/line_2_A.wav", + "silence_duration": 0.40058366157633163, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "That's so kind of you! But I've already taken care of everything. I actually wanted to say good-bye to you.", + "original_text": "That's so kind of you! But I've already taken care of everything. I actually wanted to say good-bye to you.", + "start_time": 16.84741117946913, + "end_time": 21.89775131552355, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--361/temp/line_3_B.wav", + "silence_duration": 0.3232209883269037, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "You're so thoughtful. Wish you a good trip home. And we'll miss you.", + "original_text": "You're so thoughtful. Wish you a good trip home. And we'll miss you.", + "start_time": 22.4196604413818, + "end_time": 26.297392867685655, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--361/temp/line_4_A.wav", + "silence_duration": 0.5219091258582508, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I'll miss you too, my friends. Let's definitely keep in touch and maybe plan a reunion visit next year if possible.", + "original_text": "I'll miss you too, my friends. Let's definitely keep in touch and maybe plan a reunion visit next year if possible.", + "start_time": 26.644217771961106, + "end_time": 32.60013613930805, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--361/temp/line_5_B.wav", + "silence_duration": 0.3468249042754494, + "is_interrupted": false + } + ] + }, + "DialogSum--val--363": { + "original_text": "A: Are you alright, Ethan? You don't seem to be as cheerful as you normally are.\nB: To be honest, Ava, I've just had a really bad day.\nA: What happened?\nB: First, I slept through my alarm and ended up two hours late to [interrupt] an important meeting that I was supposed to lead, which completely threw off my entire schedule and made me look incredibly unprofessional in front of all the senior executives.\nA: Oh no, that sounds stressful! Did you manage to explain the situation to your boss?\nB: He told me that if I showed up late one more time, he'd fire me. He's so mean!\nA: That's horrible. Was that the first time you'd shown up late to work?\nB: That was my second time. The first time, I was in a car accident.\nA: Is your boss Chinese?\nB: No, he's from Australia. Before I met him, I thought Australians were supposed to be relaxed and easy-going. I had no idea he'd be so fussy about punctuality and deadlines.\nA: Wait, you mentioned earlier that you were in a car accident. Are you okay now? That must have been really tough.\nB: Yeah, I'm fine now, thanks for asking. But back to my boss—I was saying that I had no idea he'd be so fussy about [interrupt] things like arriving exactly on time or submitting reports days before they're actually due, even when there's no real urgency involved.\nA: What are you going to do?\nB: I think I'm going to look for another job. I need to find a boss that is a bit more sensitive and optimistic than my current boss.", + "cleaned_text": "A: Are you alright, Ethan? You don't seem to be as cheerful as you normally are.\nB: To be honest, Ava, I've just had a really bad day.\nA: What happened?\nB:First, I slept through my alarm and ended up two hours late to an important meeting that I was supposed to lead, which completely threw off my entire schedule and made me look incredibly unprofessional in front of all the senior executives.\nA: Oh no, that sounds stressful! Did you manage to explain the situation to your boss?\nB: He told me that if I showed up late one more time, he'd fire me. He's so mean!\nA: That's horrible. Was that the first time you'd shown up late to work?\nB: That was my second time. The first time, I was in a car accident.\nA: Is your boss Chinese?\nB: No, he's from Australia. Before I met him, I thought Australians were supposed to be relaxed and easy-going. I had no idea he'd be so fussy about punctuality and deadlines.\nA: Wait, you mentioned earlier that you were in a car accident. Are you okay now? That must have been really tough.\nB:Yeah, I'm fine now, thanks for asking. But back to my boss—I was saying that I had no idea he'd be so fussy about things like arriving exactly on time or submitting reports days before they're actually due, even when there's no real urgency involved.\nA: What are you going to do?\nB: I think I'm going to look for another job. I need to find a boss that is a bit more sensitive and optimistic than my current boss.", + "total_duration": 76.6267120181406, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--363/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--363/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--363/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Are you alright, Ethan? You don't seem to be as cheerful as you normally are.", + "original_text": "Are you alright, Ethan? You don't seem to be as cheerful as you normally are.", + "start_time": 0, + "end_time": 4.551111111111111, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--363/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "To be honest, Ava, I've just had a really bad day.", + "original_text": "To be honest, Ava, I've just had a really bad day.", + "start_time": 4.974911249013411, + "end_time": 7.970285398673275, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--363/temp/line_1_B.wav", + "silence_duration": 0.4238001379023002, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "What happened?", + "original_text": "What happened?", + "start_time": 8.455746732402389, + "end_time": 9.37293494101917, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--363/temp/line_2_A.wav", + "silence_duration": 0.48546133372911393, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "First, I slept through my alarm and ended up two hours late to", + "original_text": "First, I slept through my alarm and ended up two hours late to [interrupt] an important meeting that I was supposed to lead, which completely threw off my entire schedule and made me look incredibly unprofessional in front of all the senior executives.", + "start_time": 9.933563307433479, + "end_time": 22.367849021719195, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--363/temp/line_3_B.wav", + "silence_duration": 0.5606283664143097, + "is_interrupted": true, + "text_after_interrupt": "an important meeting that I was supposed to lead, which completely threw off my entire schedule and made me look incredibly unprofessional in front of all the senior executives." + }, + { + "speaker": "A", + "text": "Oh no, that sounds stressful! Did you manage to explain the situation to your boss?", + "original_text": "Oh no, that sounds stressful! Did you manage to explain the situation to your boss?", + "start_time": 13.822905711061598, + "end_time": 18.815195960494705, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--363/temp/line_4_A.wav", + "silence_duration": 0.5708572379292192, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "He told me that if I showed up late one more time, he'd fire me. He's so mean!", + "original_text": "He told me that if I showed up late one more time, he'd fire me. He's so mean!", + "start_time": 22.680300500141744, + "end_time": 27.13853179265875, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--363/temp/line_5_B.wav", + "silence_duration": 0.3124514784225481, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "That's horrible. Was that the first time you'd shown up late to work?", + "original_text": "That's horrible. Was that the first time you'd shown up late to work?", + "start_time": 27.625811012997502, + "end_time": 31.584813280571197, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--363/temp/line_6_A.wav", + "silence_duration": 0.48727922033875337, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "That was my second time. The first time, I was in a car accident.", + "original_text": "That was my second time. The first time, I was in a car accident.", + "start_time": 32.15930411863205, + "end_time": 35.688737225208016, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--363/temp/line_7_B.wav", + "silence_duration": 0.5744908380608502, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Is your boss Chinese?", + "original_text": "Is your boss Chinese?", + "start_time": 36.08107241922124, + "end_time": 37.55553953940265, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--363/temp/line_8_A.wav", + "silence_duration": 0.3923351940132267, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "No, he's from Australia. Before I met him, I thought Australians were supposed to be relaxed and easy-going. I had no idea he'd be so fussy about punctuality and deadlines.", + "original_text": "No, he's from Australia. Before I met him, I thought Australians were supposed to be relaxed and easy-going. I had no idea he'd be so fussy about punctuality and deadlines.", + "start_time": 38.03939936724196, + "end_time": 47.87305016089276, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--363/temp/line_9_B.wav", + "silence_duration": 0.4838598278393126, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Wait, you mentioned earlier that you were in a car accident. Are you okay now? That must have been really tough.", + "original_text": "Wait, you mentioned earlier that you were in a car accident. Are you okay now? That must have been really tough.", + "start_time": 48.303535932865564, + "end_time": 55.00249284896534, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--363/temp/line_10_A.wav", + "silence_duration": 0.4304857719728055, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yeah, I'm fine now, thanks for asking. But back to my boss—I was saying that I had no idea he'd be so fussy about", + "original_text": "Yeah, I'm fine now, thanks for asking. But back to my boss—I was saying that I had no idea he'd be so fussy about [interrupt] things like arriving exactly on time or submitting reports days before they're actually due, even when there's no real urgency involved.", + "start_time": 55.39599499932294, + "end_time": 69.5717773122481, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--363/temp/line_11_B.wav", + "silence_duration": 0.3935021503575951, + "is_interrupted": true, + "text_after_interrupt": "things like arriving exactly on time or submitting reports days before they're actually due, even when there's no real urgency involved." + }, + { + "speaker": "A", + "text": "What are you going to do?", + "original_text": "What are you going to do?", + "start_time": 67.21694054936589, + "end_time": 68.4708181003863, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--363/temp/line_12_A.wav", + "silence_duration": 0.5463325701034389, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I think I'm going to look for another job. I need to find a boss that is a bit more sensitive and optimistic than my current boss.", + "original_text": "I think I'm going to look for another job. I need to find a boss that is a bit more sensitive and optimistic than my current boss.", + "start_time": 70.0090497642757, + "end_time": 76.62673683910563, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--363/temp/line_13_B.wav", + "silence_duration": 0.43727245202759746, + "is_interrupted": false + } + ] + }, + "DialogSum--val--364": { + "original_text": "A: So, Monica, what do you feel like doing this afternoon? \nB: Actually, I had a perfect plan for this afternoon, but it is totally ruined by the sand storm. I woke up this morning and found it was sunny. So I called Lucy and asked her to go shopping with me. We were going to look for a new purse. Now it turned out to be like this. Neither of us wants to go [interrupt] out in this weather, so we decided to postpone our shopping trip until the weather clears up and maybe grab some coffee at that new café near the mall when we finally get to go.\nA: Oh, I totally understand. The weather can really mess up plans. But I was wondering, have you noticed if these sand storms are happening more frequently than before? \nB: Yes, I think so. The sand storm happens more frequently these days than the years before. Can't people do something to stop it? \nA: It is not an easy job. The government is working on it. Lots of trees have been planted in the north of the capital. Also, methods of generating rain are being used by the government to fight against the drought. But of course, it will not work overnight. So, have you come out with a new plan for today? \nB: My new plan is to wait for the end of the sand storm and clean my apartment. Oh, and by the way, earlier you mentioned you were going to go shopping with Lucy. Were you planning to buy anything else besides the purse? \nA: Ah, I almost forgot to ask—what kind of purse were you looking for?", + "cleaned_text": "A: So, Monica, what do you feel like doing this afternoon? \nB:Actually, I had a perfect plan for this afternoon, but it is totally ruined by the sand storm. I woke up this morning and found it was sunny. So I called Lucy and asked her to go shopping with me. We were going to look for a new purse. Now it turned out to be like this. Neither of us wants to go out in this weather, so we decided to postpone our shopping trip until the weather clears up and maybe grab some coffee at that new café near the mall when we finally get to go.\nA: Oh, I totally understand. The weather can really mess up plans. But I was wondering, have you noticed if these sand storms are happening more frequently than before? \nB: Yes, I think so. The sand storm happens more frequently these days than the years before. Can't people do something to stop it? \nA: It is not an easy job. The government is working on it. Lots of trees have been planted in the north of the capital. Also, methods of generating rain are being used by the government to fight against the drought. But of course, it will not work overnight. So, have you come out with a new plan for today? \nB: My new plan is to wait for the end of the sand storm and clean my apartment. Oh, and by the way, earlier you mentioned you were going to go shopping with Lucy. Were you planning to buy anything else besides the purse? \nA: Ah, I almost forgot to ask—what kind of purse were you looking for?", + "total_duration": 69.96439909297052, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--364/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--364/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--364/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "So, Monica, what do you feel like doing this afternoon?", + "original_text": "So, Monica, what do you feel like doing this afternoon?", + "start_time": 0, + "end_time": 3.111473922902494, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--364/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Actually, I had a perfect plan for this afternoon, but it is totally ruined by the sand storm. I woke up this morning and found it was sunny. So I called Lucy and asked her to go shopping with me. We were going to look for a new purse. Now it turned out to be like this. Neither of us wants to go", + "original_text": "Actually, I had a perfect plan for this afternoon, but it is totally ruined by the sand storm. I woke up this morning and found it was sunny. So I called Lucy and asked her to go shopping with me. We were going to look for a new purse. Now it turned out to be like this. Neither of us wants to go [interrupt] out in this weather, so we decided to postpone our shopping trip until the weather clears up and maybe grab some coffee at that new café near the mall when we finally get to go.", + "start_time": 3.568626879522178, + "end_time": 27.392300348909934, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--364/temp/line_1_B.wav", + "silence_duration": 0.4571529566196837, + "is_interrupted": true, + "text_after_interrupt": "out in this weather, so we decided to postpone our shopping trip until the weather clears up and maybe grab some coffee at that new café near the mall when we finally get to go." + }, + { + "speaker": "A", + "text": "Oh, I totally understand. The weather can really mess up plans. But I was wondering, have you noticed if these sand storms are happening more frequently than before?", + "original_text": "Oh, I totally understand. The weather can really mess up plans. But I was wondering, have you noticed if these sand storms are happening more frequently than before?", + "start_time": 18.545497627821497, + "end_time": 28.239828693581135, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--364/temp/line_2_A.wav", + "silence_duration": 0.43209947871138255, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, I think so. The sand storm happens more frequently these days than the years before. Can't people do something to stop it?", + "original_text": "Yes, I think so. The sand storm happens more frequently these days than the years before. Can't people do something to stop it?", + "start_time": 28.798063859269682, + "end_time": 35.55507066199077, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--364/temp/line_3_B.wav", + "silence_duration": 0.5582351656885483, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "It is not an easy job. The government is working on it. Lots of trees have been planted in the north of the capital. Also, methods of generating rain are being used by the government to fight against the drought. But of course, it will not work overnight. So, have you come out with a new plan for today?", + "original_text": "It is not an easy job. The government is working on it. Lots of trees have been planted in the north of the capital. Also, methods of generating rain are being used by the government to fight against the drought. But of course, it will not work overnight. So, have you come out with a new plan for today?", + "start_time": 35.9180707028905, + "end_time": 54.296664807198894, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--364/temp/line_4_A.wav", + "silence_duration": 0.3630000408997345, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "My new plan is to wait for the end of the sand storm and clean my apartment. Oh, and by the way, earlier you mentioned you were going to go shopping with Lucy. Were you planning to buy anything else besides the purse?", + "original_text": "My new plan is to wait for the end of the sand storm and clean my apartment. Oh, and by the way, earlier you mentioned you were going to go shopping with Lucy. Were you planning to buy anything else besides the purse?", + "start_time": 54.871959422432326, + "end_time": 65.14678935440512, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--364/temp/line_5_B.wav", + "silence_duration": 0.5752946152334342, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Ah, I almost forgot to ask—what kind of purse were you looking for?", + "original_text": "Ah, I almost forgot to ask—what kind of purse were you looking for?", + "start_time": 65.72678220634462, + "end_time": 69.96442392970063, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--364/temp/line_6_A.wav", + "silence_duration": 0.5799928519395066, + "is_interrupted": false + } + ] + }, + "DialogSum--val--365": { + "original_text": "A: Elaine's back from school. I think it might be a nice gesture if you asked her out. I suppose she's not good enough for you, is that [interrupt] why you haven't considered giving her a chance despite knowing she's grown into a remarkable person with diverse interests and accomplishments?\n\nB: It's not about that. Elaine Robinson and I do not get along.\n\nA: How do you know? You haven't seen her since high school. I guess your evenings, whatever you do with them, are just too valuable.\n\nB: That has nothing to do with it. . .\n\nA: Then what is it? I mean, if you absolutely refuse to take her out [interrupt] just because of some old high school memories, maybe you're missing out on getting to know the wonderful person she's become over these years.\n\nB: I do. But wait, you mentioned something about my evenings being too valuable—what exactly are you trying to imply?", + "cleaned_text": "A:Elaine's back from school. I think it might be a nice gesture if you asked her out. I suppose she's not good enough for you, is that why you haven't considered giving her a chance despite knowing she's grown into a remarkable person with diverse interests and accomplishments?\n\nB: It's not about that. Elaine Robinson and I do not get along.\n\nA: How do you know? You haven't seen her since high school. I guess your evenings, whatever you do with them, are just too valuable.\n\nB: That has nothing to do with it. . .\n\nA:Then what is it? I mean, if you absolutely refuse to take her out just because of some old high school memories, maybe you're missing out on getting to know the wonderful person she's become over these years.\n\nB: I do. But wait, you mentioned something about my evenings being too valuable—what exactly are you trying to imply?", + "total_duration": 40.46684807256236, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--365/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--365/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--365/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Elaine's back from school. I think it might be a nice gesture if you asked her out. I suppose she's not good enough for you, is that", + "original_text": "Elaine's back from school. I think it might be a nice gesture if you asked her out. I suppose she's not good enough for you, is that [interrupt] why you haven't considered giving her a chance despite knowing she's grown into a remarkable person with diverse interests and accomplishments?", + "start_time": 0, + "end_time": 15.568979591836735, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--365/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": true, + "text_after_interrupt": "why you haven't considered giving her a chance despite knowing she's grown into a remarkable person with diverse interests and accomplishments?" + }, + { + "speaker": "B", + "text": "It's not about that. Elaine Robinson and I do not get along.", + "original_text": "It's not about that. Elaine Robinson and I do not get along.", + "start_time": 8.115374149659864, + "end_time": 11.331337868480727, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--365/temp/line_1_B.wav", + "silence_duration": 0.4319145210583605, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "How do you know? You haven't seen her since high school. I guess your evenings, whatever you do with them, are just too valuable.", + "original_text": "How do you know? You haven't seen her since high school. I guess your evenings, whatever you do with them, are just too valuable.", + "start_time": 16.14527865013837, + "end_time": 23.796253706827713, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--365/temp/line_2_A.wav", + "silence_duration": 0.5762990583016345, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "That has nothing to do with it. . .", + "original_text": "That has nothing to do with it. . .", + "start_time": 24.30185279203086, + "end_time": 25.63700018432111, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--365/temp/line_3_B.wav", + "silence_duration": 0.5055990852031462, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Then what is it? I mean, if you absolutely refuse to take her out", + "original_text": "Then what is it? I mean, if you absolutely refuse to take her out [interrupt] just because of some old high school memories, maybe you're missing out on getting to know the wonderful person she's become over these years.", + "start_time": 26.06902775762382, + "end_time": 39.327621861932215, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--365/temp/line_4_A.wav", + "silence_duration": 0.4320275733027102, + "is_interrupted": true, + "text_after_interrupt": "just because of some old high school memories, maybe you're missing out on getting to know the wonderful person she's become over these years." + }, + { + "speaker": "B", + "text": "I do. But wait, you mentioned something about my evenings being too valuable—what exactly are you trying to imply?", + "original_text": "I do. But wait, you mentioned something about my evenings being too valuable—what exactly are you trying to imply?", + "start_time": 34.3948327231851, + "end_time": 40.46685086377467, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--365/temp/line_5_B.wav", + "silence_duration": 0.5962884008396228, + "is_interrupted": false + } + ] + }, + "DialogSum--val--366": { + "original_text": "A: Helen, you must be excited at going to America to study. \nB: Yeah, I've been looking forward to it for [interrupt] a long time. It's been my dream since high school when I first read about American universities and their world-class research facilities. \nA: Sorry to interrupt, but have you already sorted out your visa and accommodation? \nB: Yes, I have. But I haven't mentioned what my classmates think yet—they've been really supportive and gave me a lot of congratulations. \nA: That's great to hear! So, how long will you study there? \nB: Oh, maybe three years. I will study and get the master degree first. Then I will decide whether I will stay there or pursue a PhD, depending on how things go. \nA: Stay there or come back? That's a tough decision. Which university will you be attending? \nB: Chicago University. My major is Economics. \nA: Good luck! \nB: Thank you!", + "cleaned_text": "A: Helen, you must be excited at going to America to study. \nB:Yeah, I've been looking forward to it for a long time. It's been my dream since high school when I first read about American universities and their world-class research facilities.\nA: Sorry to interrupt, but have you already sorted out your visa and accommodation? \nB: Yes, I have. But I haven't mentioned what my classmates think yet—they've been really supportive and gave me a lot of congratulations. \nA: That's great to hear! So, how long will you study there? \nB: Oh, maybe three years. I will study and get the master degree first. Then I will decide whether I will stay there or pursue a PhD, depending on how things go. \nA: Stay there or come back? That's a tough decision. Which university will you be attending? \nB: Chicago University. My major is Economics. \nA: Good luck! \nB: Thank you!", + "total_duration": 46.12439909297052, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--366/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--366/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--366/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Helen, you must be excited at going to America to study.", + "original_text": "Helen, you must be excited at going to America to study.", + "start_time": 0, + "end_time": 3.308843537414966, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--366/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yeah, I've been looking forward to it for", + "original_text": "Yeah, I've been looking forward to it for [interrupt] a long time. It's been my dream since high school when I first read about American universities and their world-class research facilities.", + "start_time": 3.8310713874411073, + "end_time": 13.328032838688273, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--366/temp/line_1_B.wav", + "silence_duration": 0.5222278500261412, + "is_interrupted": true, + "text_after_interrupt": "a long time. It's been my dream since high school when I first read about American universities and their world-class research facilities." + }, + { + "speaker": "A", + "text": "Sorry to interrupt, but have you already sorted out your visa and accommodation?", + "original_text": "Sorry to interrupt, but have you already sorted out your visa and accommodation?", + "start_time": 6.350436466806187, + "end_time": 11.09891719242977, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--366/temp/line_2_A.wav", + "silence_duration": 0.5137054255506397, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, I have. But I haven't mentioned what my classmates think yet—they've been really supportive and gave me a lot of congratulations.", + "original_text": "Yes, I have. But I haven't mentioned what my classmates think yet—they've been really supportive and gave me a lot of congratulations.", + "start_time": 13.87791376272168, + "end_time": 20.890340066576556, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--366/temp/line_3_B.wav", + "silence_duration": 0.5498809240334087, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "That's great to hear! So, how long will you study there?", + "original_text": "That's great to hear! So, how long will you study there?", + "start_time": 21.281027823811726, + "end_time": 25.298079978006736, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--366/temp/line_4_A.wav", + "silence_duration": 0.39068775723517024, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Oh, maybe three years. I will study and get the master degree first. Then I will decide whether I will stay there or pursue a PhD, depending on how things go.", + "original_text": "Oh, maybe three years. I will study and get the master degree first. Then I will decide whether I will stay there or pursue a PhD, depending on how things go.", + "start_time": 25.833946516402122, + "end_time": 35.11031839848829, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--366/temp/line_5_B.wav", + "silence_duration": 0.5358665383953856, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Stay there or come back? That's a tough decision. Which university will you be attending?", + "original_text": "Stay there or come back? That's a tough decision. Which university will you be attending?", + "start_time": 35.48843305484789, + "end_time": 41.02639223852136, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--366/temp/line_6_A.wav", + "silence_duration": 0.37811465635959746, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Chicago University. My major is Economics.", + "original_text": "Chicago University. My major is Economics.", + "start_time": 41.56444816706489, + "end_time": 44.15347311037554, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--366/temp/line_7_B.wav", + "silence_duration": 0.538055928543531, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Good luck!", + "original_text": "Good luck!", + "start_time": 44.49044877380938, + "end_time": 45.30314718650779, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--366/temp/line_8_A.wav", + "silence_duration": 0.3369756634338368, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Thank you!", + "original_text": "Thank you!", + "start_time": 45.694860034607366, + "end_time": 46.124429195605096, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--366/temp/line_9_B.wav", + "silence_duration": 0.3917128480995742, + "is_interrupted": false + } + ] + }, + "DialogSum--val--367": { + "original_text": "A: Hi Charles, I want you to know that I finally found an apartment in Haitian.\nB: You did? That is great!\nA: Yeah, I am having a party this Saturday night, a sort of housewarming, and I want to invite you. Are you [interrupt] free that evening? I'd love for you to come and meet some of my new neighbors who are really interesting people from different cultural backgrounds.\nB: Oh, that sounds awesome! Quick question though—what time should I be there?\nA: Around seven.\nB: Ok, great, should I bring anything?\nA: No, but thanks for offering. Actually, could you bring some fold-up chairs for people if you have any? I'm afraid not everyone's going to have a seat, do you [interrupt] think you could bring a few extra just in case we have more guests than expected? I'd really appreciate the help.\nB: Oh sure, I'll be happy to bring a few. By the way, what's the address?\nA: Oh, I was just about to mention that—don't worry, I'll come to pick you up at about 6:30.\nB: Got it. Looking forward to it!", + "cleaned_text": "A: Hi Charles, I want you to know that I finally found an apartment in Haitian.\nB: You did? That is great!\nA:Yeah, I am having a party this Saturday night, a sort of housewarming, and I want to invite you. Are you free that evening? I'd love for you to come and meet some of my new neighbors who are really interesting people from different cultural backgrounds.\nB: Oh, that sounds awesome! Quick question though—what time should I be there?\nA: Around seven.\nB: Ok, great, should I bring anything?\nA:No, but thanks for offering. Actually, could you bring some fold-up chairs for people if you have any? I'm afraid not everyone's going to have a seat, do you think you could bring a few extra just in case we have more guests than expected? I'd really appreciate the help.\nB: Oh sure, I'll be happy to bring a few. By the way, what's the address?\nA: Oh, I was just about to mention that—don't worry, I'll come to pick you up at about 6:30.\nB: Got it. Looking forward to it!", + "total_duration": 50.98607709750567, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--367/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--367/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--367/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Hi Charles, I want you to know that I finally found an apartment in Haitian.", + "original_text": "Hi Charles, I want you to know that I finally found an apartment in Haitian.", + "start_time": 0, + "end_time": 4.818140589569161, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--367/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "You did? That is great!", + "original_text": "You did? That is great!", + "start_time": 5.294558135234601, + "end_time": 6.803855187388796, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--367/temp/line_1_B.wav", + "silence_duration": 0.4764175456654396, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Yeah, I am having a party this Saturday night, a sort of housewarming, and I want to invite you. Are you", + "original_text": "Yeah, I am having a party this Saturday night, a sort of housewarming, and I want to invite you. Are you [interrupt] free that evening? I'd love for you to come and meet some of my new neighbors who are really interesting people from different cultural backgrounds.", + "start_time": 7.199007693307427, + "end_time": 21.6882593939877, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--367/temp/line_2_A.wav", + "silence_duration": 0.39515250591863205, + "is_interrupted": true, + "text_after_interrupt": "free that evening? I'd love for you to come and meet some of my new neighbors who are really interesting people from different cultural backgrounds." + }, + { + "speaker": "B", + "text": "Oh, that sounds awesome! Quick question though—what time should I be there?", + "original_text": "Oh, that sounds awesome! Quick question though—what time should I be there?", + "start_time": 14.710663022105614, + "end_time": 18.379415856572734, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--367/temp/line_3_B.wav", + "silence_duration": 0.46535821426090357, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Around seven.", + "original_text": "Around seven.", + "start_time": 22.249857462849015, + "end_time": 23.283145444708424, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--367/temp/line_4_A.wav", + "silence_duration": 0.5615980688613138, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Ok, great, should I bring anything?", + "original_text": "Ok, great, should I bring anything?", + "start_time": 23.70796966738832, + "end_time": 25.716495744485826, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--367/temp/line_5_B.wav", + "silence_duration": 0.42482422267989683, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "No, but thanks for offering. Actually, could you bring some fold-up chairs for people if you have any? I'm afraid not everyone's going to have a seat, do you", + "original_text": "No, but thanks for offering. Actually, could you bring some fold-up chairs for people if you have any? I'm afraid not everyone's going to have a seat, do you [interrupt] think you could bring a few extra just in case we have more guests than expected? I'd really appreciate the help.", + "start_time": 26.29031444910706, + "end_time": 42.43979290715695, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--367/temp/line_6_A.wav", + "silence_duration": 0.5738187046212352, + "is_interrupted": true, + "text_after_interrupt": "think you could bring a few extra just in case we have more guests than expected? I'd really appreciate the help." + }, + { + "speaker": "B", + "text": "Oh sure, I'll be happy to bring a few. By the way, what's the address?", + "original_text": "Oh sure, I'll be happy to bring a few. By the way, what's the address?", + "start_time": 39.67715141603125, + "end_time": 43.22980447725574, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--367/temp/line_7_B.wav", + "silence_duration": 0.33706193882836144, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Oh, I was just about to mention that—don't worry, I'll come to pick you up at about 6:30.", + "original_text": "Oh, I was just about to mention that—don't worry, I'll come to pick you up at about 6:30.", + "start_time": 43.71052957842994, + "end_time": 49.10916903421226, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--367/temp/line_8_A.wav", + "silence_duration": 0.4807251011742012, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Got it. Looking forward to it!", + "original_text": "Got it. Looking forward to it!", + "start_time": 49.511624213130325, + "end_time": 50.986091333311734, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--367/temp/line_9_B.wav", + "silence_duration": 0.40245517891806837, + "is_interrupted": false + } + ] + }, + "DialogSum--val--369": { + "original_text": "A: How do I use the powder? \nB: Please dissolve the powder in hot water. Soak your hand or foot in it for 20 minutes twice a day. \nA: How do I use the eye-drop and [interrupt] should I store it in the refrigerator after opening it or is room temperature sufficient for maintaining its effectiveness over the recommended usage period? \nB: Sorry to interrupt, but just to clarify, when you say \"twice a day,\" does it matter what time of day I do it? \nA: No, it doesn't matter, as long as you have a gap of several hours between the two sessions. Now, about the eye-drop, you should put it into your right eye 4 - 6 times a day, 1 - 2 drops each time. \nB: Got it. And the ointment? \nA: Squeeze a bit of the ointment on your eyelid every night. \nB: Well, I see. Thanks. \nA: You're welcome.", + "cleaned_text": "A: How do I use the powder? \nB: Please dissolve the powder in hot water. Soak your hand or foot in it for 20 minutes twice a day. \nA:How do I use the eye-drop and should I store it in the refrigerator after opening it or is room temperature sufficient for maintaining its effectiveness over the recommended usage period?\nB: Sorry to interrupt, but just to clarify, when you say \"twice a day,\" does it matter what time of day I do it? \nA: No, it doesn't matter, as long as you have a gap of several hours between the two sessions. Now, about the eye-drop, you should put it into your right eye 4 - 6 times a day, 1 - 2 drops each time. \nB: Got it. And the ointment? \nA: Squeeze a bit of the ointment on your eyelid every night. \nB: Well, I see. Thanks. \nA: You're welcome.", + "total_duration": 40.70825396825397, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--369/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--369/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--369/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "How do I use the powder?", + "original_text": "How do I use the powder?", + "start_time": 0, + "end_time": 1.4396371882086167, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--369/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Please dissolve the powder in hot water. Soak your hand or foot in it for 20 minutes twice a day.", + "original_text": "Please dissolve the powder in hot water. Soak your hand or foot in it for 20 minutes twice a day.", + "start_time": 1.9617775297165116, + "end_time": 6.954067779149618, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--369/temp/line_1_B.wav", + "silence_duration": 0.522140341507895, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "How do I use the eye-drop and", + "original_text": "How do I use the eye-drop and [interrupt] should I store it in the refrigerator after opening it or is room temperature sufficient for maintaining its effectiveness over the recommended usage period?", + "start_time": 7.504663578507743, + "end_time": 18.174232739505474, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--369/temp/line_2_A.wav", + "silence_duration": 0.5505957993581246, + "is_interrupted": true, + "text_after_interrupt": "should I store it in the refrigerator after opening it or is room temperature sufficient for maintaining its effectiveness over the recommended usage period?" + }, + { + "speaker": "B", + "text": "Sorry to interrupt, but just to clarify, when you say \"twice a day,\" does it matter what time of day I do it?", + "original_text": "Sorry to interrupt, but just to clarify, when you say \"twice a day,\" does it matter what time of day I do it?", + "start_time": 9.083620494607516, + "end_time": 14.87699917941477, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--369/temp/line_3_B.wav", + "silence_duration": 0.5099186817914172, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "No, it doesn't matter, as long as you have a gap of several hours between the two sessions. Now, about the eye-drop, you should put it into your right eye 4 - 6 times a day, 1 - 2 drops each time.", + "original_text": "No, it doesn't matter, as long as you have a gap of several hours between the two sessions. Now, about the eye-drop, you should put it into your right eye 4 - 6 times a day, 1 - 2 drops each time.", + "start_time": 18.713189002466986, + "end_time": 31.64670374169601, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--369/temp/line_4_A.wav", + "silence_duration": 0.5389562629615132, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Got it. And the ointment?", + "original_text": "Got it. And the ointment?", + "start_time": 32.16640648764234, + "end_time": 33.664093562472274, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--369/temp/line_5_B.wav", + "silence_duration": 0.5197027459463304, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Squeeze a bit of the ointment on your eyelid every night.", + "original_text": "Squeeze a bit of the ointment on your eyelid every night.", + "start_time": 34.102134718861535, + "end_time": 37.01623902725156, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--369/temp/line_6_A.wav", + "silence_duration": 0.4380411563892612, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Well, I see. Thanks.", + "original_text": "Well, I see. Thanks.", + "start_time": 37.49826888364311, + "end_time": 39.27459541425535, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--369/temp/line_7_B.wav", + "silence_duration": 0.48202985639155094, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "You're welcome.", + "original_text": "You're welcome.", + "start_time": 39.698214814145786, + "end_time": 40.70828284135667, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--369/temp/line_8_A.wav", + "silence_duration": 0.42361939989043274, + "is_interrupted": false + } + ] + }, + "DialogSum--val--370": { + "original_text": "A: I bought it. I got a watch, too. The company that sells this car has a car club where members can [interrupt] participate in exclusive events, get discounts on accessories, and even attend private track days to really push their vehicles to the limit.\nB: Where you can buy lots of paraphernalia?\nA: Yeah, and meet other drivers of the same car!\nB: Cool!\nA: I know girls love this kind of car. Look, it's got a sunroof! Imagine... a cool, starry night, driving down the coast with the top open.\nB: Sorry to cut in, but are you planning to take Sarah's car out tonight?\nA: Oh, no, I was just imagining the vibe. But speaking of that, I didn't finish telling you about the car club. It's not just about buying stuff; they also organize events and road trips.\nB: That sounds fun! But back to the car, are you seriously going to use Sarah's car to go cruising for chicks?", + "cleaned_text": "A:I bought it. I got a watch, too. The company that sells this car has a car club where members can participate in exclusive events, get discounts on accessories, and even attend private track days to really push their vehicles to the limit.\nB: Where you can buy lots of paraphernalia?\nA: Yeah, and meet other drivers of the same car!\nB: Cool!\nA: I know girls love this kind of car. Look, it's got a sunroof! Imagine... a cool, starry night, driving down the coast with the top open.\nB: Sorry to cut in, but are you planning to take Sarah's car out tonight?\nA: Oh, no, I was just imagining the vibe. But speaking of that, I didn't finish telling you about the car club. It's not just about buying stuff; they also organize events and road trips.\nB: That sounds fun! But back to the car, are you seriously going to use Sarah's car to go cruising for chicks?", + "total_duration": 49.830385487528346, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--370/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--370/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--370/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "I bought it. I got a watch, too. The company that sells this car has a car club where members can", + "original_text": "I bought it. I got a watch, too. The company that sells this car has a car club where members can [interrupt] participate in exclusive events, get discounts on accessories, and even attend private track days to really push their vehicles to the limit.", + "start_time": 0, + "end_time": 15.069750566893424, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--370/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": true, + "text_after_interrupt": "participate in exclusive events, get discounts on accessories, and even attend private track days to really push their vehicles to the limit." + }, + { + "speaker": "B", + "text": "Where you can buy lots of paraphernalia?", + "original_text": "Where you can buy lots of paraphernalia?", + "start_time": 6.617687074829932, + "end_time": 8.649433106575962, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--370/temp/line_1_B.wav", + "silence_duration": 0.46598565639347045, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Yeah, and meet other drivers of the same car!", + "original_text": "Yeah, and meet other drivers of the same car!", + "start_time": 15.44754137481387, + "end_time": 18.442915524473733, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--370/temp/line_2_A.wav", + "silence_duration": 0.37779080792044606, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Cool!", + "original_text": "Cool!", + "start_time": 18.779789762388226, + "end_time": 19.313848719304325, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--370/temp/line_3_B.wav", + "silence_duration": 0.3368742379144917, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I know girls love this kind of car. Look, it's got a sunroof! Imagine... a cool, starry night, driving down the coast with the top open.", + "original_text": "I know girls love this kind of car. Look, it's got a sunroof! Imagine... a cool, starry night, driving down the coast with the top open.", + "start_time": 19.821908099361874, + "end_time": 28.29719154607389, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--370/temp/line_4_A.wav", + "silence_duration": 0.5080593800575502, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Sorry to cut in, but are you planning to take Sarah's car out tonight?", + "original_text": "Sorry to cut in, but are you planning to take Sarah's car out tonight?", + "start_time": 28.88615511891428, + "end_time": 32.5549079533814, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--370/temp/line_5_B.wav", + "silence_duration": 0.5889635728403921, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Oh, no, I was just imagining the vibe. But speaking of that, I didn't finish telling you about the car club. It's not just about buying stuff; they also organize events and road trips.", + "original_text": "Oh, no, I was just imagining the vibe. But speaking of that, I didn't finish telling you about the car club. It's not just about buying stuff; they also organize events and road trips.", + "start_time": 32.97328156824657, + "end_time": 44.18851966348467, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--370/temp/line_6_A.wav", + "silence_duration": 0.41837361486516567, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "That sounds fun! But back to the car, are you seriously going to use Sarah's car to go cruising for chicks?", + "original_text": "That sounds fun! But back to the car, are you seriously going to use Sarah's car to go cruising for chicks?", + "start_time": 44.50142287192545, + "end_time": 49.830402463762184, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--370/temp/line_7_B.wav", + "silence_duration": 0.3129032084407827, + "is_interrupted": false + } + ] + }, + "DialogSum--val--371": { + "original_text": "A: Excuse me, could I have a menu please? \nB: Here you are. \nA: I want to try the local specialty. Can you recommend me [interrupt] something that's authentic and really showcases the local flavors with a rich history behind it, perhaps a dish that's been passed down through generations of local chefs? \nB: Sorry to jump in, but are you looking for something more traditional or with a modern twist? \nA: Hmm, something traditional would be nice. But you were about to recommend something? \nB: Sure. I think filet steak will be a good choice. It's the best local food.", + "cleaned_text": "A: Excuse me, could I have a menu please? \nB: Here you are. \nA:I want to try the local specialty. Can you recommend me something that's authentic and really showcases the local flavors with a rich history behind it, perhaps a dish that's been passed down through generations of local chefs?\nB: Sorry to jump in, but are you looking for something more traditional or with a modern twist? \nA: Hmm, something traditional would be nice. But you were about to recommend something? \nB: Sure. I think filet steak will be a good choice. It's the best local food.", + "total_duration": 27.013650793650793, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--371/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--371/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--371/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Excuse me, could I have a menu please?", + "original_text": "Excuse me, could I have a menu please?", + "start_time": 0, + "end_time": 2.2523356009070294, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--371/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Here you are.", + "original_text": "Here you are.", + "start_time": 2.688420825958651, + "end_time": 3.4082394200629595, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--371/temp/line_1_B.wav", + "silence_duration": 0.4360852250516216, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I want to try the local specialty. Can you recommend me", + "original_text": "I want to try the local specialty. Can you recommend me [interrupt] something that's authentic and really showcases the local flavors with a rich history behind it, perhaps a dish that's been passed down through generations of local chefs?", + "start_time": 3.901673873967942, + "end_time": 17.60144711659833, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--371/temp/line_2_A.wav", + "silence_duration": 0.49343445390498253, + "is_interrupted": true, + "text_after_interrupt": "something that's authentic and really showcases the local flavors with a rich history behind it, perhaps a dish that's been passed down through generations of local chefs?" + }, + { + "speaker": "B", + "text": "Sorry to jump in, but are you looking for something more traditional or with a modern twist?", + "original_text": "Sorry to jump in, but are you looking for something more traditional or with a modern twist?", + "start_time": 7.431106980543905, + "end_time": 11.761628522494018, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--371/temp/line_3_B.wav", + "silence_duration": 0.42738644581359087, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Hmm, something traditional would be nice. But you were about to recommend something?", + "original_text": "Hmm, something traditional would be nice. But you were about to recommend something?", + "start_time": 18.04439481691901, + "end_time": 22.29364651759928, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--371/temp/line_4_A.wav", + "silence_duration": 0.4429477003206781, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Sure. I think filet steak will be a good choice. It's the best local food.", + "original_text": "Sure. I think filet steak will be a good choice. It's the best local food.", + "start_time": 22.857280990218605, + "end_time": 27.013652872304775, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--371/temp/line_5_B.wav", + "silence_duration": 0.5636344726193228, + "is_interrupted": false + } + ] + }, + "DialogSum--val--372": { + "original_text": "A: Front Desk, may I help you? \nB: Yes, I'd like to move to another room. \nA: Is there anything uncomfortable in your [interrupt] current room that we can assist with? Perhaps the lighting, temperature, or any other amenities that aren't meeting your expectations? \nB: Yes, the air-conditioner in this room doesn't work. \nA: May I have your room number, sir? \nB: Wang Wei. Room 1212. \nA: OK. Mr. Wang, may I send a room attendant to check it for you [interrupt] and see if it can be fixed quickly or if we should proceed with arranging an alternative room for your comfort immediately? \nB: Actually, if it's going to take too long, I'd rather just move to another room directly. \nA: Understood. We'll check how long it might take first. If it's too long, we'll arrange another room for you right away. \n A: Mr. Wang, we are deeply sorry for the inconvenience. The maintenance might last for a long time, may I offer you another room? \nB: Yes. No problem.", + "cleaned_text": "A: Front Desk, may I help you? \nB: Yes, I'd like to move to another room. \nA:Is there anything uncomfortable in your current room that we can assist with? Perhaps the lighting, temperature, or any other amenities that aren't meeting your expectations?\nB: Yes, the air-conditioner in this room doesn't work. \nA: May I have your room number, sir? \nB: Wang Wei. Room 1212. \nA:OK. Mr. Wang, may I send a room attendant to check it for you and see if it can be fixed quickly or if we should proceed with arranging an alternative room for your comfort immediately?\nB: Actually, if it's going to take too long, I'd rather just move to another room directly. \nA: Understood. We'll check how long it might take first. If it's too long, we'll arrange another room for you right away. \n A: Mr. Wang, we are deeply sorry for the inconvenience. The maintenance might last for a long time, may I offer you another room? \nB: Yes. No problem.", + "total_duration": 47.36925170068027, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--372/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--372/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--372/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Front Desk, may I help you?", + "original_text": "Front Desk, may I help you?", + "start_time": 0, + "end_time": 1.6370068027210884, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--372/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, I'd like to move to another room.", + "original_text": "Yes, I'd like to move to another room.", + "start_time": 2.0965511132122034, + "end_time": 3.9077075757972377, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--372/temp/line_1_B.wav", + "silence_duration": 0.4595443104911149, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Is there anything uncomfortable in your", + "original_text": "Is there anything uncomfortable in your [interrupt] current room that we can assist with? Perhaps the lighting, temperature, or any other amenities that aren't meeting your expectations?", + "start_time": 4.3015159889890295, + "end_time": 13.693987644317827, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--372/temp/line_2_A.wav", + "silence_duration": 0.39380841319179144, + "is_interrupted": true, + "text_after_interrupt": "current room that we can assist with? Perhaps the lighting, temperature, or any other amenities that aren't meeting your expectations?" + }, + { + "speaker": "B", + "text": "Yes, the air-conditioner in this room doesn't work.", + "original_text": "Yes, the air-conditioner in this room doesn't work.", + "start_time": 6.170722338195379, + "end_time": 8.643647508263406, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--372/temp/line_3_B.wav", + "silence_duration": 0.4883132115311747, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "May I have your room number, sir?", + "original_text": "May I have your room number, sir?", + "start_time": 14.202802535323046, + "end_time": 15.851419315368398, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--372/temp/line_4_A.wav", + "silence_duration": 0.5088148910052183, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Wang Wei. Room 1212.", + "original_text": "Wang Wei. Room 1212.", + "start_time": 16.281915144277313, + "end_time": 18.360101085320398, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--372/temp/line_5_B.wav", + "silence_duration": 0.43049582890891447, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "OK. Mr. Wang, may I send a room attendant to check it for you", + "original_text": "OK. Mr. Wang, may I send a room attendant to check it for you [interrupt] and see if it can be fixed quickly or if we should proceed with arranging an alternative room for your comfort immediately?", + "start_time": 18.724411554099905, + "end_time": 29.77710996679832, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--372/temp/line_6_A.wav", + "silence_duration": 0.364310468779509, + "is_interrupted": true, + "text_after_interrupt": "and see if it can be fixed quickly or if we should proceed with arranging an alternative room for your comfort immediately?" + }, + { + "speaker": "B", + "text": "Actually, if it's going to take too long, I'd rather just move to another room directly.", + "original_text": "Actually, if it's going to take too long, I'd rather just move to another room directly.", + "start_time": 25.320520816473998, + "end_time": 29.430452789263114, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--372/temp/line_7_B.wav", + "silence_duration": 0.43614003143871705, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Understood. We'll check how long it might take first. If it's too long, we'll arrange another room for you right away.", + "original_text": "Understood. We'll check how long it might take first. If it's too long, we'll arrange another room for you right away.", + "start_time": 30.294212476806678, + "end_time": 37.42273855390418, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--372/temp/line_8_A.wav", + "silence_duration": 0.5171025100083567, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Mr. Wang, we are deeply sorry for the inconvenience. The maintenance might last for a long time, may I offer you another room?", + "original_text": "Mr. Wang, we are deeply sorry for the inconvenience. The maintenance might last for a long time, may I offer you another room?", + "start_time": 37.82574630470897, + "end_time": 45.825020681126205, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--372/temp/line_9_A.wav", + "silence_duration": 0.40300775080479007, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes. No problem.", + "original_text": "Yes. No problem.", + "start_time": 46.25473197890739, + "end_time": 47.36928980203664, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--372/temp/line_10_B.wav", + "silence_duration": 0.4297112977811855, + "is_interrupted": false + } + ] + }, + "DialogSum--val--373": { + "original_text": "A: How many foreign languages can you speak? \nB: Only English. \nA: What do you think of your English? \nB: I have passed CET - 6 and I am proficient in reading and translating foreign materials. I have rich translating experience because I used to be an English [interrupt] translator for a multinational company where I handled complex technical documents and business contracts on a daily basis. \nA: Sorry to cut in, but when you say translating experience, did you work with any specific industries or types of documents? \nB: Yes, I mainly worked with technical manuals and business contracts. But I haven't mentioned that I used to be an English translator for a multinational company, which gave me exposure to a variety of document types. \nA: Oh, I see. So, you were an English translator. Can you speak English fluently? \nB: I have received oral English training and I can communicate with others fluently. \nA: Did you take TOEFL or GRE? \nB: Yes, I did. I got 600 in TOEFL and 2,300 in GRE. \nA: When did you begin to learn English? \nB: I started to learn English when I was in primary school. \nA: Do you think your English is good enough to do office work? \nB: The amount of English I know enables me to do general desk work. I believe the amount of English I know is sufficient to work in a South Korean firm, especially since I'm willing to improve my language skills further through additional training and practice.", + "cleaned_text": "A: How many foreign languages can you speak? \nB: Only English. \nA: What do you think of your English? \nB:I have passed CET - 6 and I am proficient in reading and translating foreign materials. I have rich translating experience because I used to be an English translator for a multinational company where I handled complex technical documents and business contracts on a daily basis.\nA: Sorry to cut in, but when you say translating experience, did you work with any specific industries or types of documents? \nB: Yes, I mainly worked with technical manuals and business contracts. But I haven't mentioned that I used to be an English translator for a multinational company, which gave me exposure to a variety of document types. \nA: Oh, I see. So, you were an English translator. Can you speak English fluently? \nB: I have received oral English training and I can communicate with others fluently. \nA: Did you take TOEFL or GRE? \nB: Yes, I did. I got 600 in TOEFL and 2,300 in GRE. \nA: When did you begin to learn English? \nB: I started to learn English when I was in primary school. \nA: Do you think your English is good enough to do office work? \nB: The amount of English I know enables me to do general desk work. I believe the amount of English I know is sufficient to work in a South Korean firm, especially since I'm willing to improve my language skills further through additional training and practice.", + "total_duration": 73.77573696145124, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--373/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--373/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--373/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "How many foreign languages can you speak?", + "original_text": "How many foreign languages can you speak?", + "start_time": 0, + "end_time": 2.2291156462585033, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--373/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Only English.", + "original_text": "Only English.", + "start_time": 2.8065555851307225, + "end_time": 3.6192539978291354, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--373/temp/line_1_B.wav", + "silence_duration": 0.5774399388722192, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "What do you think of your English?", + "original_text": "What do you think of your English?", + "start_time": 4.020646571688341, + "end_time": 5.7737531476520605, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--373/temp/line_2_A.wav", + "silence_duration": 0.4013925738592055, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I have passed CET - 6 and I am proficient in reading and translating foreign materials. I have rich translating experience because I used to be an English", + "original_text": "I have passed CET - 6 and I am proficient in reading and translating foreign materials. I have rich translating experience because I used to be an English [interrupt] translator for a multinational company where I handled complex technical documents and business contracts on a daily basis.", + "start_time": 6.285374477362946, + "end_time": 21.958843865118048, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--373/temp/line_3_B.wav", + "silence_duration": 0.5116213297108855, + "is_interrupted": true, + "text_after_interrupt": "translator for a multinational company where I handled complex technical documents and business contracts on a daily basis." + }, + { + "speaker": "A", + "text": "Sorry to cut in, but when you say translating experience, did you work with any specific industries or types of documents?", + "original_text": "Sorry to cut in, but when you say translating experience, did you work with any specific industries or types of documents?", + "start_time": 14.714218014777913, + "end_time": 23.14306155219288, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--373/temp/line_4_A.wav", + "silence_duration": 0.3996638474843849, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, I mainly worked with technical manuals and business contracts. But I haven't mentioned that I used to be an English translator for a multinational company, which gave me exposure to a variety of document types.", + "original_text": "Yes, I mainly worked with technical manuals and business contracts. But I haven't mentioned that I used to be an English translator for a multinational company, which gave me exposure to a variety of document types.", + "start_time": 23.54878760008222, + "end_time": 34.183526829107166, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--373/temp/line_5_B.wav", + "silence_duration": 0.40572604788934086, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Oh, I see. So, you were an English translator. Can you speak English fluently?", + "original_text": "Oh, I see. So, you were an English translator. Can you speak English fluently?", + "start_time": 34.72057614991919, + "end_time": 40.45590494810513, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--373/temp/line_6_A.wav", + "silence_duration": 0.5370493208120237, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I have received oral English training and I can communicate with others fluently.", + "original_text": "I have received oral English training and I can communicate with others fluently.", + "start_time": 40.81861526432963, + "end_time": 44.87049735049743, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--373/temp/line_7_B.wav", + "silence_duration": 0.36271031622450217, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Did you take TOEFL or GRE?", + "original_text": "Did you take TOEFL or GRE?", + "start_time": 45.26837640027541, + "end_time": 47.04470293088765, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--373/temp/line_8_A.wav", + "silence_duration": 0.3978790497779742, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, I did. I got 600 in TOEFL and 2,300 in GRE.", + "original_text": "Yes, I did. I got 600 in TOEFL and 2,300 in GRE.", + "start_time": 47.627856086594164, + "end_time": 52.03964746981412, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--373/temp/line_9_B.wav", + "silence_duration": 0.583153155706514, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "When did you begin to learn English?", + "original_text": "When did you begin to learn English?", + "start_time": 52.55532461299357, + "end_time": 54.56385069009108, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--373/temp/line_10_A.wav", + "silence_duration": 0.5156771431794512, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I started to learn English when I was in primary school.", + "original_text": "I started to learn English when I was in primary school.", + "start_time": 55.00942374344713, + "end_time": 57.80742827859452, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--373/temp/line_11_B.wav", + "silence_duration": 0.44557305335605124, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Do you think your English is good enough to do office work?", + "original_text": "Do you think your English is good enough to do office work?", + "start_time": 58.180396164299815, + "end_time": 61.05967054071705, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--373/temp/line_12_A.wav", + "silence_duration": 0.3729678857052917, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "The amount of English I know enables me to do general desk work. I believe the amount of English I know is sufficient to work in a South Korean firm, especially since I'm willing to improve my language skills further through additional training and practice.", + "original_text": "The amount of English I know enables me to do general desk work. I believe the amount of English I know is sufficient to work in a South Korean firm, especially since I'm willing to improve my language skills further through additional training and practice.", + "start_time": 61.42272434774055, + "end_time": 73.77574022075642, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--373/temp/line_13_B.wav", + "silence_duration": 0.3630538070234979, + "is_interrupted": false + } + ] + }, + "DialogSum--val--374": { + "original_text": "A: How much will our order from your factory be?\nB: I'll be happy to get back to you with an estimate in the next few days.\nA: I'm afraid I can't wait that long. Can your office at least provide me with a ballpark figure?\nB: Well, I would need an idea of how large your order would be. About how many units would you [interrupt] be looking to purchase in total, and would you be interested in any additional services like customization or expedited shipping that might affect the final pricing?\nA: Just give me an estimated figure for an order of 100 units.\nB: Please give me a few minutes to calculate... Our asking price should be about $100 per unit with an order of 100. Is that price acceptable to you?\nA: Your estimate seems a little high to me; we're willing to pay $80 per unit.\nB: With an order of only 100 units, it'll be difficult to work within that kind of budget. Maybe if you were ordering 500 units or more [interrupt] we could offer a more competitive price that would include bulk discounts and potentially free shipping depending on your location and specific requirements.\nA: I understand that larger orders might get a better rate, but what if we consider a long-term partnership? Could that help us negotiate the price for 100 units?", + "cleaned_text": "A: How much will our order from your factory be?\nB: I'll be happy to get back to you with an estimate in the next few days.\nA: I'm afraid I can't wait that long. Can your office at least provide me with a ballpark figure?\nB:Well, I would need an idea of how large your order would be. About how many units would you be looking to purchase in total, and would you be interested in any additional services like customization or expedited shipping that might affect the final pricing?\nA: Just give me an estimated figure for an order of 100 units.\nB: Please give me a few minutes to calculate... Our asking price should be about $100 per unit with an order of 100. Is that price acceptable to you?\nA: Your estimate seems a little high to me; we're willing to pay $80 per unit.\nB:With an order of only 100 units, it'll be difficult to work within that kind of budget. Maybe if you were ordering 500 units or more we could offer a more competitive price that would include bulk discounts and potentially free shipping depending on your location and specific requirements.\nA: I understand that larger orders might get a better rate, but what if we consider a long-term partnership? Could that help us negotiate the price for 100 units?", + "total_duration": 60.71333333333333, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--374/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--374/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--374/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "How much will our order from your factory be?", + "original_text": "How much will our order from your factory be?", + "start_time": 0, + "end_time": 2.5774149659863945, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--374/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I'll be happy to get back to you with an estimate in the next few days.", + "original_text": "I'll be happy to get back to you with an estimate in the next few days.", + "start_time": 3.0530477950007873, + "end_time": 6.071641899309178, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--374/temp/line_1_B.wav", + "silence_duration": 0.47563282901439285, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I'm afraid I can't wait that long. Can your office at least provide me with a ballpark figure?", + "original_text": "I'm afraid I can't wait that long. Can your office at least provide me with a ballpark figure?", + "start_time": 6.450442032623848, + "end_time": 11.930351329676004, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--374/temp/line_2_A.wav", + "silence_duration": 0.3788001333146704, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Well, I would need an idea of how large your order would be. About how many units would you", + "original_text": "Well, I would need an idea of how large your order would be. About how many units would you [interrupt] be looking to purchase in total, and would you be interested in any additional services like customization or expedited shipping that might affect the final pricing?", + "start_time": 12.341747486375159, + "end_time": 25.03145270179466, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--374/temp/line_3_B.wav", + "silence_duration": 0.4113961566991552, + "is_interrupted": true, + "text_after_interrupt": "be looking to purchase in total, and would you be interested in any additional services like customization or expedited shipping that might affect the final pricing?" + }, + { + "speaker": "A", + "text": "Just give me an estimated figure for an order of 100 units.", + "original_text": "Just give me an estimated figure for an order of 100 units.", + "start_time": 17.473357463699422, + "end_time": 21.432359731273117, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--374/temp/line_4_A.wav", + "silence_duration": 0.3103503484747993, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Please give me a few minutes to calculate... Our asking price should be about $100 per unit with an order of 100. Is that price acceptable to you?", + "original_text": "Please give me a few minutes to calculate... Our asking price should be about $100 per unit with an order of 100. Is that price acceptable to you?", + "start_time": 25.393681680945576, + "end_time": 33.485835875956916, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--374/temp/line_5_B.wav", + "silence_duration": 0.3622289791509165, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Your estimate seems a little high to me; we're willing to pay $80 per unit.", + "original_text": "Your estimate seems a little high to me; we're willing to pay $80 per unit.", + "start_time": 33.86541770676098, + "end_time": 38.880927910842615, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--374/temp/line_6_A.wav", + "silence_duration": 0.3795818308040647, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "With an order of only 100 units, it'll be difficult to work within that kind of budget. Maybe if you were ordering 500 units or more", + "original_text": "With an order of only 100 units, it'll be difficult to work within that kind of budget. Maybe if you were ordering 500 units or more [interrupt] we could offer a more competitive price that would include bulk discounts and potentially free shipping depending on your location and specific requirements.", + "start_time": 39.22761153583533, + "end_time": 54.73854124105075, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--374/temp/line_7_B.wav", + "silence_duration": 0.3466836249927133, + "is_interrupted": true, + "text_after_interrupt": "we could offer a more competitive price that would include bulk discounts and potentially free shipping depending on your location and specific requirements." + }, + { + "speaker": "A", + "text": "I understand that larger orders might get a better rate, but what if we consider a long-term partnership? Could that help us negotiate the price for 100 units?", + "original_text": "I understand that larger orders might get a better rate, but what if we consider a long-term partnership? Could that help us negotiate the price for 100 units?", + "start_time": 51.344102159223596, + "end_time": 60.71335385990387, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--374/temp/line_8_A.wav", + "silence_duration": 0.5996414806183261, + "is_interrupted": false + } + ] + }, + "DialogSum--val--375": { + "original_text": "A: Hello, is this house keeper? \nB: Yes, Madam, may I help you? \nA: This is room 117, and we have just checked in. \nB: Yes? \nA: Our room hasn't been cleaned up yet. So would you send one of your house keepers to clean up our [interrupt] room as soon as possible? We have some luggage to unpack and would prefer to do so in a clean environment, especially since we're traveling with young children who need a hygienic space. \nB: Oh, I'm really sorry about that! We'll come right away. Could I confirm your room number and your name, please? \nA: Our room number is 117 and my name is Terry Chen. \nB: Thank you, Ms. Chen. By the way, you mentioned your room hasn't been cleaned up yet—was there any specific issue you noticed, like the bathroom or the [interrupt] bed sheets that need to be changed? I want to make sure our team addresses all your concerns properly and leaves your room in perfect condition for your stay. \nA: Mainly the bathroom, yes. The rest of the room seems fine, but the bathroom definitely needs attention. \nB: Understood. We'll make sure to take care of it. Could you please hang up and wait?", + "cleaned_text": "A: Hello, is this house keeper? \nB: Yes, Madam, may I help you? \nA: This is room 117, and we have just checked in. \nB: Yes? \nA:Our room hasn't been cleaned up yet. So would you send one of your house keepers to clean up our room as soon as possible? We have some luggage to unpack and would prefer to do so in a clean environment, especially since we're traveling with young children who need a hygienic space.\nB: Oh, I'm really sorry about that! We'll come right away. Could I confirm your room number and your name, please? \nA: Our room number is 117 and my name is Terry Chen. \nB:Thank you, Ms. Chen. By the way, you mentioned your room hasn't been cleaned up yet—was there any specific issue you noticed, like the bathroom or the bed sheets that need to be changed? I want to make sure our team addresses all your concerns properly and leaves your room in perfect condition for your stay.\nA: Mainly the bathroom, yes. The rest of the room seems fine, but the bathroom definitely needs attention. \nB: Understood. We'll make sure to take care of it. Could you please hang up and wait?", + "total_duration": 56.745170068027214, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--375/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--375/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--375/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Hello, is this house keeper?", + "original_text": "Hello, is this house keeper?", + "start_time": 0, + "end_time": 2.089795918367347, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--375/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, Madam, may I help you?", + "original_text": "Yes, Madam, may I help you?", + "start_time": 2.563983026319238, + "end_time": 4.235819761013115, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--375/temp/line_1_B.wav", + "silence_duration": 0.47418710795189045, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "This is room 117, and we have just checked in.", + "original_text": "This is room 117, and we have just checked in.", + "start_time": 4.750369405323792, + "end_time": 8.767421559518803, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--375/temp/line_2_A.wav", + "silence_duration": 0.5145496443106776, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes?", + "original_text": "Yes?", + "start_time": 9.366749762557319, + "end_time": 9.98207856074326, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--375/temp/line_3_B.wav", + "silence_duration": 0.5993282030385165, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Our room hasn't been cleaned up yet. So would you send one of your house keepers to clean up our", + "original_text": "Our room hasn't been cleaned up yet. So would you send one of your house keepers to clean up our [interrupt] room as soon as possible? We have some luggage to unpack and would prefer to do so in a clean environment, especially since we're traveling with young children who need a hygienic space.", + "start_time": 10.29508213017415, + "end_time": 26.131091200468934, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--375/temp/line_4_A.wav", + "silence_duration": 0.31300356943089014, + "is_interrupted": true, + "text_after_interrupt": "room as soon as possible? We have some luggage to unpack and would prefer to do so in a clean environment, especially since we're traveling with young children who need a hygienic space." + }, + { + "speaker": "B", + "text": "Oh, I'm really sorry about that! We'll come right away. Could I confirm your room number and your name, please?", + "original_text": "Oh, I'm really sorry about that! We'll come right away. Could I confirm your room number and your name, please?", + "start_time": 15.624061722010884, + "end_time": 21.312950610899772, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--375/temp/line_5_B.wav", + "silence_duration": 0.4676961631917469, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Our room number is 117 and my name is Terry Chen.", + "original_text": "Our room number is 117 and my name is Terry Chen.", + "start_time": 26.595066244404997, + "end_time": 31.19261726481316, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--375/temp/line_6_A.wav", + "silence_duration": 0.4639750439360639, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Thank you, Ms. Chen. By the way, you mentioned your room hasn't been cleaned up yet—was there any specific issue you noticed, like the bathroom or the", + "original_text": "Thank you, Ms. Chen. By the way, you mentioned your room hasn't been cleaned up yet—was there any specific issue you noticed, like the bathroom or the [interrupt] bed sheets that need to be changed? I want to make sure our team addresses all your concerns properly and leaves your room in perfect condition for your stay.", + "start_time": 31.713934026757222, + "end_time": 46.86495443492049, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--375/temp/line_7_B.wav", + "silence_duration": 0.5213167619440627, + "is_interrupted": true, + "text_after_interrupt": "bed sheets that need to be changed? I want to make sure our team addresses all your concerns properly and leaves your room in perfect condition for your stay." + }, + { + "speaker": "A", + "text": "Mainly the bathroom, yes. The rest of the room seems fine, but the bathroom definitely needs attention.", + "original_text": "Mainly the bathroom, yes. The rest of the room seems fine, but the bathroom definitely needs attention.", + "start_time": 45.14705004964708, + "end_time": 52.21752624012327, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--375/temp/line_8_A.wav", + "silence_duration": 0.4675241202946255, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Understood. We'll make sure to take care of it. Could you please hang up and wait?", + "original_text": "Understood. We'll make sure to take care of it. Could you please hang up and wait?", + "start_time": 52.72816285745415, + "end_time": 56.745215011649165, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--375/temp/line_9_B.wav", + "silence_duration": 0.510636617330885, + "is_interrupted": false + } + ] + }, + "DialogSum--val--377": { + "original_text": "A: Do you have any shoes like these? \nB: What size? \nA: Size five. \nB: What colour? \nA: Black. \nB: I'm sorry. We don't have any. \nA: But my sister bought this pair last month. \nB: Did she buy them [interrupt] here at our downtown location, or perhaps at one of our branch stores in the neighboring cities? I could check our inventory system if you'd like. \nA: Oh, no, she bought them in the U.S. But if you had them before, maybe you can get a pair for me? \nB: We had some shoes like those a month ago, but we don't have any now. \nA: Can you get a pair for me please? \nB: I'm afraid that I can't. They were in fashion last year and the year before last. But they're not in fashion this year. These shoes are in fashion now. \nA: Wait, you were asking if my sister bought them here, right? No, she didn't. But are there any other stores that might still have them?", + "cleaned_text": "A: Do you have any shoes like these? \nB: What size? \nA: Size five. \nB: What colour? \nA: Black. \nB: I'm sorry. We don't have any. \nA: But my sister bought this pair last month. \nB:Did she buy them here at our downtown location, or perhaps at one of our branch stores in the neighboring cities? I could check our inventory system if you'd like.\nA: Oh, no, she bought them in the U.S. But if you had them before, maybe you can get a pair for me? \nB: We had some shoes like those a month ago, but we don't have any now. \nA: Can you get a pair for me please? \nB: I'm afraid that I can't. They were in fashion last year and the year before last. But they're not in fashion this year. These shoes are in fashion now. \nA: Wait, you were asking if my sister bought them here, right? No, she didn't. But are there any other stores that might still have them?", + "total_duration": 42.636916099773245, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--377/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--377/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--377/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Do you have any shoes like these?", + "original_text": "Do you have any shoes like these?", + "start_time": 0, + "end_time": 1.8924263038548752, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--377/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "What size?", + "original_text": "What size?", + "start_time": 2.391574329507805, + "end_time": 3.262322628827533, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--377/temp/line_1_B.wav", + "silence_duration": 0.4991480256529297, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Size five.", + "original_text": "Size five.", + "start_time": 3.67475530825207, + "end_time": 4.789313131381322, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--377/temp/line_2_A.wav", + "silence_duration": 0.41243267942453704, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "What colour?", + "original_text": "What colour?", + "start_time": 5.14229887426815, + "end_time": 5.920167354993773, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--377/temp/line_3_B.wav", + "silence_duration": 0.35298574288682816, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Black.", + "original_text": "Black.", + "start_time": 6.3189809357281685, + "end_time": 7.015579575183951, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--377/temp/line_4_A.wav", + "silence_duration": 0.39881358073439516, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I'm sorry. We don't have any.", + "original_text": "I'm sorry. We don't have any.", + "start_time": 7.430515509793465, + "end_time": 8.963032516596186, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--377/temp/line_5_B.wav", + "silence_duration": 0.41493593460951417, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "But my sister bought this pair last month.", + "original_text": "But my sister bought this pair last month.", + "start_time": 9.420270792515906, + "end_time": 11.73065628004425, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--377/temp/line_6_A.wav", + "silence_duration": 0.45723827591971855, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Did she buy them", + "original_text": "Did she buy them [interrupt] here at our downtown location, or perhaps at one of our branch stores in the neighboring cities? I could check our inventory system if you'd like.", + "start_time": 12.180062538891702, + "end_time": 20.109677051363356, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--377/temp/line_7_B.wav", + "silence_duration": 0.44940625884745145, + "is_interrupted": true, + "text_after_interrupt": "here at our downtown location, or perhaps at one of our branch stores in the neighboring cities? I could check our inventory system if you'd like." + }, + { + "speaker": "A", + "text": "Oh, no, she bought them in the U.S. But if you had them before, maybe you can get a pair for me?", + "original_text": "Oh, no, she bought them in the U.S. But if you had them before, maybe you can get a pair for me?", + "start_time": 12.96954099694159, + "end_time": 18.461060271318004, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--377/temp/line_8_A.wav", + "silence_duration": 0.5855936325484323, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "We had some shoes like those a month ago, but we don't have any now.", + "original_text": "We had some shoes like those a month ago, but we don't have any now.", + "start_time": 20.643293471427064, + "end_time": 23.719937462356768, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--377/temp/line_9_B.wav", + "silence_duration": 0.533616420063707, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Can you get a pair for me please?", + "original_text": "Can you get a pair for me please?", + "start_time": 24.083428462119866, + "end_time": 25.8945849247049, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--377/temp/line_10_A.wav", + "silence_duration": 0.36349099976309684, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I'm afraid that I can't. They were in fashion last year and the year before last. But they're not in fashion this year. These shoes are in fashion now.", + "original_text": "I'm afraid that I can't. They were in fashion last year and the year before last. But they're not in fashion this year. These shoes are in fashion now.", + "start_time": 26.326839210230084, + "end_time": 34.38416347326863, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--377/temp/line_11_B.wav", + "silence_duration": 0.43225428552518286, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Wait, you were asking if my sister bought them here, right? No, she didn't. But are there any other stores that might still have them?", + "original_text": "Wait, you were asking if my sister bought them here, right? No, she didn't. But are there any other stores that might still have them?", + "start_time": 34.939509448433235, + "end_time": 42.63692441441963, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--377/temp/line_12_A.wav", + "silence_duration": 0.555345975164607, + "is_interrupted": false + } + ] + }, + "DialogSum--val--378": { + "original_text": "A: That is the most boring, typical gift in the world! \nB: I know. But this year I want to get him an interesting tie. Like this one. \nA: That's not exactly a conversation piece. It's so plain. \nB: It's perfect! It's a Dilbert [interrupt] tie, which is based on the comic strip character and actually has several hidden features that make it truly unique and interactive, just like the comics themselves. \nA: Wait, did you say Dilbert? You mean the comic strip character? \nB: Yes! And there's more. The diagonal black and red stripes are really conservative though. . . \nA: But you still think it's interesting just because it's Dilbert? \nB: But watch this. . . it bends upwards, just like Dilbert's tie. There's a wire inside. \nA: Oh, I see! So, what were you saying about the stripes earlier?", + "cleaned_text": "A: That is the most boring, typical gift in the world! \nB: I know. But this year I want to get him an interesting tie. Like this one. \nA: That's not exactly a conversation piece. It's so plain. \nB:It's perfect! It's a Dilbert tie, which is based on the comic strip character and actually has several hidden features that make it truly unique and interactive, just like the comics themselves.\nA: Wait, did you say Dilbert? You mean the comic strip character? \nB: Yes! And there's more. The diagonal black and red stripes are really conservative though. . . \nA: But you still think it's interesting just because it's Dilbert? \nB: But watch this. . . it bends upwards, just like Dilbert's tie. There's a wire inside. \nA: Oh, I see! So, what were you saying about the stripes earlier?", + "total_duration": 40.037732426303855, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--378/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--378/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--378/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "That is the most boring, typical gift in the world!", + "original_text": "That is the most boring, typical gift in the world!", + "start_time": 0, + "end_time": 2.809614512471655, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--378/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I know. But this year I want to get him an interesting tie. Like this one.", + "original_text": "I know. But this year I want to get him an interesting tie. Like this one.", + "start_time": 3.2535650526318234, + "end_time": 6.887487955126154, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--378/temp/line_1_B.wav", + "silence_duration": 0.44395054016016844, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "That's not exactly a conversation piece. It's so plain.", + "original_text": "That's not exactly a conversation piece. It's so plain.", + "start_time": 7.213247737875013, + "end_time": 10.905220526990659, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--378/temp/line_2_A.wav", + "silence_duration": 0.32575978274885864, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "It's perfect! It's a Dilbert", + "original_text": "It's perfect! It's a Dilbert [interrupt] tie, which is based on the comic strip character and actually has several hidden features that make it truly unique and interactive, just like the comics themselves.", + "start_time": 11.308572286021484, + "end_time": 21.33959269418475, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--378/temp/line_3_B.wav", + "silence_duration": 0.4033517590308241, + "is_interrupted": true, + "text_after_interrupt": "tie, which is based on the comic strip character and actually has several hidden features that make it truly unique and interactive, just like the comics themselves." + }, + { + "speaker": "A", + "text": "Wait, did you say Dilbert? You mean the comic strip character?", + "original_text": "Wait, did you say Dilbert? You mean the comic strip character?", + "start_time": 12.922359134094046, + "end_time": 16.521452104615587, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--378/temp/line_4_A.wav", + "silence_duration": 0.5847770090092357, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes! And there's more. The diagonal black and red stripes are really conservative though. . .", + "original_text": "Yes! And there's more. The diagonal black and red stripes are really conservative though. . .", + "start_time": 21.702204734352826, + "end_time": 26.83381471167709, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--378/temp/line_5_B.wav", + "silence_duration": 0.3626120401680768, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "But you still think it's interesting just because it's Dilbert?", + "original_text": "But you still think it's interesting just because it's Dilbert?", + "start_time": 27.243348469013995, + "end_time": 30.27355255064665, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--378/temp/line_6_A.wav", + "silence_duration": 0.40953375733690656, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "But watch this. . . it bends upwards, just like Dilbert's tie. There's a wire inside.", + "original_text": "But watch this. . . it bends upwards, just like Dilbert's tie. There's a wire inside.", + "start_time": 30.573568954968938, + "end_time": 35.32204968059252, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--378/temp/line_7_B.wav", + "silence_duration": 0.3000164043222883, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Oh, I see! So, what were you saying about the stripes earlier?", + "original_text": "Oh, I see! So, what were you saying about the stripes earlier?", + "start_time": 35.8813840769313, + "end_time": 40.03775595901747, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--378/temp/line_8_A.wav", + "silence_duration": 0.5593343963387745, + "is_interrupted": false + } + ] + }, + "DialogSum--val--379": { + "original_text": "A: Passport, please! \nB: Here you are. \nA: Are you Chinese? \nB: Yes, I am. \nA: Where in China are you [interrupt] planning to go after you leave here? I'm particularly interested because we've been seeing many tourists from different regions of China recently. \nB: Sorry to interrupt, but do you need any other documents besides my passport? \nA: No, just your passport is fine. So, where in China are you from? \nB: Fujisan Province. \nA: There are a lot of people from China visiting right now. \nB: It's not surprising. Our school year just ended, and a lot of Chinese are on vacation. \nA: How long do you plan to stay? \nB: About half a month. \nA: All right. Here's your passport. Welcome to Australia. \nB: Thank you.", + "cleaned_text": "A: Passport, please! \nB: Here you are. \nA: Are you Chinese? \nB: Yes, I am. \nA:Where in China are you planning to go after you leave here? I'm particularly interested because we've been seeing many tourists from different regions of China recently.\nB: Sorry to interrupt, but do you need any other documents besides my passport? \nA: No, just your passport is fine. So, where in China are you from? \nB: Fujisan Province. \nA: There are a lot of people from China visiting right now. \nB: It's not surprising. Our school year just ended, and a lot of Chinese are on vacation. \nA: How long do you plan to stay? \nB: About half a month. \nA: All right. Here's your passport. Welcome to Australia. \nB: Thank you.", + "total_duration": 38.357233560090705, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--379/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--379/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--379/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Passport, please!", + "original_text": "Passport, please!", + "start_time": 0, + "end_time": 1.3699773242630386, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--379/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Here you are.", + "original_text": "Here you are.", + "start_time": 1.7398414345742967, + "end_time": 2.4596600286786052, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--379/temp/line_1_B.wav", + "silence_duration": 0.3698641103112581, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Are you Chinese?", + "original_text": "Are you Chinese?", + "start_time": 2.821143227301591, + "end_time": 4.051800823673473, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--379/temp/line_2_A.wav", + "silence_duration": 0.3614831986229858, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, I am.", + "original_text": "Yes, I am.", + "start_time": 4.418876224933751, + "end_time": 5.231574637632163, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--379/temp/line_3_B.wav", + "silence_duration": 0.36707540126027816, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Where in China are you", + "original_text": "Where in China are you [interrupt] planning to go after you leave here? I'm particularly interested because we've been seeing many tourists from different regions of China recently.", + "start_time": 5.630537109303826, + "end_time": 14.802419195471625, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--379/temp/line_4_A.wav", + "silence_duration": 0.3989624716716629, + "is_interrupted": true, + "text_after_interrupt": "planning to go after you leave here? I'm particularly interested because we've been seeing many tourists from different regions of China recently." + }, + { + "speaker": "B", + "text": "Sorry to interrupt, but do you need any other documents besides my passport?", + "original_text": "Sorry to interrupt, but do you need any other documents besides my passport?", + "start_time": 6.861194705675707, + "end_time": 10.994346633113349, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--379/temp/line_5_B.wav", + "silence_duration": 0.383055645703088, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "No, just your passport is fine. So, where in China are you from?", + "original_text": "No, just your passport is fine. So, where in China are you from?", + "start_time": 15.383864782815044, + "end_time": 19.818876120683527, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--379/temp/line_6_A.wav", + "silence_duration": 0.581445587343419, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Fujisan Province.", + "original_text": "Fujisan Province.", + "start_time": 20.159844898129485, + "end_time": 21.494992290419734, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--379/temp/line_7_B.wav", + "silence_duration": 0.34096877744595955, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "There are a lot of people from China visiting right now.", + "original_text": "There are a lot of people from China visiting right now.", + "start_time": 22.060578233016308, + "end_time": 25.05595238267617, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--379/temp/line_8_A.wav", + "silence_duration": 0.5655859425965739, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "It's not surprising. Our school year just ended, and a lot of Chinese are on vacation.", + "original_text": "It's not surprising. Our school year just ended, and a lot of Chinese are on vacation.", + "start_time": 25.36806328971573, + "end_time": 29.55926510377469, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--379/temp/line_9_B.wav", + "silence_duration": 0.31211090703956107, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "How long do you plan to stay?", + "original_text": "How long do you plan to stay?", + "start_time": 30.12606834984644, + "end_time": 31.797905084540318, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--379/temp/line_10_A.wav", + "silence_duration": 0.566803246071754, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "About half a month.", + "original_text": "About half a month.", + "start_time": 32.337561051256685, + "end_time": 33.47533882903446, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--379/temp/line_11_B.wav", + "silence_duration": 0.5396559667163692, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "All right. Here's your passport. Welcome to Australia.", + "original_text": "All right. Here's your passport. Welcome to Australia.", + "start_time": 33.92078606855125, + "end_time": 37.19479967399343, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--379/temp/line_12_A.wav", + "silence_duration": 0.44544723951678733, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Thank you.", + "original_text": "Thank you.", + "start_time": 37.76514521126154, + "end_time": 38.35725405479896, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--379/temp/line_13_B.wav", + "silence_duration": 0.5703455372681092, + "is_interrupted": false + } + ] + }, + "DialogSum--val--380": { + "original_text": "A: Can I help you? \nB: Yes. How much are these T-shirts? \nA: They are 12 dollars 50 cents each. \nB: I like the green one, but it isn't big enough. Have you got a larger size? \nA: Just a minute. No. I'm sorry. We haven't. What about [interrupt] checking out our other styles or colors that might fit better? We have a new collection arriving next week with more size options and trendy designs if you'd like to come back then. \nB: Oh, before I forget, do you have any other colors besides these? Maybe something like yellow or pink? \nA: We do have a pink one. I was actually about to suggest the black one, but since you prefer lighter colors, how about the pink? \nB: Yes, that's nice. I'll take it. \nA: That's 12 dollars 50 cents then please. \nB: Here you are.", + "cleaned_text": "A: Can I help you? \nB: Yes. How much are these T-shirts? \nA: They are 12 dollars 50 cents each. \nB: I like the green one, but it isn't big enough. Have you got a larger size? \nA:Just a minute. No. I'm sorry. We haven't. What about checking out our other styles or colors that might fit better? We have a new collection arriving next week with more size options and trendy designs if you'd like to come back then.\nB: Oh, before I forget, do you have any other colors besides these? Maybe something like yellow or pink? \nA: We do have a pink one. I was actually about to suggest the black one, but since you prefer lighter colors, how about the pink? \nB: Yes, that's nice. I'll take it. \nA: That's 12 dollars 50 cents then please. \nB: Here you are.", + "total_duration": 39.97854875283447, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--380/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--380/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--380/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Can I help you?", + "original_text": "Can I help you?", + "start_time": 0, + "end_time": 0.9287981859410431, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--380/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes. How much are these T-shirts?", + "original_text": "Yes. How much are these T-shirts?", + "start_time": 1.3406804902958234, + "end_time": 3.929705433606481, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--380/temp/line_1_B.wav", + "silence_duration": 0.4118823043547803, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "They are 12 dollars 50 cents each.", + "original_text": "They are 12 dollars 50 cents each.", + "start_time": 4.378055202817903, + "end_time": 6.711660644994773, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--380/temp/line_2_A.wav", + "silence_duration": 0.4483497692114216, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I like the green one, but it isn't big enough. Have you got a larger size?", + "original_text": "I like the green one, but it isn't big enough. Have you got a larger size?", + "start_time": 7.299470190329892, + "end_time": 11.03788288874259, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--380/temp/line_3_B.wav", + "silence_duration": 0.5878095453351185, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Just a minute. No. I'm sorry. We haven't. What about", + "original_text": "Just a minute. No. I'm sorry. We haven't. What about [interrupt] checking out our other styles or colors that might fit better? We have a new collection arriving next week with more size options and trendy designs if you'd like to come back then.", + "start_time": 11.361228652612365, + "end_time": 25.09583182721554, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--380/temp/line_4_A.wav", + "silence_duration": 0.3233457638697741, + "is_interrupted": true, + "text_after_interrupt": "checking out our other styles or colors that might fit better? We have a new collection arriving next week with more size options and trendy designs if you'd like to come back then." + }, + { + "speaker": "B", + "text": "Oh, before I forget, do you have any other colors besides these? Maybe something like yellow or pink?", + "original_text": "Oh, before I forget, do you have any other colors besides these? Maybe something like yellow or pink?", + "start_time": 15.134471282997852, + "end_time": 20.25447128299785, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--380/temp/line_5_B.wav", + "silence_duration": 0.4912516192391776, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "We do have a pink one. I was actually about to suggest the black one, but since you prefer lighter colors, how about the pink?", + "original_text": "We do have a pink one. I was actually about to suggest the black one, but since you prefer lighter colors, how about the pink?", + "start_time": 25.642955495335997, + "end_time": 33.351980438646656, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--380/temp/line_6_A.wav", + "silence_duration": 0.5471236681204572, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, that's nice. I'll take it.", + "original_text": "Yes, that's nice. I'll take it.", + "start_time": 33.74868704776464, + "end_time": 35.38569385048573, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--380/temp/line_7_B.wav", + "silence_duration": 0.3967066091179866, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "That's 12 dollars 50 cents then please.", + "original_text": "That's 12 dollars 50 cents then please.", + "start_time": 35.929663472005565, + "end_time": 38.68122809785591, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--380/temp/line_8_A.wav", + "silence_duration": 0.5439696215198327, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Here you are.", + "original_text": "Here you are.", + "start_time": 39.20072420396673, + "end_time": 39.97859268469235, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--380/temp/line_9_B.wav", + "silence_duration": 0.5194961061108215, + "is_interrupted": false + } + ] + }, + "DialogSum--val--381": { + "original_text": "A: May I help you? \nB: Yes, I want to buy some shoes to replace the ones I am [interrupt] wearing, which are pretty worn out and starting to hurt my feet after long walks, so I really need something more comfortable and durable. \nA: Sorry to cut in, but do you have a specific style in mind, or are you open to suggestions? \nB: I'm open to suggestions, but mainly I need something because the ones I am wearing are too old and shabby. \nA: I can see they are simply worn out. Would you like the same color? \nB: Yes. \nA: How about this light brown pair? \nB: Yes, I'll try them on. \nA: They certainly look charming. \nB: The trouble is they feel uncomfortable. \nA: Then try on another pair of the similar [interrupt] style that might offer a better fit with more cushioning and arch support, especially since you mentioned comfort is a priority for you. \nB: Oh, before you finish, do you have them in red? \nA: I was about to suggest trying another style, but yes, we do have them in red. Would you like to see those?", + "cleaned_text": "A: May I help you? \nB:Yes, I want to buy some shoes to replace the ones I am wearing, which are pretty worn out and starting to hurt my feet after long walks, so I really need something more comfortable and durable.\nA: Sorry to cut in, but do you have a specific style in mind, or are you open to suggestions? \nB: I'm open to suggestions, but mainly I need something because the ones I am wearing are too old and shabby. \nA: I can see they are simply worn out. Would you like the same color? \nB: Yes. \nA: How about this light brown pair? \nB: Yes, I'll try them on. \nA: They certainly look charming. \nB: The trouble is they feel uncomfortable. \nA:Then try on another pair of the similar style that might offer a better fit with more cushioning and arch support, especially since you mentioned comfort is a priority for you.\nB: Oh, before you finish, do you have them in red? \nA: I was about to suggest trying another style, but yes, we do have them in red. Would you like to see those?", + "total_duration": 48.759909297052154, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--381/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--381/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--381/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "May I help you?", + "original_text": "May I help you?", + "start_time": 0, + "end_time": 0.9520181405895691, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--381/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, I want to buy some shoes to replace the ones I am", + "original_text": "Yes, I want to buy some shoes to replace the ones I am [interrupt] wearing, which are pretty worn out and starting to hurt my feet after long walks, so I really need something more comfortable and durable.", + "start_time": 1.2983520441543466, + "end_time": 10.21481462918836, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--381/temp/line_1_B.wav", + "silence_duration": 0.3463339035647775, + "is_interrupted": true, + "text_after_interrupt": "wearing, which are pretty worn out and starting to hurt my feet after long walks, so I really need something more comfortable and durable." + }, + { + "speaker": "A", + "text": "Sorry to cut in, but do you have a specific style in mind, or are you open to suggestions?", + "original_text": "Sorry to cut in, but do you have a specific style in mind, or are you open to suggestions?", + "start_time": 4.17762642057158, + "end_time": 10.528284016943463, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--381/temp/line_2_A.wav", + "silence_duration": 0.3759652891826042, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I'm open to suggestions, but mainly I need something because the ones I am wearing are too old and shabby.", + "original_text": "I'm open to suggestions, but mainly I need something because the ones I am wearing are too old and shabby.", + "start_time": 10.979862711760957, + "end_time": 16.599091736704267, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--381/temp/line_3_B.wav", + "silence_duration": 0.4515786948174936, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I can see they are simply worn out. Would you like the same color?", + "original_text": "I can see they are simply worn out. Would you like the same color?", + "start_time": 17.122761553657565, + "end_time": 21.27913343574373, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--381/temp/line_4_A.wav", + "silence_duration": 0.5236698169532988, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes.", + "original_text": "Yes.", + "start_time": 21.741404174108872, + "end_time": 22.31029306299776, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--381/temp/line_5_B.wav", + "silence_duration": 0.46227073836514165, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "How about this light brown pair?", + "original_text": "How about this light brown pair?", + "start_time": 22.63844516774529, + "end_time": 24.58892135822148, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--381/temp/line_6_A.wav", + "silence_duration": 0.32815210474752743, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, I'll try them on.", + "original_text": "Yes, I'll try them on.", + "start_time": 25.04556598548685, + "end_time": 26.264613604534468, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--381/temp/line_7_B.wav", + "silence_duration": 0.45664462726536925, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "They certainly look charming.", + "original_text": "They certainly look charming.", + "start_time": 26.767301337264477, + "end_time": 28.299818344067198, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--381/temp/line_8_A.wav", + "silence_duration": 0.5026877327300082, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "The trouble is they feel uncomfortable.", + "original_text": "The trouble is they feel uncomfortable.", + "start_time": 28.703470244613786, + "end_time": 30.56106661649587, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--381/temp/line_9_B.wav", + "silence_duration": 0.4036519005465896, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Then try on another pair of the similar", + "original_text": "Then try on another pair of the similar [interrupt] style that might offer a better fit with more cushioning and arch support, especially since you mentioned comfort is a priority for you.", + "start_time": 31.017195685092652, + "end_time": 41.257195685092654, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--381/temp/line_10_A.wav", + "silence_duration": 0.45612906859678193, + "is_interrupted": true, + "text_after_interrupt": "style that might offer a better fit with more cushioning and arch support, especially since you mentioned comfort is a priority for you." + }, + { + "speaker": "B", + "text": "Oh, before you finish, do you have them in red?", + "original_text": "Oh, before you finish, do you have them in red?", + "start_time": 39.37850967798929, + "end_time": 41.77016500678748, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--381/temp/line_11_B.wav", + "silence_duration": 0.5149963626392174, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I was about to suggest trying another style, but yes, we do have them in red. Would you like to see those?", + "original_text": "I was about to suggest trying another style, but yes, we do have them in red. Would you like to see those?", + "start_time": 42.22349614418234, + "end_time": 48.759913377742436, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--381/temp/line_12_A.wav", + "silence_duration": 0.4533311373948644, + "is_interrupted": false + } + ] + }, + "DialogSum--val--382": { + "original_text": "A: What I should remind you is that your boy is sometimes 25 minutes late for the [interrupt] class, and it's becoming a bit of a concern because consistent tardiness can negatively impact both his learning progress and classroom dynamics. \nB: Really? That's surprising. Could it be that there's some misunderstanding? He always tells me he usually arrives ten minutes early. \nA: I understand your concern, but I've noticed this pattern a few times. Maybe you could check with him directly to clarify. Also, I was going to mention that he might get punished this time if it continues [interrupt] with a warning or even a detention, depending on the school's policy regarding repeated violations of attendance rules and their impact on academic performance. \nB: Oh no, I didn't realize it was that serious. I'll definitely talk to him about it. But can you tell me more about what kind of punishment he might face?", + "cleaned_text": "A:What I should remind you is that your boy is sometimes 25 minutes late for the class, and it's becoming a bit of a concern because consistent tardiness can negatively impact both his learning progress and classroom dynamics.\nB: Really? That's surprising. Could it be that there's some misunderstanding? He always tells me he usually arrives ten minutes early. \nA:I understand your concern, but I've noticed this pattern a few times. Maybe you could check with him directly to clarify. Also, I was going to mention that he might get punished this time if it continues with a warning or even a detention, depending on the school's policy regarding repeated violations of attendance rules and their impact on academic performance.\nB: Oh no, I didn't realize it was that serious. I'll definitely talk to him about it. But can you tell me more about what kind of punishment he might face?", + "total_duration": 40.74126984126984, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--382/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--382/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--382/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "What I should remind you is that your boy is sometimes 25 minutes late for the", + "original_text": "What I should remind you is that your boy is sometimes 25 minutes late for the [interrupt] class, and it's becoming a bit of a concern because consistent tardiness can negatively impact both his learning progress and classroom dynamics.", + "start_time": 0, + "end_time": 13.455963718820861, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--382/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": true, + "text_after_interrupt": "class, and it's becoming a bit of a concern because consistent tardiness can negatively impact both his learning progress and classroom dynamics." + }, + { + "speaker": "B", + "text": "Really? That's surprising. Could it be that there's some misunderstanding? He always tells me he usually arrives ten minutes early.", + "original_text": "Really? That's surprising. Could it be that there's some misunderstanding? He always tells me he usually arrives ten minutes early.", + "start_time": 4.748480725623582, + "end_time": 11.80734693877551, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--382/temp/line_1_B.wav", + "silence_duration": 0.5294002887140385, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I understand your concern, but I've noticed this pattern a few times. Maybe you could check with him directly to clarify. Also, I was going to mention that he might get punished this time if it continues", + "original_text": "I understand your concern, but I've noticed this pattern a few times. Maybe you could check with him directly to clarify. Also, I was going to mention that he might get punished this time if it continues [interrupt] with a warning or even a detention, depending on the school's policy regarding repeated violations of attendance rules and their impact on academic performance.", + "start_time": 13.925955082972793, + "end_time": 34.80069431199774, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--382/temp/line_2_A.wav", + "silence_duration": 0.46999136415193243, + "is_interrupted": true, + "text_after_interrupt": "with a warning or even a detention, depending on the school's policy regarding repeated violations of attendance rules and their impact on academic performance." + }, + { + "speaker": "B", + "text": "Oh no, I didn't realize it was that serious. I'll definitely talk to him about it. But can you tell me more about what kind of punishment he might face?", + "original_text": "Oh no, I didn't realize it was that serious. I'll definitely talk to him about it. But can you tell me more about what kind of punishment he might face?", + "start_time": 33.14836826301616, + "end_time": 40.74129343308419, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--382/temp/line_3_B.wav", + "silence_duration": 0.5129853347090108, + "is_interrupted": false + } + ] + }, + "DialogSum--val--383": { + "original_text": "A: Good morning. What seems to be the problem? \nB: Good morning, Mrs. Brown. I have a cough and a fever and I feel very tired all the [interrupt] time, especially in the evenings when my symptoms seem to worsen significantly and I struggle to get proper rest. \nA: Sorry to interrupt, but when did these symptoms start? \nB: Three days now. \nA: Let me have a look. Open your mouth please. Wider please. Now say AHH. \nB: AHHH. \nA: Now take your shirt off please. Breathe in-Breathe out-OK, you can put your shirt back on now. \nB: What seems to be the problem? Do I suffer from bird flu or is there something wrong with my [interrupt] lungs? I've been really worried about it because my cousin had similar symptoms last month and was diagnosed with pneumonia. \nA: Oh, no. Don't be so nervous. You just have a bad cold. Do you work in an air-conditioned office? \nB: Yes, I do. But doctor, you didn't finish—what about my lungs? \nA: Oh, right. Your lungs sound fine. It's the air conditioning, you see. It's really not very good for your health. \nB: So what would you suggest, doctor?", + "cleaned_text": "A: Good morning. What seems to be the problem? \nB:Good morning, Mrs. Brown. I have a cough and a fever and I feel very tired all the time, especially in the evenings when my symptoms seem to worsen significantly and I struggle to get proper rest.\nA: Sorry to interrupt, but when did these symptoms start? \nB: Three days now. \nA: Let me have a look. Open your mouth please. Wider please. Now say AHH. \nB: AHHH. \nA: Now take your shirt off please. Breathe in-Breathe out-OK, you can put your shirt back on now. \nB:What seems to be the problem? Do I suffer from bird flu or is there something wrong with my lungs? I've been really worried about it because my cousin had similar symptoms last month and was diagnosed with pneumonia.\nA: Oh, no. Don't be so nervous. You just have a bad cold. Do you work in an air-conditioned office? \nB: Yes, I do. But doctor, you didn't finish—what about my lungs? \nA: Oh, right. Your lungs sound fine. It's the air conditioning, you see. It's really not very good for your health. \nB: So what would you suggest, doctor?", + "total_duration": 55.83179138321996, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--383/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--383/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--383/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Good morning. What seems to be the problem?", + "original_text": "Good morning. What seems to be the problem?", + "start_time": 0, + "end_time": 2.36843537414966, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--383/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Good morning, Mrs. Brown. I have a cough and a fever and I feel very tired all the", + "original_text": "Good morning, Mrs. Brown. I have a cough and a fever and I feel very tired all the [interrupt] time, especially in the evenings when my symptoms seem to worsen significantly and I struggle to get proper rest.", + "start_time": 2.844607648177329, + "end_time": 13.038167738880276, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--383/temp/line_1_B.wav", + "silence_duration": 0.4761722740276692, + "is_interrupted": true, + "text_after_interrupt": "time, especially in the evenings when my symptoms seem to worsen significantly and I struggle to get proper rest." + }, + { + "speaker": "A", + "text": "Sorry to interrupt, but when did these symptoms start?", + "original_text": "Sorry to interrupt, but when did these symptoms start?", + "start_time": 7.302838940694336, + "end_time": 10.692952319379144, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--383/temp/line_2_A.wav", + "silence_duration": 0.3488819971833203, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Three days now.", + "original_text": "Three days now.", + "start_time": 13.41303322583796, + "end_time": 14.411491275724583, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--383/temp/line_3_B.wav", + "silence_duration": 0.3748654869576847, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Let me have a look. Open your mouth please. Wider please. Now say AHH.", + "original_text": "Let me have a look. Open your mouth please. Wider please. Now say AHH.", + "start_time": 14.832076138965089, + "end_time": 19.986906070937877, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--383/temp/line_4_A.wav", + "silence_duration": 0.4205848632405059, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "AHHH.", + "original_text": "AHHH.", + "start_time": 20.479740602416616, + "end_time": 21.153119287223873, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--383/temp/line_5_B.wav", + "silence_duration": 0.49283453147873746, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Now take your shirt off please. Breathe in-Breathe out-OK, you can put your shirt back on now.", + "original_text": "Now take your shirt off please. Breathe in-Breathe out-OK, you can put your shirt back on now.", + "start_time": 21.60145738869595, + "end_time": 27.592205688015675, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--383/temp/line_6_A.wav", + "silence_duration": 0.44833810147207565, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "What seems to be the problem? Do I suffer from bird flu or is there something wrong with my", + "original_text": "What seems to be the problem? Do I suffer from bird flu or is there something wrong with my [interrupt] lungs? I've been really worried about it because my cousin had similar symptoms last month and was diagnosed with pneumonia.", + "start_time": 27.92754361329539, + "end_time": 38.84092229810265, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--383/temp/line_7_B.wav", + "silence_duration": 0.3353379252797151, + "is_interrupted": true, + "text_after_interrupt": "lungs? I've been really worried about it because my cousin had similar symptoms last month and was diagnosed with pneumonia." + }, + { + "speaker": "A", + "text": "Oh, no. Don't be so nervous. You just have a bad cold. Do you work in an air-conditioned office?", + "original_text": "Oh, no. Don't be so nervous. You just have a bad cold. Do you work in an air-conditioned office?", + "start_time": 36.208905795621064, + "end_time": 42.42024366410179, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--383/temp/line_8_A.wav", + "silence_duration": 0.4202611887365291, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, I do. But doctor, you didn't finish—what about my lungs?", + "original_text": "Yes, I do. But doctor, you didn't finish—what about my lungs?", + "start_time": 42.80032883029734, + "end_time": 46.2368821182792, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--383/temp/line_9_B.wav", + "silence_duration": 0.38008516619555044, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Oh, right. Your lungs sound fine. It's the air conditioning, you see. It's really not very good for your health.", + "original_text": "Oh, right. Your lungs sound fine. It's the air conditioning, you see. It's really not very good for your health.", + "start_time": 46.799032915081625, + "end_time": 53.45154992188435, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--383/temp/line_10_A.wav", + "silence_duration": 0.562150796802426, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "So what would you suggest, doctor?", + "original_text": "So what would you suggest, doctor?", + "start_time": 53.974199722474964, + "end_time": 55.83179609435705, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--383/temp/line_11_B.wav", + "silence_duration": 0.5226498005906128, + "is_interrupted": false + } + ] + }, + "DialogSum--val--384": { + "original_text": "A: Hi, David. Haven't seen you for ages. How are you getting along with your work? \nB: Hi, Susan. Not so well as expected. I've left my position. I can't bear the rudeness of my boss any longer. \nA: What are you going to do then? \nB: No idea. Anyway, I've got to think about it seriously. And [interrupt] maybe explore some new opportunities that align with my passions and skills, perhaps even considering a complete career change to something more fulfilling and less stressful. \nA: Sorry to interrupt, but have you considered taking some time off to clear your mind before making any decisions? \nB: I have thought about it, but I also need to figure out my next steps soon. And you? \nA: I've been very successful as a dancer. I like this kind of life. It is so exciting. \nB: You can't do it for ever. \nA: No, but I've decided to open a dance school once I've moved to the top. A lot of young dancers need better training, don't you think? \nB: That's a wonderful idea. But what were you saying about young dancers? \nA: Oh, I was just saying they need better training, and I think I can help with that through my school by [interrupt] providing comprehensive programs that focus not just on technique but also on artistic expression and career development for aspiring professional dancers.", + "cleaned_text": "A: Hi, David. Haven't seen you for ages. How are you getting along with your work? \nB: Hi, Susan. Not so well as expected. I've left my position. I can't bear the rudeness of my boss any longer. \nA: What are you going to do then? \nB:No idea. Anyway, I've got to think about it seriously. And maybe explore some new opportunities that align with my passions and skills, perhaps even considering a complete career change to something more fulfilling and less stressful.\nA: Sorry to interrupt, but have you considered taking some time off to clear your mind before making any decisions? \nB: I have thought about it, but I also need to figure out my next steps soon. And you? \nA: I've been very successful as a dancer. I like this kind of life. It is so exciting. \nB: You can't do it for ever. \nA: No, but I've decided to open a dance school once I've moved to the top. A lot of young dancers need better training, don't you think? \nB: That's a wonderful idea. But what were you saying about young dancers? \nA:Oh, I was just saying they need better training, and I think I can help with that through my school by providing comprehensive programs that focus not just on technique but also on artistic expression and career development for aspiring professional dancers.", + "total_duration": 67.42897959183674, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--384/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--384/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--384/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Hi, David. Haven't seen you for ages. How are you getting along with your work?", + "original_text": "Hi, David. Haven't seen you for ages. How are you getting along with your work?", + "start_time": 0, + "end_time": 5.12, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--384/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Hi, Susan. Not so well as expected. I've left my position. I can't bear the rudeness of my boss any longer.", + "original_text": "Hi, Susan. Not so well as expected. I've left my position. I can't bear the rudeness of my boss any longer.", + "start_time": 5.573487759580862, + "end_time": 11.773215650737324, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--384/temp/line_1_B.wav", + "silence_duration": 0.4534877595808618, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "What are you going to do then?", + "original_text": "What are you going to do then?", + "start_time": 12.185960875166138, + "end_time": 13.68364794999607, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--384/temp/line_2_A.wav", + "silence_duration": 0.41274522442881434, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "No idea. Anyway, I've got to think about it seriously. And", + "original_text": "No idea. Anyway, I've got to think about it seriously. And [interrupt] maybe explore some new opportunities that align with my passions and skills, perhaps even considering a complete career change to something more fulfilling and less stressful.", + "start_time": 14.206498728716646, + "end_time": 26.664004397650885, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--384/temp/line_3_B.wav", + "silence_duration": 0.522850778720576, + "is_interrupted": true, + "text_after_interrupt": "maybe explore some new opportunities that align with my passions and skills, perhaps even considering a complete career change to something more fulfilling and less stressful." + }, + { + "speaker": "A", + "text": "Sorry to interrupt, but have you considered taking some time off to clear your mind before making any decisions?", + "original_text": "Sorry to interrupt, but have you considered taking some time off to clear your mind before making any decisions?", + "start_time": 18.420920497424127, + "end_time": 24.980557685632746, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--384/temp/line_4_A.wav", + "silence_duration": 0.33531471238076294, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I have thought about it, but I also need to figure out my next steps soon. And you?", + "original_text": "I have thought about it, but I also need to figure out my next steps soon. And you?", + "start_time": 27.01724473263131, + "end_time": 31.092346773447634, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--384/temp/line_5_B.wav", + "silence_duration": 0.3532403349804233, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I've been very successful as a dancer. I like this kind of life. It is so exciting.", + "original_text": "I've been very successful as a dancer. I like this kind of life. It is so exciting.", + "start_time": 31.55419260611034, + "end_time": 37.3475712909176, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--384/temp/line_6_A.wav", + "silence_duration": 0.4618458326627068, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "You can't do it for ever.", + "original_text": "You can't do it for ever.", + "start_time": 37.938253208302726, + "end_time": 39.33145048721429, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--384/temp/line_7_B.wav", + "silence_duration": 0.5906819173851228, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "No, but I've decided to open a dance school once I've moved to the top. A lot of young dancers need better training, don't you think?", + "original_text": "No, but I've decided to open a dance school once I've moved to the top. A lot of young dancers need better training, don't you think?", + "start_time": 39.86986677405427, + "end_time": 47.323472216231146, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--384/temp/line_8_A.wav", + "silence_duration": 0.5384162868399851, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "That's a wonderful idea. But what were you saying about young dancers?", + "original_text": "That's a wonderful idea. But what were you saying about young dancers?", + "start_time": 47.79756079529419, + "end_time": 51.25733403792457, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--384/temp/line_9_B.wav", + "silence_duration": 0.47408857906304125, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Oh, I was just saying they need better training, and I think I can help with that through my school by", + "original_text": "Oh, I was just saying they need better training, and I think I can help with that through my school by [interrupt] providing comprehensive programs that focus not just on technique but also on artistic expression and career development for aspiring professional dancers.", + "start_time": 51.69748162501924, + "end_time": 67.42900089939566, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--384/temp/line_10_A.wav", + "silence_duration": 0.4401475870946736, + "is_interrupted": true, + "text_after_interrupt": "providing comprehensive programs that focus not just on technique but also on artistic expression and career development for aspiring professional dancers." + } + ] + }, + "DialogSum--val--385": { + "original_text": "A: How are you doing today? \nB: I'm doing great. What about you? \nA: I'm absolutely lovely, thank you. \nB: Everything's been good with you? \nA: I haven't been better. How about your [interrupt] weekend? Did you do anything fun like going out with friends or trying new restaurants in town? \nB: Sorry to jump in, but you mentioned you were lovely—anything special going on that's got you in such a good mood? \nA: Oh, nothing in particular, just enjoying the day. But you were saying you started school recently? \nB: Yes, I started school recently. \nA: Where are you going to school? \nB: I'm going to PCC. \nA: How do you like it so far? \nB: I like it so far. My classes are pretty good right now. \nA: That's great to hear. I wish you luck. \nB: Thanks a lot.", + "cleaned_text": "A: How are you doing today? \nB: I'm doing great. What about you? \nA: I'm absolutely lovely, thank you. \nB: Everything's been good with you? \nA:I haven't been better. How about your weekend? Did you do anything fun like going out with friends or trying new restaurants in town?\nB: Sorry to jump in, but you mentioned you were lovely—anything special going on that's got you in such a good mood? \nA: Oh, nothing in particular, just enjoying the day. But you were saying you started school recently? \nB: Yes, I started school recently. \nA: Where are you going to school? \nB: I'm going to PCC. \nA: How do you like it so far? \nB: I like it so far. My classes are pretty good right now. \nA: That's great to hear. I wish you luck. \nB: Thanks a lot.", + "total_duration": 37.402403628117916, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--385/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--385/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--385/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "How are you doing today?", + "original_text": "How are you doing today?", + "start_time": 0, + "end_time": 1.509297052154195, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--385/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I'm doing great. What about you?", + "original_text": "I'm doing great. What about you?", + "start_time": 1.8928689105216208, + "end_time": 3.4834358039456568, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--385/temp/line_1_B.wav", + "silence_duration": 0.38357185836742563, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I'm absolutely lovely, thank you.", + "original_text": "I'm absolutely lovely, thank you.", + "start_time": 3.9326854946716687, + "end_time": 6.243070982200013, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--385/temp/line_2_A.wav", + "silence_duration": 0.4492496907260118, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Everything's been good with you?", + "original_text": "Everything's been good with you?", + "start_time": 6.669969951296258, + "end_time": 8.039947275559296, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--385/temp/line_3_B.wav", + "silence_duration": 0.4268989690962446, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I haven't been better. How about your", + "original_text": "I haven't been better. How about your [interrupt] weekend? Did you do anything fun like going out with friends or trying new restaurants in town?", + "start_time": 8.544098679567956, + "end_time": 16.032534053717615, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--385/temp/line_4_A.wav", + "silence_duration": 0.5041514040086601, + "is_interrupted": true, + "text_after_interrupt": "weekend? Did you do anything fun like going out with friends or trying new restaurants in town?" + }, + { + "speaker": "B", + "text": "Sorry to jump in, but you mentioned you were lovely—anything special going on that's got you in such a good mood?", + "original_text": "Sorry to jump in, but you mentioned you were lovely—anything special going on that's got you in such a good mood?", + "start_time": 11.017023849635983, + "end_time": 16.55498303330945, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--385/temp/line_5_B.wav", + "silence_duration": 0.3115457569514048, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Oh, nothing in particular, just enjoying the day. But you were saying you started school recently?", + "original_text": "Oh, nothing in particular, just enjoying the day. But you were saying you started school recently?", + "start_time": 17.1508860794843, + "end_time": 22.630795376536454, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--385/temp/line_6_A.wav", + "silence_duration": 0.5959030461748503, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, I started school recently.", + "original_text": "Yes, I started school recently.", + "start_time": 22.970116412143216, + "end_time": 24.920592602619408, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--385/temp/line_7_B.wav", + "silence_duration": 0.3393210356067617, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Where are you going to school?", + "original_text": "Where are you going to school?", + "start_time": 25.25879023732549, + "end_time": 26.849357130749524, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--385/temp/line_8_A.wav", + "silence_duration": 0.33819763470608116, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I'm going to PCC.", + "original_text": "I'm going to PCC.", + "start_time": 27.253764794226214, + "end_time": 28.368322617355467, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--385/temp/line_9_B.wav", + "silence_duration": 0.4044076634766879, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "How do you like it so far?", + "original_text": "How do you like it so far?", + "start_time": 28.709184042373405, + "end_time": 30.206871117203338, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--385/temp/line_10_A.wav", + "silence_duration": 0.3408614250179368, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I like it so far. My classes are pretty good right now.", + "original_text": "I like it so far. My classes are pretty good right now.", + "start_time": 30.73903957639505, + "end_time": 33.68797381675786, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--385/temp/line_11_B.wav", + "silence_duration": 0.5321684591917109, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "That's great to hear. I wish you luck.", + "original_text": "That's great to hear. I wish you luck.", + "start_time": 34.09599464902748, + "end_time": 36.39477015923156, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--385/temp/line_12_A.wav", + "silence_duration": 0.4080208322696184, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Thanks a lot.", + "original_text": "Thanks a lot.", + "start_time": 36.70582400609827, + "end_time": 37.40242264555405, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--385/temp/line_13_B.wav", + "silence_duration": 0.3110538468667045, + "is_interrupted": false + } + ] + }, + "DialogSum--val--386": { + "original_text": "A: For you, I would recommend this one here. \nB: The compact? Why do you think that one is better than the others? \nA: This automobile is just right for your needs because not only is it compact for ease in city driving, but also, it has many safety features. I know that as a parent, you are concerned about safety in driving your kids to and from [interrupt] school or other activities, especially with its advanced lane-keeping assist system and automatic emergency braking that activates when potential collisions are detected. \nB: Sorry to jump in, but safety is definitely my top priority. What kind of safety features are we talking about? \nA: This model features anti-lock brakes, airbags on both driver and passenger sides, and impact collision design. But that's not all. This car isn't only safe but it's also very economical. \nB: You mean it has a cheaper price than similar models? \nA: Yes, this price is very affordable, but driving this car you'll also notice a significant annual saving in gas consumption. The main attraction for this model is the fuel economy. By the way, I didn't get to finish earlier—it's also great for getting your kids to school safely. \nB: With the cost of gasoline these days, that is a big plus. I think this model may be just what I'm looking for. \nA: Why don't you take it for a test drive, and think it over?", + "cleaned_text": "A: For you, I would recommend this one here. \nB: The compact? Why do you think that one is better than the others? \nA:This automobile is just right for your needs because not only is it compact for ease in city driving, but also, it has many safety features. I know that as a parent, you are concerned about safety in driving your kids to and from school or other activities, especially with its advanced lane-keeping assist system and automatic emergency braking that activates when potential collisions are detected.\nB: Sorry to jump in, but safety is definitely my top priority. What kind of safety features are we talking about? \nA: This model features anti-lock brakes, airbags on both driver and passenger sides, and impact collision design. But that's not all. This car isn't only safe but it's also very economical. \nB: You mean it has a cheaper price than similar models? \nA: Yes, this price is very affordable, but driving this car you'll also notice a significant annual saving in gas consumption. The main attraction for this model is the fuel economy. By the way, I didn't get to finish earlier—it's also great for getting your kids to school safely. \nB: With the cost of gasoline these days, that is a big plus. I think this model may be just what I'm looking for. \nA: Why don't you take it for a test drive, and think it over?", + "total_duration": 75.18467120181406, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--386/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--386/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--386/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "For you, I would recommend this one here.", + "original_text": "For you, I would recommend this one here.", + "start_time": 0, + "end_time": 2.5193650793650795, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--386/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "The compact? Why do you think that one is better than the others?", + "original_text": "The compact? Why do you think that one is better than the others?", + "start_time": 3.0999945817442853, + "end_time": 6.559767824374671, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--386/temp/line_1_B.wav", + "silence_duration": 0.5806295023792056, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "This automobile is just right for your needs because not only is it compact for ease in city driving, but also, it has many safety features. I know that as a parent, you are concerned about safety in driving your kids to and from", + "original_text": "This automobile is just right for your needs because not only is it compact for ease in city driving, but also, it has many safety features. I know that as a parent, you are concerned about safety in driving your kids to and from [interrupt] school or other activities, especially with its advanced lane-keeping assist system and automatic emergency braking that activates when potential collisions are detected.", + "start_time": 7.108488560262535, + "end_time": 32.186039580670695, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--386/temp/line_2_A.wav", + "silence_duration": 0.5487207358878647, + "is_interrupted": true, + "text_after_interrupt": "school or other activities, especially with its advanced lane-keeping assist system and automatic emergency braking that activates when potential collisions are detected." + }, + { + "speaker": "B", + "text": "Sorry to jump in, but safety is definitely my top priority. What kind of safety features are we talking about?", + "original_text": "Sorry to jump in, but safety is definitely my top priority. What kind of safety features are we talking about?", + "start_time": 22.14340919518317, + "end_time": 28.122547517178635, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--386/temp/line_3_B.wav", + "silence_duration": 0.5449458498418681, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "This model features anti-lock brakes, airbags on both driver and passenger sides, and impact collision design. But that's not all. This car isn't only safe but it's also very economical.", + "original_text": "This model features anti-lock brakes, airbags on both driver and passenger sides, and impact collision design. But that's not all. This car isn't only safe but it's also very economical.", + "start_time": 32.71239294892726, + "end_time": 45.03057888997034, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--386/temp/line_4_A.wav", + "silence_duration": 0.5263533682565646, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "You mean it has a cheaper price than similar models?", + "original_text": "You mean it has a cheaper price than similar models?", + "start_time": 45.518307237253374, + "end_time": 47.96801245267287, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--386/temp/line_5_B.wav", + "silence_duration": 0.48772834728303305, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Yes, this price is very affordable, but driving this car you'll also notice a significant annual saving in gas consumption. The main attraction for this model is the fuel economy. By the way, I didn't get to finish earlier—it's also great for getting your kids to school safely.", + "original_text": "Yes, this price is very affordable, but driving this car you'll also notice a significant annual saving in gas consumption. The main attraction for this model is the fuel economy. By the way, I didn't get to finish earlier—it's also great for getting your kids to school safely.", + "start_time": 48.45359151903818, + "end_time": 65.17195886597696, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--386/temp/line_6_A.wav", + "silence_duration": 0.48557906636530557, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "With the cost of gasoline these days, that is a big plus. I think this model may be just what I'm looking for.", + "original_text": "With the cost of gasoline these days, that is a big plus. I think this model may be just what I'm looking for.", + "start_time": 65.74394124498427, + "end_time": 71.79273943092531, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--386/temp/line_7_B.wav", + "silence_duration": 0.5719823790073124, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Why don't you take it for a test drive, and think it over?", + "original_text": "Why don't you take it for a test drive, and think it over?", + "start_time": 72.21252463259674, + "end_time": 75.18467882760808, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--386/temp/line_8_A.wav", + "silence_duration": 0.4197852016714261, + "is_interrupted": false + } + ] + }, + "DialogSum--val--387": { + "original_text": "A: Have you ever been involved in the auditing work? \nB: Yes, I have. I was employed by the financial section of the university ever since I graduated. I worked there for 3 years. Then I had worked in a bank for [interrupt] about two years before transitioning into a different role, where I gained extensive experience in financial analysis and risk assessment procedures that proved invaluable for my auditing career. \nA: Sorry to jump in, but when you say you worked at the bank, were you also doing auditing work there? \nB: Yes, I was. I mainly focused on internal audits at the bank. But I didn't mention that I worked there for 3 years before becoming an auditor. \nA: Oh, I see. So how long did it take you to become an auditor? \nB: Very short time. I became an auditor within three months.", + "cleaned_text": "A: Have you ever been involved in the auditing work? \nB:Yes, I have. I was employed by the financial section of the university ever since I graduated. I worked there for 3 years. Then I had worked in a bank for about two years before transitioning into a different role, where I gained extensive experience in financial analysis and risk assessment procedures that proved invaluable for my auditing career.\nA: Sorry to jump in, but when you say you worked at the bank, were you also doing auditing work there? \nB: Yes, I was. I mainly focused on internal audits at the bank. But I didn't mention that I worked there for 3 years before becoming an auditor. \nA: Oh, I see. So how long did it take you to become an auditor? \nB: Very short time. I became an auditor within three months.", + "total_duration": 38.48340136054422, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--387/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--387/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--387/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Have you ever been involved in the auditing work?", + "original_text": "Have you ever been involved in the auditing work?", + "start_time": 0, + "end_time": 2.5193650793650795, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--387/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, I have. I was employed by the financial section of the university ever since I graduated. I worked there for 3 years. Then I had worked in a bank for", + "original_text": "Yes, I have. I was employed by the financial section of the university ever since I graduated. I worked there for 3 years. Then I had worked in a bank for [interrupt] about two years before transitioning into a different role, where I gained extensive experience in financial analysis and risk assessment procedures that proved invaluable for my auditing career.", + "start_time": 2.820088648555599, + "end_time": 21.709521755131565, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--387/temp/line_1_B.wav", + "silence_duration": 0.3007235691905196, + "is_interrupted": true, + "text_after_interrupt": "about two years before transitioning into a different role, where I gained extensive experience in financial analysis and risk assessment procedures that proved invaluable for my auditing career." + }, + { + "speaker": "A", + "text": "Sorry to jump in, but when you say you worked at the bank, were you also doing auditing work there?", + "original_text": "Sorry to jump in, but when you say you worked at the bank, were you also doing auditing work there?", + "start_time": 11.736551233589612, + "end_time": 17.715689555585076, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--387/temp/line_2_A.wav", + "silence_duration": 0.3642065018859728, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, I was. I mainly focused on internal audits at the bank. But I didn't mention that I worked there for 3 years before becoming an auditor.", + "original_text": "Yes, I was. I mainly focused on internal audits at the bank. But I didn't mention that I worked there for 3 years before becoming an auditor.", + "start_time": 22.289422651931375, + "end_time": 29.63853829818988, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--387/temp/line_3_B.wav", + "silence_duration": 0.5799008967998083, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Oh, I see. So how long did it take you to become an auditor?", + "original_text": "Oh, I see. So how long did it take you to become an auditor?", + "start_time": 30.22383598190521, + "end_time": 35.18129629936553, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--387/temp/line_4_A.wav", + "silence_duration": 0.5852976837153334, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Very short time. I became an auditor within three months.", + "original_text": "Very short time. I became an auditor within three months.", + "start_time": 35.51126332039874, + "end_time": 38.483417515410075, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--387/temp/line_5_B.wav", + "silence_duration": 0.32996702103321224, + "is_interrupted": false + } + ] + }, + "DialogSum--val--388": { + "original_text": "A: Nice dress. How do I look? Be honest. \nB: Hmm... you look too dressed up. How about this purple top and these jeans? \nA: Well, that top is a little too tight, and those jeans aren't dressy enough. And I don't feel comfortable with that. What do you think, Vicky? You've been very [interrupt] thoughtful with your suggestions in the past, and I'd love to hear your opinion on whether we should keep looking for something more elegant yet comfortable. \nB: Sorry to interrupt, but I just wanted to say that comfort is key. If you don't feel comfortable, it might show. Maybe we should find something that balances both comfort and style? \nA: You're right, comfort is important. But I was going to ask Vicky because she's been very quiet up to now. \nB: Be confident. Wear styles you're going to be comfortable in.", + "cleaned_text": "A: Nice dress. How do I look? Be honest. \nB: Hmm... you look too dressed up. How about this purple top and these jeans? \nA:Well, that top is a little too tight, and those jeans aren't dressy enough. And I don't feel comfortable with that. What do you think, Vicky? You've been very thoughtful with your suggestions in the past, and I'd love to hear your opinion on whether we should keep looking for something more elegant yet comfortable.\nB: Sorry to interrupt, but I just wanted to say that comfort is key. If you don't feel comfortable, it might show. Maybe we should find something that balances both comfort and style? \nA: You're right, comfort is important. But I was going to ask Vicky because she's been very quiet up to now. \nB: Be confident. Wear styles you're going to be comfortable in.", + "total_duration": 38.493968253968255, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--388/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--388/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--388/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Nice dress. How do I look? Be honest.", + "original_text": "Nice dress. How do I look? Be honest.", + "start_time": 0, + "end_time": 3.1695238095238096, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--388/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Hmm... you look too dressed up. How about this purple top and these jeans?", + "original_text": "Hmm... you look too dressed up. How about this purple top and these jeans?", + "start_time": 3.7168927575825847, + "end_time": 8.407323596584853, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--388/temp/line_1_B.wav", + "silence_duration": 0.5473689480587753, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Well, that top is a little too tight, and those jeans aren't dressy enough. And I don't feel comfortable with that. What do you think, Vicky? You've been very", + "original_text": "Well, that top is a little too tight, and those jeans aren't dressy enough. And I don't feel comfortable with that. What do you think, Vicky? You've been very [interrupt] thoughtful with your suggestions in the past, and I'd love to hear your opinion on whether we should keep looking for something more elegant yet comfortable.", + "start_time": 8.743358515323308, + "end_time": 25.02054672394009, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--388/temp/line_2_A.wav", + "silence_duration": 0.33603491873845504, + "is_interrupted": true, + "text_after_interrupt": "thoughtful with your suggestions in the past, and I'd love to hear your opinion on whether we should keep looking for something more elegant yet comfortable." + }, + { + "speaker": "B", + "text": "Sorry to interrupt, but I just wanted to say that comfort is key. If you don't feel comfortable, it might show. Maybe we should find something that balances both comfort and style?", + "original_text": "Sorry to interrupt, but I just wanted to say that comfort is key. If you don't feel comfortable, it might show. Maybe we should find something that balances both comfort and style?", + "start_time": 18.553789354325573, + "end_time": 28.271340374733736, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--388/temp/line_3_B.wav", + "silence_duration": 0.3994897541297133, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "You're right, comfort is important. But I was going to ask Vicky because she's been very quiet up to now.", + "original_text": "You're right, comfort is important. But I was going to ask Vicky because she's been very quiet up to now.", + "start_time": 28.736448111732752, + "end_time": 35.00583586683479, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--388/temp/line_4_A.wav", + "silence_duration": 0.46510773699901686, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Be confident. Wear styles you're going to be comfortable in.", + "original_text": "Be confident. Wear styles you're going to be comfortable in.", + "start_time": 35.57990202208599, + "end_time": 38.49400633047601, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--388/temp/line_5_B.wav", + "silence_duration": 0.5740661552511921, + "is_interrupted": false + } + ] + }, + "DialogSum--val--390": { + "original_text": "A: They got a divorce at last. \nB: It's inevitable. Their love was built on the sand, and this is why their marriage has landed on the [interrupt] path to ruin from the very beginning, with neither of them truly understanding each other's needs or making any real effort to build a strong emotional connection. \nA: Sorry to jump in, but do you think there was a specific moment when things started to fall apart? \nB: I believe it was a series of small issues that accumulated over time. But as I was saying, their marriage landed on the rocks because their foundation was weak. \nA: You said it. Love built on the sand will soon be on the rocks. \nB: That gives us a good lesson.", + "cleaned_text": "A: They got a divorce at last. \nB:It's inevitable. Their love was built on the sand, and this is why their marriage has landed on the path to ruin from the very beginning, with neither of them truly understanding each other's needs or making any real effort to build a strong emotional connection.\nA: Sorry to jump in, but do you think there was a specific moment when things started to fall apart? \nB: I believe it was a series of small issues that accumulated over time. But as I was saying, their marriage landed on the rocks because their foundation was weak. \nA: You said it. Love built on the sand will soon be on the rocks. \nB: That gives us a good lesson.", + "total_duration": 29.80013605442177, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--390/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--390/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--390/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "They got a divorce at last.", + "original_text": "They got a divorce at last.", + "start_time": 0, + "end_time": 1.7298866213151927, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--390/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "It's inevitable. Their love was built on the sand, and this is why their marriage has landed on the", + "original_text": "It's inevitable. Their love was built on the sand, and this is why their marriage has landed on the [interrupt] path to ruin from the very beginning, with neither of them truly understanding each other's needs or making any real effort to build a strong emotional connection.", + "start_time": 2.1284569889794134, + "end_time": 15.305781252017962, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--390/temp/line_1_B.wav", + "silence_duration": 0.3985703676642207, + "is_interrupted": true, + "text_after_interrupt": "path to ruin from the very beginning, with neither of them truly understanding each other's needs or making any real effort to build a strong emotional connection." + }, + { + "speaker": "A", + "text": "Sorry to jump in, but do you think there was a specific moment when things started to fall apart?", + "original_text": "Sorry to jump in, but do you think there was a specific moment when things started to fall apart?", + "start_time": 7.608366286031568, + "end_time": 13.227595310974879, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--390/temp/line_2_A.wav", + "silence_duration": 0.4315369140633829, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I believe it was a series of small issues that accumulated over time. But as I was saying, their marriage landed on the rocks because their foundation was weak.", + "original_text": "I believe it was a series of small issues that accumulated over time. But as I was saying, their marriage landed on the rocks because their foundation was weak.", + "start_time": 15.61733811832094, + "end_time": 23.813982109250645, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--390/temp/line_3_B.wav", + "silence_duration": 0.3115568663029791, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "You said it. Love built on the sand will soon be on the rocks.", + "original_text": "You said it. Love built on the sand will soon be on the rocks.", + "start_time": 24.248130774742563, + "end_time": 27.94010356385821, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--390/temp/line_4_A.wav", + "silence_duration": 0.43414866549191855, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "That gives us a good lesson.", + "original_text": "That gives us a good lesson.", + "start_time": 28.465013993210214, + "end_time": 29.800161385500463, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--390/temp/line_5_B.wav", + "silence_duration": 0.5249104293520035, + "is_interrupted": false + } + ] + }, + "DialogSum--val--392": { + "original_text": "A: Ah, where am I? \nB: Excuse me, do you need any help? \nA: I want to go to the Science Museum. But I've been lost for the past few hours, and I can't use these ticket [interrupt] machines properly because the interface is quite different from what I'm used to back home and the instructions aren't very clear for first-time users. \nB: Oh, don't worry, I can show you how to use the ticket machine. Where exactly are you trying to go? \nA: The Science Museum. But I also wanted to know how often the trains come around this time of day. \nB: Usually they come about every 6 minutes. Just press this button on the ticket machine, then, get on the train at platform number four. \nA: Ok, and where do I get off the train? \nB: Get off at State Street Station, 3 stops from here. \nA: Ok, I got it, thanks for your help. \nB: No problem. By the way, did you manage to get your ticket from the machine? \nA: Oh, right, I still need to do that. Thanks for reminding me! \nB: No worries. Good luck!", + "cleaned_text": "A: Ah, where am I? \nB: Excuse me, do you need any help? \nA:I want to go to the Science Museum. But I've been lost for the past few hours, and I can't use these ticket machines properly because the interface is quite different from what I'm used to back home and the instructions aren't very clear for first-time users.\nB: Oh, don't worry, I can show you how to use the ticket machine. Where exactly are you trying to go? \nA: The Science Museum. But I also wanted to know how often the trains come around this time of day. \nB: Usually they come about every 6 minutes. Just press this button on the ticket machine, then, get on the train at platform number four. \nA: Ok, and where do I get off the train? \nB: Get off at State Street Station, 3 stops from here. \nA: Ok, I got it, thanks for your help. \nB: No problem. By the way, did you manage to get your ticket from the machine? \nA: Oh, right, I still need to do that. Thanks for reminding me! \nB: No worries. Good luck!", + "total_duration": 52.07764172335601, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--392/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--392/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--392/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Ah, where am I?", + "original_text": "Ah, where am I?", + "start_time": 0, + "end_time": 1.195827664399093, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--392/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Excuse me, do you need any help?", + "original_text": "Excuse me, do you need any help?", + "start_time": 1.7819895306010896, + "end_time": 3.3725564240251256, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--392/temp/line_1_B.wav", + "silence_duration": 0.5861618662019966, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I want to go to the Science Museum. But I've been lost for the past few hours, and I can't use these ticket", + "original_text": "I want to go to the Science Museum. But I've been lost for the past few hours, and I can't use these ticket [interrupt] machines properly because the interface is quite different from what I'm used to back home and the instructions aren't very clear for first-time users.", + "start_time": 3.960224404505729, + "end_time": 18.55396590110437, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--392/temp/line_2_A.wav", + "silence_duration": 0.5876679804806035, + "is_interrupted": true, + "text_after_interrupt": "machines properly because the interface is quite different from what I'm used to back home and the instructions aren't very clear for first-time users." + }, + { + "speaker": "B", + "text": "Oh, don't worry, I can show you how to use the ticket machine. Where exactly are you trying to go?", + "original_text": "Oh, don't worry, I can show you how to use the ticket machine. Where exactly are you trying to go?", + "start_time": 11.053920549630446, + "end_time": 16.406120096115707, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--392/temp/line_3_B.wav", + "silence_duration": 0.510610697345367, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "The Science Museum. But I also wanted to know how often the trains come around this time of day.", + "original_text": "The Science Museum. But I also wanted to know how often the trains come around this time of day.", + "start_time": 19.067366430482828, + "end_time": 25.26709432163929, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--392/temp/line_4_A.wav", + "silence_duration": 0.5134005293784599, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Usually they come about every 6 minutes. Just press this button on the ticket machine, then, get on the train at platform number four.", + "original_text": "Usually they come about every 6 minutes. Just press this button on the ticket machine, then, get on the train at platform number four.", + "start_time": 25.79337619439003, + "end_time": 32.411063269219966, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--392/temp/line_5_B.wav", + "silence_duration": 0.5262818727507399, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Ok, and where do I get off the train?", + "original_text": "Ok, and where do I get off the train?", + "start_time": 32.809066340500195, + "end_time": 35.444531193107906, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--392/temp/line_6_A.wav", + "silence_duration": 0.3980030712802297, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Get off at State Street Station, 3 stops from here.", + "original_text": "Get off at State Street Station, 3 stops from here.", + "start_time": 35.9273378217187, + "end_time": 38.678902447569044, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--392/temp/line_7_B.wav", + "silence_duration": 0.4828066286107966, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Ok, I got it, thanks for your help.", + "original_text": "Ok, I got it, thanks for your help.", + "start_time": 39.19047736931968, + "end_time": 42.36000117884349, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--392/temp/line_8_A.wav", + "silence_duration": 0.5115749217506333, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "No problem. By the way, did you manage to get your ticket from the machine?", + "original_text": "No problem. By the way, did you manage to get your ticket from the machine?", + "start_time": 42.66569034945975, + "end_time": 46.63630259435771, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--392/temp/line_9_B.wav", + "silence_duration": 0.3056891706162604, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Oh, right, I still need to do that. Thanks for reminding me!", + "original_text": "Oh, right, I still need to do that. Thanks for reminding me!", + "start_time": 46.96907999006839, + "end_time": 50.27792352748335, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--392/temp/line_10_A.wav", + "silence_duration": 0.332777395710677, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "No worries. Good luck!", + "original_text": "No worries. Good luck!", + "start_time": 50.742496786580816, + "end_time": 52.07764417887107, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--392/temp/line_11_B.wav", + "silence_duration": 0.46457325909746344, + "is_interrupted": false + } + ] + }, + "DialogSum--val--393": { + "original_text": "A: Have you got the list of who is coming to the party? \nB: Yes, I do. And I've told them to keep the date secret. John hates that kind of thing. Do you remember when he found out that we bought him a birthday cake last year and that surprised [interrupt] look on his face was priceless, but he was so embarrassed after that and kept apologizing for not being prepared with a proper thank-you speech.\nA: Oh, that was a disaster! But speaking of surprises, do you think everyone will manage to keep this one a secret? \nB: I hope so, but this is different. Getting married is special and we've known him and Anna for years. Everyone's looking forward to it. I'll pick you up from the office and will go there together, shall we? \nA: That'll be fine, thanks. By the way, what were you saying about the Christmas party?", + "cleaned_text": "A: Have you got the list of who is coming to the party? \nB:Yes, I do. And I've told them to keep the date secret. John hates that kind of thing. Do you remember when he found out that we bought him a birthday cake last year and that surprised look on his face was priceless, but he was so embarrassed after that and kept apologizing for not being prepared with a proper thank-you speech.\nA: Oh, that was a disaster! But speaking of surprises, do you think everyone will manage to keep this one a secret? \nB: I hope so, but this is different. Getting married is special and we've known him and Anna for years. Everyone's looking forward to it. I'll pick you up from the office and will go there together, shall we? \nA: That'll be fine, thanks. By the way, what were you saying about the Christmas party?", + "total_duration": 35.214784580498865, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--393/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--393/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--393/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Have you got the list of who is coming to the party?", + "original_text": "Have you got the list of who is coming to the party?", + "start_time": 0, + "end_time": 2.589024943310658, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--393/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, I do. And I've told them to keep the date secret. John hates that kind of thing. Do you remember when he found out that we bought him a birthday cake last year and that surprised", + "original_text": "Yes, I do. And I've told them to keep the date secret. John hates that kind of thing. Do you remember when he found out that we bought him a birthday cake last year and that surprised [interrupt] look on his face was priceless, but he was so embarrassed after that and kept apologizing for not being prepared with a proper thank-you speech.", + "start_time": 3.0293817324694263, + "end_time": 19.144030258546522, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--393/temp/line_1_B.wav", + "silence_duration": 0.4403567891587685, + "is_interrupted": true, + "text_after_interrupt": "look on his face was priceless, but he was so embarrassed after that and kept apologizing for not being prepared with a proper thank-you speech." + }, + { + "speaker": "A", + "text": "Oh, that was a disaster! But speaking of surprises, do you think everyone will manage to keep this one a secret?", + "original_text": "Oh, that was a disaster! But speaking of surprises, do you think everyone will manage to keep this one a secret?", + "start_time": 12.108384000043122, + "end_time": 18.923440689385526, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--393/temp/line_2_A.wav", + "silence_duration": 0.5984464452759819, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I hope so, but this is different. Getting married is special and we've known him and Anna for years. Everyone's looking forward to it. I'll pick you up from the office and will go there together, shall we?", + "original_text": "I hope so, but this is different. Getting married is special and we've known him and Anna for years. Everyone's looking forward to it. I'll pick you up from the office and will go there together, shall we?", + "start_time": 19.7161605565351, + "end_time": 29.88650069258952, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--393/temp/line_3_B.wav", + "silence_duration": 0.5721302979885783, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "That'll be fine, thanks. By the way, what were you saying about the Christmas party?", + "original_text": "That'll be fine, thanks. By the way, what were you saying about the Christmas party?", + "start_time": 30.30378970347088, + "end_time": 35.214810111634144, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--393/temp/line_4_A.wav", + "silence_duration": 0.4172890108813595, + "is_interrupted": false + } + ] + }, + "DialogSum--val--394": { + "original_text": "A: Excuse me, could you tell me where the nearest post office is? \nB: Yes, walk down this road and then turn left when you get to the third crossing. You will see it [interrupt] on your right, just past the bakery which has a distinctive red awning and is famous for its freshly baked croissants every morning. \nA: Sorry to interrupt, but could you tell me if there are any landmarks I should look out for on the way? \nB: Ah, yes. When you turn left, you will see a five-star hotel with a tea shop on the left. The post office is just next to it. It's a three-storey building. \nA: How long will it take to get there if I walk? \nB: About 30 minutes? \nA: Oh, that's too long. \nB: Uh, well, you can take bus 232 or take the subway if you're in a hurry. \nA: Actually, I think getting a taxi might be better. But you mentioned something about a bus? \nB: Yes, bus 232 can also take you there, but a taxi would be quicker. \nA: Thanks a lot. \nB: You are welcome.", + "cleaned_text": "A: Excuse me, could you tell me where the nearest post office is? \nB:Yes, walk down this road and then turn left when you get to the third crossing. You will see it on your right, just past the bakery which has a distinctive red awning and is famous for its freshly baked croissants every morning.\nA: Sorry to interrupt, but could you tell me if there are any landmarks I should look out for on the way? \nB: Ah, yes. When you turn left, you will see a five-star hotel with a tea shop on the left. The post office is just next to it. It's a three-storey building. \nA: How long will it take to get there if I walk? \nB: About 30 minutes? \nA: Oh, that's too long. \nB: Uh, well, you can take bus 232 or take the subway if you're in a hurry. \nA: Actually, I think getting a taxi might be better. But you mentioned something about a bus? \nB: Yes, bus 232 can also take you there, but a taxi would be quicker. \nA: Thanks a lot. \nB: You are welcome.", + "total_duration": 49.77854875283447, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--394/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--394/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--394/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Excuse me, could you tell me where the nearest post office is?", + "original_text": "Excuse me, could you tell me where the nearest post office is?", + "start_time": 0, + "end_time": 3.297233560090703, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--394/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, walk down this road and then turn left when you get to the third crossing. You will see it", + "original_text": "Yes, walk down this road and then turn left when you get to the third crossing. You will see it [interrupt] on your right, just past the bakery which has a distinctive red awning and is famous for its freshly baked croissants every morning.", + "start_time": 3.799098325017103, + "end_time": 14.898236647012567, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--394/temp/line_1_B.wav", + "silence_duration": 0.5018647649263999, + "is_interrupted": true, + "text_after_interrupt": "on your right, just past the bakery which has a distinctive red awning and is famous for its freshly baked croissants every morning." + }, + { + "speaker": "A", + "text": "Sorry to interrupt, but could you tell me if there are any landmarks I should look out for on the way?", + "original_text": "Sorry to interrupt, but could you tell me if there are any landmarks I should look out for on the way?", + "start_time": 8.152839821615743, + "end_time": 13.725628937262002, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--394/temp/line_2_A.wav", + "silence_duration": 0.49722299970020467, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Ah, yes. When you turn left, you will see a five-star hotel with a tea shop on the left. The post office is just next to it. It's a three-storey building.", + "original_text": "Ah, yes. When you turn left, you will see a five-star hotel with a tea shop on the left. The post office is just next to it. It's a three-storey building.", + "start_time": 15.458908039626268, + "end_time": 24.247660874093388, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--394/temp/line_3_B.wav", + "silence_duration": 0.560671392613701, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "How long will it take to get there if I walk?", + "original_text": "How long will it take to get there if I walk?", + "start_time": 24.693340018332314, + "end_time": 27.026945460509186, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--394/temp/line_4_A.wav", + "silence_duration": 0.4456791442389272, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "About 30 minutes?", + "original_text": "About 30 minutes?", + "start_time": 27.42391739413056, + "end_time": 28.619745058529652, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--394/temp/line_5_B.wav", + "silence_duration": 0.3969719336213726, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Oh, that's too long.", + "original_text": "Oh, that's too long.", + "start_time": 29.084502544313708, + "end_time": 30.593799596467903, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--394/temp/line_6_A.wav", + "silence_duration": 0.4647574857840546, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Uh, well, you can take bus 232 or take the subway if you're in a hurry.", + "original_text": "Uh, well, you can take bus 232 or take the subway if you're in a hurry.", + "start_time": 31.117810772702356, + "end_time": 36.249420750026616, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--394/temp/line_7_B.wav", + "silence_duration": 0.5240111762344519, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Actually, I think getting a taxi might be better. But you mentioned something about a bus?", + "original_text": "Actually, I think getting a taxi might be better. But you mentioned something about a bus?", + "start_time": 36.845442360750766, + "end_time": 42.081542133993395, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--394/temp/line_8_A.wav", + "silence_duration": 0.5960216107241515, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, bus 232 can also take you there, but a taxi would be quicker.", + "original_text": "Yes, bus 232 can also take you there, but a taxi would be quicker.", + "start_time": 42.50401807087731, + "end_time": 47.18283893255531, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--394/temp/line_9_B.wav", + "silence_duration": 0.4224759368839149, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Thanks a lot.", + "original_text": "Thanks a lot.", + "start_time": 47.55259805406925, + "end_time": 48.562666081280135, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--394/temp/line_10_A.wav", + "silence_duration": 0.36975912151393575, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "You are welcome.", + "original_text": "You are welcome.", + "start_time": 48.91945214810091, + "end_time": 49.778590470096375, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--394/temp/line_11_B.wav", + "silence_duration": 0.3567860668207731, + "is_interrupted": false + } + ] + }, + "DialogSum--val--395": { + "original_text": "A: First, I'll spend a few days in Vancouver. Then I'll take a train through the Rocky [interrupt] Mountains, which should be a breathtaking experience with stunning views of glaciers, wildlife sightings, and some of the most dramatic landscapes in North America.\nB: Oh, you're riding through the Rocky Mountains? That's really exciting! Have you already booked the train tickets?\nA: Yes, I have. After that, I'll fly to Toronto and take a bus to Niagara Falls. I will take a boat under that huge waterfall.\nB: Wow, that's wonderful. You're so lucky! Have you thought about what to do after Niagara Falls?\nA: Well, I hope I don't get seasick. I'll finish my trip in Nova Scotia. I'd like to bike around some small fishing villages.\nB: That sounds amazing! By the way, you mentioned the Rocky Mountains earlier—what route is the train taking?\nA: It's the famous route that goes through Jasper and Banff. I'll make sure to take lots of pictures!", + "cleaned_text": "A:First, I'll spend a few days in Vancouver. Then I'll take a train through the Rocky Mountains, which should be a breathtaking experience with stunning views of glaciers, wildlife sightings, and some of the most dramatic landscapes in North America.\nB: Oh, you're riding through the Rocky Mountains? That's really exciting! Have you already booked the train tickets?\nA: Yes, I have. After that, I'll fly to Toronto and take a bus to Niagara Falls. I will take a boat under that huge waterfall.\nB: Wow, that's wonderful. You're so lucky! Have you thought about what to do after Niagara Falls?\nA: Well, I hope I don't get seasick. I'll finish my trip in Nova Scotia. I'd like to bike around some small fishing villages.\nB: That sounds amazing! By the way, you mentioned the Rocky Mountains earlier—what route is the train taking?\nA: It's the famous route that goes through Jasper and Banff. I'll make sure to take lots of pictures!", + "total_duration": 46.98249433106576, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--395/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--395/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--395/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "First, I'll spend a few days in Vancouver. Then I'll take a train through the Rocky", + "original_text": "First, I'll spend a few days in Vancouver. Then I'll take a train through the Rocky [interrupt] Mountains, which should be a breathtaking experience with stunning views of glaciers, wildlife sightings, and some of the most dramatic landscapes in North America.", + "start_time": 0, + "end_time": 13.676553287981859, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--395/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": true, + "text_after_interrupt": "Mountains, which should be a breathtaking experience with stunning views of glaciers, wildlife sightings, and some of the most dramatic landscapes in North America." + }, + { + "speaker": "B", + "text": "Oh, you're riding through the Rocky Mountains? That's really exciting! Have you already booked the train tickets?", + "original_text": "Oh, you're riding through the Rocky Mountains? That's really exciting! Have you already booked the train tickets?", + "start_time": 4.3769614512471655, + "end_time": 9.566621315192744, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--395/temp/line_1_B.wav", + "silence_duration": 0.3445235530904634, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Yes, I have. After that, I'll fly to Toronto and take a bus to Niagara Falls. I will take a boat under that huge waterfall.", + "original_text": "Yes, I have. After that, I'll fly to Toronto and take a bus to Niagara Falls. I will take a boat under that huge waterfall.", + "start_time": 13.997455698737525, + "end_time": 22.170879735018705, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--395/temp/line_2_A.wav", + "silence_duration": 0.3209024107556665, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Wow, that's wonderful. You're so lucky! Have you thought about what to do after Niagara Falls?", + "original_text": "Wow, that's wonderful. You're so lucky! Have you thought about what to do after Niagara Falls?", + "start_time": 22.525287115509602, + "end_time": 27.575627251564022, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--395/temp/line_3_B.wav", + "silence_duration": 0.35440738049089643, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Well, I hope I don't get seasick. I'll finish my trip in Nova Scotia. I'd like to bike around some small fishing villages.", + "original_text": "Well, I hope I don't get seasick. I'll finish my trip in Nova Scotia. I'd like to bike around some small fishing villages.", + "start_time": 28.025327025259315, + "end_time": 35.11902317038403, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--395/temp/line_4_A.wav", + "silence_duration": 0.449699773695292, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "That sounds amazing! By the way, you mentioned the Rocky Mountains earlier—what route is the train taking?", + "original_text": "That sounds amazing! By the way, you mentioned the Rocky Mountains earlier—what route is the train taking?", + "start_time": 35.547490565879386, + "end_time": 40.64427061123086, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--395/temp/line_5_B.wav", + "silence_duration": 0.4284673954953513, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "It's the famous route that goes through Jasper and Banff. I'll make sure to take lots of pictures!", + "original_text": "It's the famous route that goes through Jasper and Banff. I'll make sure to take lots of pictures!", + "start_time": 41.18912275382509, + "end_time": 46.98250143863235, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--395/temp/line_6_A.wav", + "silence_duration": 0.5448521425942283, + "is_interrupted": false + } + ] + }, + "DialogSum--val--396": { + "original_text": "A: You are not happy, are you? \nB: No. \nA: What makes you unhappy? \nB: My parents. \nA: Why? I guess they must love you very [interrupt] much and want the best for you, even if their methods sometimes feel overwhelming or restrictive to you as you're growing up and developing your own identity. \nB: They do, but they always want me to do what they wish, regardless of my feeling, just because I'm the only child in the family! \nA: Oh, I see. There is a generation gap between your parents and you. \nB: What is it? Generation gap? \nA: It refers to a lack of understanding between parents and [interrupt] children due to differences in age, experiences, and perspectives, which can lead to conflicts when expectations and values don't align between different generations in a family. \nB: That's true, I don't think they understand me. But wait, what were you saying about understanding between parents and...? \nA: Oh, I was saying it refers to a lack of understanding between parents and children. But have you ever tried to understand them? \nB: Maybe not much.", + "cleaned_text": "A: You are not happy, are you? \nB: No. \nA: What makes you unhappy? \nB: My parents. \nA:Why? I guess they must love you very much and want the best for you, even if their methods sometimes feel overwhelming or restrictive to you as you're growing up and developing your own identity.\nB: They do, but they always want me to do what they wish, regardless of my feeling, just because I'm the only child in the family! \nA: Oh, I see. There is a generation gap between your parents and you. \nB: What is it? Generation gap? \nA:It refers to a lack of understanding between parents and children due to differences in age, experiences, and perspectives, which can lead to conflicts when expectations and values don't align between different generations in a family.\nB: That's true, I don't think they understand me. But wait, what were you saying about understanding between parents and...? \nA: Oh, I was saying it refers to a lack of understanding between parents and children. But have you ever tried to understand them? \nB: Maybe not much.", + "total_duration": 49.98671201814059, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--396/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--396/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--396/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "You are not happy, are you?", + "original_text": "You are not happy, are you?", + "start_time": 0, + "end_time": 1.5325170068027212, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--396/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "No.", + "original_text": "No.", + "start_time": 2.0506161459615107, + "end_time": 2.6078950575261364, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--396/temp/line_1_B.wav", + "silence_duration": 0.5180991391587896, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "What makes you unhappy?", + "original_text": "What makes you unhappy?", + "start_time": 2.914881688966377, + "end_time": 4.308078967877941, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--396/temp/line_2_A.wav", + "silence_duration": 0.3069866314402409, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "My parents.", + "original_text": "My parents.", + "start_time": 4.702968158508745, + "end_time": 5.71303618571963, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--396/temp/line_3_B.wav", + "silence_duration": 0.3948891906308033, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Why? I guess they must love you very", + "original_text": "Why? I guess they must love you very [interrupt] much and want the best for you, even if their methods sometimes feel overwhelming or restrictive to you as you're growing up and developing your own identity.", + "start_time": 6.149283279673198, + "end_time": 17.677990762666397, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--396/temp/line_4_A.wav", + "silence_duration": 0.43624709395356864, + "is_interrupted": true, + "text_after_interrupt": "much and want the best for you, even if their methods sometimes feel overwhelming or restrictive to you as you're growing up and developing your own identity." + }, + { + "speaker": "B", + "text": "They do, but they always want me to do what they wish, regardless of my feeling, just because I'm the only child in the family!", + "original_text": "They do, but they always want me to do what they wish, regardless of my feeling, just because I'm the only child in the family!", + "start_time": 8.958897792144853, + "end_time": 15.274725456543946, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--396/temp/line_5_B.wav", + "silence_duration": 0.38823964508394765, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Oh, I see. There is a generation gap between your parents and you.", + "original_text": "Oh, I see. There is a generation gap between your parents and you.", + "start_time": 18.046332779845343, + "end_time": 22.179484707282985, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--396/temp/line_6_A.wav", + "silence_duration": 0.368342017178945, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "What is it? Generation gap?", + "original_text": "What is it? Generation gap?", + "start_time": 22.530155702504853, + "end_time": 24.085892663956102, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--396/temp/line_7_B.wav", + "silence_duration": 0.35067099522186856, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "It refers to a lack of understanding between parents and", + "original_text": "It refers to a lack of understanding between parents and [interrupt] children due to differences in age, experiences, and perspectives, which can lead to conflicts when expectations and values don't align between different generations in a family.", + "start_time": 24.58264942104153, + "end_time": 38.47979227818439, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--396/temp/line_8_A.wav", + "silence_duration": 0.4967567570854297, + "is_interrupted": true, + "text_after_interrupt": "children due to differences in age, experiences, and perspectives, which can lead to conflicts when expectations and values don't align between different generations in a family." + }, + { + "speaker": "B", + "text": "That's true, I don't think they understand me. But wait, what were you saying about understanding between parents and...?", + "original_text": "That's true, I don't think they understand me. But wait, what were you saying about understanding between parents and...?", + "start_time": 35.42387932614922, + "end_time": 41.10115823771385, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--396/temp/line_9_B.wav", + "silence_duration": 0.473287447321059, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Oh, I was saying it refers to a lack of understanding between parents and children. But have you ever tried to understand them?", + "original_text": "Oh, I was saying it refers to a lack of understanding between parents and children. But have you ever tried to understand them?", + "start_time": 41.54682283619744, + "end_time": 48.67534891329495, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--396/temp/line_10_A.wav", + "silence_duration": 0.44566459848359263, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Maybe not much.", + "original_text": "Maybe not much.", + "start_time": 48.9882756567098, + "end_time": 49.986733706596425, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--396/temp/line_11_B.wav", + "silence_duration": 0.3129267434148571, + "is_interrupted": false + } + ] + }, + "DialogSum--val--398": { + "original_text": "A: Hello, reservation desk. How can I help you? \nB: I'd like to book a room. \nA: And what kind of room would you like ma'am? We got single rooms, double rooms, standard rooms, suites, and deluxe [interrupt] suites available, each with unique amenities to suit your needs including complimentary breakfast, high-speed internet, and access to our premium spa facilities for the ultimate relaxation experience. \nB: Sorry, could you tell me the rate for a standard room? \nA: Sure, it's $79 a night. \nB: I'd like a standard room. \nA: What date would you check in, ma'am? \nB: December twenty-third, please. \nA: How long do you plan to stay? \nB: Four days. \nA: Could you give me your name and phone number? \nB: Nancy Brown, my phone number is 7096785634. Oh, you mentioned deluxe suites earlier—what's the rate for those? \nA: The deluxe suites are $150 a night. Would you like to change your booking? \nB: No, I'll stick with the standard room. Thank you.", + "cleaned_text": "A: Hello, reservation desk. How can I help you? \nB: I'd like to book a room. \nA:And what kind of room would you like ma'am? We got single rooms, double rooms, standard rooms, suites, and deluxe suites available, each with unique amenities to suit your needs including complimentary breakfast, high-speed internet, and access to our premium spa facilities for the ultimate relaxation experience.\nB: Sorry, could you tell me the rate for a standard room? \nA: Sure, it's $79 a night. \nB: I'd like a standard room. \nA: What date would you check in, ma'am? \nB: December twenty-third, please. \nA: How long do you plan to stay? \nB: Four days. \nA: Could you give me your name and phone number? \nB: Nancy Brown, my phone number is 7096785634. Oh, you mentioned deluxe suites earlier—what's the rate for those? \nA: The deluxe suites are $150 a night. Would you like to change your booking? \nB: No, I'll stick with the standard room. Thank you.", + "total_duration": 60.22666666666667, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--398/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--398/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--398/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Hello, reservation desk. How can I help you?", + "original_text": "Hello, reservation desk. How can I help you?", + "start_time": 0, + "end_time": 3.81968253968254, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--398/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I'd like to book a room.", + "original_text": "I'd like to book a room.", + "start_time": 4.402142907810606, + "end_time": 5.760510254749382, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--398/temp/line_1_B.wav", + "silence_duration": 0.5824603681280658, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "And what kind of room would you like ma'am? We got single rooms, double rooms, standard rooms, suites, and deluxe", + "original_text": "And what kind of room would you like ma'am? We got single rooms, double rooms, standard rooms, suites, and deluxe [interrupt] suites available, each with unique amenities to suit your needs including complimentary breakfast, high-speed internet, and access to our premium spa facilities for the ultimate relaxation experience.", + "start_time": 6.353746580566531, + "end_time": 25.730798734761542, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--398/temp/line_2_A.wav", + "silence_duration": 0.5932363258171489, + "is_interrupted": true, + "text_after_interrupt": "suites available, each with unique amenities to suit your needs including complimentary breakfast, high-speed internet, and access to our premium spa facilities for the ultimate relaxation experience." + }, + { + "speaker": "B", + "text": "Sorry, could you tell me the rate for a standard room?", + "original_text": "Sorry, could you tell me the rate for a standard room?", + "start_time": 13.586762453582404, + "end_time": 16.442816875351113, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--398/temp/line_3_B.wav", + "silence_duration": 0.5994885373142633, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Sure, it's $79 a night.", + "original_text": "Sure, it's $79 a night.", + "start_time": 26.184562510050263, + "end_time": 28.634267725469766, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--398/temp/line_4_A.wav", + "silence_duration": 0.45376377528872125, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I'd like a standard room.", + "original_text": "I'd like a standard room.", + "start_time": 29.080282833322403, + "end_time": 30.438650180261178, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--398/temp/line_5_B.wav", + "silence_duration": 0.44601510785263765, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "What date would you check in, ma'am?", + "original_text": "What date would you check in, ma'am?", + "start_time": 30.873271043940182, + "end_time": 32.52188782398554, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--398/temp/line_6_A.wav", + "silence_duration": 0.4346208636790035, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "December twenty-third, please.", + "original_text": "December twenty-third, please.", + "start_time": 32.86298256700827, + "end_time": 34.453549460432306, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--398/temp/line_7_B.wav", + "silence_duration": 0.34109474302273085, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "How long do you plan to stay?", + "original_text": "How long do you plan to stay?", + "start_time": 34.848256106543914, + "end_time": 36.46204295461648, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--398/temp/line_8_A.wav", + "silence_duration": 0.39470664611160544, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Four days.", + "original_text": "Four days.", + "start_time": 36.88273901355942, + "end_time": 37.77670726752768, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--398/temp/line_9_B.wav", + "silence_duration": 0.4206960589429455, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Could you give me your name and phone number?", + "original_text": "Could you give me your name and phone number?", + "start_time": 38.37125508544639, + "end_time": 40.3797811625439, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--398/temp/line_10_A.wav", + "silence_duration": 0.5945478179187165, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Nancy Brown, my phone number is 7096785634. Oh, you mentioned deluxe suites earlier—what's the rate for those?", + "original_text": "Nancy Brown, my phone number is 7096785634. Oh, you mentioned deluxe suites earlier—what's the rate for those?", + "start_time": 40.927647717162195, + "end_time": 51.864246356617976, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--398/temp/line_11_B.wav", + "silence_duration": 0.5478665546182919, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "The deluxe suites are $150 a night. Would you like to change your booking?", + "original_text": "The deluxe suites are $150 a night. Would you like to change your booking?", + "start_time": 52.43949660717044, + "end_time": 57.62915647111602, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--398/temp/line_12_A.wav", + "silence_duration": 0.5752502505524681, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "No, I'll stick with the standard room. Thank you.", + "original_text": "No, I'll stick with the standard room. Thank you.", + "start_time": 58.13689332988669, + "end_time": 60.22668924825403, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--398/temp/line_13_B.wav", + "silence_duration": 0.5077368587706688, + "is_interrupted": false + } + ] + }, + "DialogSum--val--399": { + "original_text": "A: Excuse me, do you think I can return these gloves? \nB: What's the problem with them? \nA: They're too small. \nB: Didn't you try them on before you [interrupt] left the store or decided to keep them? I'm asking because our return policy requires items to be in original condition with tags attached. \nA: Well, as a matter of fact, I received them as a gift. \nB: OK, I see. I'm afraid I can't give you a cash return, but you can change them. \nA: I believe you sell these gloves for $29.95. \nB: Yes, I'll take the gloves of the same price for you to [interrupt] exchange them right away or you can browse our new collection that just arrived this morning with many stylish options. \nA: Sorry, I just noticed that pair over there looks nice. May I have a try? \nB: It's for $35.25. If you like to take that pair, you'll pay some extra money.", + "cleaned_text": "A: Excuse me, do you think I can return these gloves? \nB: What's the problem with them? \nA: They're too small. \nB:Didn't you try them on before you left the store or decided to keep them? I'm asking because our return policy requires items to be in original condition with tags attached.\nA: Well, as a matter of fact, I received them as a gift. \nB: OK, I see. I'm afraid I can't give you a cash return, but you can change them. \nA: I believe you sell these gloves for $29.95. \nB:Yes, I'll take the gloves of the same price for you to exchange them right away or you can browse our new collection that just arrived this morning with many stylish options.\nA: Sorry, I just noticed that pair over there looks nice. May I have a try? \nB: It's for $35.25. If you like to take that pair, you'll pay some extra money.", + "total_duration": 42.43818594104308, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--399/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--399/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--399/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Excuse me, do you think I can return these gloves?", + "original_text": "Excuse me, do you think I can return these gloves?", + "start_time": 0, + "end_time": 3.053424036281179, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--399/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "What's the problem with them?", + "original_text": "What's the problem with them?", + "start_time": 3.5010931133806458, + "end_time": 4.859460460319421, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--399/temp/line_1_B.wav", + "silence_duration": 0.4476690770994668, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "They're too small.", + "original_text": "They're too small.", + "start_time": 5.272216931272317, + "end_time": 6.363554799753043, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--399/temp/line_2_A.wav", + "silence_duration": 0.4127564709528958, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Didn't you try them on before you", + "original_text": "Didn't you try them on before you [interrupt] left the store or decided to keep them? I'm asking because our return policy requires items to be in original condition with tags attached.", + "start_time": 6.718481231261396, + "end_time": 15.507234065728516, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--399/temp/line_3_B.wav", + "silence_duration": 0.35492643150835373, + "is_interrupted": true, + "text_after_interrupt": "left the store or decided to keep them? I'm asking because our return policy requires items to be in original condition with tags attached." + }, + { + "speaker": "A", + "text": "Well, as a matter of fact, I received them as a gift.", + "original_text": "Well, as a matter of fact, I received them as a gift.", + "start_time": 8.29743814736117, + "end_time": 11.234762410399718, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--399/temp/line_4_A.wav", + "silence_duration": 0.49332200267841986, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "OK, I see. I'm afraid I can't give you a cash return, but you can change them.", + "original_text": "OK, I see. I'm afraid I can't give you a cash return, but you can change them.", + "start_time": 16.032368288292645, + "end_time": 20.629919308700806, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--399/temp/line_5_B.wav", + "silence_duration": 0.5251342225641279, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I believe you sell these gloves for $29.95.", + "original_text": "I believe you sell these gloves for $29.95.", + "start_time": 20.987184862634994, + "end_time": 24.539837923859483, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--399/temp/line_6_A.wav", + "silence_duration": 0.3572655539341883, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, I'll take the gloves of the same price for you to", + "original_text": "Yes, I'll take the gloves of the same price for you to [interrupt] exchange them right away or you can browse our new collection that just arrived this morning with many stylish options.", + "start_time": 25.036666292708414, + "end_time": 33.12882048771975, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--399/temp/line_7_B.wav", + "silence_duration": 0.4968283688489298, + "is_interrupted": true, + "text_after_interrupt": "exchange them right away or you can browse our new collection that just arrived this morning with many stylish options." + }, + { + "speaker": "A", + "text": "Sorry, I just noticed that pair over there looks nice. May I have a try?", + "original_text": "Sorry, I just noticed that pair over there looks nice. May I have a try?", + "start_time": 31.75813216355207, + "end_time": 37.05228182341602, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--399/temp/line_8_A.wav", + "silence_duration": 0.3196890819600615, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "It's for $35.25. If you like to take that pair, you'll pay some extra money.", + "original_text": "It's for $35.25. If you like to take that pair, you'll pay some extra money.", + "start_time": 37.5620384079126, + "end_time": 42.43822888410308, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--399/temp/line_9_B.wav", + "silence_duration": 0.5097565844965886, + "is_interrupted": false + } + ] + }, + "DialogSum--val--402": { + "original_text": "A: Excuse me. I need to refill this prescription. \nB: It says on the bottle here that you can have two refills. \nA: Yes, I need to refill it today. \nB: Alright. I'm sorry, Miss. According to our file, this prescription has already been refilled [interrupt] twice within the past month, which means we cannot process another refill until you obtain a new prescription from your doctor. \nA: Oh, wait—are you sure? I was worried about that. I couldn't remember if I had it refilled twice yet or not. \nB: It looks like you have. You will need to see your doctor to get a new prescription. \nA: Listen. This is an emergency. I tried to call my doctor, but he is out of town. So I can't see him in time. I need this medicine. It is for a skin condition. I've run out. Can you just refill it once [interrupt] more as a special exception while I arrange an appointment with another healthcare provider who can assess my condition properly? \nB: I completely understand your urgency, but we really can't do it. We must follow the prescription, and this one has run out. \nA: But I need it. Please. Refill it for me just this once. I can go to the doctor around ten days from now. Then I'll have another prescription. \nB: Miss, I understand your problem. But it is against the law for us to sell certain medicines without a valid prescription. It's the law. I can't do anything about it. We never sell medicine unless we have a proper prescription. Never. \nA: But I have a prescription. I just need more of it. \nB: A prescription must be valid. It cannot be an expired prescription. I'm sorry, Miss. You'll have to find another doctor who will prescribe this for you.", + "cleaned_text": "A: Excuse me. I need to refill this prescription. \nB: It says on the bottle here that you can have two refills. \nA: Yes, I need to refill it today. \nB:Alright. I'm sorry, Miss. According to our file, this prescription has already been refilled twice within the past month, which means we cannot process another refill until you obtain a new prescription from your doctor.\nA: Oh, wait—are you sure? I was worried about that. I couldn't remember if I had it refilled twice yet or not. \nB: It looks like you have. You will need to see your doctor to get a new prescription. \nA:Listen. This is an emergency. I tried to call my doctor, but he is out of town. So I can't see him in time. I need this medicine. It is for a skin condition. I've run out. Can you just refill it once more as a special exception while I arrange an appointment with another healthcare provider who can assess my condition properly?\nB: I completely understand your urgency, but we really can't do it. We must follow the prescription, and this one has run out. \nA: But I need it. Please. Refill it for me just this once. I can go to the doctor around ten days from now. Then I'll have another prescription. \nB: Miss, I understand your problem. But it is against the law for us to sell certain medicines without a valid prescription. It's the law. I can't do anything about it. We never sell medicine unless we have a proper prescription. Never. \nA: But I have a prescription. I just need more of it. \nB: A prescription must be valid. It cannot be an expired prescription. I'm sorry, Miss. You'll have to find another doctor who will prescribe this for you.", + "total_duration": 86.67709750566894, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--402/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--402/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--402/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Excuse me. I need to refill this prescription.", + "original_text": "Excuse me. I need to refill this prescription.", + "start_time": 0, + "end_time": 3.355283446712018, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--402/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "It says on the bottle here that you can have two refills.", + "original_text": "It says on the bottle here that you can have two refills.", + "start_time": 3.930655488871182, + "end_time": 6.600950273451681, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--402/temp/line_1_B.wav", + "silence_duration": 0.5753720421591639, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Yes, I need to refill it today.", + "original_text": "Yes, I need to refill it today.", + "start_time": 6.981073596458716, + "end_time": 9.14052937877164, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--402/temp/line_2_A.wav", + "silence_duration": 0.38012332300703466, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Alright. I'm sorry, Miss. According to our file, this prescription has already been refilled", + "original_text": "Alright. I'm sorry, Miss. According to our file, this prescription has already been refilled [interrupt] twice within the past month, which means we cannot process another refill until you obtain a new prescription from your doctor.", + "start_time": 9.504392395160181, + "end_time": 20.66158060377696, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--402/temp/line_3_B.wav", + "silence_duration": 0.36386301638854135, + "is_interrupted": true, + "text_after_interrupt": "twice within the past month, which means we cannot process another refill until you obtain a new prescription from your doctor." + }, + { + "speaker": "A", + "text": "Oh, wait—are you sure? I was worried about that. I couldn't remember if I had it refilled twice yet or not.", + "original_text": "Oh, wait—are you sure? I was worried about that. I couldn't remember if I had it refilled twice yet or not.", + "start_time": 15.100401465454965, + "end_time": 21.79935838155474, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--402/temp/line_4_A.wav", + "silence_duration": 0.5987125470464179, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "It looks like you have. You will need to see your doctor to get a new prescription.", + "original_text": "It looks like you have. You will need to see your doctor to get a new prescription.", + "start_time": 22.395864204622182, + "end_time": 26.424526336141454, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--402/temp/line_5_B.wav", + "silence_duration": 0.596505823067441, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Listen. This is an emergency. I tried to call my doctor, but he is out of town. So I can't see him in time. I need this medicine. It is for a skin condition. I've run out. Can you just refill it once", + "original_text": "Listen. This is an emergency. I tried to call my doctor, but he is out of town. So I can't see him in time. I need this medicine. It is for a skin condition. I've run out. Can you just refill it once [interrupt] more as a special exception while I arrange an appointment with another healthcare provider who can assess my condition properly?", + "start_time": 26.775580736218167, + "end_time": 46.79118164324765, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--402/temp/line_6_A.wav", + "silence_duration": 0.351054400076713, + "is_interrupted": true, + "text_after_interrupt": "more as a special exception while I arrange an appointment with another healthcare provider who can assess my condition properly?" + }, + { + "speaker": "B", + "text": "I completely understand your urgency, but we really can't do it. We must follow the prescription, and this one has run out.", + "original_text": "I completely understand your urgency, but we really can't do it. We must follow the prescription, and this one has run out.", + "start_time": 46.202040592239726, + "end_time": 52.81972766706966, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--402/temp/line_7_B.wav", + "silence_duration": 0.45195281649848484, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "But I need it. Please. Refill it for me just this once. I can go to the doctor around ten days from now. Then I'll have another prescription.", + "original_text": "But I need it. Please. Refill it for me just this once. I can go to the doctor around ten days from now. Then I'll have another prescription.", + "start_time": 53.38415060313244, + "end_time": 61.89426398181725, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--402/temp/line_8_A.wav", + "silence_duration": 0.5644229360627855, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Miss, I understand your problem. But it is against the law for us to sell certain medicines without a valid prescription. It's the law. I can't do anything about it. We never sell medicine unless we have a proper prescription. Never.", + "original_text": "Miss, I understand your problem. But it is against the law for us to sell certain medicines without a valid prescription. It's the law. I can't do anything about it. We never sell medicine unless we have a proper prescription. Never.", + "start_time": 62.20954849301133, + "end_time": 74.00528545446258, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--402/temp/line_9_B.wav", + "silence_duration": 0.315284511194088, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "But I have a prescription. I just need more of it.", + "original_text": "But I have a prescription. I just need more of it.", + "start_time": 74.58516944496603, + "end_time": 77.91723293702952, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--402/temp/line_10_A.wav", + "silence_duration": 0.5798839905034536, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "A prescription must be valid. It cannot be an expired prescription. I'm sorry, Miss. You'll have to find another doctor who will prescribe this for you.", + "original_text": "A prescription must be valid. It cannot be an expired prescription. I'm sorry, Miss. You'll have to find another doctor who will prescribe this for you.", + "start_time": 78.50370641016806, + "end_time": 86.67713044644924, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--402/temp/line_11_B.wav", + "silence_duration": 0.5864734731385404, + "is_interrupted": false + } + ] + }, + "DialogSum--val--403": { + "original_text": "A: Do you consider yourself a good mother? \nB: Yes, I'm a very good mother and successful career woman. \nA: How can you manage to do both? I mean, it is so hard to be a working mother. \nB: I think the most important thing is that you should be nice to yourself, like keeping housework simple, spending money on things that make life easier, buying yourself things you like, and so [interrupt] you don't feel overwhelmed by the pressure of doing everything perfectly while still maintaining a healthy work-life balance and setting realistic expectations for yourself and your family. \nA: Sorry to jump in, but I'm curious—what specific things do you spend money on to make life easier? \nB: Oh, small things really, like hiring a cleaner once a week or buying pre-prepared meals. But as I was saying, you can only be nice to others when you can be nice to yourself. \nA: That makes sense. Does your husband feel the same? \nB: Yes. He is very understanding and supportive.", + "cleaned_text": "A: Do you consider yourself a good mother? \nB: Yes, I'm a very good mother and successful career woman. \nA: How can you manage to do both? I mean, it is so hard to be a working mother. \nB:I think the most important thing is that you should be nice to yourself, like keeping housework simple, spending money on things that make life easier, buying yourself things you like, and so you don't feel overwhelmed by the pressure of doing everything perfectly while still maintaining a healthy work-life balance and setting realistic expectations for yourself and your family.\nA: Sorry to jump in, but I'm curious—what specific things do you spend money on to make life easier? \nB: Oh, small things really, like hiring a cleaner once a week or buying pre-prepared meals. But as I was saying, you can only be nice to others when you can be nice to yourself. \nA: That makes sense. Does your husband feel the same? \nB: Yes. He is very understanding and supportive.", + "total_duration": 45.681224489795916, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--403/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--403/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--403/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Do you consider yourself a good mother?", + "original_text": "Do you consider yourself a good mother?", + "start_time": 0, + "end_time": 2.0317460317460316, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--403/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, I'm a very good mother and successful career woman.", + "original_text": "Yes, I'm a very good mother and successful career woman.", + "start_time": 2.4758903062433655, + "end_time": 5.494484410551756, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--403/temp/line_1_B.wav", + "silence_duration": 0.4441442744973336, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "How can you manage to do both? I mean, it is so hard to be a working mother.", + "original_text": "How can you manage to do both? I mean, it is so hard to be a working mother.", + "start_time": 6.042191439635406, + "end_time": 11.080921598365565, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--403/temp/line_2_A.wav", + "silence_duration": 0.5477070290836499, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I think the most important thing is that you should be nice to yourself, like keeping housework simple, spending money on things that make life easier, buying yourself things you like, and so", + "original_text": "I think the most important thing is that you should be nice to yourself, like keeping housework simple, spending money on things that make life easier, buying yourself things you like, and so [interrupt] you don't feel overwhelmed by the pressure of doing everything perfectly while still maintaining a healthy work-life balance and setting realistic expectations for yourself and your family.", + "start_time": 11.674465584779488, + "end_time": 29.228751299065202, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--403/temp/line_3_B.wav", + "silence_duration": 0.5935439864139236, + "is_interrupted": true, + "text_after_interrupt": "you don't feel overwhelmed by the pressure of doing everything perfectly while still maintaining a healthy work-life balance and setting realistic expectations for yourself and your family." + }, + { + "speaker": "A", + "text": "Sorry to jump in, but I'm curious—what specific things do you spend money on to make life easier?", + "original_text": "Sorry to jump in, but I'm curious—what specific things do you spend money on to make life easier?", + "start_time": 20.683807988407608, + "end_time": 27.33632499521033, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--403/temp/line_4_A.wav", + "silence_duration": 0.4098866553995528, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Oh, small things really, like hiring a cleaner once a week or buying pre-prepared meals. But as I was saying, you can only be nice to others when you can be nice to yourself.", + "original_text": "Oh, small things really, like hiring a cleaner once a week or buying pre-prepared meals. But as I was saying, you can only be nice to others when you can be nice to yourself.", + "start_time": 29.769262067606466, + "end_time": 38.99919404039558, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--403/temp/line_5_B.wav", + "silence_duration": 0.5405107685412652, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "That makes sense. Does your husband feel the same?", + "original_text": "That makes sense. Does your husband feel the same?", + "start_time": 39.51324470024473, + "end_time": 42.682768509768536, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--403/temp/line_6_A.wav", + "silence_duration": 0.5140506598491484, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes. He is very understanding and supportive.", + "original_text": "Yes. He is very understanding and supportive.", + "start_time": 43.15027911110542, + "end_time": 45.68125416779476, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--403/temp/line_7_B.wav", + "silence_duration": 0.4675106013368866, + "is_interrupted": false + } + ] + }, + "DialogSum--val--405": { + "original_text": "A: Taxi! Taxi!\nB: Where to, sir?\nA: I'd like to go to the railway station [interrupt] and I hope we can get there without too much delay because I have an important meeting to attend right after arriving at my destination.\nB: Sorry to interrupt, but which railway station are you referring to? There are a couple in the city.\nA: Oh, the central station, please.\nB: Please hop in.\nA: Is it a long run to the station?\nB: It'll take about 20 minutes.\nA: The streets are heavy with traffic at this time of a day, are [interrupt] they usually this congested during rush hour, or is there some special event causing additional delays today?\nB: Yes, they are. And it's the rush hour, so there might be some delays.\nA: Right, is it the rush hour?\nB: Yes, it is. Are you in a hurry, sir?\nA: No, I'm not. Would you please drive slowly and carefully?\nB: Yes, sir.", + "cleaned_text": "A: Taxi! Taxi!\nB: Where to, sir?\nA:I'd like to go to the railway station and I hope we can get there without too much delay because I have an important meeting to attend right after arriving at my destination.\nB: Sorry to interrupt, but which railway station are you referring to? There are a couple in the city.\nA: Oh, the central station, please.\nB: Please hop in.\nA: Is it a long run to the station?\nB: It'll take about 20 minutes.\nA:The streets are heavy with traffic at this time of a day, are they usually this congested during rush hour, or is there some special event causing additional delays today?\nB: Yes, they are. And it's the rush hour, so there might be some delays.\nA: Right, is it the rush hour?\nB: Yes, it is. Are you in a hurry, sir?\nA: No, I'm not. Would you please drive slowly and carefully?\nB: Yes, sir.", + "total_duration": 44.33265306122449, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--405/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--405/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--405/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Taxi! Taxi!", + "original_text": "Taxi! Taxi!", + "start_time": 0, + "end_time": 1.3699773242630386, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--405/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Where to, sir?", + "original_text": "Where to, sir?", + "start_time": 1.9526653903025042, + "end_time": 2.9279034855405994, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--405/temp/line_1_B.wav", + "silence_duration": 0.5826880660394655, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I'd like to go to the railway station", + "original_text": "I'd like to go to the railway station [interrupt] and I hope we can get there without too much delay because I have an important meeting to attend right after arriving at my destination.", + "start_time": 3.25079198982769, + "end_time": 13.119272715451272, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--405/temp/line_2_A.wav", + "silence_duration": 0.3228885042870904, + "is_interrupted": true, + "text_after_interrupt": "and I hope we can get there without too much delay because I have an important meeting to attend right after arriving at my destination." + }, + { + "speaker": "B", + "text": "Sorry to interrupt, but which railway station are you referring to? There are a couple in the city.", + "original_text": "Sorry to interrupt, but which railway station are you referring to? There are a couple in the city.", + "start_time": 5.363807862843563, + "end_time": 10.518637794816353, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--405/temp/line_3_B.wav", + "silence_duration": 0.5536620901580552, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Oh, the central station, please.", + "original_text": "Oh, the central station, please.", + "start_time": 13.548666788425857, + "end_time": 15.557192865523362, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--405/temp/line_4_A.wav", + "silence_duration": 0.4293940729745851, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Please hop in.", + "original_text": "Please hop in.", + "start_time": 15.958579511127418, + "end_time": 16.829327810447147, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--405/temp/line_5_B.wav", + "silence_duration": 0.4013866456040564, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Is it a long run to the station?", + "original_text": "Is it a long run to the station?", + "start_time": 17.214138984844663, + "end_time": 18.862755764890014, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--405/temp/line_6_A.wav", + "silence_duration": 0.384811174397517, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "It'll take about 20 minutes.", + "original_text": "It'll take about 20 minutes.", + "start_time": 19.325265255461904, + "end_time": 20.857782262264625, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--405/temp/line_7_B.wav", + "silence_duration": 0.46250949057188934, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "The streets are heavy with traffic at this time of a day, are", + "original_text": "The streets are heavy with traffic at this time of a day, are [interrupt] they usually this congested during rush hour, or is there some special event causing additional delays today?", + "start_time": 21.347838504494568, + "end_time": 31.262759139415202, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--405/temp/line_8_A.wav", + "silence_duration": 0.49005624222994393, + "is_interrupted": true, + "text_after_interrupt": "they usually this congested during rush hour, or is there some special event causing additional delays today?" + }, + { + "speaker": "B", + "text": "Yes, they are. And it's the rush hour, so there might be some delays.", + "original_text": "Yes, they are. And it's the rush hour, so there might be some delays.", + "start_time": 30.259662761437383, + "end_time": 33.91680561858024, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--405/temp/line_9_B.wav", + "silence_duration": 0.4286049165677468, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Right, is it the rush hour?", + "original_text": "Right, is it the rush hour?", + "start_time": 34.27515400046859, + "end_time": 35.97021068981099, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--405/temp/line_10_A.wav", + "silence_duration": 0.35834838188835144, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, it is. Are you in a hurry, sir?", + "original_text": "Yes, it is. Are you in a hurry, sir?", + "start_time": 36.3430953188094, + "end_time": 38.75797060225611, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--405/temp/line_11_B.wav", + "silence_duration": 0.37288462899840374, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "No, I'm not. Would you please drive slowly and carefully?", + "original_text": "No, I'm not. Would you please drive slowly and carefully?", + "start_time": 39.233341580621236, + "end_time": 43.111074006925094, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--405/temp/line_12_A.wav", + "silence_duration": 0.4753709783651254, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, sir.", + "original_text": "Yes, sir.", + "start_time": 43.63606320835387, + "end_time": 44.332661847809646, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--405/temp/line_13_B.wav", + "silence_duration": 0.5249892014287751, + "is_interrupted": false + } + ] + }, + "DialogSum--val--406": { + "original_text": "A: Look at the catalogue, John. I think I want to get this red blouse [interrupt] and maybe the matching skirt too because the fabric looks really comfortable and the design would be perfect for both casual outings and more formal occasions.\nB: Don't you already have one in blue? \nA: Yah, but it doesn't have a red one. \nB: Do you really need every color in the rainbow? \nA: Yes! Oh, and by the way, I didn't get to mention that the blue one is a bit different in style. \nB: Ze ze ze. . . Women!", + "cleaned_text": "A:Look at the catalogue, John. I think I want to get this red blouse and maybe the matching skirt too because the fabric looks really comfortable and the design would be perfect for both casual outings and more formal occasions.\nB: Don't you already have one in blue? \nA: Yah, but it doesn't have a red one. \nB: Do you really need every color in the rainbow? \nA: Yes! Oh, and by the way, I didn't get to mention that the blue one is a bit different in style. \nB: Ze ze ze. . . Women!", + "total_duration": 26.379183673469388, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--406/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--406/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--406/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Look at the catalogue, John. I think I want to get this red blouse", + "original_text": "Look at the catalogue, John. I think I want to get this red blouse [interrupt] and maybe the matching skirt too because the fabric looks really comfortable and the design would be perfect for both casual outings and more formal occasions.", + "start_time": 0, + "end_time": 12.898684807256236, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--406/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": true, + "text_after_interrupt": "and maybe the matching skirt too because the fabric looks really comfortable and the design would be perfect for both casual outings and more formal occasions." + }, + { + "speaker": "B", + "text": "Don't you already have one in blue?", + "original_text": "Don't you already have one in blue?", + "start_time": 3.633922902494331, + "end_time": 5.328979591836735, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--406/temp/line_1_B.wav", + "silence_duration": 0.5091196430977283, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Yah, but it doesn't have a red one.", + "original_text": "Yah, but it doesn't have a red one.", + "start_time": 13.342477534995384, + "end_time": 15.815402705063411, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--406/temp/line_2_A.wav", + "silence_duration": 0.44379272773914813, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Do you really need every color in the rainbow?", + "original_text": "Do you really need every color in the rainbow?", + "start_time": 16.304576491421635, + "end_time": 18.49886220570735, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--406/temp/line_3_B.wav", + "silence_duration": 0.48917378635822256, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Yes! Oh, and by the way, I didn't get to mention that the blue one is a bit different in style.", + "original_text": "Yes! Oh, and by the way, I didn't get to mention that the blue one is a bit different in style.", + "start_time": 18.957238153099457, + "end_time": 24.6925669512854, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--406/temp/line_4_A.wav", + "silence_duration": 0.45837594739210563, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Ze ze ze. . . Women!", + "original_text": "Ze ze ze. . . Women!", + "start_time": 25.067258976474925, + "end_time": 26.37918641411665, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--406/temp/line_5_B.wav", + "silence_duration": 0.37469202518952455, + "is_interrupted": false + } + ] + }, + "DialogSum--val--407": { + "original_text": "A: What's your favorite hobby? \nB: I'd like reading books best. \nA: What kinds of books do you like to [interrupt] explore in your free time? I'm particularly interested in knowing whether you prefer classic literature, contemporary works, or perhaps even experimental writing styles that challenge traditional storytelling. \nB: Sorry to jump in, but do you have any recommendations for good literature? I've been looking for something new to read. \nA: Oh, definitely! I can suggest a few. But before that, I was asking what kinds of books you like to read? \nB: Oh, right! I enjoy literature and economy mostly. \nA: By the way, would you like to see [interrupt] some book recommendations tailored to those genres? I've recently discovered several fascinating economic analyses that blend historical context with modern financial theories, which might interest you. \nB: Speaking of books, do you ever read while traveling? I find it relaxing. \nA: Sometimes, but I was actually asking if you'd like to see movies? \nB: That's OK. \nA: What do you do in your spare time? \nB: I like to play golf, play badminton or crack jokes. \nA: I just like to sleep like a lazy cat. \nB: That's a bad habit.", + "cleaned_text": "A: What's your favorite hobby? \nB: I'd like reading books best. \nA:What kinds of books do you like to explore in your free time? I'm particularly interested in knowing whether you prefer classic literature, contemporary works, or perhaps even experimental writing styles that challenge traditional storytelling.\nB: Sorry to jump in, but do you have any recommendations for good literature? I've been looking for something new to read. \nA: Oh, definitely! I can suggest a few. But before that, I was asking what kinds of books you like to read? \nB: Oh, right! I enjoy literature and economy mostly. \nA:By the way, would you like to see some book recommendations tailored to those genres? I've recently discovered several fascinating economic analyses that blend historical context with modern financial theories, which might interest you.\nB: Speaking of books, do you ever read while traveling? I find it relaxing. \nA: Sometimes, but I was actually asking if you'd like to see movies? \nB: That's OK. \nA: What do you do in your spare time? \nB: I like to play golf, play badminton or crack jokes. \nA: I just like to sleep like a lazy cat. \nB: That's a bad habit.", + "total_duration": 58.15736961451247, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--407/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--407/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--407/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "What's your favorite hobby?", + "original_text": "What's your favorite hobby?", + "start_time": 0, + "end_time": 1.3351473922902495, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--407/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I'd like reading books best.", + "original_text": "I'd like reading books best.", + "start_time": 1.6653409753813218, + "end_time": 3.1049781635899385, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--407/temp/line_1_B.wav", + "silence_duration": 0.33019358309107233, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "What kinds of books do you like to", + "original_text": "What kinds of books do you like to [interrupt] explore in your free time? I'm particularly interested in knowing whether you prefer classic literature, contemporary works, or perhaps even experimental writing styles that challenge traditional storytelling.", + "start_time": 3.613206327990047, + "end_time": 17.812208595563742, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--407/temp/line_2_A.wav", + "silence_duration": 0.5082281644001087, + "is_interrupted": true, + "text_after_interrupt": "explore in your free time? I'm particularly interested in knowing whether you prefer classic literature, contemporary works, or perhaps even experimental writing styles that challenge traditional storytelling." + }, + { + "speaker": "B", + "text": "Sorry to jump in, but do you have any recommendations for good literature? I've been looking for something new to read.", + "original_text": "Sorry to jump in, but do you have any recommendations for good literature? I've been looking for something new to read.", + "start_time": 5.552072541141975, + "end_time": 11.786630364271225, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--407/temp/line_3_B.wav", + "silence_duration": 0.5113398665547367, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Oh, definitely! I can suggest a few. But before that, I was asking what kinds of books you like to read?", + "original_text": "Oh, definitely! I can suggest a few. But before that, I was asking what kinds of books you like to read?", + "start_time": 18.19535568422305, + "end_time": 24.46474343932509, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--407/temp/line_4_A.wav", + "silence_duration": 0.3831470886593077, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Oh, right! I enjoy literature and economy mostly.", + "original_text": "Oh, right! I enjoy literature and economy mostly.", + "start_time": 24.939909304485234, + "end_time": 27.912063499496572, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--407/temp/line_5_B.wav", + "silence_duration": 0.4751658651601448, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "By the way, would you like to see", + "original_text": "By the way, would you like to see [interrupt] some book recommendations tailored to those genres? I've recently discovered several fascinating economic analyses that blend historical context with modern financial theories, which might interest you.", + "start_time": 28.31054613416073, + "end_time": 43.51961642894531, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--407/temp/line_6_A.wav", + "silence_duration": 0.3984826346641595, + "is_interrupted": true, + "text_after_interrupt": "some book recommendations tailored to those genres? I've recently discovered several fascinating economic analyses that blend historical context with modern financial theories, which might interest you." + }, + { + "speaker": "B", + "text": "Speaking of books, do you ever read while traveling? I find it relaxing.", + "original_text": "Speaking of books, do you ever read while traveling? I find it relaxing.", + "start_time": 37.1514637096044, + "end_time": 41.389105432960406, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--407/temp/line_7_B.wav", + "silence_duration": 0.37211545620497033, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Sometimes, but I was actually asking if you'd like to see movies?", + "original_text": "Sometimes, but I was actually asking if you'd like to see movies?", + "start_time": 43.861620163418976, + "end_time": 47.55359295253462, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--407/temp/line_8_A.wav", + "silence_duration": 0.3420037344736671, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "That's OK.", + "original_text": "That's OK.", + "start_time": 47.90409630677534, + "end_time": 48.69357476482522, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--407/temp/line_9_B.wav", + "silence_duration": 0.3505033542407126, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "What do you do in your spare time?", + "original_text": "What do you do in your spare time?", + "start_time": 49.05155093710427, + "end_time": 51.002027127580455, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--407/temp/line_10_A.wav", + "silence_duration": 0.3579761722790442, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I like to play golf, play badminton or crack jokes.", + "original_text": "I like to play golf, play badminton or crack jokes.", + "start_time": 51.37044033026643, + "end_time": 54.1452249107653, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--407/temp/line_11_B.wav", + "silence_duration": 0.36841320268597716, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I just like to sleep like a lazy cat.", + "original_text": "I just like to sleep like a lazy cat.", + "start_time": 54.4827107229791, + "end_time": 56.73504632388613, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--407/temp/line_12_A.wav", + "silence_duration": 0.3374858122137963, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "That's a bad habit.", + "original_text": "That's a bad habit.", + "start_time": 57.042826284097565, + "end_time": 58.15738410722682, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--407/temp/line_13_B.wav", + "silence_duration": 0.3077799602114329, + "is_interrupted": false + } + ] + }, + "DialogSum--val--408": { + "original_text": "A: Is this seat taken? \nB: No. Please sit down. \nA: Thanks. \nB: Are you also going to Beijing? \nA: Yes, on a business trip. How about you? \nB: I'm taking a vacation to visit a friend there. Have you ever been there before? \nA: Yes, I went there once last summer. \nB: Really? What did you think? \nA: I think it is amazing. You can enjoy both the traditional Chinese culture as well as the vitality of a modern cosmopolitan city. The only thing I didn't enjoy was the [interrupt] subway during rush hour. It was so packed that it was hard to move, and sometimes you'd have to wait for multiple trains before even being able to squeeze in. \nB: Speaking of the subway, I've heard it's quite extensive. But what do you mean by not enjoying it? \nA: Oh, I was going to say the subway was too crowded. There were always so many people. After taking the subway during the rush hour, you'll envy sardines in their cans. \nB: Oh, maybe I can take the bus or even rent a car. By the way, you were mentioning something about the subway before I interrupted—what else didn't you enjoy? \nA: Ah, nothing major, just the rush hour crowds. Other than that, the transportation system is very efficient.", + "cleaned_text": "A: Is this seat taken? \nB: No. Please sit down. \nA: Thanks. \nB: Are you also going to Beijing? \nA: Yes, on a business trip. How about you? \nB: I'm taking a vacation to visit a friend there. Have you ever been there before? \nA: Yes, I went there once last summer. \nB: Really? What did you think? \nA:I think it is amazing. You can enjoy both the traditional Chinese culture as well as the vitality of a modern cosmopolitan city. The only thing I didn't enjoy was the subway during rush hour. It was so packed that it was hard to move, and sometimes you'd have to wait for multiple trains before even being able to squeeze in.\nB: Speaking of the subway, I've heard it's quite extensive. But what do you mean by not enjoying it? \nA: Oh, I was going to say the subway was too crowded. There were always so many people. After taking the subway during the rush hour, you'll envy sardines in their cans. \nB: Oh, maybe I can take the bus or even rent a car. By the way, you were mentioning something about the subway before I interrupted—what else didn't you enjoy? \nA: Ah, nothing major, just the rush hour crowds. Other than that, the transportation system is very efficient.", + "total_duration": 66.27696145124716, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--408/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--408/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--408/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Is this seat taken?", + "original_text": "Is this seat taken?", + "start_time": 0, + "end_time": 1.253877551020408, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--408/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "No. Please sit down.", + "original_text": "No. Please sit down.", + "start_time": 1.70927963712544, + "end_time": 3.3578964171707915, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--408/temp/line_1_B.wav", + "silence_duration": 0.45540208610503186, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Thanks.", + "original_text": "Thanks.", + "start_time": 3.837890456112075, + "end_time": 4.557709050216383, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--408/temp/line_2_A.wav", + "silence_duration": 0.4799940389412838, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Are you also going to Beijing?", + "original_text": "Are you also going to Beijing?", + "start_time": 4.9909938914908505, + "end_time": 6.384191170402415, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--408/temp/line_3_B.wav", + "silence_duration": 0.43328484127446776, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Yes, on a business trip. How about you?", + "original_text": "Yes, on a business trip. How about you?", + "start_time": 6.9632061637507014, + "end_time": 9.900530426789249, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--408/temp/line_4_A.wav", + "silence_duration": 0.5790149933482862, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I'm taking a vacation to visit a friend there. Have you ever been there before?", + "original_text": "I'm taking a vacation to visit a friend there. Have you ever been there before?", + "start_time": 10.318769649670731, + "end_time": 14.277771917244428, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--408/temp/line_5_B.wav", + "silence_duration": 0.41823922288148113, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Yes, I went there once last summer.", + "original_text": "Yes, I went there once last summer.", + "start_time": 14.670649068953768, + "end_time": 17.00425451113064, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--408/temp/line_6_A.wav", + "silence_duration": 0.3928771517093399, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Really? What did you think?", + "original_text": "Really? What did you think?", + "start_time": 17.515674074137667, + "end_time": 19.326830536722703, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--408/temp/line_7_B.wav", + "silence_duration": 0.5114195630070261, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I think it is amazing. You can enjoy both the traditional Chinese culture as well as the vitality of a modern cosmopolitan city. The only thing I didn't enjoy was the", + "original_text": "I think it is amazing. You can enjoy both the traditional Chinese culture as well as the vitality of a modern cosmopolitan city. The only thing I didn't enjoy was the [interrupt] subway during rush hour. It was so packed that it was hard to move, and sometimes you'd have to wait for multiple trains before even being able to squeeze in.", + "start_time": 19.79969486406168, + "end_time": 39.455386474039, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--408/temp/line_8_A.wav", + "silence_duration": 0.472864327338978, + "is_interrupted": true, + "text_after_interrupt": "subway during rush hour. It was so packed that it was hard to move, and sometimes you'd have to wait for multiple trains before even being able to squeeze in." + }, + { + "speaker": "B", + "text": "Speaking of the subway, I've heard it's quite extensive. But what do you mean by not enjoying it?", + "original_text": "Speaking of the subway, I've heard it's quite extensive. But what do you mean by not enjoying it?", + "start_time": 30.817563344787303, + "end_time": 35.35706447857415, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--408/temp/line_9_B.wav", + "silence_duration": 0.35113917246368453, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Oh, I was going to say the subway was too crowded. There were always so many people. After taking the subway during the rush hour, you'll envy sardines in their cans.", + "original_text": "Oh, I was going to say the subway was too crowded. There were always so many people. After taking the subway during the rush hour, you'll envy sardines in their cans.", + "start_time": 39.96192350436984, + "end_time": 49.95811398056032, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--408/temp/line_10_A.wav", + "silence_duration": 0.5065370303308409, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Oh, maybe I can take the bus or even rent a car. By the way, you were mentioning something about the subway before I interrupted—what else didn't you enjoy?", + "original_text": "Oh, maybe I can take the bus or even rent a car. By the way, you were mentioning something about the subway before I interrupted—what else didn't you enjoy?", + "start_time": 50.543888204224714, + "end_time": 58.078763487671424, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--408/temp/line_11_B.wav", + "silence_duration": 0.5857742236643958, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Ah, nothing major, just the rush hour crowds. Other than that, the transportation system is very efficient.", + "original_text": "Ah, nothing major, just the rush hour crowds. Other than that, the transportation system is very efficient.", + "start_time": 58.626026004716216, + "end_time": 66.27700106140556, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--408/temp/line_12_A.wav", + "silence_duration": 0.5472625170447948, + "is_interrupted": false + } + ] + }, + "DialogSum--val--414": { + "original_text": "A: How do you use an ATM card, Billy? \nB: It's easy, Grandpa. Insert your card into the machine here. Then wait a moment. Ok. Now you enter your PIN. It should have four [interrupt] digits, and make sure you remember them because the ATM will automatically lock your card if you enter the wrong PIN three times in a row for security reasons. \nA: Oh yes. I've got it written down here. Just a minute. \nB: You really shouldn't write it down. You should memorize it. You can change it to a more convenient number if you like. But, Grandpa, did you catch what I said about the PIN needing to be four numbers? \nA: Oh, yes, I did. Ok, I've entered my PIN. There are several options on the screen. I guess I just choose which service I want, don't I? \nB: Yes. Choose the service you need to use. If you choose to withdraw money, the machine will ask you how much you [interrupt] want to take out and then it will dispense the cash along with a receipt that shows your remaining balance and transaction details for your records. \nA: I can just enter the amount using the keys, right? \nB: That's right. Give the machine a moment to process your request. Then take your money.", + "cleaned_text": "A: How do you use an ATM card, Billy? \nB:It's easy, Grandpa. Insert your card into the machine here. Then wait a moment. Ok. Now you enter your PIN. It should have four digits, and make sure you remember them because the ATM will automatically lock your card if you enter the wrong PIN three times in a row for security reasons.\nA: Oh yes. I've got it written down here. Just a minute. \nB: You really shouldn't write it down. You should memorize it. You can change it to a more convenient number if you like. But, Grandpa, did you catch what I said about the PIN needing to be four numbers? \nA: Oh, yes, I did. Ok, I've entered my PIN. There are several options on the screen. I guess I just choose which service I want, don't I? \nB:Yes. Choose the service you need to use. If you choose to withdraw money, the machine will ask you how much you want to take out and then it will dispense the cash along with a receipt that shows your remaining balance and transaction details for your records.\nA: I can just enter the amount using the keys, right? \nB: That's right. Give the machine a moment to process your request. Then take your money.", + "total_duration": 54.20448979591837, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--414/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--414/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--414/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "How do you use an ATM card, Billy?", + "original_text": "How do you use an ATM card, Billy?", + "start_time": 0, + "end_time": 2.2175056689342405, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--414/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "It's easy, Grandpa. Insert your card into the machine here. Then wait a moment. Ok. Now you enter your PIN. It should have four", + "original_text": "It's easy, Grandpa. Insert your card into the machine here. Then wait a moment. Ok. Now you enter your PIN. It should have four [interrupt] digits, and make sure you remember them because the ATM will automatically lock your card if you enter the wrong PIN three times in a row for security reasons.", + "start_time": 2.730150505407873, + "end_time": 17.347111956655038, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--414/temp/line_1_B.wav", + "silence_duration": 0.5126448364736325, + "is_interrupted": true, + "text_after_interrupt": "digits, and make sure you remember them because the ATM will automatically lock your card if you enter the wrong PIN three times in a row for security reasons." + }, + { + "speaker": "A", + "text": "Oh yes. I've got it written down here. Just a minute.", + "original_text": "Oh yes. I've got it written down here. Just a minute.", + "start_time": 9.208517852346649, + "end_time": 12.366431684546196, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--414/temp/line_2_A.wav", + "silence_duration": 0.3245425701019421, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "You really shouldn't write it down. You should memorize it. You can change it to a more convenient number if you like. But, Grandpa, did you catch what I said about the PIN needing to be four numbers?", + "original_text": "You really shouldn't write it down. You should memorize it. You can change it to a more convenient number if you like. But, Grandpa, did you catch what I said about the PIN needing to be four numbers?", + "start_time": 17.85902770785552, + "end_time": 27.855218184045995, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--414/temp/line_3_B.wav", + "silence_duration": 0.5119157512004828, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Oh, yes, I did. Ok, I've entered my PIN. There are several options on the screen. I guess I just choose which service I want, don't I?", + "original_text": "Oh, yes, I did. Ok, I've entered my PIN. There are several options on the screen. I guess I just choose which service I want, don't I?", + "start_time": 28.416972819045718, + "end_time": 36.393027240814426, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--414/temp/line_4_A.wav", + "silence_duration": 0.5617546349997213, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes. Choose the service you need to use. If you choose to withdraw money, the machine will ask you how much you", + "original_text": "Yes. Choose the service you need to use. If you choose to withdraw money, the machine will ask you how much you [interrupt] want to take out and then it will dispense the cash along with a receipt that shows your remaining balance and transaction details for your records.", + "start_time": 36.716181962634735, + "end_time": 49.45232708735129, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--414/temp/line_5_B.wav", + "silence_duration": 0.3231547218203088, + "is_interrupted": true, + "text_after_interrupt": "want to take out and then it will dispense the cash along with a receipt that shows your remaining balance and transaction details for your records." + }, + { + "speaker": "A", + "text": "I can just enter the amount using the keys, right?", + "original_text": "I can just enter the amount using the keys, right?", + "start_time": 46.28921706066073, + "end_time": 49.16849143707797, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--414/temp/line_6_A.wav", + "silence_duration": 0.3306035998004085, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "That's right. Give the machine a moment to process your request. Then take your money.", + "original_text": "That's right. Give the machine a moment to process your request. Then take your money.", + "start_time": 49.87399288589299, + "end_time": 54.2045144278431, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--414/temp/line_7_B.wav", + "silence_duration": 0.4216657985416927, + "is_interrupted": false + } + ] + }, + "DialogSum--val--415": { + "original_text": "A: How are you doing? \nB: I'm pretty good, you? \nA: I'm awesome. \nB: How long have you been on the bus? \nA: I've been on here for like, 15 [interrupt] minutes or so, which is actually not too bad considering the usual traffic at this time of day. \nB: 15 minutes? I just got on myself. Do you catch this bus a lot? \nA: Not much, I have a car. \nB: So, you have your own car? \nA: I sure do. \nB: Then, why are you on the bus with me? \nA: I'm waiting till our President gets out of office, and the gas prices [interrupt] hopefully start to drop significantly so I can save some money while still getting around conveniently. \nB: Oh, that makes sense. But wait, how long did you say you've been on the bus again? \nA: About 15 minutes. And yeah, I'm hoping the gas prices go down soon. \nB: That's good thinking.", + "cleaned_text": "A: How are you doing? \nB: I'm pretty good, you? \nA: I'm awesome. \nB: How long have you been on the bus? \nA:I've been on here for like, 15 minutes or so, which is actually not too bad considering the usual traffic at this time of day.\nB: 15 minutes? I just got on myself. Do you catch this bus a lot? \nA: Not much, I have a car. \nB: So, you have your own car? \nA: I sure do. \nB: Then, why are you on the bus with me? \nA:I'm waiting till our President gets out of office, and the gas prices hopefully start to drop significantly so I can save some money while still getting around conveniently.\nB: Oh, that makes sense. But wait, how long did you say you've been on the bus again? \nA: About 15 minutes. And yeah, I'm hoping the gas prices go down soon. \nB: That's good thinking.", + "total_duration": 41.18938775510204, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--415/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--415/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--415/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "How are you doing?", + "original_text": "How are you doing?", + "start_time": 0, + "end_time": 0.9984580498866213, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--415/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I'm pretty good, you?", + "original_text": "I'm pretty good, you?", + "start_time": 1.3446263878501683, + "end_time": 2.494014142952209, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--415/temp/line_1_B.wav", + "silence_duration": 0.34616833796354707, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I'm awesome.", + "original_text": "I'm awesome.", + "start_time": 2.9326607251923225, + "end_time": 4.128488389591416, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--415/temp/line_2_A.wav", + "silence_duration": 0.43864658224011355, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "How long have you been on the bus?", + "original_text": "How long have you been on the bus?", + "start_time": 4.693717434189788, + "end_time": 6.144964599722668, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--415/temp/line_3_B.wav", + "silence_duration": 0.5652290445983721, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I've been on here for like, 15", + "original_text": "I've been on here for like, 15 [interrupt] minutes or so, which is actually not too bad considering the usual traffic at this time of day.", + "start_time": 6.612932615487079, + "end_time": 14.171027853582316, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--415/temp/line_4_A.wav", + "silence_duration": 0.46796801576441094, + "is_interrupted": true, + "text_after_interrupt": "minutes or so, which is actually not too bad considering the usual traffic at this time of day." + }, + { + "speaker": "B", + "text": "15 minutes? I just got on myself. Do you catch this bus a lot?", + "original_text": "15 minutes? I just got on myself. Do you catch this bus a lot?", + "start_time": 8.772388397800004, + "end_time": 12.38309134564581, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--415/temp/line_5_B.wav", + "silence_duration": 0.30532414092574234, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Not much, I have a car.", + "original_text": "Not much, I have a car.", + "start_time": 14.56159437056919, + "end_time": 16.337920901181434, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--415/temp/line_6_A.wav", + "silence_duration": 0.3905665169868736, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "So, you have your own car?", + "original_text": "So, you have your own car?", + "start_time": 16.88741115856384, + "end_time": 18.245778505502614, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--415/temp/line_7_B.wav", + "silence_duration": 0.5494902573824054, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I sure do.", + "original_text": "I sure do.", + "start_time": 18.795350742703658, + "end_time": 19.77058883794175, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--415/temp/line_8_A.wav", + "silence_duration": 0.5495722372010446, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Then, why are you on the bus with me?", + "original_text": "Then, why are you on the bus with me?", + "start_time": 20.11373032223654, + "end_time": 21.971326694118623, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--415/temp/line_9_B.wav", + "silence_duration": 0.3431414842947855, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I'm waiting till our President gets out of office, and the gas prices", + "original_text": "I'm waiting till our President gets out of office, and the gas prices [interrupt] hopefully start to drop significantly so I can save some money while still getting around conveniently.", + "start_time": 22.496329575843642, + "end_time": 32.13261075498197, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--415/temp/line_10_A.wav", + "silence_duration": 0.5250028817250197, + "is_interrupted": true, + "text_after_interrupt": "hopefully start to drop significantly so I can save some money while still getting around conveniently." + }, + { + "speaker": "B", + "text": "Oh, that makes sense. But wait, how long did you say you've been on the bus again?", + "original_text": "Oh, that makes sense. But wait, how long did you say you've been on the bus again?", + "start_time": 30.38677118335231, + "end_time": 34.32255349627748, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--415/temp/line_11_B.wav", + "silence_duration": 0.5966449064527359, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "About 15 minutes. And yeah, I'm hoping the gas prices go down soon.", + "original_text": "About 15 minutes. And yeah, I'm hoping the gas prices go down soon.", + "start_time": 34.805842124413644, + "end_time": 39.844572283143805, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--415/temp/line_12_A.wav", + "silence_duration": 0.483288628136167, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "That's good thinking.", + "original_text": "That's good thinking.", + "start_time": 40.23738358343776, + "end_time": 41.189401724027334, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--415/temp/line_13_B.wav", + "silence_duration": 0.39281130029395706, + "is_interrupted": false + } + ] + }, + "DialogSum--val--416": { + "original_text": "A: May I take your order? \nB: What's the specialty of the house? \nA: The baked fish in tomato sauce is pretty [interrupt] tender and flavorful, it's one of our most popular dishes because we use a secret blend of herbs and spices that have been passed down through generations of chefs here. \nB: Sorry to interrupt, but could you tell me if the fish is fresh? \nA: Yes, it's fresh daily. As I was saying, the baked fish in tomato sauce is pretty good and pairs wonderfully with our house white wine if you're interested. \nB: I like fish. Please bring me an order of that. \nA: Do you want some dessert? \nB: Apple pie, please. \nA: Single or [interrupt] double serving? We also offer a complimentary coffee with our desserts if you'd like to enjoy the full dining experience. \nB: Oh, wait! I forgot to ask—does the pie come with ice cream? \nA: Yes, it does. Now, would you like a single or double serving? \nB: Make it two.", + "cleaned_text": "A: May I take your order? \nB: What's the specialty of the house? \nA:The baked fish in tomato sauce is pretty tender and flavorful, it's one of our most popular dishes because we use a secret blend of herbs and spices that have been passed down through generations of chefs here.\nB: Sorry to interrupt, but could you tell me if the fish is fresh? \nA: Yes, it's fresh daily. As I was saying, the baked fish in tomato sauce is pretty good and pairs wonderfully with our house white wine if you're interested. \nB: I like fish. Please bring me an order of that. \nA: Do you want some dessert? \nB: Apple pie, please. \nA:Single or double serving? We also offer a complimentary coffee with our desserts if you'd like to enjoy the full dining experience.\nB: Oh, wait! I forgot to ask—does the pie come with ice cream? \nA: Yes, it does. Now, would you like a single or double serving? \nB: Make it two.", + "total_duration": 48.13532879818594, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--416/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--416/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--416/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "May I take your order?", + "original_text": "May I take your order?", + "start_time": 0, + "end_time": 1.3351473922902495, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--416/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "What's the specialty of the house?", + "original_text": "What's the specialty of the house?", + "start_time": 1.6587933687906786, + "end_time": 3.2725802168632407, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--416/temp/line_1_B.wav", + "silence_duration": 0.32364597650042926, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "The baked fish in tomato sauce is pretty", + "original_text": "The baked fish in tomato sauce is pretty [interrupt] tender and flavorful, it's one of our most popular dishes because we use a secret blend of herbs and spices that have been passed down through generations of chefs here.", + "start_time": 3.8537165917850804, + "end_time": 16.972990968202314, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--416/temp/line_2_A.wav", + "silence_duration": 0.5811363749218396, + "is_interrupted": true, + "text_after_interrupt": "tender and flavorful, it's one of our most popular dishes because we use a secret blend of herbs and spices that have been passed down through generations of chefs here." + }, + { + "speaker": "B", + "text": "Sorry to interrupt, but could you tell me if the fish is fresh?", + "original_text": "Sorry to interrupt, but could you tell me if the fish is fresh?", + "start_time": 6.164102079313425, + "end_time": 9.263966024891657, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--416/temp/line_3_B.wav", + "silence_duration": 0.4776498831283674, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Yes, it's fresh daily. As I was saying, the baked fish in tomato sauce is pretty good and pairs wonderfully with our house white wine if you're interested.", + "original_text": "Yes, it's fresh daily. As I was saying, the baked fish in tomato sauce is pretty good and pairs wonderfully with our house white wine if you're interested.", + "start_time": 17.289227220327835, + "end_time": 26.461109306495636, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--416/temp/line_4_A.wav", + "silence_duration": 0.3162362521255212, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I like fish. Please bring me an order of that.", + "original_text": "I like fish. Please bring me an order of that.", + "start_time": 26.83251026064298, + "end_time": 29.409925226629376, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--416/temp/line_5_B.wav", + "silence_duration": 0.37140095414734375, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Do you want some dessert?", + "original_text": "Do you want some dessert?", + "start_time": 29.802533938839517, + "end_time": 31.07963144450845, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--416/temp/line_6_A.wav", + "silence_duration": 0.3926087122101394, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Apple pie, please.", + "original_text": "Apple pie, please.", + "start_time": 31.525891094029742, + "end_time": 32.77976864505015, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--416/temp/line_7_B.wav", + "silence_duration": 0.4462596495212917, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Single or", + "original_text": "Single or [interrupt] double serving? We also offer a complimentary coffee with our desserts if you'd like to enjoy the full dining experience.", + "start_time": 33.373690994579825, + "end_time": 41.744484645373475, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--416/temp/line_8_A.wav", + "silence_duration": 0.5939223495296807, + "is_interrupted": true, + "text_after_interrupt": "double serving? We also offer a complimentary coffee with our desserts if you'd like to enjoy the full dining experience." + }, + { + "speaker": "B", + "text": "Oh, wait! I forgot to ask—does the pie come with ice cream?", + "original_text": "Oh, wait! I forgot to ask—does the pie come with ice cream?", + "start_time": 38.569005276890984, + "end_time": 42.504787589816154, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--416/temp/line_9_B.wav", + "silence_duration": 0.4724688904560134, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Yes, it does. Now, would you like a single or double serving?", + "original_text": "Yes, it does. Now, would you like a single or double serving?", + "start_time": 42.8489542407037, + "end_time": 46.86600639489871, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--416/temp/line_10_A.wav", + "silence_duration": 0.34416665088754145, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Make it two.", + "original_text": "Make it two.", + "start_time": 47.26459926436369, + "end_time": 48.13534756368342, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--416/temp/line_11_B.wav", + "silence_duration": 0.3985928694649764, + "is_interrupted": false + } + ] + }, + "DialogSum--val--417": { + "original_text": "A: Oh, I'm afraid we've sold out of those. They were really [interrupt] in high demand, so they went quickly and we've had multiple customers asking about them throughout the day. \nB: Sold out? That's disappointing. Do you know when you'll be getting more in? \nA: They were really popular, but I haven't mentioned yet—Yes, we should be getting more in next week. Would you like me to reserve one for you? \nB: That would be great, thank you. And just to confirm, it's definitely the DS102 series, right?", + "cleaned_text": "A:Oh, I'm afraid we've sold out of those. They were really in high demand, so they went quickly and we've had multiple customers asking about them throughout the day.\nB: Sold out? That's disappointing. Do you know when you'll be getting more in? \nA: They were really popular, but I haven't mentioned yet—Yes, we should be getting more in next week. Would you like me to reserve one for you? \nB: That would be great, thank you. And just to confirm, it's definitely the DS102 series, right?", + "total_duration": 24.024807256235828, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--417/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--417/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--417/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Oh, I'm afraid we've sold out of those. They were really", + "original_text": "Oh, I'm afraid we've sold out of those. They were really [interrupt] in high demand, so they went quickly and we've had multiple customers asking about them throughout the day.", + "start_time": 0, + "end_time": 9.531791383219955, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--417/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": true, + "text_after_interrupt": "in high demand, so they went quickly and we've had multiple customers asking about them throughout the day." + }, + { + "speaker": "B", + "text": "Sold out? That's disappointing. Do you know when you'll be getting more in?", + "original_text": "Sold out? That's disappointing. Do you know when you'll be getting more in?", + "start_time": 3.6687528344671203, + "end_time": 6.977596371882086, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--417/temp/line_1_B.wav", + "silence_duration": 0.40295396648224124, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "They were really popular, but I haven't mentioned yet—Yes, we should be getting more in next week. Would you like me to reserve one for you?", + "original_text": "They were really popular, but I haven't mentioned yet—Yes, we should be getting more in next week. Would you like me to reserve one for you?", + "start_time": 9.952556064534466, + "end_time": 18.125980100815646, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--417/temp/line_2_A.wav", + "silence_duration": 0.4207646813145114, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "That would be great, thank you. And just to confirm, it's definitely the DS102 series, right?", + "original_text": "That would be great, thank you. And just to confirm, it's definitely the DS102 series, right?", + "start_time": 18.695848933722058, + "end_time": 24.024828525558792, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--417/temp/line_3_B.wav", + "silence_duration": 0.5698688329064131, + "is_interrupted": false + } + ] + }, + "DialogSum--val--418": { + "original_text": "A: Your total comes to $36.78. \nB: Put it on my VISA. \nA: There's a problem with your [interrupt] card. It seems like it might be expired or there could be an issue with the bank authorization system preventing the transaction from going through successfully. \nB: What's wrong with it? \nA: I believe it was declined. \nB: You're kidding me! \nA: Do you have another card I could try, or maybe an alternative payment method like a mobile wallet? \nB: I only have one card. What should I do now? \nA: Do you have cash, perhaps? \nB: I don't have any cash on me. \nA: You're not going to be able to take these items today. \nB: I'll be back tomorrow.", + "cleaned_text": "A: Your total comes to $36.78. \nB: Put it on my VISA. \nA:There's a problem with your card. It seems like it might be expired or there could be an issue with the bank authorization system preventing the transaction from going through successfully.\nB: What's wrong with it? \nA: I believe it was declined. \nB: You're kidding me! \nA: Do you have another card I could try, or maybe an alternative payment method like a mobile wallet? \nB: I only have one card. What should I do now? \nA: Do you have cash, perhaps? \nB: I don't have any cash on me. \nA: You're not going to be able to take these items today. \nB: I'll be back tomorrow.", + "total_duration": 37.76090702947846, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--418/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--418/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--418/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Your total comes to $36.78.", + "original_text": "Your total comes to $36.78.", + "start_time": 0, + "end_time": 3.332063492063492, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--418/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Put it on my VISA.", + "original_text": "Put it on my VISA.", + "start_time": 3.7062169586408102, + "end_time": 4.878824668391378, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--418/temp/line_1_B.wav", + "silence_duration": 0.37415346657731846, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "There's a problem with your", + "original_text": "There's a problem with your [interrupt] card. It seems like it might be expired or there could be an issue with the bank authorization system preventing the transaction from going through successfully.", + "start_time": 5.18414975461626, + "end_time": 15.934988756883833, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--418/temp/line_2_A.wav", + "silence_duration": 0.3053250862248822, + "is_interrupted": true, + "text_after_interrupt": "card. It seems like it might be expired or there could be an issue with the bank authorization system preventing the transaction from going through successfully." + }, + { + "speaker": "B", + "text": "What's wrong with it?", + "original_text": "What's wrong with it?", + "start_time": 7.2158957863622915, + "end_time": 8.272403722870228, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--418/temp/line_3_B.wav", + "silence_duration": 0.39345193270181344, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I believe it was declined.", + "original_text": "I believe it was declined.", + "start_time": 16.49994417715079, + "end_time": 18.148560957196143, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--418/temp/line_4_A.wav", + "silence_duration": 0.5649554202669587, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "You're kidding me!", + "original_text": "You're kidding me!", + "start_time": 18.607006847879354, + "end_time": 19.58224494311745, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--418/temp/line_5_B.wav", + "silence_duration": 0.45844589068321157, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Do you have another card I could try, or maybe an alternative payment method like a mobile wallet?", + "original_text": "Do you have another card I could try, or maybe an alternative payment method like a mobile wallet?", + "start_time": 19.978037199729293, + "end_time": 25.713365997915233, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--418/temp/line_6_A.wav", + "silence_duration": 0.39579225661184625, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I only have one card. What should I do now?", + "original_text": "I only have one card. What should I do now?", + "start_time": 26.249418612205798, + "end_time": 28.687513850301038, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--418/temp/line_7_B.wav", + "silence_duration": 0.5360526142905663, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Do you have cash, perhaps?", + "original_text": "Do you have cash, perhaps?", + "start_time": 29.04820904701485, + "end_time": 30.603946008466096, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--418/temp/line_8_A.wav", + "silence_duration": 0.3606951967138117, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I don't have any cash on me.", + "original_text": "I don't have any cash on me.", + "start_time": 31.056522216666316, + "end_time": 32.61225917811756, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--418/temp/line_9_B.wav", + "silence_duration": 0.45257620820021993, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "You're not going to be able to take these items today.", + "original_text": "You're not going to be able to take these items today.", + "start_time": 33.137230727534025, + "end_time": 36.10938492254536, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--418/temp/line_10_A.wav", + "silence_duration": 0.5249715494164617, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I'll be back tomorrow.", + "original_text": "I'll be back tomorrow.", + "start_time": 36.61153362187148, + "end_time": 37.76092137697352, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--418/temp/line_11_B.wav", + "silence_duration": 0.5021486993261209, + "is_interrupted": false + } + ] + }, + "DialogSum--val--422": { + "original_text": "A: Are you going to vote this Tuesday? \nB: Yes, I am, and I am so [interrupt] excited to finally have a say in this election because I've been following the campaigns closely and truly believe this is a pivotal moment for our country's future. \nA: Sorry to interrupt, but have you figured out who you're going to vote for? \nB: I love my candidate. \nA: Why is that? \nB: My candidate is probably the most intelligent. \nA: Is that right? \nB: I also agree with all his policies. \nA: That's great! By the way, you mentioned you were excited earlier—what specifically are you excited about? \nB: I know he's going to be the next President. \nA: Hopefully, he will be. \nB: I can't wait to vote.", + "cleaned_text": "A: Are you going to vote this Tuesday? \nB:Yes, I am, and I am so excited to finally have a say in this election because I've been following the campaigns closely and truly believe this is a pivotal moment for our country's future.\nA: Sorry to interrupt, but have you figured out who you're going to vote for? \nB: I love my candidate. \nA: Why is that? \nB: My candidate is probably the most intelligent. \nA: Is that right? \nB: I also agree with all his policies. \nA: That's great! By the way, you mentioned you were excited earlier—what specifically are you excited about? \nB: I know he's going to be the next President. \nA: Hopefully, he will be. \nB: I can't wait to vote.", + "total_duration": 34.542040816326534, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--422/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--422/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--422/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Are you going to vote this Tuesday?", + "original_text": "Are you going to vote this Tuesday?", + "start_time": 0, + "end_time": 1.8343764172335602, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--422/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, I am, and I am so", + "original_text": "Yes, I am, and I am so [interrupt] excited to finally have a say in this election because I've been following the campaigns closely and truly believe this is a pivotal moment for our country's future.", + "start_time": 2.2807964539449745, + "end_time": 11.638438177300984, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--422/temp/line_1_B.wav", + "silence_duration": 0.4464200367114144, + "is_interrupted": true, + "text_after_interrupt": "excited to finally have a say in this election because I've been following the campaigns closely and truly believe this is a pivotal moment for our country's future." + }, + { + "speaker": "A", + "text": "Sorry to interrupt, but have you figured out who you're going to vote for?", + "original_text": "Sorry to interrupt, but have you figured out who you're going to vote for?", + "start_time": 3.7784835287749066, + "end_time": 8.132225025373547, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--422/temp/line_2_A.wav", + "silence_duration": 0.35740350261999865, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I love my candidate.", + "original_text": "I love my candidate.", + "start_time": 12.042483312575756, + "end_time": 13.215091022326323, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--422/temp/line_3_B.wav", + "silence_duration": 0.4040451352747719, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Why is that?", + "original_text": "Why is that?", + "start_time": 13.54930368219185, + "end_time": 14.524541777429945, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--422/temp/line_4_A.wav", + "silence_duration": 0.33421265986552634, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "My candidate is probably the most intelligent.", + "original_text": "My candidate is probably the most intelligent.", + "start_time": 15.081110094147256, + "end_time": 17.600475173512336, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--422/temp/line_5_B.wav", + "silence_duration": 0.5565683167173109, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Is that right?", + "original_text": "Is that right?", + "start_time": 18.04340074654905, + "end_time": 18.96058895516583, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--422/temp/line_6_A.wav", + "silence_duration": 0.4429255730367151, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I also agree with all his policies.", + "original_text": "I also agree with all his policies.", + "start_time": 19.523572747237523, + "end_time": 21.601758688280608, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--422/temp/line_7_B.wav", + "silence_duration": 0.562983792071696, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "That's great! By the way, you mentioned you were excited earlier—what specifically are you excited about?", + "original_text": "That's great! By the way, you mentioned you were excited earlier—what specifically are you excited about?", + "start_time": 22.17392433680002, + "end_time": 28.79161141162995, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--422/temp/line_8_A.wav", + "silence_duration": 0.5721656485194138, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I know he's going to be the next President.", + "original_text": "I know he's going to be the next President.", + "start_time": 29.114852359791087, + "end_time": 30.984058708997438, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--422/temp/line_9_B.wav", + "silence_duration": 0.3232409481611355, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Hopefully, he will be.", + "original_text": "Hopefully, he will be.", + "start_time": 31.57712343227119, + "end_time": 32.91227082456144, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--422/temp/line_10_A.wav", + "silence_duration": 0.5930647232737527, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I can't wait to vote.", + "original_text": "I can't wait to vote.", + "start_time": 33.28819295474517, + "end_time": 34.54207050576558, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--422/temp/line_11_B.wav", + "silence_duration": 0.37592213018373233, + "is_interrupted": false + } + ] + }, + "DialogSum--val--423": { + "original_text": "A: I wonder if you could help me find something for my daughter.\nB: Do you think she'd like a laptop?\nA: I think that would be [interrupt] a great idea, especially since she's starting college soon and will need reliable technology for all her coursework and research projects.\nB: Sorry to jump in, but does she have any specific brand preferences? It might help narrow down the options.\nA: Actually, she prefers Macs. How much is one?\nB: Our 15-inch Pro will cost you only $2,100.\nA: She's going to be so happy. Let me have one.\nB: You've made a good decision. How would you like to complete the payment? We accept various methods.\nA: Oh, I'll pay for it with my VISA.\nB: It's all yours after you sign here, please.\nA: By the way, are there any extras that she needs?\nB: This is good to go. If she wants accessories, just visit us again.", + "cleaned_text": "A: I wonder if you could help me find something for my daughter.\nB: Do you think she'd like a laptop?\nA:I think that would be a great idea, especially since she's starting college soon and will need reliable technology for all her coursework and research projects.\nB: Sorry to jump in, but does she have any specific brand preferences? It might help narrow down the options.\nA: Actually, she prefers Macs. How much is one?\nB: Our 15-inch Pro will cost you only $2,100.\nA: She's going to be so happy. Let me have one.\nB: You've made a good decision. How would you like to complete the payment? We accept various methods.\nA: Oh, I'll pay for it with my VISA.\nB: It's all yours after you sign here, please.\nA: By the way, are there any extras that she needs?\nB: This is good to go. If she wants accessories, just visit us again.", + "total_duration": 44.717777777777776, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--423/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--423/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--423/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "I wonder if you could help me find something for my daughter.", + "original_text": "I wonder if you could help me find something for my daughter.", + "start_time": 0, + "end_time": 3.076643990929705, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--423/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Do you think she'd like a laptop?", + "original_text": "Do you think she'd like a laptop?", + "start_time": 3.622554730835597, + "end_time": 5.073801896368477, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--423/temp/line_1_B.wav", + "silence_duration": 0.5459107399058917, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I think that would be", + "original_text": "I think that would be [interrupt] a great idea, especially since she's starting college soon and will need reliable technology for all her coursework and research projects.", + "start_time": 5.481685231194045, + "end_time": 14.816106999901528, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--423/temp/line_2_A.wav", + "silence_duration": 0.4078833348255681, + "is_interrupted": true, + "text_after_interrupt": "a great idea, especially since she's starting college soon and will need reliable technology for all her coursework and research projects." + }, + { + "speaker": "B", + "text": "Sorry to jump in, but does she have any specific brand preferences? It might help narrow down the options.", + "original_text": "Sorry to jump in, but does she have any specific brand preferences? It might help narrow down the options.", + "start_time": 6.6775128955931375, + "end_time": 12.772750990831232, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--423/temp/line_3_B.wav", + "silence_duration": 0.3483021733249529, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Actually, she prefers Macs. How much is one?", + "original_text": "Actually, she prefers Macs. How much is one?", + "start_time": 15.283492721503338, + "end_time": 18.8129258280793, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--423/temp/line_4_A.wav", + "silence_duration": 0.46738572160181, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Our 15-inch Pro will cost you only $2,100.", + "original_text": "Our 15-inch Pro will cost you only $2,100.", + "start_time": 19.33301196475592, + "end_time": 22.827615139359093, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--423/temp/line_5_B.wav", + "silence_duration": 0.520086136676617, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "She's going to be so happy. Let me have one.", + "original_text": "She's going to be so happy. Let me have one.", + "start_time": 23.36419492676343, + "end_time": 26.440838917693135, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--423/temp/line_6_A.wav", + "silence_duration": 0.5365797874043398, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "You've made a good decision. How would you like to complete the payment? We accept various methods.", + "original_text": "You've made a good decision. How would you like to complete the payment? We accept various methods.", + "start_time": 26.913772999530035, + "end_time": 31.848013362341828, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--423/temp/line_7_B.wav", + "silence_duration": 0.472934081836902, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Oh, I'll pay for it with my VISA.", + "original_text": "Oh, I'll pay for it with my VISA.", + "start_time": 32.21925196779147, + "end_time": 34.22777804488898, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--423/temp/line_8_A.wav", + "silence_duration": 0.37123860544964477, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "It's all yours after you sign here, please.", + "original_text": "It's all yours after you sign here, please.", + "start_time": 34.67580731536447, + "end_time": 36.974582825568554, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--423/temp/line_9_B.wav", + "silence_duration": 0.44802927047549707, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "By the way, are there any extras that she needs?", + "original_text": "By the way, are there any extras that she needs?", + "start_time": 37.318933320211954, + "end_time": 40.45362719776298, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--423/temp/line_10_A.wav", + "silence_duration": 0.34435049464339873, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "This is good to go. If she wants accessories, just visit us again.", + "original_text": "This is good to go. If she wants accessories, just visit us again.", + "start_time": 40.86328713479479, + "end_time": 44.717799606450114, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--423/temp/line_11_B.wav", + "silence_duration": 0.40965993703181025, + "is_interrupted": false + } + ] + }, + "DialogSum--val--425": { + "original_text": "A: I want to rent skis and boots. \nB: Here you are. Have a nice stay here. \nA: Thank you. I am a learner so can you tell me where I can find a ski [interrupt] instructor who can help me get started with proper techniques and safety measures on the slopes? \nB: Oh, are you a complete beginner? If so, we have instructors who specialize in teaching newcomers. \nA: Yes, I am. I was asking where I can find a ski instructor. \nB: We will find you one. Wait a moment.", + "cleaned_text": "A: I want to rent skis and boots. \nB: Here you are. Have a nice stay here. \nA:Thank you. I am a learner so can you tell me where I can find a ski instructor who can help me get started with proper techniques and safety measures on the slopes?\nB: Oh, are you a complete beginner? If so, we have instructors who specialize in teaching newcomers. \nA: Yes, I am. I was asking where I can find a ski instructor. \nB: We will find you one. Wait a moment.", + "total_duration": 22.342494331065758, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--425/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--425/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--425/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "I want to rent skis and boots.", + "original_text": "I want to rent skis and boots.", + "start_time": 0, + "end_time": 2.159455782312925, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--425/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Here you are. Have a nice stay here.", + "original_text": "Here you are. Have a nice stay here.", + "start_time": 2.5321901928811728, + "end_time": 5.086385204219042, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--425/temp/line_1_B.wav", + "silence_duration": 0.3727344105682476, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Thank you. I am a learner so can you tell me where I can find a ski", + "original_text": "Thank you. I am a learner so can you tell me where I can find a ski [interrupt] instructor who can help me get started with proper techniques and safety measures on the slopes?", + "start_time": 5.6596432304425655, + "end_time": 14.796695384637577, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--425/temp/line_2_A.wav", + "silence_duration": 0.5732580262235241, + "is_interrupted": true, + "text_after_interrupt": "instructor who can help me get started with proper techniques and safety measures on the slopes?" + }, + { + "speaker": "B", + "text": "Oh, are you a complete beginner? If so, we have instructors who specialize in teaching newcomers.", + "original_text": "Oh, are you a complete beginner? If so, we have instructors who specialize in teaching newcomers.", + "start_time": 9.676695384637576, + "end_time": 15.65583370663304, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--425/temp/line_3_B.wav", + "silence_duration": 0.3823234095256017, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Yes, I am. I was asking where I can find a ski instructor.", + "original_text": "Yes, I am. I was asking where I can find a ski instructor.", + "start_time": 16.226288347153652, + "end_time": 19.88343120429651, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--425/temp/line_4_A.wav", + "silence_duration": 0.570454640520613, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "We will find you one. Wait a moment.", + "original_text": "We will find you one. Wait a moment.", + "start_time": 20.264314462500053, + "end_time": 22.342500403543138, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--425/temp/line_5_B.wav", + "silence_duration": 0.3808832582035421, + "is_interrupted": false + } + ] + }, + "DialogSum--val--426": { + "original_text": "A: There's a lot of traffic on the street. Is this the shopping district? \nB: Yes, it is. There are a lot of stores, office buildings, and theatres near [interrupt] the main square, which is just a few blocks away and always bustling with activity, especially during weekends when street performers and food vendors set up their stalls. \nA: Sorry to interrupt, but I was wondering, do you know if there's a good place to park around here? \nB: There's a parking garage two blocks down on the left. But as I was saying, there are a lot of stores and theatres here. The largest building on the left is a department store. It sells clothing, furniture, food—almost everything. \nA: Do you buy everything in the same store? That's very handy, isn't it? It saves a lot of time. I need some clothes. \nB: There's a men's clothing store next to the bank building on the right. There are also some good stores on Lincoln Street. \nA: That's a beautiful theatre on the corner. What do all the signs in front of it say about the upcoming events? \nB: Oh, those signs? They're advertising a new play that's opening tonight. The building next to the theatre is a hotel. \nA: Interesting. And earlier, you mentioned a department store—does it also carry electronics? \nB: Yes, it does. And by the way, the post office is just three blocks straight ahead, not across the street.", + "cleaned_text": "A: There's a lot of traffic on the street. Is this the shopping district? \nB:Yes, it is. There are a lot of stores, office buildings, and theatres near the main square, which is just a few blocks away and always bustling with activity, especially during weekends when street performers and food vendors set up their stalls.\nA: Sorry to interrupt, but I was wondering, do you know if there's a good place to park around here? \nB: There's a parking garage two blocks down on the left. But as I was saying, there are a lot of stores and theatres here. The largest building on the left is a department store. It sells clothing, furniture, food—almost everything. \nA: Do you buy everything in the same store? That's very handy, isn't it? It saves a lot of time. I need some clothes. \nB: There's a men's clothing store next to the bank building on the right. There are also some good stores on Lincoln Street. \nA: That's a beautiful theatre on the corner. What do all the signs in front of it say about the upcoming events? \nB: Oh, those signs? They're advertising a new play that's opening tonight. The building next to the theatre is a hotel. \nA: Interesting. And earlier, you mentioned a department store—does it also carry electronics? \nB: Yes, it does. And by the way, the post office is just three blocks straight ahead, not across the street.", + "total_duration": 70.95183673469388, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--426/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--426/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--426/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "There's a lot of traffic on the street. Is this the shopping district?", + "original_text": "There's a lot of traffic on the street. Is this the shopping district?", + "start_time": 0, + "end_time": 4.237641723356009, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--426/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, it is. There are a lot of stores, office buildings, and theatres near", + "original_text": "Yes, it is. There are a lot of stores, office buildings, and theatres near [interrupt] the main square, which is just a few blocks away and always bustling with activity, especially during weekends when street performers and food vendors set up their stalls.", + "start_time": 4.672665398859014, + "end_time": 17.501690342169674, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--426/temp/line_1_B.wav", + "silence_duration": 0.435023675503005, + "is_interrupted": true, + "text_after_interrupt": "the main square, which is just a few blocks away and always bustling with activity, especially during weekends when street performers and food vendors set up their stalls." + }, + { + "speaker": "A", + "text": "Sorry to interrupt, but I was wondering, do you know if there's a good place to park around here?", + "original_text": "Sorry to interrupt, but I was wondering, do you know if there's a good place to park around here?", + "start_time": 8.689717553054024, + "end_time": 14.761735693643594, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--426/temp/line_2_A.wav", + "silence_duration": 0.39847180867451576, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "There's a parking garage two blocks down on the left. But as I was saying, there are a lot of stores and theatres here. The largest building on the left is a department store. It sells clothing, furniture, food—almost everything.", + "original_text": "There's a parking garage two blocks down on the left. But as I was saying, there are a lot of stores and theatres here. The largest building on the left is a department store. It sells clothing, furniture, food—almost everything.", + "start_time": 18.026715712023393, + "end_time": 30.263631811796635, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--426/temp/line_3_B.wav", + "silence_duration": 0.5250253698537176, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Do you buy everything in the same store? That's very handy, isn't it? It saves a lot of time. I need some clothes.", + "original_text": "Do you buy everything in the same store? That's very handy, isn't it? It saves a lot of time. I need some clothes.", + "start_time": 30.718189136372157, + "end_time": 38.276284374467394, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--426/temp/line_4_A.wav", + "silence_duration": 0.45455732457552056, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "There's a men's clothing store next to the bank building on the right. There are also some good stores on Lincoln Street.", + "original_text": "There's a men's clothing store next to the bank building on the right. There are also some good stores on Lincoln Street.", + "start_time": 38.615763681693025, + "end_time": 44.467192253121596, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--426/temp/line_5_B.wav", + "silence_duration": 0.33947930722562963, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "That's a beautiful theatre on the corner. What do all the signs in front of it say about the upcoming events?", + "original_text": "That's a beautiful theatre on the corner. What do all the signs in front of it say about the upcoming events?", + "start_time": 44.9959482942069, + "end_time": 51.39304579987583, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--426/temp/line_6_A.wav", + "silence_duration": 0.5287560410853015, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Oh, those signs? They're advertising a new play that's opening tonight. The building next to the theatre is a hotel.", + "original_text": "Oh, those signs? They're advertising a new play that's opening tonight. The building next to the theatre is a hotel.", + "start_time": 51.97116785787046, + "end_time": 58.4611451821335, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--426/temp/line_7_B.wav", + "silence_duration": 0.5781220579946309, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Interesting. And earlier, you mentioned a department store—does it also carry electronics?", + "original_text": "Interesting. And earlier, you mentioned a department store—does it also carry electronics?", + "start_time": 58.97428911145853, + "end_time": 64.3845385445651, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--426/temp/line_8_A.wav", + "silence_duration": 0.5131439293250328, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, it does. And by the way, the post office is just three blocks straight ahead, not across the street.", + "original_text": "Yes, it does. And by the way, the post office is just three blocks straight ahead, not across the street.", + "start_time": 64.96110942388829, + "end_time": 70.95185772320802, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--426/temp/line_9_B.wav", + "silence_duration": 0.5765708793231795, + "is_interrupted": false + } + ] + }, + "DialogSum--val--427": { + "original_text": "A: The service is really slow here. I've been trying to get the waiter's attention for the last ten minutes.\nB: I hope he takes our order soon. Otherwise I'll be late for my class at two o'clock.\nA: Me, too. I have a class at 2 as well.\nB: I've noticed you have a math book. Do you [interrupt] study math as your major? It seems like a tough subject with all those complex equations and abstract theories that require so much dedication and practice to master.\nA: Oh, yes! I actually like the summer school here. It's pretty good. I think I've learned a lot.\nB: That's great to hear. I only wish the class were a little smaller, but I like my teachers a lot. They are very kind and patient.\nA: I see. By the way, where are you from?\nB: I'm from Boston. How about you?\nA: I'm from Washington DC. I'm only staying here for three more weeks. Then I'll go to Columbia University in New York. Oh, I just realized I didn't ask—do you like the summer school here? You mentioned the class size, but what about the overall experience?\nB: I do like it overall, just wish it was a bit more personalized. Oh, look, here comes the waiter. It seems we are going to get served after all.", + "cleaned_text": "A: The service is really slow here. I've been trying to get the waiter's attention for the last ten minutes.\nB: I hope he takes our order soon. Otherwise I'll be late for my class at two o'clock.\nA: Me, too. I have a class at 2 as well.\nB:I've noticed you have a math book. Do you study math as your major? It seems like a tough subject with all those complex equations and abstract theories that require so much dedication and practice to master.\nA: Oh, yes! I actually like the summer school here. It's pretty good. I think I've learned a lot.\nB: That's great to hear. I only wish the class were a little smaller, but I like my teachers a lot. They are very kind and patient.\nA: I see. By the way, where are you from?\nB: I'm from Boston. How about you?\nA: I'm from Washington DC. I'm only staying here for three more weeks. Then I'll go to Columbia University in New York. Oh, I just realized I didn't ask—do you like the summer school here? You mentioned the class size, but what about the overall experience?\nB: I do like it overall, just wish it was a bit more personalized. Oh, look, here comes the waiter. It seems we are going to get served after all.", + "total_duration": 61.88548752834467, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--427/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--427/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--427/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "The service is really slow here. I've been trying to get the waiter's attention for the last ten minutes.", + "original_text": "The service is really slow here. I've been trying to get the waiter's attention for the last ten minutes.", + "start_time": 0, + "end_time": 5.758548752834467, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--427/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I hope he takes our order soon. Otherwise I'll be late for my class at two o'clock.", + "original_text": "I hope he takes our order soon. Otherwise I'll be late for my class at two o'clock.", + "start_time": 6.142236055278991, + "end_time": 10.600467347795998, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--427/temp/line_1_B.wav", + "silence_duration": 0.3836873024445238, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Me, too. I have a class at 2 as well.", + "original_text": "Me, too. I have a class at 2 as well.", + "start_time": 11.020565545909411, + "end_time": 14.015939695569276, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--427/temp/line_2_A.wav", + "silence_duration": 0.4200981981134129, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I've noticed you have a math book. Do you", + "original_text": "I've noticed you have a math book. Do you [interrupt] study math as your major? It seems like a tough subject with all those complex equations and abstract theories that require so much dedication and practice to master.", + "start_time": 14.507420740845664, + "end_time": 25.53689919889555, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--427/temp/line_3_B.wav", + "silence_duration": 0.4914810452763869, + "is_interrupted": true, + "text_after_interrupt": "study math as your major? It seems like a tough subject with all those complex equations and abstract theories that require so much dedication and practice to master." + }, + { + "speaker": "A", + "text": "Oh, yes! I actually like the summer school here. It's pretty good. I think I've learned a lot.", + "original_text": "Oh, yes! I actually like the summer school here. It's pretty good. I think I've learned a lot.", + "start_time": 16.39984704470054, + "end_time": 22.27449557077764, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--427/temp/line_4_A.wav", + "silence_duration": 0.5188507799909688, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "That's great to hear. I only wish the class were a little smaller, but I like my teachers a lot. They are very kind and patient.", + "original_text": "That's great to hear. I only wish the class were a little smaller, but I like my teachers a lot. They are very kind and patient.", + "start_time": 26.04743530315298, + "end_time": 32.66512237798291, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--427/temp/line_5_B.wav", + "silence_duration": 0.5105361042574305, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I see. By the way, where are you from?", + "original_text": "I see. By the way, where are you from?", + "start_time": 33.069336030459596, + "end_time": 36.1459800213893, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--427/temp/line_6_A.wav", + "silence_duration": 0.40421365247668284, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I'm from Boston. How about you?", + "original_text": "I'm from Boston. How about you?", + "start_time": 36.73260010827201, + "end_time": 38.45087675226294, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--427/temp/line_7_B.wav", + "silence_duration": 0.5866200868827094, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I'm from Washington DC. I'm only staying here for three more weeks. Then I'll go to Columbia University in New York. Oh, I just realized I didn't ask—do you like the summer school here? You mentioned the class size, but what about the overall experience?", + "original_text": "I'm from Washington DC. I'm only staying here for three more weeks. Then I'll go to Columbia University in New York. Oh, I just realized I didn't ask—do you like the summer school here? You mentioned the class size, but what about the overall experience?", + "start_time": 38.76284956124727, + "end_time": 54.69173845013616, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--427/temp/line_8_A.wav", + "silence_duration": 0.31197280898433205, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I do like it overall, just wish it was a bit more personalized. Oh, look, here comes the waiter. It seems we are going to get served after all.", + "original_text": "I do like it overall, just wish it was a bit more personalized. Oh, look, here comes the waiter. It seems we are going to get served after all.", + "start_time": 55.01242001131146, + "end_time": 61.88552658727518, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--427/temp/line_9_B.wav", + "silence_duration": 0.32068156117530744, + "is_interrupted": false + } + ] + }, + "DialogSum--val--428": { + "original_text": "A: What do you like most about your new job? \nB: Well, I get better paid and the distance between work and home is shorter. But the best part is that they have training programs to improve our work skills. And they run partly on company time, usually from four to six on Wednesdays and Fridays, which is perfect because it doesn't interfere with my [interrupt] personal commitments and still allows me to dedicate enough time to learning new techniques and methodologies. \nA: Sorry to jump in, but I was curious—do these training programs cover advanced topics or just the basics? \nB: They actually cover both, which is really helpful. They start with the basics and then move on to more advanced skills. \nA: That sounds great. I wish my company did that. \nB: It really is a good thing. And even though the company has to pay for the training, it's worth it in the long run. Because with a greater understanding of the computer programs I use every day, I do my daily tasks more quickly and gain insights into optimizing processes that I hadn't considered before. \nA: And effectively, right? That must be a huge time-saver for you. \nB: Absolutely, it is.", + "cleaned_text": "A: What do you like most about your new job? \nB:Well, I get better paid and the distance between work and home is shorter. But the best part is that they have training programs to improve our work skills. And they run partly on company time, usually from four to six on Wednesdays and Fridays, which is perfect because it doesn't interfere with my personal commitments and still allows me to dedicate enough time to learning new techniques and methodologies.\nA: Sorry to jump in, but I was curious—do these training programs cover advanced topics or just the basics? \nB: They actually cover both, which is really helpful. They start with the basics and then move on to more advanced skills. \nA: That sounds great. I wish my company did that. \nB: It really is a good thing. And even though the company has to pay for the training, it's worth it in the long run. Because with a greater understanding of the computer programs I use every day, I do my daily tasks more quickly and gain insights into optimizing processes that I hadn't considered before. \nA: And effectively, right? That must be a huge time-saver for you. \nB: Absolutely, it is.", + "total_duration": 57.06258503401361, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--428/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--428/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--428/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "What do you like most about your new job?", + "original_text": "What do you like most about your new job?", + "start_time": 0, + "end_time": 2.1942857142857144, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--428/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Well, I get better paid and the distance between work and home is shorter. But the best part is that they have training programs to improve our work skills. And they run partly on company time, usually from four to six on Wednesdays and Fridays, which is perfect because it doesn't interfere with my", + "original_text": "Well, I get better paid and the distance between work and home is shorter. But the best part is that they have training programs to improve our work skills. And they run partly on company time, usually from four to six on Wednesdays and Fridays, which is perfect because it doesn't interfere with my [interrupt] personal commitments and still allows me to dedicate enough time to learning new techniques and methodologies.", + "start_time": 2.5819041488458847, + "end_time": 22.481405282632736, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--428/temp/line_1_B.wav", + "silence_duration": 0.3876184345601702, + "is_interrupted": true, + "text_after_interrupt": "personal commitments and still allows me to dedicate enough time to learning new techniques and methodologies." + }, + { + "speaker": "A", + "text": "Sorry to jump in, but I was curious—do these training programs cover advanced topics or just the basics?", + "original_text": "Sorry to jump in, but I was curious—do these training programs cover advanced topics or just the basics?", + "start_time": 18.092833854061304, + "end_time": 24.79179077016108, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--428/temp/line_2_A.wav", + "silence_duration": 0.5265585941165409, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "They actually cover both, which is really helpful. They start with the basics and then move on to more advanced skills.", + "original_text": "They actually cover both, which is really helpful. They start with the basics and then move on to more advanced skills.", + "start_time": 25.279592387410116, + "end_time": 31.0961910268659, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--428/temp/line_3_B.wav", + "silence_duration": 0.48780161724903814, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "That sounds great. I wish my company did that.", + "original_text": "That sounds great. I wish my company did that.", + "start_time": 31.461994352746633, + "end_time": 34.70117802621602, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--428/temp/line_4_A.wav", + "silence_duration": 0.36580332588073317, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "It really is a good thing. And even though the company has to pay for the training, it's worth it in the long run. Because with a greater understanding of the computer programs I use every day, I do my daily tasks more quickly and gain insights into optimizing processes that I hadn't considered before.", + "original_text": "It really is a good thing. And even though the company has to pay for the training, it's worth it in the long run. Because with a greater understanding of the computer programs I use every day, I do my daily tasks more quickly and gain insights into optimizing processes that I hadn't considered before.", + "start_time": 35.184177269388236, + "end_time": 50.97374643038597, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--428/temp/line_5_B.wav", + "silence_duration": 0.4829992431722151, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "And effectively, right? That must be a huge time-saver for you.", + "original_text": "And effectively, right? That must be a huge time-saver for you.", + "start_time": 51.3768747101041, + "end_time": 55.33587697767779, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--428/temp/line_6_A.wav", + "silence_duration": 0.4031282797181268, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Absolutely, it is.", + "original_text": "Absolutely, it is.", + "start_time": 55.808748162248165, + "end_time": 57.062625713268574, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--428/temp/line_7_B.wav", + "silence_duration": 0.47287118457037336, + "is_interrupted": false + } + ] + }, + "DialogSum--val--431": { + "original_text": "A: Our flight will be delayed by 6 hours. That means it won't be leaving until 3:30 in the [interrupt] afternoon, which really messes up our plans for the day since we were supposed to arrive in time for the conference opening ceremony and now we'll miss the keynote speech entirely. \nB: Wait, 6 hours? That's a really long delay. Do you think we should check if there's any earlier flight available? \nA: I doubt there will be any, but it's worth a try. In the meantime, we could look for some seats in the quiet part of the terminal to take a nap. \nB: Good idea. I am pretty tired. By the way, what time did you say the flight was rescheduled to? \nA: 3:30 in the afternoon. \nB: Got it. Let's hope there are some comfy seats available.", + "cleaned_text": "A:Our flight will be delayed by 6 hours. That means it won't be leaving until 3:30 in the afternoon, which really messes up our plans for the day since we were supposed to arrive in time for the conference opening ceremony and now we'll miss the keynote speech entirely.\nB: Wait, 6 hours? That's a really long delay. Do you think we should check if there's any earlier flight available? \nA: I doubt there will be any, but it's worth a try. In the meantime, we could look for some seats in the quiet part of the terminal to take a nap. \nB: Good idea. I am pretty tired. By the way, what time did you say the flight was rescheduled to? \nA: 3:30 in the afternoon. \nB: Got it. Let's hope there are some comfy seats available.", + "total_duration": 36.03256235827664, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--431/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--431/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--431/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Our flight will be delayed by 6 hours. That means it won't be leaving until 3:30 in the", + "original_text": "Our flight will be delayed by 6 hours. That means it won't be leaving until 3:30 in the [interrupt] afternoon, which really messes up our plans for the day since we were supposed to arrive in time for the conference opening ceremony and now we'll miss the keynote speech entirely.", + "start_time": 0, + "end_time": 15.47609977324263, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--431/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": true, + "text_after_interrupt": "afternoon, which really messes up our plans for the day since we were supposed to arrive in time for the conference opening ceremony and now we'll miss the keynote speech entirely." + }, + { + "speaker": "B", + "text": "Wait, 6 hours? That's a really long delay. Do you think we should check if there's any earlier flight available?", + "original_text": "Wait, 6 hours? That's a really long delay. Do you think we should check if there's any earlier flight available?", + "start_time": 5.793378684807256, + "end_time": 12.30657596371882, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--431/temp/line_1_B.wav", + "silence_duration": 0.3037767954168312, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I doubt there will be any, but it's worth a try. In the meantime, we could look for some seats in the quiet part of the terminal to take a nap.", + "original_text": "I doubt there will be any, but it's worth a try. In the meantime, we could look for some seats in the quiet part of the terminal to take a nap.", + "start_time": 15.89864065253987, + "end_time": 24.211384416712207, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--431/temp/line_2_A.wav", + "silence_duration": 0.4225408792972389, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Good idea. I am pretty tired. By the way, what time did you say the flight was rescheduled to?", + "original_text": "Good idea. I am pretty tired. By the way, what time did you say the flight was rescheduled to?", + "start_time": 24.6897232592622, + "end_time": 30.04192280574746, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--431/temp/line_3_B.wav", + "silence_duration": 0.4783388425499916, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "3:30 in the afternoon.", + "original_text": "3:30 in the afternoon.", + "start_time": 30.470631163778183, + "end_time": 32.699746810036686, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--431/temp/line_4_A.wav", + "silence_duration": 0.42870835803072205, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Got it. Let's hope there are some comfy seats available.", + "original_text": "Got it. Let's hope there are some comfy seats available.", + "start_time": 33.00238898470098, + "end_time": 36.03259306633363, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--431/temp/line_5_B.wav", + "silence_duration": 0.30264217466429383, + "is_interrupted": false + } + ] + }, + "DialogSum--val--432": { + "original_text": "A: May I help you? \nB: Yes. I'm looking for a green dress. \nA: What size do you wear? These dresses are on [interrupt] sale right now, so you might find a good deal, especially since we just got a fresh shipment of new styles that would complement your preferences perfectly. \nB: Oh, sorry to interrupt, but do you have any recommendations for something that would be good for a formal event? \nA: Absolutely! We have a few options that would be perfect for that. But first, what size did you say you wear? \nB: I wear size 32. This one looks nice. Where may I try it on? \nA: Come this way. Here's the dressing room. \nB: How does it look? \nA: It looks nice. And it's not expensive. \nB: How much is it? \nA: It's only $20. \nB: I'll take it.", + "cleaned_text": "A: May I help you? \nB: Yes. I'm looking for a green dress. \nA:What size do you wear? These dresses are on sale right now, so you might find a good deal, especially since we just got a fresh shipment of new styles that would complement your preferences perfectly.\nB: Oh, sorry to interrupt, but do you have any recommendations for something that would be good for a formal event? \nA: Absolutely! We have a few options that would be perfect for that. But first, what size did you say you wear? \nB: I wear size 32. This one looks nice. Where may I try it on? \nA: Come this way. Here's the dressing room. \nB: How does it look? \nA: It looks nice. And it's not expensive. \nB: How much is it? \nA: It's only $20. \nB: I'll take it.", + "total_duration": 39.00784580498866, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--432/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--432/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--432/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "May I help you?", + "original_text": "May I help you?", + "start_time": 0, + "end_time": 0.9984580498866213, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--432/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes. I'm looking for a green dress.", + "original_text": "Yes. I'm looking for a green dress.", + "start_time": 1.4894219031906608, + "end_time": 3.463118048315377, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--432/temp/line_1_B.wav", + "silence_duration": 0.4909638533040394, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "What size do you wear? These dresses are on", + "original_text": "What size do you wear? These dresses are on [interrupt] sale right now, so you might find a good deal, especially since we just got a fresh shipment of new styles that would complement your preferences perfectly.", + "start_time": 4.057424200181631, + "end_time": 15.214612408798413, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--432/temp/line_2_A.wav", + "silence_duration": 0.594306151866254, + "is_interrupted": true, + "text_after_interrupt": "sale right now, so you might find a good deal, especially since we just got a fresh shipment of new styles that would complement your preferences perfectly." + }, + { + "speaker": "B", + "text": "Oh, sorry to interrupt, but do you have any recommendations for something that would be good for a formal event?", + "original_text": "Oh, sorry to interrupt, but do you have any recommendations for something that would be good for a formal event?", + "start_time": 6.774158894059182, + "end_time": 12.64880742013628, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--432/temp/line_3_B.wav", + "silence_duration": 0.4304748188609322, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Absolutely! We have a few options that would be perfect for that. But first, what size did you say you wear?", + "original_text": "Absolutely! We have a few options that would be perfect for that. But first, what size did you say you wear?", + "start_time": 15.703128345101204, + "end_time": 22.5530149664164, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--432/temp/line_4_A.wav", + "silence_duration": 0.488515936302791, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I wear size 32. This one looks nice. Where may I try it on?", + "original_text": "I wear size 32. This one looks nice. Where may I try it on?", + "start_time": 22.861088916522498, + "end_time": 26.738821342826352, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--432/temp/line_5_B.wav", + "silence_duration": 0.3080739501060999, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Come this way. Here's the dressing room.", + "original_text": "Come this way. Here's the dressing room.", + "start_time": 27.152247626319387, + "end_time": 29.903812252169725, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--432/temp/line_6_A.wav", + "silence_duration": 0.4134262834930336, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "How does it look?", + "original_text": "How does it look?", + "start_time": 30.472105248209747, + "end_time": 31.40090343415079, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--432/temp/line_7_B.wav", + "silence_duration": 0.5682929960400216, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "It looks nice. And it's not expensive.", + "original_text": "It looks nice. And it's not expensive.", + "start_time": 31.899328278573332, + "end_time": 34.349033493992835, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--432/temp/line_8_A.wav", + "silence_duration": 0.49842484442254026, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "How much is it?", + "original_text": "How much is it?", + "start_time": 34.76786537140762, + "end_time": 35.603783738754565, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--432/temp/line_9_B.wav", + "silence_duration": 0.41883187741479033, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "It's only $20.", + "original_text": "It's only $20.", + "start_time": 36.19470639249968, + "end_time": 37.912983036490616, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--432/temp/line_10_A.wav", + "silence_duration": 0.5909226537451202, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I'll take it.", + "original_text": "I'll take it.", + "start_time": 38.311290818667054, + "end_time": 39.00788945812283, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--432/temp/line_11_B.wav", + "silence_duration": 0.39830778217644003, + "is_interrupted": false + } + ] + }, + "DialogSum--val--433": { + "original_text": "A: Can I help you, sir? \nB: I want to find a book called *Gone with the Wind*. But I can't find [interrupt] the section where it might be located, even though I've searched through the fiction and classic literature aisles several times already. \nA: Let me give you a hand. The author is... \nB: Margaret Mitchell. \nA: Oh, yes. Here it is. \nB: Thank you very much. I have been looking for it for a long time. Is this the only copy you have in stock? \nA: Is this the latest edition? Yes, we have both the paperback and hardcover. Which would you want to buy? \nB: How about the price of the hardcover? \nA: It's $25. \nB: A little bit expensive, but I will buy one. This is $25, here you are.", + "cleaned_text": "A: Can I help you, sir? \nB:I want to find a book called *Gone with the Wind*. But I can't find the section where it might be located, even though I've searched through the fiction and classic literature aisles several times already.\nA: Let me give you a hand. The author is... \nB: Margaret Mitchell. \nA: Oh, yes. Here it is. \nB: Thank you very much. I have been looking for it for a long time. Is this the only copy you have in stock? \nA: Is this the latest edition? Yes, we have both the paperback and hardcover. Which would you want to buy? \nB: How about the price of the hardcover? \nA: It's $25. \nB: A little bit expensive, but I will buy one. This is $25, here you are.", + "total_duration": 36.93818594104308, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--433/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--433/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--433/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Can I help you, sir?", + "original_text": "Can I help you, sir?", + "start_time": 0, + "end_time": 1.1377777777777778, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--433/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I want to find a book called *Gone with the Wind*. But I can't find", + "original_text": "I want to find a book called *Gone with the Wind*. But I can't find [interrupt] the section where it might be located, even though I've searched through the fiction and classic literature aisles several times already.", + "start_time": 1.6924019275029485, + "end_time": 11.688592403693423, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--433/temp/line_1_B.wav", + "silence_duration": 0.5546241497251706, + "is_interrupted": true, + "text_after_interrupt": "the section where it might be located, even though I've searched through the fiction and classic literature aisles several times already." + }, + { + "speaker": "A", + "text": "Let me give you a hand. The author is...", + "original_text": "Let me give you a hand. The author is...", + "start_time": 6.0113134921287985, + "end_time": 8.809318027276191, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--433/temp/line_2_A.wav", + "silence_duration": 0.5833632963816505, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Margaret Mitchell.", + "original_text": "Margaret Mitchell.", + "start_time": 12.21599188544236, + "end_time": 13.086740184762087, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--433/temp/line_3_B.wav", + "silence_duration": 0.5273994817489366, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Oh, yes. Here it is.", + "original_text": "Oh, yes. Here it is.", + "start_time": 13.655283060820263, + "end_time": 15.303899840865615, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--433/temp/line_4_A.wav", + "silence_duration": 0.5685428760581763, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Thank you very much. I have been looking for it for a long time. Is this the only copy you have in stock?", + "original_text": "Thank you very much. I have been looking for it for a long time. Is this the only copy you have in stock?", + "start_time": 15.696000181818178, + "end_time": 21.01336979633065, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--433/temp/line_5_B.wav", + "silence_duration": 0.3921003409525635, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Is this the latest edition? Yes, we have both the paperback and hardcover. Which would you want to buy?", + "original_text": "Is this the latest edition? Yes, we have both the paperback and hardcover. Which would you want to buy?", + "start_time": 21.54276706953064, + "end_time": 27.99791446182089, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--433/temp/line_6_A.wav", + "silence_duration": 0.529397273199989, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "How about the price of the hardcover?", + "original_text": "How about the price of the hardcover?", + "start_time": 28.386269774683107, + "end_time": 30.301916033186508, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--433/temp/line_7_B.wav", + "silence_duration": 0.3883553128622179, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "It's $25.", + "original_text": "It's $25.", + "start_time": 30.745725509942183, + "end_time": 32.41756224463606, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--433/temp/line_8_A.wav", + "silence_duration": 0.4438094767556744, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "A little bit expensive, but I will buy one. This is $25, here you are.", + "original_text": "A little bit expensive, but I will buy one. This is $25, here you are.", + "start_time": 32.74701381345337, + "end_time": 36.93821562751233, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--433/temp/line_9_B.wav", + "silence_duration": 0.3294515688173114, + "is_interrupted": false + } + ] + }, + "DialogSum--val--434": { + "original_text": "A: Excuse me, Sir, do you know what time it is? \nB: Oh, it's almost eleven twenty, to be exact. \nA: Eleven twenty? Thank you. \nB: You're welcome. The rain is quite heavy, isn't it? \nA: Yeah. I was in a hurry and I forgot my umbrella today. \nB: I have one. We could share it. Which way are you go[interrupt]ing? I'm heading towards the city center myself and would be happy to accompany you part of the way if our directions align. \nA: Oh, that's very kind of you. I am going to the Garden Hotel. \nB: I was about to say, which way are you going? But it seems we're heading to the same place. I'm going to the Garden Hotel, too. We can walk together.", + "cleaned_text": "A: Excuse me, Sir, do you know what time it is? \nB: Oh, it's almost eleven twenty, to be exact. \nA: Eleven twenty? Thank you. \nB: You're welcome. The rain is quite heavy, isn't it? \nA: Yeah. I was in a hurry and I forgot my umbrella today. \nB:I have one. We could share it. Which way are you go ing? I'm heading towards the city center myself and would be happy to accompany you part of the way if our directions align.\nA: Oh, that's very kind of you. I am going to the Garden Hotel. \nB: I was about to say, which way are you going? But it seems we're heading to the same place. I'm going to the Garden Hotel, too. We can walk together.", + "total_duration": 32.07823129251701, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--434/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--434/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--434/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Excuse me, Sir, do you know what time it is?", + "original_text": "Excuse me, Sir, do you know what time it is?", + "start_time": 0, + "end_time": 2.7980045351473923, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--434/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Oh, it's almost eleven twenty, to be exact.", + "original_text": "Oh, it's almost eleven twenty, to be exact.", + "start_time": 3.213072876713848, + "end_time": 5.685998046781876, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--434/temp/line_1_B.wav", + "silence_duration": 0.4150683415664556, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Eleven twenty? Thank you.", + "original_text": "Eleven twenty? Thank you.", + "start_time": 6.000411902537315, + "end_time": 8.299187412741396, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--434/temp/line_2_A.wav", + "silence_duration": 0.31441385575543934, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "You're welcome. The rain is quite heavy, isn't it?", + "original_text": "You're welcome. The rain is quite heavy, isn't it?", + "start_time": 8.601784225990468, + "end_time": 11.179199191976862, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--434/temp/line_3_B.wav", + "silence_duration": 0.3025968132490718, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Yeah. I was in a hurry and I forgot my umbrella today.", + "original_text": "Yeah. I was in a hurry and I forgot my umbrella today.", + "start_time": 11.688103771387226, + "end_time": 15.48456635642124, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--434/temp/line_4_A.wav", + "silence_duration": 0.5089045794103653, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I have one. We could share it. Which way are you go", + "original_text": "I have one. We could share it. Which way are you go[interrupt]ing? I'm heading towards the city center myself and would be happy to accompany you part of the way if our directions align.", + "start_time": 15.939455248147478, + "end_time": 24.69337815064181, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--434/temp/line_5_B.wav", + "silence_duration": 0.4548888917262379, + "is_interrupted": true, + "text_after_interrupt": "ing? I'm heading towards the city center myself and would be happy to accompany you part of the way if our directions align." + }, + { + "speaker": "A", + "text": "Oh, that's very kind of you. I am going to the Garden Hotel.", + "original_text": "Oh, that's very kind of you. I am going to the Garden Hotel.", + "start_time": 19.596598105290337, + "end_time": 23.485940508918453, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--434/temp/line_6_A.wav", + "silence_duration": 0.3653005995083607, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I was about to say, which way are you going? But it seems we're heading to the same place. I'm going to the Garden Hotel, too. We can walk together.", + "original_text": "I was about to say, which way are you going? But it seems we're heading to the same place. I'm going to the Garden Hotel, too. We can walk together.", + "start_time": 25.100671419550114, + "end_time": 32.0782677914322, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--434/temp/line_7_B.wav", + "silence_duration": 0.407293268908306, + "is_interrupted": false + } + ] + }, + "DialogSum--val--435": { + "original_text": "A: Hi Mary, how's it going? \nB: Well, last night I had a big argument with Ann. \nA: Terrible. It must be something serious. You two are such close friends. \nB: Now that I look back at it, it wasn't that big a deal. I shouldn't have [interrupt] overreacted the way I did, especially since Ann has always been there for me through thick and thin and this was just a minor scheduling conflict. \nA: Sorry to jump in, but I'm really curious—what exactly happened between you two? \nB: It's just we've been planning to go to the beach for a while, and we decided we could both make it this weekend. Then out of nowhere, she called me up, said her boyfriend had made plans and that she needed to cancel the trip. I was so angry when she told me that I said she didn't care about our friendship at all. \nA: That's pretty harsh. But wait, you were saying earlier that you shouldn't have... what? \nB: Oh, right—I shouldn't have lost my temper. I know, but I was so upset. I mean, come on! Does she have to do everything her boyfriend says? \nA: You know she probably feels just as bad. \nB: Well, I think I was being a little selfish myself. I know they don't get to see each other very often. \nA: Well, in that case, I guess maybe you can be more understanding. You shouldn't let a trivial thing like this stand in the way of your friendship. After all, you can go to the beach anytime you want. \nB: Yeah, I'll call later to patch things up.", + "cleaned_text": "A: Hi Mary, how's it going? \nB: Well, last night I had a big argument with Ann. \nA: Terrible. It must be something serious. You two are such close friends. \nB:Now that I look back at it, it wasn't that big a deal. I shouldn't have overreacted the way I did, especially since Ann has always been there for me through thick and thin and this was just a minor scheduling conflict.\nA: Sorry to jump in, but I'm really curious—what exactly happened between you two? \nB: It's just we've been planning to go to the beach for a while, and we decided we could both make it this weekend. Then out of nowhere, she called me up, said her boyfriend had made plans and that she needed to cancel the trip. I was so angry when she told me that I said she didn't care about our friendship at all. \nA: That's pretty harsh. But wait, you were saying earlier that you shouldn't have... what? \nB: Oh, right—I shouldn't have lost my temper. I know, but I was so upset. I mean, come on! Does she have to do everything her boyfriend says? \nA: You know she probably feels just as bad. \nB: Well, I think I was being a little selfish myself. I know they don't get to see each other very often. \nA: Well, in that case, I guess maybe you can be more understanding. You shouldn't let a trivial thing like this stand in the way of your friendship. After all, you can go to the beach anytime you want. \nB: Yeah, I'll call later to patch things up.", + "total_duration": 73.30848072562358, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--435/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--435/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--435/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Hi Mary, how's it going?", + "original_text": "Hi Mary, how's it going?", + "start_time": 0, + "end_time": 1.6950566893424037, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--435/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Well, last night I had a big argument with Ann.", + "original_text": "Well, last night I had a big argument with Ann.", + "start_time": 2.005755400640381, + "end_time": 4.757320026490721, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--435/temp/line_1_B.wav", + "silence_duration": 0.3106987112979772, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Terrible. It must be something serious. You two are such close friends.", + "original_text": "Terrible. It must be something serious. You two are such close friends.", + "start_time": 5.22116376197726, + "end_time": 9.992864442249369, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--435/temp/line_2_A.wav", + "silence_duration": 0.4638437354865389, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Now that I look back at it, it wasn't that big a deal. I shouldn't have", + "original_text": "Now that I look back at it, it wasn't that big a deal. I shouldn't have [interrupt] overreacted the way I did, especially since Ann has always been there for me through thick and thin and this was just a minor scheduling conflict.", + "start_time": 10.591497714654905, + "end_time": 21.121747147761482, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--435/temp/line_3_B.wav", + "silence_duration": 0.5986332724055361, + "is_interrupted": true, + "text_after_interrupt": "overreacted the way I did, especially since Ann has always been there for me through thick and thin and this was just a minor scheduling conflict." + }, + { + "speaker": "A", + "text": "Sorry to jump in, but I'm really curious—what exactly happened between you two?", + "original_text": "Sorry to jump in, but I'm really curious—what exactly happened between you two?", + "start_time": 14.248640571797761, + "end_time": 19.62406007293155, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--435/temp/line_4_A.wav", + "silence_duration": 0.5202904976223656, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "It's just we've been planning to go to the beach for a while, and we decided we could both make it this weekend. Then out of nowhere, she called me up, said her boyfriend had made plans and that she needed to cancel the trip. I was so angry when she told me that I said she didn't care about our friendship at all.", + "original_text": "It's just we've been planning to go to the beach for a while, and we decided we could both make it this weekend. Then out of nowhere, she called me up, said her boyfriend had made plans and that she needed to cancel the trip. I was so angry when she told me that I said she didn't care about our friendship at all.", + "start_time": 21.433670009071243, + "end_time": 36.21317114285809, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--435/temp/line_5_B.wav", + "silence_duration": 0.3119228613097595, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "That's pretty harsh. But wait, you were saying earlier that you shouldn't have... what?", + "original_text": "That's pretty harsh. But wait, you were saying earlier that you shouldn't have... what?", + "start_time": 36.731188732637634, + "end_time": 42.06016832447437, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--435/temp/line_6_A.wav", + "silence_duration": 0.5180175897795466, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Oh, right—I shouldn't have lost my temper. I know, but I was so upset. I mean, come on! Does she have to do everything her boyfriend says?", + "original_text": "Oh, right—I shouldn't have lost my temper. I know, but I was so upset. I mean, come on! Does she have to do everything her boyfriend says?", + "start_time": 42.434545633284664, + "end_time": 50.24806037251369, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--435/temp/line_7_B.wav", + "silence_duration": 0.37437730881029474, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "You know she probably feels just as bad.", + "original_text": "You know she probably feels just as bad.", + "start_time": 50.84604475078863, + "end_time": 53.342189875505184, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--435/temp/line_8_A.wav", + "silence_duration": 0.5979843782749388, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Well, I think I was being a little selfish myself. I know they don't get to see each other very often.", + "original_text": "Well, I think I was being a little selfish myself. I know they don't get to see each other very often.", + "start_time": 53.754018053467114, + "end_time": 58.76952825754874, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--435/temp/line_9_B.wav", + "silence_duration": 0.41182817796192733, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Well, in that case, I guess maybe you can be more understanding. You shouldn't let a trivial thing like this stand in the way of your friendship. After all, you can go to the beach anytime you want.", + "original_text": "Well, in that case, I guess maybe you can be more understanding. You shouldn't let a trivial thing like this stand in the way of your friendship. After all, you can go to the beach anytime you want.", + "start_time": 59.28575533454957, + "end_time": 70.64031315767882, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--435/temp/line_10_A.wav", + "silence_duration": 0.5162270770008299, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yeah, I'll call later to patch things up.", + "original_text": "Yeah, I'll call later to patch things up.", + "start_time": 71.0097165743849, + "end_time": 73.30849208458898, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--435/temp/line_11_B.wav", + "silence_duration": 0.3694034167060738, + "is_interrupted": false + } + ] + }, + "DialogSum--val--437": { + "original_text": "A: Lieb! How are you doing these days? I've been meaning to catch up with you about [interrupt] all the exciting things happening in your life, especially now that you've got a new furry friend to take care of!\nB: Hi! I am busy with my new cat. Do you want to see a picture of [interrupt] her? She's really cute and loves to play around the house, always chasing after toys and climbing on furniture like a little acrobat.\nA: Wait, you have a new cat? When did you get her? I'm so surprised and excited to hear about this new addition to your family!\nB: I got her last week. She's only 3 months old. Do you want to see a picture of her? I've taken so many already because she's just too adorable not to photograph constantly.\nA: Yes, please! Show me the pictures! I can't wait to see your little bundle of joy and hear all about her personality and habits.", + "cleaned_text": "A:Lieb! How are you doing these days? I've been meaning to catch up with you about all the exciting things happening in your life, especially now that you've got a new furry friend to take care of!\nB:Hi! I am busy with my new cat. Do you want to see a picture of her? She's really cute and loves to play around the house, always chasing after toys and climbing on furniture like a little acrobat.\nA: Wait, you have a new cat? When did you get her? I'm so surprised and excited to hear about this new addition to your family!\nB: I got her last week. She's only 3 months old. Do you want to see a picture of her? I've taken so many already because she's just too adorable not to photograph constantly.\nA: Yes, please! Show me the pictures! I can't wait to see your little bundle of joy and hear all about her personality and habits.", + "total_duration": 42.08185941043084, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--437/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--437/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--437/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Lieb! How are you doing these days? I've been meaning to catch up with you about", + "original_text": "Lieb! How are you doing these days? I've been meaning to catch up with you about [interrupt] all the exciting things happening in your life, especially now that you've got a new furry friend to take care of!", + "start_time": 0, + "end_time": 11.319727891156463, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--437/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": true, + "text_after_interrupt": "all the exciting things happening in your life, especially now that you've got a new furry friend to take care of!" + }, + { + "speaker": "B", + "text": "Hi! I am busy with my new cat. Do you want to see a picture of", + "original_text": "Hi! I am busy with my new cat. Do you want to see a picture of [interrupt] her? She's really cute and loves to play around the house, always chasing after toys and climbing on furniture like a little acrobat.", + "start_time": 5.073560090702948, + "end_time": 15.290340136054422, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--437/temp/line_1_B.wav", + "silence_duration": 0.5334000204668385, + "is_interrupted": true, + "text_after_interrupt": "her? She's really cute and loves to play around the house, always chasing after toys and climbing on furniture like a little acrobat." + }, + { + "speaker": "A", + "text": "Wait, you have a new cat? When did you get her? I'm so surprised and excited to hear about this new addition to your family!", + "original_text": "Wait, you have a new cat? When did you get her? I'm so surprised and excited to hear about this new addition to your family!", + "start_time": 16.404239022734412, + "end_time": 23.741744691668654, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--437/temp/line_2_A.wav", + "silence_duration": 0.522573752232159, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I got her last week. She's only 3 months old. Do you want to see a picture of her? I've taken so many already because she's just too adorable not to photograph constantly.", + "original_text": "I got her last week. She's only 3 months old. Do you want to see a picture of her? I've taken so many already because she's just too adorable not to photograph constantly.", + "start_time": 24.223207658641243, + "end_time": 33.72016910988841, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--437/temp/line_3_B.wav", + "silence_duration": 0.48146296697258817, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Yes, please! Show me the pictures! I can't wait to see your little bundle of joy and hear all about her personality and habits.", + "original_text": "Yes, please! Show me the pictures! I can't wait to see your little bundle of joy and hear all about her personality and habits.", + "start_time": 34.22191723836943, + "end_time": 42.081871886895506, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--437/temp/line_4_A.wav", + "silence_duration": 0.501748128481019, + "is_interrupted": false + } + ] + }, + "DialogSum--val--439": { + "original_text": "A: I heard Rose is pregnant. I hope it'll be a boy this time.\nB: I hope so, too. Rose and her husband have been wanting a boy so much.\nA: After three baby girls in a row, Rose is under a lot of pressure from her in-laws. They want a boy in the worst way [interrupt] and they've even started suggesting names for a future grandson while redecorating the nursery in blue and buying all sorts of boy's clothes in advance.\nB: I completely understand the pressure, but don't you think it's unfair? Baby girls are just as good and just as fun as baby boys.\nA: Absolutely, but I was going to say that Rose is feeling the pressure even more because her in-laws keep reminding her about it. It's really starting to take a toll on her.", + "cleaned_text": "A: I heard Rose is pregnant. I hope it'll be a boy this time.\nB: I hope so, too. Rose and her husband have been wanting a boy so much.\nA:After three baby girls in a row, Rose is under a lot of pressure from her in-laws. They want a boy in the worst way and they've even started suggesting names for a future grandson while redecorating the nursery in blue and buying all sorts of boy's clothes in advance.\nB: I completely understand the pressure, but don't you think it's unfair? Baby girls are just as good and just as fun as baby boys.\nA: Absolutely, but I was going to say that Rose is feeling the pressure even more because her in-laws keep reminding her about it. It's really starting to take a toll on her.", + "total_duration": 35.34689342403628, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--439/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--439/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--439/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "I heard Rose is pregnant. I hope it'll be a boy this time.", + "original_text": "I heard Rose is pregnant. I hope it'll be a boy this time.", + "start_time": 0, + "end_time": 3.599092970521542, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--439/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I hope so, too. Rose and her husband have been wanting a boy so much.", + "original_text": "I hope so, too. Rose and her husband have been wanting a boy so much.", + "start_time": 4.131053171076681, + "end_time": 7.648876300328382, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--439/temp/line_1_B.wav", + "silence_duration": 0.531960200555139, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "After three baby girls in a row, Rose is under a lot of pressure from her in-laws. They want a boy in the worst way", + "original_text": "After three baby girls in a row, Rose is under a lot of pressure from her in-laws. They want a boy in the worst way [interrupt] and they've even started suggesting names for a future grandson while redecorating the nursery in blue and buying all sorts of boy's clothes in advance.", + "start_time": 8.022318687972547, + "end_time": 24.752296012235586, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--439/temp/line_2_A.wav", + "silence_duration": 0.3734423876441637, + "is_interrupted": true, + "text_after_interrupt": "and they've even started suggesting names for a future grandson while redecorating the nursery in blue and buying all sorts of boy's clothes in advance." + }, + { + "speaker": "B", + "text": "I completely understand the pressure, but don't you think it's unfair? Baby girls are just as good and just as fun as baby boys.", + "original_text": "I completely understand the pressure, but don't you think it's unfair? Baby girls are just as good and just as fun as baby boys.", + "start_time": 15.441094198176629, + "end_time": 22.51157038865282, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--439/temp/line_3_B.wav", + "silence_duration": 0.37490949474748536, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Absolutely, but I was going to say that Rose is feeling the pressure even more because her in-laws keep reminding her about it. It's really starting to take a toll on her.", + "original_text": "Absolutely, but I was going to say that Rose is feeling the pressure even more because her in-laws keep reminding her about it. It's really starting to take a toll on her.", + "start_time": 25.23462462901817, + "end_time": 35.34691487845128, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--439/temp/line_4_A.wav", + "silence_duration": 0.4823286167825859, + "is_interrupted": false + } + ] + }, + "DialogSum--val--440": { + "original_text": "A: My friend finally dumped her boyfriend, and she's sworn she's going to abstain until she finds the right man to marry.\nB: After going through an episode like that I'm not surprised. How's her headspace?\nA: She's doing great, she's getting her confidence back, and her self-esteem has improved drastically. She's very [interrupt] focused on her personal growth right now and is really enjoying her independence while exploring new hobbies and rediscovering old passions she'd neglected during the relationship.\nB: That's so good to hear! By the way, have you noticed any changes in how she's interacting with people now?\nA: Absolutely, she's much more outgoing and positive. But I was going to say she's very happy. Anyway, I'm proud of you for standing by her. I think you've helped make a big difference in her life.\nB: Thanks, but I think you were the real rock for her. Do you have any plans for next Sunday evening?\nA: No, why?\nB: My friend, who had the mishap, wants to take us to dinner to show her gratitude for helping her.\nA: She doesn't need to do that, I didn't do anything.", + "cleaned_text": "A: My friend finally dumped her boyfriend, and she's sworn she's going to abstain until she finds the right man to marry.\nB: After going through an episode like that I'm not surprised. How's her headspace?\nA:She's doing great, she's getting her confidence back, and her self-esteem has improved drastically. She's very focused on her personal growth right now and is really enjoying her independence while exploring new hobbies and rediscovering old passions she'd neglected during the relationship.\nB: That's so good to hear! By the way, have you noticed any changes in how she's interacting with people now?\nA: Absolutely, she's much more outgoing and positive. But I was going to say she's very happy. Anyway, I'm proud of you for standing by her. I think you've helped make a big difference in her life.\nB: Thanks, but I think you were the real rock for her. Do you have any plans for next Sunday evening?\nA: No, why?\nB: My friend, who had the mishap, wants to take us to dinner to show her gratitude for helping her.\nA: She doesn't need to do that, I didn't do anything.", + "total_duration": 55.06226757369615, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--440/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--440/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--440/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "My friend finally dumped her boyfriend, and she's sworn she's going to abstain until she finds the right man to marry.", + "original_text": "My friend finally dumped her boyfriend, and she's sworn she's going to abstain until she finds the right man to marry.", + "start_time": 0, + "end_time": 6.130068027210885, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--440/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "After going through an episode like that I'm not surprised. How's her headspace?", + "original_text": "After going through an episode like that I'm not surprised. How's her headspace?", + "start_time": 6.60574362455086, + "end_time": 11.017535007770814, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--440/temp/line_1_B.wav", + "silence_duration": 0.47567559733997566, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "She's doing great, she's getting her confidence back, and her self-esteem has improved drastically. She's very", + "original_text": "She's doing great, she's getting her confidence back, and her self-esteem has improved drastically. She's very [interrupt] focused on her personal growth right now and is really enjoying her independence while exploring new hobbies and rediscovering old passions she'd neglected during the relationship.", + "start_time": 11.503340444728735, + "end_time": 27.559939084184517, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--440/temp/line_2_A.wav", + "silence_duration": 0.4858054369579211, + "is_interrupted": true, + "text_after_interrupt": "focused on her personal growth right now and is really enjoying her independence while exploring new hobbies and rediscovering old passions she'd neglected during the relationship." + }, + { + "speaker": "B", + "text": "That's so good to hear! By the way, have you noticed any changes in how she's interacting with people now?", + "original_text": "That's so good to hear! By the way, have you noticed any changes in how she's interacting with people now?", + "start_time": 18.260347247449822, + "end_time": 23.008827973073405, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--440/temp/line_3_B.wav", + "silence_duration": 0.5795575032612207, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Absolutely, she's much more outgoing and positive. But I was going to say she's very happy. Anyway, I'm proud of you for standing by her. I think you've helped make a big difference in her life.", + "original_text": "Absolutely, she's much more outgoing and positive. But I was going to say she's very happy. Anyway, I'm proud of you for standing by her. I think you've helped make a big difference in her life.", + "start_time": 28.145756720820074, + "end_time": 40.05759345551395, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--440/temp/line_4_A.wav", + "silence_duration": 0.5858176366355581, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Thanks, but I think you were the real rock for her. Do you have any plans for next Sunday evening?", + "original_text": "Thanks, but I think you were the real rock for her. Do you have any plans for next Sunday evening?", + "start_time": 40.54084903556672, + "end_time": 45.05713021470505, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--440/temp/line_5_B.wav", + "silence_duration": 0.4832555800527667, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "No, why?", + "original_text": "No, why?", + "start_time": 45.431936752472716, + "end_time": 47.022503645896755, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--440/temp/line_6_A.wav", + "silence_duration": 0.3748065377676714, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "My friend, who had the mishap, wants to take us to dinner to show her gratitude for helping her.", + "original_text": "My friend, who had the mishap, wants to take us to dinner to show her gratitude for helping her.", + "start_time": 47.36676725039847, + "end_time": 51.63923890572727, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--440/temp/line_7_B.wav", + "silence_duration": 0.3442636045017104, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "She doesn't need to do that, I didn't do anything.", + "original_text": "She doesn't need to do that, I didn't do anything.", + "start_time": 52.12494727047995, + "end_time": 55.0622715335185, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--440/temp/line_8_A.wav", + "silence_duration": 0.4857083647526813, + "is_interrupted": false + } + ] + }, + "DialogSum--val--441": { + "original_text": "A: Susan has got the cancer of stomach.\nB: How terrible! This is quite unexpected!\nA: Yesterday when I went to hospital to see her, you cannot imagine how greatly surprised when I [interrupt] saw how much weight she had lost and how pale she looked compared to just a month ago when we last met for coffee. It was absolutely heartbreaking to see such a drastic change in her appearance.\nB: Sorry to cut in, but do you know how long she's been dealing with this? I mean, was it diagnosed recently, or has she been hiding it?\nA: It was diagnosed recently, just a few weeks ago. But what I was saying earlier—when I saw her, I was shocked because she looked so frail. What happened?", + "cleaned_text": "A: Susan has got the cancer of stomach.\nB: How terrible! This is quite unexpected!\nA:Yesterday when I went to hospital to see her, you cannot imagine how greatly surprised when I saw how much weight she had lost and how pale she looked compared to just a month ago when we last met for coffee. It was absolutely heartbreaking to see such a drastic change in her appearance.\nB: Sorry to cut in, but do you know how long she's been dealing with this? I mean, was it diagnosed recently, or has she been hiding it?\nA: It was diagnosed recently, just a few weeks ago. But what I was saying earlier—when I saw her, I was shocked because she looked so frail. What happened?", + "total_duration": 32.51238095238095, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--441/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--441/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--441/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Susan has got the cancer of stomach.", + "original_text": "Susan has got the cancer of stomach.", + "start_time": 0, + "end_time": 2.3103854875283445, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--441/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "How terrible! This is quite unexpected!", + "original_text": "How terrible! This is quite unexpected!", + "start_time": 2.8773882481897064, + "end_time": 5.176163758393788, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--441/temp/line_1_B.wav", + "silence_duration": 0.567002760661362, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Yesterday when I went to hospital to see her, you cannot imagine how greatly surprised when I", + "original_text": "Yesterday when I went to hospital to see her, you cannot imagine how greatly surprised when I [interrupt] saw how much weight she had lost and how pale she looked compared to just a month ago when we last met for coffee. It was absolutely heartbreaking to see such a drastic change in her appearance.", + "start_time": 5.565087407522783, + "end_time": 22.817513711377657, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--441/temp/line_2_A.wav", + "silence_duration": 0.3889236491289954, + "is_interrupted": true, + "text_after_interrupt": "saw how much weight she had lost and how pale she looked compared to just a month ago when we last met for coffee. It was absolutely heartbreaking to see such a drastic change in her appearance." + }, + { + "speaker": "B", + "text": "Sorry to cut in, but do you know how long she's been dealing with this? I mean, was it diagnosed recently, or has she been hiding it?", + "original_text": "Sorry to cut in, but do you know how long she's been dealing with this? I mean, was it diagnosed recently, or has she been hiding it?", + "start_time": 11.462955888248406, + "end_time": 19.07910101296496, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--441/temp/line_3_B.wav", + "silence_duration": 0.5992061175240706, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "It was diagnosed recently, just a few weeks ago. But what I was saying earlier—when I saw her, I was shocked because she looked so frail. What happened?", + "original_text": "It was diagnosed recently, just a few weeks ago. But what I was saying earlier—when I saw her, I was shocked because she looked so frail. What happened?", + "start_time": 23.212825478259607, + "end_time": 32.5124173149943, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--441/temp/line_4_A.wav", + "silence_duration": 0.3953117668819507, + "is_interrupted": false + } + ] + }, + "DialogSum--val--442": { + "original_text": "A: The sun is up! Time for all the campers to rise. Time to get paddling.\nB: Oh, no! No more paddling! My arms are sore!\nA: Do not worry. Today will be easier.\nB: Beth, what date is today?\nA: Today is Saturday.\nB: What is the date today?\nA: Today is July 4th.\nB: Oh, I almost forgot. Today is my mom's [interrupt] birthday, and I was planning to call her later to wish her well and maybe even send her some photos from our camping trip.\nA: Wait, today is July 4th? That means it's Independence Day! Are there any special events planned here at the camp?\nB: Oh, I'm not sure about any events, but I was just about to say that today is my mom's birthday. I should call her.\nA: Call her on my cell phone. Wish her 'Happy Birthday!' Tell her you are out exploring the great American wilderness. Tell her I said she is lucky to be born on Independence Day.\nB: Thanks! I will do that! When is your birthday?\nA: It is December 25th.\nB: Wow! What a lucky girl! Your birthday is on Christmas Day.", + "cleaned_text": "A: The sun is up! Time for all the campers to rise. Time to get paddling.\nB: Oh, no! No more paddling! My arms are sore!\nA: Do not worry. Today will be easier.\nB: Beth, what date is today?\nA: Today is Saturday.\nB: What is the date today?\nA: Today is July 4th.\nB:Oh, I almost forgot. Today is my mom's birthday, and I was planning to call her later to wish her well and maybe even send her some photos from our camping trip.\nA: Wait, today is July 4th? That means it's Independence Day! Are there any special events planned here at the camp?\nB: Oh, I'm not sure about any events, but I was just about to say that today is my mom's birthday. I should call her.\nA: Call her on my cell phone. Wish her 'Happy Birthday!' Tell her you are out exploring the great American wilderness. Tell her I said she is lucky to be born on Independence Day.\nB: Thanks! I will do that! When is your birthday?\nA: It is December 25th.\nB: Wow! What a lucky girl! Your birthday is on Christmas Day.", + "total_duration": 55.77269841269841, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--442/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--442/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--442/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "The sun is up! Time for all the campers to rise. Time to get paddling.", + "original_text": "The sun is up! Time for all the campers to rise. Time to get paddling.", + "start_time": 0, + "end_time": 4.574331065759637, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--442/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Oh, no! No more paddling! My arms are sore!", + "original_text": "Oh, no! No more paddling! My arms are sore!", + "start_time": 5.051855709221152, + "end_time": 7.9891799722597, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--442/temp/line_1_B.wav", + "silence_duration": 0.4775246434615152, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Do not worry. Today will be easier.", + "original_text": "Do not worry. Today will be easier.", + "start_time": 8.445956713341278, + "end_time": 11.104641520597514, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--442/temp/line_2_A.wav", + "silence_duration": 0.456776741081578, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Beth, what date is today?", + "original_text": "Beth, what date is today?", + "start_time": 11.424652324344144, + "end_time": 13.073269104389496, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--442/temp/line_3_B.wav", + "silence_duration": 0.32001080374662993, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Today is Saturday.", + "original_text": "Today is Saturday.", + "start_time": 13.619755958228344, + "end_time": 15.071003123761225, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--442/temp/line_4_A.wav", + "silence_duration": 0.5464868538388485, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "What is the date today?", + "original_text": "What is the date today?", + "start_time": 15.446456677906765, + "end_time": 16.642284342305857, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--442/temp/line_5_B.wav", + "silence_duration": 0.3754535541455397, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Today is July 4th.", + "original_text": "Today is July 4th.", + "start_time": 17.063074508430287, + "end_time": 18.897450925663847, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--442/temp/line_6_A.wav", + "silence_duration": 0.4207901661244302, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Oh, I almost forgot. Today is my mom's", + "original_text": "Oh, I almost forgot. Today is my mom's [interrupt] birthday, and I was planning to call her later to wish her well and maybe even send her some photos from our camping trip.", + "start_time": 19.47392255536589, + "end_time": 27.368707135864753, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--442/temp/line_7_B.wav", + "silence_duration": 0.5764716297020409, + "is_interrupted": true, + "text_after_interrupt": "birthday, and I was planning to call her later to wish her well and maybe even send her some photos from our camping trip." + }, + { + "speaker": "A", + "text": "Wait, today is July 4th? That means it's Independence Day! Are there any special events planned here at the camp?", + "original_text": "Wait, today is July 4th? That means it's Independence Day! Are there any special events planned here at the camp?", + "start_time": 22.55056654629559, + "end_time": 30.12027176171509, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--442/temp/line_8_A.wav", + "silence_duration": 0.4920020364088197, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Oh, I'm not sure about any events, but I was just about to say that today is my mom's birthday. I should call her.", + "original_text": "Oh, I'm not sure about any events, but I was just about to say that today is my mom's birthday. I should call her.", + "start_time": 30.67362154878979, + "end_time": 36.432170301624254, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--442/temp/line_9_B.wav", + "silence_duration": 0.5533497870746983, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Call her on my cell phone. Wish her 'Happy Birthday!' Tell her you are out exploring the great American wilderness. Tell her I said she is lucky to be born on Independence Day.", + "original_text": "Call her on my cell phone. Wish her 'Happy Birthday!' Tell her you are out exploring the great American wilderness. Tell her I said she is lucky to be born on Independence Day.", + "start_time": 36.78159033527542, + "end_time": 47.311839768381994, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--442/temp/line_10_A.wav", + "silence_duration": 0.34942003365116064, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Thanks! I will do that! When is your birthday?", + "original_text": "Thanks! I will do that! When is your birthday?", + "start_time": 47.65362817255946, + "end_time": 49.81308395487238, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--442/temp/line_11_B.wav", + "silence_duration": 0.3417884041774611, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "It is December 25th.", + "original_text": "It is December 25th.", + "start_time": 50.237376824878766, + "end_time": 52.211072970003485, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--442/temp/line_12_A.wav", + "silence_duration": 0.42429287000638216, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Wow! What a lucky girl! Your birthday is on Christmas Day.", + "original_text": "Wow! What a lucky girl! Your birthday is on Christmas Day.", + "start_time": 52.55677550352416, + "end_time": 55.77273922234502, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--442/temp/line_13_B.wav", + "silence_duration": 0.3457025335206749, + "is_interrupted": false + } + ] + }, + "DialogSum--val--443": { + "original_text": "A: May I have my bill, please? \nB: That's $20 in all. \nA: Well, I am afraid you have made a mistake. Would you check it [interrupt] I believe there's an error in the main course pricing because I distinctly remember it being listed at a lower price on the menu when I ordered. \nB: Oh, sorry to interrupt, but are you referring to the extra charge for the dessert? I just want to clarify before I check. \nA: No, it's not about the dessert. Could you check the entire bill again, please? \nB: Let me see. I am terribly sorry, sir. That should be $18.", + "cleaned_text": "A: May I have my bill, please? \nB: That's $20 in all. \nA:Well, I am afraid you have made a mistake. Would you check it I believe there's an error in the main course pricing because I distinctly remember it being listed at a lower price on the menu when I ordered.\nB: Oh, sorry to interrupt, but are you referring to the extra charge for the dessert? I just want to clarify before I check. \nA: No, it's not about the dessert. Could you check the entire bill again, please? \nB: Let me see. I am terribly sorry, sir. That should be $18.", + "total_duration": 26.209931972789114, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--443/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--443/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--443/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "May I have my bill, please?", + "original_text": "May I have my bill, please?", + "start_time": 0, + "end_time": 1.6718367346938776, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--443/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "That's $20 in all.", + "original_text": "That's $20 in all.", + "start_time": 2.1893776722742606, + "end_time": 3.826384474995349, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--443/temp/line_1_B.wav", + "silence_duration": 0.517540937580383, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Well, I am afraid you have made a mistake. Would you check it", + "original_text": "Well, I am afraid you have made a mistake. Would you check it [interrupt] I believe there's an error in the main course pricing because I distinctly remember it being listed at a lower price on the menu when I ordered.", + "start_time": 4.421837973565429, + "end_time": 16.914173574472457, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--443/temp/line_2_A.wav", + "silence_duration": 0.5954534985700808, + "is_interrupted": true, + "text_after_interrupt": "I believe there's an error in the main course pricing because I distinctly remember it being listed at a lower price on the menu when I ordered." + }, + { + "speaker": "B", + "text": "Oh, sorry to interrupt, but are you referring to the extra charge for the dessert? I just want to clarify before I check.", + "original_text": "Oh, sorry to interrupt, but are you referring to the extra charge for the dessert? I just want to clarify before I check.", + "start_time": 7.9164411481686034, + "end_time": 14.975307361320532, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--443/temp/line_3_B.wav", + "silence_duration": 0.33640456510144356, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "No, it's not about the dessert. Could you check the entire bill again, please?", + "original_text": "No, it's not about the dessert. Could you check the entire bill again, please?", + "start_time": 17.492715188265933, + "end_time": 21.823236730216045, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--443/temp/line_4_A.wav", + "silence_duration": 0.5785416137934758, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Let me see. I am terribly sorry, sir. That should be $18.", + "original_text": "Let me see. I am terribly sorry, sir. That should be $18.", + "start_time": 22.19288560949495, + "end_time": 26.20993776368996, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--443/temp/line_5_B.wav", + "silence_duration": 0.36964887927890605, + "is_interrupted": false + } + ] + }, + "DialogSum--val--444": { + "original_text": "A: Hi, Mary. You look pale today. What's the matter with [interrupt] you? Did you sleep well last night or have you been feeling unwell for a while now? You seem quite exhausted and I'm genuinely concerned about your wellbeing.\nB: Sorry to interrupt, but I just realized I have some cold medicine in my bag. Do you want to try that before heading to the doctor? It might help alleviate some of your symptoms while we figure out the best course of action.\nA: That's really kind of you, but I think I've caught a cold. Now I'm aching all over, so I might need something stronger. The pain is quite intense and I'm worried it might be developing into something more serious.\nB: Oh, I see. You'd better take some medicine and have a good rest. I hope you'll be yourself pretty soon. Maybe we should call your doctor right away to get professional advice about your condition.\nA: Thank you. I suppose I should go to see a doctor. By the way, what were you saying earlier about the medicine in your bag? I might reconsider trying it if you think it could provide some temporary relief before my appointment.", + "cleaned_text": "A:Hi, Mary. You look pale today. What's the matter with you? Did you sleep well last night or have you been feeling unwell for a while now? You seem quite exhausted and I'm genuinely concerned about your wellbeing.\nB: Sorry to interrupt, but I just realized I have some cold medicine in my bag. Do you want to try that before heading to the doctor? It might help alleviate some of your symptoms while we figure out the best course of action.\nA: That's really kind of you, but I think I've caught a cold. Now I'm aching all over, so I might need something stronger. The pain is quite intense and I'm worried it might be developing into something more serious.\nB: Oh, I see. You'd better take some medicine and have a good rest. I hope you'll be yourself pretty soon. Maybe we should call your doctor right away to get professional advice about your condition.\nA: Thank you. I suppose I should go to see a doctor. By the way, what were you saying earlier about the medicine in your bag? I might reconsider trying it if you think it could provide some temporary relief before my appointment.", + "total_duration": 53.14621315192744, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--444/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--444/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--444/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Hi, Mary. You look pale today. What's the matter with", + "original_text": "Hi, Mary. You look pale today. What's the matter with [interrupt] you? Did you sleep well last night or have you been feeling unwell for a while now? You seem quite exhausted and I'm genuinely concerned about your wellbeing.", + "start_time": 0, + "end_time": 12.852244897959183, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--444/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": true, + "text_after_interrupt": "you? Did you sleep well last night or have you been feeling unwell for a while now? You seem quite exhausted and I'm genuinely concerned about your wellbeing." + }, + { + "speaker": "B", + "text": "Sorry to interrupt, but I just realized I have some cold medicine in my bag. Do you want to try that before heading to the doctor? It might help alleviate some of your symptoms while we figure out the best course of action.", + "original_text": "Sorry to interrupt, but I just realized I have some cold medicine in my bag. Do you want to try that before heading to the doctor? It might help alleviate some of your symptoms while we figure out the best course of action.", + "start_time": 3.7151927437641725, + "end_time": 14.373151927437641, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--444/temp/line_1_B.wav", + "silence_duration": 0.4859805309745354, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "That's really kind of you, but I think I've caught a cold. Now I'm aching all over, so I might need something stronger. The pain is quite intense and I'm worried it might be developing into something more serious.", + "original_text": "That's really kind of you, but I think I've caught a cold. Now I'm aching all over, so I might need something stronger. The pain is quite intense and I'm worried it might be developing into something more serious.", + "start_time": 14.746515816633243, + "end_time": 27.981889966293107, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--444/temp/line_2_A.wav", + "silence_duration": 0.37336388919560215, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Oh, I see. You'd better take some medicine and have a good rest. I hope you'll be yourself pretty soon. Maybe we should call your doctor right away to get professional advice about your condition.", + "original_text": "Oh, I see. You'd better take some medicine and have a good rest. I hope you'll be yourself pretty soon. Maybe we should call your doctor right away to get professional advice about your condition.", + "start_time": 28.566334926289095, + "end_time": 38.65540522107368, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--444/temp/line_3_B.wav", + "silence_duration": 0.5844449599959869, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Thank you. I suppose I should go to see a doctor. By the way, what were you saying earlier about the medicine in your bag? I might reconsider trying it if you think it could provide some temporary relief before my appointment.", + "original_text": "Thank you. I suppose I should go to see a doctor. By the way, what were you saying earlier about the medicine in your bag? I might reconsider trying it if you think it could provide some temporary relief before my appointment.", + "start_time": 38.9936801501406, + "end_time": 53.146242508417245, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--444/temp/line_4_A.wav", + "silence_duration": 0.33827492906691625, + "is_interrupted": false + } + ] + }, + "DialogSum--val--445": { + "original_text": "A: Do you want to hear a funny joke? \nB: OK. Are you sure it's funny, though? \nA: Well, you'll see. \nB: OK. \nA: OK, an Englishman, a Scotsman, and an Irishman were going on a trip across the desert, and they could only take one thing with them. \nB: I see. \nA: So they met up at the start of the journey and showed each other their [interrupt] items they had chosen to bring for the journey, each convinced that their selection was the most practical and essential for surviving the harsh desert conditions ahead. \nB: Oh, that's funny! \nA: Hang on, I haven't finished yet. \nB: Oh, sorry. \nA: Well, as I was saying, they showed each other what they had decided to bring. The Englishman had brought some water. 'If we get thirsty, we'll have something to drink,' he said. The Scotsman brought a map. 'If we get lost, we'll be able to find our way.' The Irishman had brought a car door. \nB: A car door? You mean just one car door? \nA: Yes, just one. And when they asked him why, he said, 'So if it gets too hot, I can roll down the window!'", + "cleaned_text": "A: Do you want to hear a funny joke? \nB: OK. Are you sure it's funny, though? \nA: Well, you'll see. \nB: OK. \nA: OK, an Englishman, a Scotsman, and an Irishman were going on a trip across the desert, and they could only take one thing with them. \nB: I see. \nA:So they met up at the start of the journey and showed each other their items they had chosen to bring for the journey, each convinced that their selection was the most practical and essential for surviving the harsh desert conditions ahead.\nB: Oh, that's funny! \nA: Hang on, I haven't finished yet. \nB: Oh, sorry. \nA: Well, as I was saying, they showed each other what they had decided to bring. The Englishman had brought some water. 'If we get thirsty, we'll have something to drink,' he said. The Scotsman brought a map. 'If we get lost, we'll be able to find our way.' The Irishman had brought a car door. \nB: A car door? You mean just one car door? \nA: Yes, just one. And when they asked him why, he said, 'So if it gets too hot, I can roll down the window!'", + "total_duration": 62.557868480725624, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--445/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--445/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--445/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Do you want to hear a funny joke?", + "original_text": "Do you want to hear a funny joke?", + "start_time": 0, + "end_time": 1.811156462585034, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--445/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "OK. Are you sure it's funny, though?", + "original_text": "OK. Are you sure it's funny, though?", + "start_time": 2.296394186749996, + "end_time": 4.79253931146655, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--445/temp/line_1_B.wav", + "silence_duration": 0.48523772416496225, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Well, you'll see.", + "original_text": "Well, you'll see.", + "start_time": 5.20963566912272, + "end_time": 6.405463333521814, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--445/temp/line_2_A.wav", + "silence_duration": 0.4170963576561708, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "OK.", + "original_text": "OK.", + "start_time": 6.762827241442375, + "end_time": 7.494255812870946, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--445/temp/line_3_B.wav", + "silence_duration": 0.35736390792056116, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "OK, an Englishman, a Scotsman, and an Irishman were going on a trip across the desert, and they could only take one thing with them.", + "original_text": "OK, an Englishman, a Scotsman, and an Irishman were going on a trip across the desert, and they could only take one thing with them.", + "start_time": 7.819048742812237, + "end_time": 15.655783436689788, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--445/temp/line_4_A.wav", + "silence_duration": 0.3247929299412908, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I see.", + "original_text": "I see.", + "start_time": 16.148103968449405, + "end_time": 17.3439316328485, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--445/temp/line_5_B.wav", + "silence_duration": 0.492320531759616, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "So they met up at the start of the journey and showed each other their", + "original_text": "So they met up at the start of the journey and showed each other their [interrupt] items they had chosen to bring for the journey, each convinced that their selection was the most practical and essential for surviving the harsh desert conditions ahead.", + "start_time": 17.690441238102057, + "end_time": 30.00862717914514, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--445/temp/line_6_A.wav", + "silence_duration": 0.3465096052535575, + "is_interrupted": true, + "text_after_interrupt": "items they had chosen to bring for the journey, each convinced that their selection was the most practical and essential for surviving the harsh desert conditions ahead." + }, + { + "speaker": "B", + "text": "Oh, that's funny!", + "original_text": "Oh, that's funny!", + "start_time": 21.962912893430854, + "end_time": 23.05425076191158, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--445/temp/line_7_B.wav", + "silence_duration": 0.45763031237258184, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Hang on, I haven't finished yet.", + "original_text": "Hang on, I haven't finished yet.", + "start_time": 30.47953095318925, + "end_time": 32.65059671282644, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--445/temp/line_8_A.wav", + "silence_duration": 0.47090377404410877, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Oh, sorry.", + "original_text": "Oh, sorry.", + "start_time": 33.21095808308097, + "end_time": 34.16297622367054, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--445/temp/line_9_B.wav", + "silence_duration": 0.5603613702545245, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Well, as I was saying, they showed each other what they had decided to bring. The Englishman had brought some water. 'If we get thirsty, we'll have something to drink,' he said. The Scotsman brought a map. 'If we get lost, we'll be able to find our way.' The Irishman had brought a car door.", + "original_text": "Well, as I was saying, they showed each other what they had decided to bring. The Englishman had brought some water. 'If we get thirsty, we'll have something to drink,' he said. The Scotsman brought a map. 'If we get lost, we'll be able to find our way.' The Irishman had brought a car door.", + "start_time": 34.74454056587263, + "end_time": 51.7183274139452, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--445/temp/line_10_A.wav", + "silence_duration": 0.5815643422020911, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "A car door? You mean just one car door?", + "original_text": "A car door? You mean just one car door?", + "start_time": 52.16067794182677, + "end_time": 54.87741263570432, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--445/temp/line_11_B.wav", + "silence_duration": 0.44235052788157203, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Yes, just one. And when they asked him why, he said, 'So if it gets too hot, I can roll down the window!'", + "original_text": "Yes, just one. And when they asked him why, he said, 'So if it gets too hot, I can roll down the window!'", + "start_time": 55.24361114802091, + "end_time": 62.55789686230663, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--445/temp/line_12_A.wav", + "silence_duration": 0.3661985123165943, + "is_interrupted": false + } + ] + }, + "DialogSum--val--446": { + "original_text": "A: I'm now at the airport to meet Mr. Dale, who is arriving at 3:00 PM. There will be some calls for me while I'm away. So please take a detailed message including the caller's name, contact information, and the nature of their [interrupt] business, especially if it seems urgent or time-sensitive. I'll need all this information when I return.\nB: Certainly. What time will you be back? I need to know when I can hand over any urgent messages.\nA: Sorry, I just realized—if there's some urgent business, how can I reach you?\nB: I'll call it again. Just to make sure you have my number saved in your contacts under \"Office Assistant\" with the [interrupt] secondary emergency line also programmed in case we experience any connectivity issues with the main number.\nA: Got it, but you didn't mention what time you'll be back.", + "cleaned_text": "A:I'm now at the airport to meet Mr. Dale, who is arriving at 3:00 PM. There will be some calls for me while I'm away. So please take a detailed message including the caller's name, contact information, and the nature of their business, especially if it seems urgent or time-sensitive. I'll need all this information when I return.\nB: Certainly. What time will you be back? I need to know when I can hand over any urgent messages.\nA: Sorry, I just realized—if there's some urgent business, how can I reach you?\nB:I'll call it again. Just to make sure you have my number saved in your contacts under \"Office Assistant\" with the secondary emergency line also programmed in case we experience any connectivity issues with the main number.\nA: Got it, but you didn't mention what time you'll be back.", + "total_duration": 40.160816326530615, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--446/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--446/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--446/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "I'm now at the airport to meet Mr. Dale, who is arriving at 3:00 PM. There will be some calls for me while I'm away. So please take a detailed message including the caller's name, contact information, and the nature of their", + "original_text": "I'm now at the airport to meet Mr. Dale, who is arriving at 3:00 PM. There will be some calls for me while I'm away. So please take a detailed message including the caller's name, contact information, and the nature of their [interrupt] business, especially if it seems urgent or time-sensitive. I'll need all this information when I return.", + "start_time": 0, + "end_time": 19.736961451247165, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--446/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": true, + "text_after_interrupt": "business, especially if it seems urgent or time-sensitive. I'll need all this information when I return." + }, + { + "speaker": "B", + "text": "Certainly. What time will you be back? I need to know when I can hand over any urgent messages.", + "original_text": "Certainly. What time will you be back? I need to know when I can hand over any urgent messages.", + "start_time": 14.849160997732426, + "end_time": 19.586031746031747, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--446/temp/line_1_B.wav", + "silence_duration": 0.5888789371695089, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Sorry, I just realized—if there's some urgent business, how can I reach you?", + "original_text": "Sorry, I just realized—if there's some urgent business, how can I reach you?", + "start_time": 20.240033960047874, + "end_time": 25.534183619911822, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--446/temp/line_2_A.wav", + "silence_duration": 0.503072508800708, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I'll call it again. Just to make sure you have my number saved in your contacts under \"Office Assistant\" with the", + "original_text": "I'll call it again. Just to make sure you have my number saved in your contacts under \"Office Assistant\" with the [interrupt] secondary emergency line also programmed in case we experience any connectivity issues with the main number.", + "start_time": 25.9546332601035, + "end_time": 37.030551627450436, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--446/temp/line_3_B.wav", + "silence_duration": 0.4204496401916782, + "is_interrupted": true, + "text_after_interrupt": "secondary emergency line also programmed in case we experience any connectivity issues with the main number." + }, + { + "speaker": "A", + "text": "Got it, but you didn't mention what time you'll be back.", + "original_text": "Got it, but you didn't mention what time you'll be back.", + "start_time": 37.362843853542245, + "end_time": 40.16084838868964, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--446/temp/line_4_A.wav", + "silence_duration": 0.41320013313474113, + "is_interrupted": false + } + ] + }, + "DialogSum--val--447": { + "original_text": "A: Adam, I'm sorry.\nB: But, where have you been, Alice? Here over an hour [interrupt] waiting and wondering if something happened to you, checking my phone constantly for any message from you and getting more worried by the minute.\nA: Yes, but I couldn't help it. I was late getting off work and then I missed the bus. The bus I did catch got caught in a traffic jam. It was one thing after another.\nB: But, why did you get off work so late? The office closes at 6, doesn't [interrupt] it? I thought you'd be done by then since we had plans and you knew how important this evening was to me.\nA: Yes, but there's a rash on at the moment and my boss asked me to work on some urgent letters.\nB: Wait, did you tell him you had an appointment?\nA: Well. No, I thought I'd finish in about 5 minutes. If it hadn't been for missing the bus and the traffic, I wouldn't have been so late. I'm sorry!\nB: Well, you're here now, and that's the main thing. Though you were late for the movie, we can have dinner together.", + "cleaned_text": "A: Adam, I'm sorry.\nB:But, where have you been, Alice? Here over an hour waiting and wondering if something happened to you, checking my phone constantly for any message from you and getting more worried by the minute.\nA: Yes, but I couldn't help it. I was late getting off work and then I missed the bus. The bus I did catch got caught in a traffic jam. It was one thing after another.\nB:But, why did you get off work so late? The office closes at 6, doesn't it? I thought you'd be done by then since we had plans and you knew how important this evening was to me.\nA: Yes, but there's a rash on at the moment and my boss asked me to work on some urgent letters.\nB: Wait, did you tell him you had an appointment?\nA: Well. No, I thought I'd finish in about 5 minutes. If it hadn't been for missing the bus and the traffic, I wouldn't have been so late. I'm sorry!\nB: Well, you're here now, and that's the main thing. Though you were late for the movie, we can have dinner together.", + "total_duration": 51.45410430839002, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--447/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--447/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--447/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Adam, I'm sorry.", + "original_text": "Adam, I'm sorry.", + "start_time": 0, + "end_time": 1.6137868480725623, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--447/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "But, where have you been, Alice? Here over an hour", + "original_text": "But, where have you been, Alice? Here over an hour [interrupt] waiting and wondering if something happened to you, checking my phone constantly for any message from you and getting more worried by the minute.", + "start_time": 2.0789347141595615, + "end_time": 11.575896165406727, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--447/temp/line_1_B.wav", + "silence_duration": 0.4651478660869992, + "is_interrupted": true, + "text_after_interrupt": "waiting and wondering if something happened to you, checking my phone constantly for any message from you and getting more worried by the minute." + }, + { + "speaker": "A", + "text": "Yes, but I couldn't help it. I was late getting off work and then I missed the bus. The bus I did catch got caught in a traffic jam. It was one thing after another.", + "original_text": "Yes, but I couldn't help it. I was late getting off work and then I missed the bus. The bus I did catch got caught in a traffic jam. It was one thing after another.", + "start_time": 4.958209090576795, + "end_time": 14.954399566767272, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--447/temp/line_2_A.wav", + "silence_duration": 0.4509725279743735, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "But, why did you get off work so late? The office closes at 6, doesn't", + "original_text": "But, why did you get off work so late? The office closes at 6, doesn't [interrupt] it? I thought you'd be done by then since we had plans and you knew how important this evening was to me.", + "start_time": 15.41508595356444, + "end_time": 25.00492722340571, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--447/temp/line_3_B.wav", + "silence_duration": 0.4606863867971678, + "is_interrupted": true, + "text_after_interrupt": "it? I thought you'd be done by then since we had plans and you knew how important this evening was to me." + }, + { + "speaker": "A", + "text": "Yes, but there's a rash on at the moment and my boss asked me to work on some urgent letters.", + "original_text": "Yes, but there's a rash on at the moment and my boss asked me to work on some urgent letters.", + "start_time": 26.585190343921386, + "end_time": 32.99389782691458, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--447/temp/line_4_A.wav", + "silence_duration": 0.5433924951431399, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Wait, did you tell him you had an appointment?", + "original_text": "Wait, did you tell him you had an appointment?", + "start_time": 33.55178030852227, + "end_time": 36.047925433238824, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--447/temp/line_5_B.wav", + "silence_duration": 0.5578824816076853, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Well. No, I thought I'd finish in about 5 minutes. If it hadn't been for missing the bus and the traffic, I wouldn't have been so late. I'm sorry!", + "original_text": "Well. No, I thought I'd finish in about 5 minutes. If it hadn't been for missing the bus and the traffic, I wouldn't have been so late. I'm sorry!", + "start_time": 36.50136012543944, + "end_time": 45.812561939498394, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--447/temp/line_6_A.wav", + "silence_duration": 0.45343469220061616, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Well, you're here now, and that's the main thing. Though you were late for the movie, we can have dinner together.", + "original_text": "Well, you're here now, and that's the main thing. Though you were late for the movie, we can have dinner together.", + "start_time": 46.35735924272533, + "end_time": 51.4541392880768, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--447/temp/line_7_B.wav", + "silence_duration": 0.5447973032269362, + "is_interrupted": false + } + ] + }, + "DialogSum--val--448": { + "original_text": "A: What's up? \nB: It's taking notes in class. Ever since I hurt my hand, my writing's been slower. And if I push too hard, it gets really [interrupt] painful, which makes it hard to keep up with the lecture and sometimes I even miss important points because I have to stop writing altogether. \nA: Oh, that sounds tough. Have you thought about just borrowing someone else's notes and photocopying them? It might help take the stress off your hands while trying to keep up with the lectures. \nB: That seems simple enough, though I'm not too sure about it. Maybe I should just bring a tape recorder to class. I could sit at the front or near the professor so the sound is clear enough to listen to later. \nA: Actually, that's a great idea! You can even borrow my recorder if you want. But, you mentioned your hand gets really painful—have you tried any other ways to manage the pain? \nB: You're really helpful. No, I haven't tried much else yet, but I should look into it. Thanks for the suggestion!", + "cleaned_text": "A: What's up? \nB:It's taking notes in class. Ever since I hurt my hand, my writing's been slower. And if I push too hard, it gets really painful, which makes it hard to keep up with the lecture and sometimes I even miss important points because I have to stop writing altogether.\nA: Oh, that sounds tough. Have you thought about just borrowing someone else's notes and photocopying them? It might help take the stress off your hands while trying to keep up with the lectures. \nB: That seems simple enough, though I'm not too sure about it. Maybe I should just bring a tape recorder to class. I could sit at the front or near the professor so the sound is clear enough to listen to later. \nA: Actually, that's a great idea! You can even borrow my recorder if you want. But, you mentioned your hand gets really painful—have you tried any other ways to manage the pain? \nB: You're really helpful. No, I haven't tried much else yet, but I should look into it. Thanks for the suggestion!", + "total_duration": 46.4233560090703, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--448/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--448/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--448/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "What's up?", + "original_text": "What's up?", + "start_time": 0, + "end_time": 0.7546485260770975, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--448/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "It's taking notes in class. Ever since I hurt my hand, my writing's been slower. And if I push too hard, it gets really", + "original_text": "It's taking notes in class. Ever since I hurt my hand, my writing's been slower. And if I push too hard, it gets really [interrupt] painful, which makes it hard to keep up with the lecture and sometimes I even miss important points because I have to stop writing altogether.", + "start_time": 1.1893614255709561, + "end_time": 14.227365960718348, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--448/temp/line_1_B.wav", + "silence_duration": 0.4347128994938587, + "is_interrupted": true, + "text_after_interrupt": "painful, which makes it hard to keep up with the lecture and sometimes I even miss important points because I have to stop writing altogether." + }, + { + "speaker": "A", + "text": "Oh, that sounds tough. Have you thought about just borrowing someone else's notes and photocopying them? It might help take the stress off your hands while trying to keep up with the lectures.", + "original_text": "Oh, that sounds tough. Have you thought about just borrowing someone else's notes and photocopying them? It might help take the stress off your hands while trying to keep up with the lectures.", + "start_time": 7.783828545752362, + "end_time": 18.232808137589096, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--448/temp/line_2_A.wav", + "silence_duration": 0.485212235156259, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "That seems simple enough, though I'm not too sure about it. Maybe I should just bring a tape recorder to class. I could sit at the front or near the professor so the sound is clear enough to listen to later.", + "original_text": "That seems simple enough, though I'm not too sure about it. Maybe I should just bring a tape recorder to class. I could sit at the front or near the professor so the sound is clear enough to listen to later.", + "start_time": 18.66167561470843, + "end_time": 28.51854636300775, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--448/temp/line_3_B.wav", + "silence_duration": 0.4288674771193325, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Actually, that's a great idea! You can even borrow my recorder if you want. But, you mentioned your hand gets really painful—have you tried any other ways to manage the pain?", + "original_text": "Actually, that's a great idea! You can even borrow my recorder if you want. But, you mentioned your hand gets really painful—have you tried any other ways to manage the pain?", + "start_time": 29.06459353054016, + "end_time": 39.67611280491658, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--448/temp/line_4_A.wav", + "silence_duration": 0.5460471675324114, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "You're really helpful. No, I haven't tried much else yet, but I should look into it. Thanks for the suggestion!", + "original_text": "You're really helpful. No, I haven't tried much else yet, but I should look into it. Thanks for the suggestion!", + "start_time": 40.16559405163081, + "end_time": 46.42337182940859, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--448/temp/line_5_B.wav", + "silence_duration": 0.489481246714237, + "is_interrupted": false + } + ] + }, + "DialogSum--val--450": { + "original_text": "A: Is there any place in the hotel where we can amuse ourselves?\nB: If you want to take a walk, you can go to the garden. It is very relaxing [interrupt] and has beautiful flowers and a calming atmosphere with several scenic spots perfect for meditation or simply enjoying the peaceful surroundings.\nA: The garden sounds nice, but I was actually thinking of something more indoors. Is there anywhere else to go?\nB: No, sir, there is a Recreation Center on the ground floor. You can play table tennis and go [interrupt] for a quick workout if you're interested in staying active, or simply relax in the lounge area with some light refreshments.\nA: I'm not really looking to play sports. I'd prefer a place where I can just unwind.\nB: Yes, sir. There is a music teahouse where you can enjoy both classical music and modern music while having some Chinese tea or other drinks.\nA: Oh, great! That sounds perfect. Thank you very much.\nB: It's a pleasure.", + "cleaned_text": "A: Is there any place in the hotel where we can amuse ourselves?\nB:If you want to take a walk, you can go to the garden. It is very relaxing and has beautiful flowers and a calming atmosphere with several scenic spots perfect for meditation or simply enjoying the peaceful surroundings.\nA: The garden sounds nice, but I was actually thinking of something more indoors. Is there anywhere else to go?\nB:No, sir, there is a Recreation Center on the ground floor. You can play table tennis and go for a quick workout if you're interested in staying active, or simply relax in the lounge area with some light refreshments.\nA: I'm not really looking to play sports. I'd prefer a place where I can just unwind.\nB: Yes, sir. There is a music teahouse where you can enjoy both classical music and modern music while having some Chinese tea or other drinks.\nA: Oh, great! That sounds perfect. Thank you very much.\nB: It's a pleasure.", + "total_duration": 44.80444444444444, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--450/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--450/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--450/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Is there any place in the hotel where we can amuse ourselves?", + "original_text": "Is there any place in the hotel where we can amuse ourselves?", + "start_time": 0, + "end_time": 3.1579138321995464, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--450/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "If you want to take a walk, you can go to the garden. It is very relaxing", + "original_text": "If you want to take a walk, you can go to the garden. It is very relaxing [interrupt] and has beautiful flowers and a calming atmosphere with several scenic spots perfect for meditation or simply enjoying the peaceful surroundings.", + "start_time": 3.6020038750275942, + "end_time": 14.538602514483376, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--450/temp/line_1_B.wav", + "silence_duration": 0.444090042828048, + "is_interrupted": true, + "text_after_interrupt": "and has beautiful flowers and a calming atmosphere with several scenic spots perfect for meditation or simply enjoying the peaceful surroundings." + }, + { + "speaker": "A", + "text": "The garden sounds nice, but I was actually thinking of something more indoors. Is there anywhere else to go?", + "original_text": "The garden sounds nice, but I was actually thinking of something more indoors. Is there anywhere else to go?", + "start_time": 7.340416573440293, + "end_time": 13.911663738973171, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--450/temp/line_2_A.wav", + "silence_duration": 0.3633033979394618, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "No, sir, there is a Recreation Center on the ground floor. You can play table tennis and go", + "original_text": "No, sir, there is a Recreation Center on the ground floor. You can play table tennis and go [interrupt] for a quick workout if you're interested in staying active, or simply relax in the lounge area with some light refreshments.", + "start_time": 15.009972066690134, + "end_time": 26.120720366009863, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--450/temp/line_3_B.wav", + "silence_duration": 0.4713695522067579, + "is_interrupted": true, + "text_after_interrupt": "for a quick workout if you're interested in staying active, or simply relax in the lounge area with some light refreshments." + }, + { + "speaker": "A", + "text": "I'm not really looking to play sports. I'd prefer a place where I can just unwind.", + "original_text": "I'm not really looking to play sports. I'd prefer a place where I can just unwind.", + "start_time": 26.602737042748245, + "end_time": 31.954936589233505, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--450/temp/line_4_A.wav", + "silence_duration": 0.5708181539885274, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, sir. There is a music teahouse where you can enjoy both classical music and modern music while having some Chinese tea or other drinks.", + "original_text": "Yes, sir. There is a music teahouse where you can enjoy both classical music and modern music while having some Chinese tea or other drinks.", + "start_time": 32.42078843468532, + "end_time": 39.57253446643135, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--450/temp/line_5_B.wav", + "silence_duration": 0.46585184545181246, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Oh, great! That sounds perfect. Thank you very much.", + "original_text": "Oh, great! That sounds perfect. Thank you very much.", + "start_time": 39.878905483528364, + "end_time": 43.396728612780066, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--450/temp/line_6_A.wav", + "silence_duration": 0.3063710170970143, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "It's a pleasure.", + "original_text": "It's a pleasure.", + "start_time": 43.88728156397515, + "end_time": 44.80446977259193, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--450/temp/line_7_B.wav", + "silence_duration": 0.4905529511950858, + "is_interrupted": false + } + ] + }, + "DialogSum--val--452": { + "original_text": "A: Excuse me. Could you please tell me how to get to the nearest cinema? \nB: Turn left at the second light. You can't [interrupt] miss it because it's a huge modern building with bright neon signs and multiple screens showing current movie trailers. \nA: Sorry to interrupt, but do you know if there's a parking lot nearby? \nB: Yes, there's a parking lot just past the cinema. But as I was saying, you can't miss it once you turn left. \nA: Will it take me long to get there? \nB: No. It's not far at all. \nA: Great, thank you very much. And just to confirm, after turning left, do I need to look out for any specific landmarks? \nB: No specific landmarks, just keep an eye out for a large billboard, the cinema is right next to it. \nA: Got it. Thanks again! \nB: That's all right. Have a good day.", + "cleaned_text": "A: Excuse me. Could you please tell me how to get to the nearest cinema? \nB:Turn left at the second light. You can't miss it because it's a huge modern building with bright neon signs and multiple screens showing current movie trailers.\nA: Sorry to interrupt, but do you know if there's a parking lot nearby? \nB: Yes, there's a parking lot just past the cinema. But as I was saying, you can't miss it once you turn left. \nA: Will it take me long to get there? \nB: No. It's not far at all. \nA: Great, thank you very much. And just to confirm, after turning left, do I need to look out for any specific landmarks? \nB: No specific landmarks, just keep an eye out for a large billboard, the cinema is right next to it. \nA: Got it. Thanks again! \nB: That's all right. Have a good day.", + "total_duration": 40.72430839002268, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--452/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--452/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--452/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Excuse me. Could you please tell me how to get to the nearest cinema?", + "original_text": "Excuse me. Could you please tell me how to get to the nearest cinema?", + "start_time": 0, + "end_time": 3.517823129251701, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--452/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Turn left at the second light. You can't", + "original_text": "Turn left at the second light. You can't [interrupt] miss it because it's a huge modern building with bright neon signs and multiple screens showing current movie trailers.", + "start_time": 3.9555915278635103, + "end_time": 12.430874974575527, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--452/temp/line_1_B.wav", + "silence_duration": 0.4377683986118095, + "is_interrupted": true, + "text_after_interrupt": "miss it because it's a huge modern building with bright neon signs and multiple screens showing current movie trailers." + }, + { + "speaker": "A", + "text": "Sorry to interrupt, but do you know if there's a parking lot nearby?", + "original_text": "Sorry to interrupt, but do you know if there's a parking lot nearby?", + "start_time": 6.47495660722859, + "end_time": 11.165387446230858, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--452/temp/line_2_A.wav", + "silence_duration": 0.38022042737892203, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, there's a parking lot just past the cinema. But as I was saying, you can't miss it once you turn left.", + "original_text": "Yes, there's a parking lot just past the cinema. But as I was saying, you can't miss it once you turn left.", + "start_time": 12.988082611762543, + "end_time": 19.222640434891794, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--452/temp/line_3_B.wav", + "silence_duration": 0.5572076371870165, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Will it take me long to get there?", + "original_text": "Will it take me long to get there?", + "start_time": 19.60039933068205, + "end_time": 21.2490161107274, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--452/temp/line_4_A.wav", + "silence_duration": 0.37775889579025346, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "No. It's not far at all.", + "original_text": "No. It's not far at all.", + "start_time": 21.789190974425882, + "end_time": 23.298488026580078, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--452/temp/line_5_B.wav", + "silence_duration": 0.5401748636984824, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Great, thank you very much. And just to confirm, after turning left, do I need to look out for any specific landmarks?", + "original_text": "Great, thank you very much. And just to confirm, after turning left, do I need to look out for any specific landmarks?", + "start_time": 23.89471228255158, + "end_time": 31.68500706713208, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--452/temp/line_6_A.wav", + "silence_duration": 0.5962242559715036, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "No specific landmarks, just keep an eye out for a large billboard, the cinema is right next to it.", + "original_text": "No specific landmarks, just keep an eye out for a large billboard, the cinema is right next to it.", + "start_time": 32.20304761630406, + "end_time": 37.253387752358485, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--452/temp/line_7_B.wav", + "silence_duration": 0.5180405491719807, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Got it. Thanks again!", + "original_text": "Got it. Thanks again!", + "start_time": 37.58786785664363, + "end_time": 38.81852545301552, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--452/temp/line_8_A.wav", + "silence_duration": 0.3344801042851504, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "That's all right. Have a good day.", + "original_text": "That's all right. Have a good day.", + "start_time": 39.19181832932355, + "end_time": 40.72433533612627, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--452/temp/line_9_B.wav", + "silence_duration": 0.37329287630803376, + "is_interrupted": false + } + ] + }, + "DialogSum--val--453": { + "original_text": "A: Merry Christmas, Bill. \nB: Merry Christmas, Jina. \nA: What are you doing there on the computer? \nB: Come have a look, I received many beautiful e-cards. They are from my friends, all over the world. Christmas wishes for all my friends. \nA: That's pretty interesting. Did you get one from Haven? The reason I ask is that I am looking for her [interrupt] to discuss something important about our upcoming project deadline, and I haven't been able to reach her for the past couple of days which is quite concerning. \nB: Oh, Haven! I actually don't have her number, but I do have her Email. You want me to send it to you? \nA: Yeah, that would be great. Thanks. By the way, I was going to ask if you got a card from her too? \nB: No worries. I just found her card. And you can get in touch with her via Email. I would really like to talk to her again. I kind of miss her a little these days. \nA: Thanks a million. \nB: My pleasure.", + "cleaned_text": "A: Merry Christmas, Bill. \nB: Merry Christmas, Jina. \nA: What are you doing there on the computer? \nB: Come have a look, I received many beautiful e-cards. They are from my friends, all over the world. Christmas wishes for all my friends. \nA:That's pretty interesting. Did you get one from Haven? The reason I ask is that I am looking for her to discuss something important about our upcoming project deadline, and I haven't been able to reach her for the past couple of days which is quite concerning.\nB: Oh, Haven! I actually don't have her number, but I do have her Email. You want me to send it to you? \nA: Yeah, that would be great. Thanks. By the way, I was going to ask if you got a card from her too? \nB: No worries. I just found her card. And you can get in touch with her via Email. I would really like to talk to her again. I kind of miss her a little these days. \nA: Thanks a million. \nB: My pleasure.", + "total_duration": 47.817913832199544, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--453/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--453/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--453/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Merry Christmas, Bill.", + "original_text": "Merry Christmas, Bill.", + "start_time": 0, + "end_time": 1.5789569160997732, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--453/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Merry Christmas, Jina.", + "original_text": "Merry Christmas, Jina.", + "start_time": 2.0980481734413683, + "end_time": 3.711835021513931, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--453/temp/line_1_B.wav", + "silence_duration": 0.5190912573415952, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "What are you doing there on the computer?", + "original_text": "What are you doing there on the computer?", + "start_time": 4.053012190374277, + "end_time": 5.864168652959311, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--453/temp/line_2_A.wav", + "silence_duration": 0.3411771688603463, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Come have a look, I received many beautiful e-cards. They are from my friends, all over the world. Christmas wishes for all my friends.", + "original_text": "Come have a look, I received many beautiful e-cards. They are from my friends, all over the world. Christmas wishes for all my friends.", + "start_time": 6.273294726163315, + "end_time": 12.925811732966036, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--453/temp/line_3_B.wav", + "silence_duration": 0.40912607320400457, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "That's pretty interesting. Did you get one from Haven? The reason I ask is that I am looking for her", + "original_text": "That's pretty interesting. Did you get one from Haven? The reason I ask is that I am looking for her [interrupt] to discuss something important about our upcoming project deadline, and I haven't been able to reach her for the past couple of days which is quite concerning.", + "start_time": 13.477696520660068, + "end_time": 28.837696520660067, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--453/temp/line_4_A.wav", + "silence_duration": 0.5518847876940316, + "is_interrupted": true, + "text_after_interrupt": "to discuss something important about our upcoming project deadline, and I haven't been able to reach her for the past couple of days which is quite concerning." + }, + { + "speaker": "B", + "text": "Oh, Haven! I actually don't have her number, but I do have her Email. You want me to send it to you?", + "original_text": "Oh, Haven! I actually don't have her number, but I do have her Email. You want me to send it to you?", + "start_time": 19.213025318846007, + "end_time": 24.30980536419748, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--453/temp/line_5_B.wav", + "silence_duration": 0.5584604113989405, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Yeah, that would be great. Thanks. By the way, I was going to ask if you got a card from her too?", + "original_text": "Yeah, that would be great. Thanks. By the way, I was going to ask if you got a card from her too?", + "start_time": 29.209673064329113, + "end_time": 35.804140184510516, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--453/temp/line_6_A.wav", + "silence_duration": 0.37197654366904515, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "No worries. I just found her card. And you can get in touch with her via Email. I would really like to talk to her again. I kind of miss her a little these days.", + "original_text": "No worries. I just found her card. And you can get in touch with her via Email. I would really like to talk to her again. I kind of miss her a little these days.", + "start_time": 36.32821184330485, + "end_time": 45.04730481382639, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--453/temp/line_7_B.wav", + "silence_duration": 0.5240716587943335, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Thanks a million.", + "original_text": "Thanks a million.", + "start_time": 45.580815501910514, + "end_time": 46.55605359714861, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--453/temp/line_8_A.wav", + "silence_duration": 0.5335106880841234, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "My pleasure.", + "original_text": "My pleasure.", + "start_time": 46.982012650924716, + "end_time": 47.81793101827166, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--453/temp/line_9_B.wav", + "silence_duration": 0.4259590537761062, + "is_interrupted": false + } + ] + }, + "DialogSum--val--454": { + "original_text": "A: Do you remember what the ratings of movies stand for? \nB: Yes, G stands for General Audiences, PG means Parental Guidance suggested, R is restricted to audiences under 18 and X means explicit [interrupt] content that is only for adults and often includes graphic violence, strong language, or sexual scenes that aren't suitable for younger viewers. \nA: Sorry to jump in, but do you think people even pay attention to those ratings anymore? \nB: That's a good point. It feels like the significance has diminished. Remember when we were kids? Theaters wouldn't let kids in to PG movies without a parent. \nA: I do remember, and I also recall that I never saw an X movie even [interrupt] though some of my friends would talk about sneaking into them, claiming they were more mature and edgy than the films we were allowed to watch at that age. \nB: Displayed, right? Yeah, those were kept out of sight. But now, with video rentals and streaming, it's all a personal matter. \nA: Exactly. And speaking of theaters, I never see them turning people away for their age anymore either. \nB: True, and that puts the responsibility on us to decide what we will see and what we won't.", + "cleaned_text": "A: Do you remember what the ratings of movies stand for? \nB:Yes, G stands for General Audiences, PG means Parental Guidance suggested, R is restricted to audiences under 18 and X means explicit content that is only for adults and often includes graphic violence, strong language, or sexual scenes that aren't suitable for younger viewers.\nA: Sorry to jump in, but do you think people even pay attention to those ratings anymore? \nB: That's a good point. It feels like the significance has diminished. Remember when we were kids? Theaters wouldn't let kids in to PG movies without a parent. \nA:I do remember, and I also recall that I never saw an X movie even though some of my friends would talk about sneaking into them, claiming they were more mature and edgy than the films we were allowed to watch at that age.\nB: Displayed, right? Yeah, those were kept out of sight. But now, with video rentals and streaming, it's all a personal matter. \nA: Exactly. And speaking of theaters, I never see them turning people away for their age anymore either. \nB: True, and that puts the responsibility on us to decide what we will see and what we won't.", + "total_duration": 58.906938775510206, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--454/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--454/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--454/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Do you remember what the ratings of movies stand for?", + "original_text": "Do you remember what the ratings of movies stand for?", + "start_time": 0, + "end_time": 2.7980045351473923, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--454/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, G stands for General Audiences, PG means Parental Guidance suggested, R is restricted to audiences under 18 and X means explicit", + "original_text": "Yes, G stands for General Audiences, PG means Parental Guidance suggested, R is restricted to audiences under 18 and X means explicit [interrupt] content that is only for adults and often includes graphic violence, strong language, or sexual scenes that aren't suitable for younger viewers.", + "start_time": 3.321108155655914, + "end_time": 20.619974368807842, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--454/temp/line_1_B.wav", + "silence_duration": 0.5231036205085219, + "is_interrupted": true, + "text_after_interrupt": "content that is only for adults and often includes graphic violence, strong language, or sexual scenes that aren't suitable for younger viewers." + }, + { + "speaker": "A", + "text": "Sorry to jump in, but do you think people even pay attention to those ratings anymore?", + "original_text": "Sorry to jump in, but do you think people even pay attention to those ratings anymore?", + "start_time": 12.818069606903078, + "end_time": 17.914849652254553, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--454/temp/line_2_A.wav", + "silence_duration": 0.5324443536072376, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "That's a good point. It feels like the significance has diminished. Remember when we were kids? Theaters wouldn't let kids in to PG movies without a parent.", + "original_text": "That's a good point. It feels like the significance has diminished. Remember when we were kids? Theaters wouldn't let kids in to PG movies without a parent.", + "start_time": 21.029816570287725, + "end_time": 28.947821105435118, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--454/temp/line_3_B.wav", + "silence_duration": 0.4098422014798827, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I do remember, and I also recall that I never saw an X movie even", + "original_text": "I do remember, and I also recall that I never saw an X movie even [interrupt] though some of my friends would talk about sneaking into them, claiming they were more mature and edgy than the films we were allowed to watch at that age.", + "start_time": 29.422396249492085, + "end_time": 42.576500557882106, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--454/temp/line_4_A.wav", + "silence_duration": 0.47457514405696677, + "is_interrupted": true, + "text_after_interrupt": "though some of my friends would talk about sneaking into them, claiming they were more mature and edgy than the films we were allowed to watch at that age." + }, + { + "speaker": "B", + "text": "Displayed, right? Yeah, those were kept out of sight. But now, with video rentals and streaming, it's all a personal matter.", + "original_text": "Displayed, right? Yeah, those were kept out of sight. But now, with video rentals and streaming, it's all a personal matter.", + "start_time": 39.83641619688559, + "end_time": 46.709522772849304, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--454/temp/line_5_B.wav", + "silence_duration": 0.5422287645271964, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Exactly. And speaking of theaters, I never see them turning people away for their age anymore either.", + "original_text": "Exactly. And speaking of theaters, I never see them turning people away for their age anymore either.", + "start_time": 47.0596608119761, + "end_time": 53.21294879383551, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--454/temp/line_6_A.wav", + "silence_duration": 0.35013803912679403, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "True, and that puts the responsibility on us to decide what we will see and what we won't.", + "original_text": "True, and that puts the responsibility on us to decide what we will see and what we won't.", + "start_time": 53.612815204953506, + "end_time": 58.90696486481745, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--454/temp/line_7_B.wav", + "silence_duration": 0.3998664111179967, + "is_interrupted": false + } + ] + }, + "DialogSum--val--455": { + "original_text": "A: Good afternoon. Is there a vacant room here? \nB: What do you want, a single or a double one? \nA: A single, preferably with a [interrupt] good view, if possible, preferably facing the garden or the city skyline since I enjoy watching sunsets and urban landscapes during my stay. \nB: Sorry to interrupt, but do you have any preferences for the floor? We have rooms available on different floors. \nA: I don't mind the floor, but I do prefer a quiet room. I hate noise. \nB: It's very quiet, sir. We have one single room on the fifth floor. \nA: How much does it cost per day? \nB: It's 150 yuan per day including a 10% service charge. \nA: All right. I'll take the room. Oh, by the way, does it have a bath? \nB: Yes, it does. Would you please fill in the registration form?", + "cleaned_text": "A: Good afternoon. Is there a vacant room here? \nB: What do you want, a single or a double one? \nA:A single, preferably with a good view, if possible, preferably facing the garden or the city skyline since I enjoy watching sunsets and urban landscapes during my stay.\nB: Sorry to interrupt, but do you have any preferences for the floor? We have rooms available on different floors. \nA: I don't mind the floor, but I do prefer a quiet room. I hate noise. \nB: It's very quiet, sir. We have one single room on the fifth floor. \nA: How much does it cost per day? \nB: It's 150 yuan per day including a 10% service charge. \nA: All right. I'll take the room. Oh, by the way, does it have a bath? \nB: Yes, it does. Would you please fill in the registration form?", + "total_duration": 42.393197278911565, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--455/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--455/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--455/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Good afternoon. Is there a vacant room here?", + "original_text": "Good afternoon. Is there a vacant room here?", + "start_time": 0, + "end_time": 2.7980045351473923, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--455/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "What do you want, a single or a double one?", + "original_text": "What do you want, a single or a double one?", + "start_time": 3.3227908757600737, + "end_time": 5.633176363288419, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--455/temp/line_1_B.wav", + "silence_duration": 0.5247863406126816, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "A single, preferably with a", + "original_text": "A single, preferably with a [interrupt] good view, if possible, preferably facing the garden or the city skyline since I enjoy watching sunsets and urban landscapes during my stay.", + "start_time": 5.963006452892964, + "end_time": 17.155024593482533, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--455/temp/line_2_A.wav", + "silence_duration": 0.3298300896045457, + "is_interrupted": true, + "text_after_interrupt": "good view, if possible, preferably facing the garden or the city skyline since I enjoy watching sunsets and urban landscapes during my stay." + }, + { + "speaker": "B", + "text": "Sorry to interrupt, but do you have any preferences for the floor? We have rooms available on different floors.", + "original_text": "Sorry to interrupt, but do you have any preferences for the floor? We have rooms available on different floors.", + "start_time": 7.994752484638996, + "end_time": 14.554389672847613, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--455/temp/line_3_B.wav", + "silence_duration": 0.41048240885859755, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I don't mind the floor, but I do prefer a quiet room. I hate noise.", + "original_text": "I don't mind the floor, but I do prefer a quiet room. I hate noise.", + "start_time": 17.695433673296343, + "end_time": 22.54840419483829, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--455/temp/line_4_A.wav", + "silence_duration": 0.5404090798138081, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "It's very quiet, sir. We have one single room on the fifth floor.", + "original_text": "It's very quiet, sir. We have one single room on the fifth floor.", + "start_time": 22.98382120203395, + "end_time": 26.397154535367285, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--455/temp/line_5_B.wav", + "silence_duration": 0.43541700719565923, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "How much does it cost per day?", + "original_text": "How much does it cost per day?", + "start_time": 26.825071660860857, + "end_time": 29.05418730711936, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--455/temp/line_6_A.wav", + "silence_duration": 0.42791712549357114, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "It's 150 yuan per day including a 10% service charge.", + "original_text": "It's 150 yuan per day including a 10% service charge.", + "start_time": 29.36144656219564, + "end_time": 34.10992728781922, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--455/temp/line_7_B.wav", + "silence_duration": 0.3072592550762788, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "All right. I'll take the room. Oh, by the way, does it have a bath?", + "original_text": "All right. I'll take the room. Oh, by the way, does it have a bath?", + "start_time": 34.61934164115296, + "end_time": 39.15884277493981, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--455/temp/line_8_A.wav", + "silence_duration": 0.509414353333739, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, it does. Would you please fill in the registration form?", + "original_text": "Yes, it does. Would you please fill in the registration form?", + "start_time": 39.502331254552836, + "end_time": 42.393215608294334, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--455/temp/line_9_B.wav", + "silence_duration": 0.3434884796130281, + "is_interrupted": false + } + ] + }, + "DialogSum--val--456": { + "original_text": "A: What seems to be the problem? \nB: Oh, my God! It's my stomach. It's [interrupt] been hurting since I woke up this morning and the pain has been getting progressively worse throughout the day, making it difficult to even stand up straight. \nA: Where exactly does it hurt? \nB: Right here! It hurts right here! \nA: How long has it felt like this? \nB: I felt OK when I woke up, and then, suddenly, I had this really sharp pain. \nA: Do you have a history of stomach pain? \nB: No, and I haven't done anything out of the ordinary. \nA: Well, I think that we are going to have to get you to an emergency room right [interrupt] away to make sure it's nothing serious like appendicitis or a gastrointestinal issue that might require immediate medical attention. \nB: Wait, before we go, is there anything I should avoid doing or eating right now? \nA: Just try to stay calm and avoid eating or drinking anything until we get there. But as I was saying, we should head to the emergency room right away. \nB: Thank you for helping me.", + "cleaned_text": "A: What seems to be the problem? \nB:Oh, my God! It's my stomach. It's been hurting since I woke up this morning and the pain has been getting progressively worse throughout the day, making it difficult to even stand up straight.\nA: Where exactly does it hurt? \nB: Right here! It hurts right here! \nA: How long has it felt like this? \nB: I felt OK when I woke up, and then, suddenly, I had this really sharp pain. \nA: Do you have a history of stomach pain? \nB: No, and I haven't done anything out of the ordinary. \nA:Well, I think that we are going to have to get you to an emergency room right away to make sure it's nothing serious like appendicitis or a gastrointestinal issue that might require immediate medical attention.\nB: Wait, before we go, is there anything I should avoid doing or eating right now? \nA: Just try to stay calm and avoid eating or drinking anything until we get there. But as I was saying, we should head to the emergency room right away. \nB: Thank you for helping me.", + "total_duration": 49.14408163265306, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--456/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--456/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--456/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "What seems to be the problem?", + "original_text": "What seems to be the problem?", + "start_time": 0, + "end_time": 1.6137868480725623, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--456/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Oh, my God! It's my stomach. It's", + "original_text": "Oh, my God! It's my stomach. It's [interrupt] been hurting since I woke up this morning and the pain has been getting progressively worse throughout the day, making it difficult to even stand up straight.", + "start_time": 1.9672534457669153, + "end_time": 11.545484738283921, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--456/temp/line_1_B.wav", + "silence_duration": 0.35346659769435307, + "is_interrupted": true, + "text_after_interrupt": "been hurting since I woke up this morning and the pain has been getting progressively worse throughout the day, making it difficult to even stand up straight." + }, + { + "speaker": "A", + "text": "Where exactly does it hurt?", + "original_text": "Where exactly does it hurt?", + "start_time": 3.8248498176490013, + "end_time": 5.519906506991405, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--456/temp/line_2_A.wav", + "silence_duration": 0.571848198712233, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Right here! It hurts right here!", + "original_text": "Right here! It hurts right here!", + "start_time": 11.987693289795361, + "end_time": 13.798849752380395, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--456/temp/line_3_B.wav", + "silence_duration": 0.44220855151143934, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "How long has it felt like this?", + "original_text": "How long has it felt like this?", + "start_time": 14.173535823802672, + "end_time": 16.03113219568476, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--456/temp/line_4_A.wav", + "silence_duration": 0.37468607142227695, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I felt OK when I woke up, and then, suddenly, I had this really sharp pain.", + "original_text": "I felt OK when I woke up, and then, suddenly, I had this really sharp pain.", + "start_time": 16.35676740932567, + "end_time": 20.71050890592431, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--456/temp/line_5_B.wav", + "silence_duration": 0.32563521364091086, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Do you have a history of stomach pain?", + "original_text": "Do you have a history of stomach pain?", + "start_time": 21.015850839402297, + "end_time": 22.989546984527014, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--456/temp/line_6_A.wav", + "silence_duration": 0.305341933477987, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "No, and I haven't done anything out of the ordinary.", + "original_text": "No, and I haven't done anything out of the ordinary.", + "start_time": 23.529829646258168, + "end_time": 26.14207454421735, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--456/temp/line_7_B.wav", + "silence_duration": 0.5402826617311562, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Well, I think that we are going to have to get you to an emergency room right", + "original_text": "Well, I think that we are going to have to get you to an emergency room right [interrupt] away to make sure it's nothing serious like appendicitis or a gastrointestinal issue that might require immediate medical attention.", + "start_time": 26.639390865343785, + "end_time": 38.74859721455013, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--456/temp/line_8_A.wav", + "silence_duration": 0.49731632112643265, + "is_interrupted": true, + "text_after_interrupt": "away to make sure it's nothing serious like appendicitis or a gastrointestinal issue that might require immediate medical attention." + }, + { + "speaker": "B", + "text": "Wait, before we go, is there anything I should avoid doing or eating right now?", + "original_text": "Wait, before we go, is there anything I should avoid doing or eating right now?", + "start_time": 32.70653553932688, + "end_time": 36.58426796563074, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--456/temp/line_9_B.wav", + "silence_duration": 0.5429358271961587, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Just try to stay calm and avoid eating or drinking anything until we get there. But as I was saying, we should head to the emergency room right away.", + "original_text": "Just try to stay calm and avoid eating or drinking anything until we get there. But as I was saying, we should head to the emergency room right away.", + "start_time": 39.05336154418652, + "end_time": 47.55186494554707, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--456/temp/line_10_A.wav", + "silence_duration": 0.3047643296363917, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Thank you for helping me.", + "original_text": "Thank you for helping me.", + "start_time": 47.97151183287462, + "end_time": 49.144119542625184, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--456/temp/line_11_B.wav", + "silence_duration": 0.4196468873275491, + "is_interrupted": false + } + ] + }, + "DialogSum--val--457": { + "original_text": "A: Wow, Is winter always this cold in Taiwan? \nB: Not really. It's much warmer usually. You're not used to cold [interrupt] weather, are you? I can tell by how you're shivering right now and the way you keep rubbing your hands together for warmth. \nA: Actually, no, I am from South California. This is my first real winter. How do people usually deal with this cold here? \nB: Well, you'd better get some more warm clothes. It's also common to use space heaters, and layering up really helps. By the way, what's the temperature today? \nA: I would say it's about 5 degrees Celsius. But speaking of staying warm, do you know where I can buy some good quality winter clothes around here?", + "cleaned_text": "A: Wow, Is winter always this cold in Taiwan? \nB:Not really. It's much warmer usually. You're not used to cold weather, are you? I can tell by how you're shivering right now and the way you keep rubbing your hands together for warmth.\nA: Actually, no, I am from South California. This is my first real winter. How do people usually deal with this cold here? \nB: Well, you'd better get some more warm clothes. It's also common to use space heaters, and layering up really helps. By the way, what's the temperature today? \nA: I would say it's about 5 degrees Celsius. But speaking of staying warm, do you know where I can buy some good quality winter clothes around here?", + "total_duration": 31.959002267573695, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--457/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--457/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--457/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Wow, Is winter always this cold in Taiwan?", + "original_text": "Wow, Is winter always this cold in Taiwan?", + "start_time": 0, + "end_time": 3.01859410430839, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--457/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Not really. It's much warmer usually. You're not used to cold", + "original_text": "Not really. It's much warmer usually. You're not used to cold [interrupt] weather, are you? I can tell by how you're shivering right now and the way you keep rubbing your hands together for warmth.", + "start_time": 3.3670522587007206, + "end_time": 12.515714390219994, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--457/temp/line_1_B.wav", + "silence_duration": 0.3484581543923306, + "is_interrupted": true, + "text_after_interrupt": "weather, are you? I can tell by how you're shivering right now and the way you keep rubbing your hands together for warmth." + }, + { + "speaker": "A", + "text": "Actually, no, I am from South California. This is my first real winter. How do people usually deal with this cold here?", + "original_text": "Actually, no, I am from South California. This is my first real winter. How do people usually deal with this cold here?", + "start_time": 7.244784685004575, + "end_time": 14.942199650990968, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--457/temp/line_2_A.wav", + "silence_duration": 0.34857127176156855, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Well, you'd better get some more warm clothes. It's also common to use space heaters, and layering up really helps. By the way, what's the temperature today?", + "original_text": "Well, you'd better get some more warm clothes. It's also common to use space heaters, and layering up really helps. By the way, what's the temperature today?", + "start_time": 15.46017105042393, + "end_time": 23.52910529078674, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--457/temp/line_3_B.wav", + "silence_duration": 0.5179713994329623, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I would say it's about 5 degrees Celsius. But speaking of staying warm, do you know where I can buy some good quality winter clothes around here?", + "original_text": "I would say it's about 5 degrees Celsius. But speaking of staying warm, do you know where I can buy some good quality winter clothes around here?", + "start_time": 23.866867861278042, + "end_time": 31.959022056289378, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--457/temp/line_4_A.wav", + "silence_duration": 0.33776257049129865, + "is_interrupted": false + } + ] + }, + "DialogSum--val--458": { + "original_text": "A: Are you ready to order, sir? \nB: Yes. Can you show me the menu, please? \nA: Of course. Here you [interrupt] go, let me get that for you. We have a special seasonal menu tonight featuring locally sourced ingredients and some chef's specials that have been getting excellent reviews from our customers. \nB: Actually, before I look at the menu, do you have any recommendations for tonight? \nA: Our seafood is fresh. I recommend shrimp with garlic. \nB: That sounds great. We'll have some seafood and vegetables. Oh, by the way, could you show me the menu as well? I might want to add something else. \nA: Certainly, here you are.", + "cleaned_text": "A: Are you ready to order, sir? \nB: Yes. Can you show me the menu, please? \nA:Of course. Here you go, let me get that for you. We have a special seasonal menu tonight featuring locally sourced ingredients and some chef's specials that have been getting excellent reviews from our customers.\nB: Actually, before I look at the menu, do you have any recommendations for tonight? \nA: Our seafood is fresh. I recommend shrimp with garlic. \nB: That sounds great. We'll have some seafood and vegetables. Oh, by the way, could you show me the menu as well? I might want to add something else. \nA: Certainly, here you are.", + "total_duration": 30.27886621315193, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--458/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--458/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--458/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Are you ready to order, sir?", + "original_text": "Are you ready to order, sir?", + "start_time": 0, + "end_time": 1.555736961451247, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--458/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes. Can you show me the menu, please?", + "original_text": "Yes. Can you show me the menu, please?", + "start_time": 1.9812554201851706, + "end_time": 4.2335910210922005, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--458/temp/line_1_B.wav", + "silence_duration": 0.4255184587339236, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Of course. Here you", + "original_text": "Of course. Here you [interrupt] go, let me get that for you. We have a special seasonal menu tonight featuring locally sourced ingredients and some chef's specials that have been getting excellent reviews from our customers.", + "start_time": 4.640152282981537, + "end_time": 16.61003890429673, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--458/temp/line_2_A.wav", + "silence_duration": 0.40656126188933667, + "is_interrupted": true, + "text_after_interrupt": "go, let me get that for you. We have a special seasonal menu tonight featuring locally sourced ingredients and some chef's specials that have been getting excellent reviews from our customers." + }, + { + "speaker": "B", + "text": "Actually, before I look at the menu, do you have any recommendations for tonight?", + "original_text": "Actually, before I look at the menu, do you have any recommendations for tonight?", + "start_time": 6.311989017675415, + "end_time": 10.549630741031425, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--458/temp/line_3_B.wav", + "silence_duration": 0.3880673832892484, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Our seafood is fresh. I recommend shrimp with garlic.", + "original_text": "Our seafood is fresh. I recommend shrimp with garlic.", + "start_time": 16.99129013936456, + "end_time": 20.648432996507417, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--458/temp/line_4_A.wav", + "silence_duration": 0.3812512350678278, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "That sounds great. We'll have some seafood and vegetables. Oh, by the way, could you show me the menu as well? I might want to add something else.", + "original_text": "That sounds great. We'll have some seafood and vegetables. Oh, by the way, could you show me the menu as well? I might want to add something else.", + "start_time": 21.090991789623352, + "end_time": 28.602647118421537, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--458/temp/line_5_B.wav", + "silence_duration": 0.4425587931159338, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Certainly, here you are.", + "original_text": "Certainly, here you are.", + "start_time": 28.94373458658939, + "end_time": 30.27888197887964, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--458/temp/line_6_A.wav", + "silence_duration": 0.34108746816785307, + "is_interrupted": false + } + ] + }, + "DialogSum--val--461": { + "original_text": "A: Don't have some relation with him. You know, he is not a kind [interrupt] person, and he tends to hold grudges for even the smallest perceived slights while maintaining an outwardly calm demeanor that makes it hard to anticipate his reactions.\nB: Sorry to jump in, but do you think his behavior could actually affect our work environment?\nA: Absolutely, it could create a lot of tension. I was going to say that sometimes I just cannot accept his behavior. If you attack him, be sure you'll get a Roland for an Oliver.\nB: That sounds concerning. But what do you mean by \"Roland for an Oliver\"? Could you explain that a bit more?\nA: Sure, it means if you confront him, he'll retaliate equally or even more aggressively. That's why it's better to be far away from him.", + "cleaned_text": "A:Don't have some relation with him. You know, he is not a kind person, and he tends to hold grudges for even the smallest perceived slights while maintaining an outwardly calm demeanor that makes it hard to anticipate his reactions.\nB: Sorry to jump in, but do you think his behavior could actually affect our work environment?\nA: Absolutely, it could create a lot of tension. I was going to say that sometimes I just cannot accept his behavior. If you attack him, be sure you'll get a Roland for an Oliver.\nB: That sounds concerning. But what do you mean by \"Roland for an Oliver\"? Could you explain that a bit more?\nA: Sure, it means if you confront him, he'll retaliate equally or even more aggressively. That's why it's better to be far away from him.", + "total_duration": 38.71179138321995, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--461/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--461/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--461/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Don't have some relation with him. You know, he is not a kind", + "original_text": "Don't have some relation with him. You know, he is not a kind [interrupt] person, and he tends to hold grudges for even the smallest perceived slights while maintaining an outwardly calm demeanor that makes it hard to anticipate his reactions.", + "start_time": 0, + "end_time": 13.79265306122449, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--461/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": true, + "text_after_interrupt": "person, and he tends to hold grudges for even the smallest perceived slights while maintaining an outwardly calm demeanor that makes it hard to anticipate his reactions." + }, + { + "speaker": "B", + "text": "Sorry to jump in, but do you think his behavior could actually affect our work environment?", + "original_text": "Sorry to jump in, but do you think his behavior could actually affect our work environment?", + "start_time": 3.6919727891156464, + "end_time": 7.883174603174603, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--461/temp/line_1_B.wav", + "silence_duration": 0.5180867676227211, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Absolutely, it could create a lot of tension. I was going to say that sometimes I just cannot accept his behavior. If you attack him, be sure you'll get a Roland for an Oliver.", + "original_text": "Absolutely, it could create a lot of tension. I was going to say that sometimes I just cannot accept his behavior. If you attack him, be sure you'll get a Roland for an Oliver.", + "start_time": 14.278723009749843, + "end_time": 24.994732080044628, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--461/temp/line_2_A.wav", + "silence_duration": 0.48606994852535357, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "That sounds concerning. But what do you mean by \"Roland for an Oliver\"? Could you explain that a bit more?", + "original_text": "That sounds concerning. But what do you mean by \"Roland for an Oliver\"? Could you explain that a bit more?", + "start_time": 25.316309488755778, + "end_time": 30.35503964748594, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--461/temp/line_3_B.wav", + "silence_duration": 0.32157740871114837, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Sure, it means if you confront him, he'll retaliate equally or even more aggressively. That's why it's better to be far away from him.", + "original_text": "Sure, it means if you confront him, he'll retaliate equally or even more aggressively. That's why it's better to be far away from him.", + "start_time": 30.78221483244659, + "end_time": 38.71182934491824, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--461/temp/line_4_A.wav", + "silence_duration": 0.4271751849606545, + "is_interrupted": false + } + ] + }, + "DialogSum--val--462": { + "original_text": "A: Thank you so much. I can't take this.\nB: She will insist. It's a rosary. She has millions of them. Take it.\nA: What did she mean just now about raising pigs?\nB: Oh! My grandmother used to say 'raising the pigs, raising the kids'... at least you can [interrupt] get some bacon out of it when times get tough, unlike children who just keep demanding more attention and resources without any immediate payoff.\nA: Oh wait, does that mean she thinks raising kids is as tough as raising pigs?\nB: Exactly! She's just being sarcastic. It's her way of poking fun at the challenges of motherhood. But I was saying, at least you can eat the pigs.\nA: Haha. I get it. That's funny. Your cousin's a real sarcastic lady.\nB: She likes to complain about her macho husband and her 'bambinos', but she loves them all dearly.", + "cleaned_text": "A: Thank you so much. I can't take this.\nB: She will insist. It's a rosary. She has millions of them. Take it.\nA: What did she mean just now about raising pigs?\nB:Oh! My grandmother used to say 'raising the pigs, raising the kids'... at least you can get some bacon out of it when times get tough, unlike children who just keep demanding more attention and resources without any immediate payoff.\nA: Oh wait, does that mean she thinks raising kids is as tough as raising pigs?\nB: Exactly! She's just being sarcastic. It's her way of poking fun at the challenges of motherhood. But I was saying, at least you can eat the pigs.\nA: Haha. I get it. That's funny. Your cousin's a real sarcastic lady.\nB: She likes to complain about her macho husband and her 'bambinos', but she loves them all dearly.", + "total_duration": 41.90920634920635, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--462/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--462/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--462/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Thank you so much. I can't take this.", + "original_text": "Thank you so much. I can't take this.", + "start_time": 0, + "end_time": 3.5294331065759637, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--462/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "She will insist. It's a rosary. She has millions of them. Take it.", + "original_text": "She will insist. It's a rosary. She has millions of them. Take it.", + "start_time": 3.9239460241538167, + "end_time": 7.662358722566515, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--462/temp/line_1_B.wav", + "silence_duration": 0.39451291757785306, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "What did she mean just now about raising pigs?", + "original_text": "What did she mean just now about raising pigs?", + "start_time": 8.05001265313125, + "end_time": 10.88284712025143, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--462/temp/line_2_A.wav", + "silence_duration": 0.38765393056473385, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Oh! My grandmother used to say 'raising the pigs, raising the kids'... at least you can", + "original_text": "Oh! My grandmother used to say 'raising the pigs, raising the kids'... at least you can [interrupt] get some bacon out of it when times get tough, unlike children who just keep demanding more attention and resources without any immediate payoff.", + "start_time": 11.310902029162332, + "end_time": 23.22273876385621, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--462/temp/line_3_B.wav", + "silence_duration": 0.42805490891090087, + "is_interrupted": true, + "text_after_interrupt": "get some bacon out of it when times get tough, unlike children who just keep demanding more attention and resources without any immediate payoff." + }, + { + "speaker": "A", + "text": "Oh wait, does that mean she thinks raising kids is as tough as raising pigs?", + "original_text": "Oh wait, does that mean she thinks raising kids is as tough as raising pigs?", + "start_time": 16.46573196113512, + "end_time": 21.516072097189543, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--462/temp/line_4_A.wav", + "silence_duration": 0.46207529185163765, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Exactly! She's just being sarcastic. It's her way of poking fun at the challenges of motherhood. But I was saying, at least you can eat the pigs.", + "original_text": "Exactly! She's just being sarcastic. It's her way of poking fun at the challenges of motherhood. But I was saying, at least you can eat the pigs.", + "start_time": 23.57146900648448, + "end_time": 31.24566401782235, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--462/temp/line_5_B.wav", + "silence_duration": 0.34873024262827024, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Haha. I get it. That's funny. Your cousin's a real sarcastic lady.", + "original_text": "Haha. I get it. That's funny. Your cousin's a real sarcastic lady.", + "start_time": 31.618412222256467, + "end_time": 36.61070247168957, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--462/temp/line_6_A.wav", + "silence_duration": 0.372748204434117, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "She likes to complain about her macho husband and her 'bambinos', but she loves them all dearly.", + "original_text": "She likes to complain about her macho husband and her 'bambinos', but she loves them all dearly.", + "start_time": 36.94014872784957, + "end_time": 41.90921902263415, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--462/temp/line_7_B.wav", + "silence_duration": 0.3294462561599991, + "is_interrupted": false + } + ] + }, + "DialogSum--val--463": { + "original_text": "A: OK, Dead Man. If this doesn't start your engine, nothing will. \nB: Thank you. Hey, do you know how espresso got its [interrupt] unique flavor and rich aroma from the specific roasting process and high-pressure extraction method that creates those distinctive caramelized notes and velvety crema on top? \nA: Sorry to cut in, but I was wondering if you could recommend a good place to get an espresso around here? \nB: Sure, I know a few spots. But as I was saying, espresso got its name because of the way the steam and boiling water are pressed through the coffee. Es-PRESS-o, get it? The perfect espresso should have a balance of sweetness, acidity, and bitterness that dances on your palate.", + "cleaned_text": "A: OK, Dead Man. If this doesn't start your engine, nothing will. \nB:Thank you. Hey, do you know how espresso got its unique flavor and rich aroma from the specific roasting process and high-pressure extraction method that creates those distinctive caramelized notes and velvety crema on top?\nA: Sorry to cut in, but I was wondering if you could recommend a good place to get an espresso around here? \nB: Sure, I know a few spots. But as I was saying, espresso got its name because of the way the steam and boiling water are pressed through the coffee. Es-PRESS-o, get it? The perfect espresso should have a balance of sweetness, acidity, and bitterness that dances on your palate.", + "total_duration": 30.68294784580499, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--463/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--463/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--463/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "OK, Dead Man. If this doesn't start your engine, nothing will.", + "original_text": "OK, Dead Man. If this doesn't start your engine, nothing will.", + "start_time": 0, + "end_time": 4.249251700680272, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--463/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Thank you. Hey, do you know how espresso got its", + "original_text": "Thank you. Hey, do you know how espresso got its [interrupt] unique flavor and rich aroma from the specific roasting process and high-pressure extraction method that creates those distinctive caramelized notes and velvety crema on top?", + "start_time": 4.837534838190339, + "end_time": 16.052772933428436, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--463/temp/line_1_B.wav", + "silence_duration": 0.5882831375100667, + "is_interrupted": true, + "text_after_interrupt": "unique flavor and rich aroma from the specific roasting process and high-pressure extraction method that creates those distinctive caramelized notes and velvety crema on top?" + }, + { + "speaker": "A", + "text": "Sorry to cut in, but I was wondering if you could recommend a good place to get an espresso around here?", + "original_text": "Sorry to cut in, but I was wondering if you could recommend a good place to get an espresso around here?", + "start_time": 7.229190166988525, + "end_time": 13.161888579686938, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--463/temp/line_2_A.wav", + "silence_duration": 0.48484847160376127, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Sure, I know a few spots. But as I was saying, espresso got its name because of the way the steam and boiling water are pressed through the coffee. Es-PRESS-o, get it? The perfect espresso should have a balance of sweetness, acidity, and bitterness that dances on your palate.", + "original_text": "Sure, I know a few spots. But as I was saying, espresso got its name because of the way the steam and boiling water are pressed through the coffee. Es-PRESS-o, get it? The perfect espresso should have a balance of sweetness, acidity, and bitterness that dances on your palate.", + "start_time": 16.483975647466263, + "end_time": 30.68297791503996, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--463/temp/line_3_B.wav", + "silence_duration": 0.43120271403782773, + "is_interrupted": false + } + ] + }, + "DialogSum--val--464": { + "original_text": "A: Are you busy with your work? \nB: Yes. What about you? \nA: Yes, I'm very busy, too. Sometimes I work [interrupt] late into the night to meet deadlines, which can be exhausting but necessary when we have important projects with tight schedules. \nB: Overtime? How often do you have to stay late at the office? \nA: Quite often, especially during peak seasons. But I was saying that we can travel twice every year. \nB: Is this time one of them? \nA: Yes, we won't travel again until [interrupt] the end of the year, probably around Christmas when things slow down at work and we can finally take some well-deserved time off. \nB: October? That's a nice time for a vacation. We only get one chance to travel every year. \nA: Really? Then you must make the most of that one trip by carefully planning your itinerary and choosing destinations that offer diverse experiences.", + "cleaned_text": "A: Are you busy with your work? \nB: Yes. What about you? \nA:Yes, I'm very busy, too. Sometimes I work late into the night to meet deadlines, which can be exhausting but necessary when we have important projects with tight schedules.\nB: Overtime? How often do you have to stay late at the office? \nA: Quite often, especially during peak seasons. But I was saying that we can travel twice every year. \nB: Is this time one of them? \nA:Yes, we won't travel again until the end of the year, probably around Christmas when things slow down at work and we can finally take some well-deserved time off.\nB: October? That's a nice time for a vacation. We only get one chance to travel every year. \nA: Really? Then you must make the most of that one trip by carefully planning your itinerary and choosing destinations that offer diverse experiences.", + "total_duration": 42.67768707482993, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--464/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--464/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--464/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Are you busy with your work?", + "original_text": "Are you busy with your work?", + "start_time": 0, + "end_time": 1.3931972789115645, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--464/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes. What about you?", + "original_text": "Yes. What about you?", + "start_time": 1.7509069506851533, + "end_time": 3.109274297623929, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--464/temp/line_1_B.wav", + "silence_duration": 0.3577096717735889, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Yes, I'm very busy, too. Sometimes I work", + "original_text": "Yes, I'm very busy, too. Sometimes I work [interrupt] late into the night to meet deadlines, which can be exhausting but necessary when we have important projects with tight schedules.", + "start_time": 3.612775776754155, + "end_time": 14.526154461561411, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--464/temp/line_2_A.wav", + "silence_duration": 0.5035014791302256, + "is_interrupted": true, + "text_after_interrupt": "late into the night to meet deadlines, which can be exhausting but necessary when we have important projects with tight schedules." + }, + { + "speaker": "B", + "text": "Overtime? How often do you have to stay late at the office?", + "original_text": "Overtime? How often do you have to stay late at the office?", + "start_time": 6.886789382196332, + "end_time": 11.066381218931026, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--464/temp/line_3_B.wav", + "silence_duration": 0.5513957278347013, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Quite often, especially during peak seasons. But I was saying that we can travel twice every year.", + "original_text": "Quite often, especially during peak seasons. But I was saying that we can travel twice every year.", + "start_time": 14.991930567545543, + "end_time": 20.90140902559543, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--464/temp/line_4_A.wav", + "silence_duration": 0.4657761059841323, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Is this time one of them?", + "original_text": "Is this time one of them?", + "start_time": 21.47642080259743, + "end_time": 22.61419858037521, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--464/temp/line_5_B.wav", + "silence_duration": 0.5750117770020022, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Yes, we won't travel again until", + "original_text": "Yes, we won't travel again until [interrupt] the end of the year, probably around Christmas when things slow down at work and we can finally take some well-deserved time off.", + "start_time": 23.077166300144352, + "end_time": 32.585737728715785, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--464/temp/line_6_A.wav", + "silence_duration": 0.46296771976914436, + "is_interrupted": true, + "text_after_interrupt": "the end of the year, probably around Christmas when things slow down at work and we can finally take some well-deserved time off." + }, + { + "speaker": "B", + "text": "October? That's a nice time for a vacation. We only get one chance to travel every year.", + "original_text": "October? That's a nice time for a vacation. We only get one chance to travel every year.", + "start_time": 29.3792236573248, + "end_time": 34.09287445097559, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--464/temp/line_7_B.wav", + "silence_duration": 0.4376190728293432, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Really? Then you must make the most of that one trip by carefully planning your itinerary and choosing destinations that offer diverse experiences.", + "original_text": "Really? Then you must make the most of that one trip by carefully planning your itinerary and choosing destinations that offer diverse experiences.", + "start_time": 34.399792074474306, + "end_time": 42.67770590667385, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--464/temp/line_8_A.wav", + "silence_duration": 0.30691762349871604, + "is_interrupted": false + } + ] + }, + "DialogSum--val--465": { + "original_text": "A: Is this the A housing office? \nB: Yes, it is. Are you looking for housing for this semester? \nA: I was hoping to get into something on campus, but my friend told me that everything is [interrupt] already taken, and the chances of getting a spot are slim unless you apply very early or have special circumstances like being an international student. \nB: It is, but I can put you on a waiting list, if you would like. \nA: Please. And in the meantime, can I look at apartments available in the area from this office? \nB: Yes, here is a catalog that is put out every year with locations that meet campus requirements for As. \nA: Who do I talk to if I want to see some of them? \nB: The individual landlord's numbers are next to each entry. You can call them with any questions you may have. Oh, and about the waiting list, I forgot to mention— \nA: Right, about the waiting list, how long is the wait usually? \n\n", + "cleaned_text": "A: Is this the A housing office? \nB: Yes, it is. Are you looking for housing for this semester? \nA:I was hoping to get into something on campus, but my friend told me that everything is already taken, and the chances of getting a spot are slim unless you apply very early or have special circumstances like being an international student.\nB: It is, but I can put you on a waiting list, if you would like. \nA: Please. And in the meantime, can I look at apartments available in the area from this office? \nB: Yes, here is a catalog that is put out every year with locations that meet campus requirements for As. \nA: Who do I talk to if I want to see some of them? \nB: The individual landlord's numbers are next to each entry. You can call them with any questions you may have. Oh, and about the waiting list, I forgot to mention— \nA: Right, about the waiting list, how long is the wait usually? \n\n", + "total_duration": 46.27242630385488, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--465/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--465/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--465/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Is this the A housing office?", + "original_text": "Is this the A housing office?", + "start_time": 0, + "end_time": 1.9504761904761905, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--465/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, it is. Are you looking for housing for this semester?", + "original_text": "Yes, it is. Are you looking for housing for this semester?", + "start_time": 2.516755368577975, + "end_time": 5.616619314156207, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--465/temp/line_1_B.wav", + "silence_duration": 0.5662791781017846, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I was hoping to get into something on campus, but my friend told me that everything is", + "original_text": "I was hoping to get into something on campus, but my friend told me that everything is [interrupt] already taken, and the chances of getting a spot are slim unless you apply very early or have special circumstances like being an international student.", + "start_time": 6.01264797166759, + "end_time": 20.025890602053078, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--465/temp/line_2_A.wav", + "silence_duration": 0.3960286575113832, + "is_interrupted": true, + "text_after_interrupt": "already taken, and the chances of getting a spot are slim unless you apply very early or have special circumstances like being an international student." + }, + { + "speaker": "B", + "text": "It is, but I can put you on a waiting list, if you would like.", + "original_text": "It is, but I can put you on a waiting list, if you would like.", + "start_time": 11.028158175749223, + "end_time": 14.162852053300243, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--465/temp/line_3_B.wav", + "silence_duration": 0.4993493210608926, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Please. And in the meantime, can I look at apartments available in the area from this office?", + "original_text": "Please. And in the meantime, can I look at apartments available in the area from this office?", + "start_time": 20.395710352007995, + "end_time": 25.80595978511457, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--465/temp/line_4_A.wav", + "silence_duration": 0.3698197499549172, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, here is a catalog that is put out every year with locations that meet campus requirements for As.", + "original_text": "Yes, here is a catalog that is put out every year with locations that meet campus requirements for As.", + "start_time": 26.208798445935862, + "end_time": 31.28235853663881, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--465/temp/line_5_B.wav", + "silence_duration": 0.4028386608212933, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Who do I talk to if I want to see some of them?", + "original_text": "Who do I talk to if I want to see some of them?", + "start_time": 31.843648941888254, + "end_time": 34.316574111956285, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--465/temp/line_6_A.wav", + "silence_duration": 0.561290405249445, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "The individual landlord's numbers are next to each entry. You can call them with any questions you may have. Oh, and about the waiting list, I forgot to mention—", + "original_text": "The individual landlord's numbers are next to each entry. You can call them with any questions you may have. Oh, and about the waiting list, I forgot to mention—", + "start_time": 34.618347262820734, + "end_time": 42.35059216077992, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--465/temp/line_7_B.wav", + "silence_duration": 0.30177315086445133, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Right, about the waiting list, how long is the wait usually?", + "original_text": "Right, about the waiting list, how long is the wait usually?", + "start_time": 42.94037419161896, + "end_time": 46.27243768368245, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--465/temp/line_8_A.wav", + "silence_duration": 0.5897820308390398, + "is_interrupted": false + } + ] + }, + "DialogSum--val--466": { + "original_text": "A: I was just about to go to bed when the telephone rang last night. \nB: Who was it? \nA: Kate. She said she was too excited to [interrupt] sleep because she had just come back from a date and couldn't stop talking about how perfect everything was - from the restaurant they went to, to the way he looked at her all evening. \nB: Too excited? Let me guess—was it about her new boyfriend? \nA: Yes, exactly! But I haven't told you what we were talking about last night. \nB: So, what did she say this time? \nA: Well, she was going on and on about how amazing he is, and how she couldn't sleep because of it. \nB: She never cares about others. \nA: It's true. But now I'm curious, how did you know about her new boyfriend? \nB: I was also interrupted by her last week because of such a thing.", + "cleaned_text": "A: I was just about to go to bed when the telephone rang last night. \nB: Who was it? \nA:Kate. She said she was too excited to sleep because she had just come back from a date and couldn't stop talking about how perfect everything was - from the restaurant they went to, to the way he looked at her all evening.\nB: Too excited? Let me guess—was it about her new boyfriend? \nA: Yes, exactly! But I haven't told you what we were talking about last night. \nB: So, what did she say this time? \nA: Well, she was going on and on about how amazing he is, and how she couldn't sleep because of it. \nB: She never cares about others. \nA: It's true. But now I'm curious, how did you know about her new boyfriend? \nB: I was also interrupted by her last week because of such a thing.", + "total_duration": 42.59945578231292, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--466/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--466/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--466/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "I was just about to go to bed when the telephone rang last night.", + "original_text": "I was just about to go to bed when the telephone rang last night.", + "start_time": 0, + "end_time": 3.9938321995464854, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--466/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Who was it?", + "original_text": "Who was it?", + "start_time": 4.560634619887178, + "end_time": 5.234013304694434, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--466/temp/line_1_B.wav", + "silence_duration": 0.5668024203406932, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Kate. She said she was too excited to", + "original_text": "Kate. She said she was too excited to [interrupt] sleep because she had just come back from a date and couldn't stop talking about how perfect everything was - from the restaurant they went to, to the way he looked at her all evening.", + "start_time": 5.589476334534674, + "end_time": 18.081811935441703, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--466/temp/line_2_A.wav", + "silence_duration": 0.35546302984024003, + "is_interrupted": true, + "text_after_interrupt": "sleep because she had just come back from a date and couldn't stop talking about how perfect everything was - from the restaurant they went to, to the way he looked at her all evening." + }, + { + "speaker": "B", + "text": "Too excited? Let me guess—was it about her new boyfriend?", + "original_text": "Too excited? Let me guess—was it about her new boyfriend?", + "start_time": 8.108841413899754, + "end_time": 10.906845949047145, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--466/temp/line_3_B.wav", + "silence_duration": 0.5716004333231512, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Yes, exactly! But I haven't told you what we were talking about last night.", + "original_text": "Yes, exactly! But I haven't told you what we were talking about last night.", + "start_time": 18.562312206817627, + "end_time": 23.39206277371105, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--466/temp/line_4_A.wav", + "silence_duration": 0.4805002713759233, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "So, what did she say this time?", + "original_text": "So, what did she say this time?", + "start_time": 23.777726678614624, + "end_time": 25.36829357203866, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--466/temp/line_5_B.wav", + "silence_duration": 0.3856639049035727, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Well, she was going on and on about how amazing he is, and how she couldn't sleep because of it.", + "original_text": "Well, she was going on and on about how amazing he is, and how she couldn't sleep because of it.", + "start_time": 25.674388426122302, + "end_time": 31.51420702022661, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--466/temp/line_6_A.wav", + "silence_duration": 0.3060948540836425, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "She never cares about others.", + "original_text": "She never cares about others.", + "start_time": 31.895147900326684, + "end_time": 33.3347850885353, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--466/temp/line_7_B.wav", + "silence_duration": 0.380940880100073, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "It's true. But now I'm curious, how did you know about her new boyfriend?", + "original_text": "It's true. But now I'm curious, how did you know about her new boyfriend?", + "start_time": 33.71083136852373, + "end_time": 38.70312161795683, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--466/temp/line_8_A.wav", + "silence_duration": 0.3760462799884283, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I was also interrupted by her last week because of such a thing.", + "original_text": "I was also interrupted by her last week because of such a thing.", + "start_time": 39.302261624462815, + "end_time": 42.59949518455352, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--466/temp/line_9_B.wav", + "silence_duration": 0.5991400065059869, + "is_interrupted": false + } + ] + }, + "DialogSum--val--468": { + "original_text": "A: There are so many record players here. That is hard to choose one that suits our needs and preferences. \nB: Sorry to interrupt, but do you think we should prioritize sound quality or space-saving features? \nA: Good point. I'd rather get one with separated speakers. They give a clear sound. \nB: Yes, but we shouldn't get anything too big. Remember it has to fit in with our living room furniture. \nA: That's right. Now this one looks alright? It's a detached or do you prefer this one? It's [interrupt] compact and has integrated speakers, which might save us some space while still delivering decent audio quality for our vinyl collection. \nB: Oh, I didn't catch which one you were talking about. Were you asking about the Sony model? \nA: Yes, the Sony one. Let's have the salesmen for a demonstration.", + "cleaned_text": "A: There are so many record players here. That is hard to choose one that suits our needs and preferences. \nB: Sorry to interrupt, but do you think we should prioritize sound quality or space-saving features? \nA: Good point. I'd rather get one with separated speakers. They give a clear sound. \nB: Yes, but we shouldn't get anything too big. Remember it has to fit in with our living room furniture. \nA:That's right. Now this one looks alright? It's a detached or do you prefer this one? It's compact and has integrated speakers, which might save us some space while still delivering decent audio quality for our vinyl collection.\nB: Oh, I didn't catch which one you were talking about. Were you asking about the Sony model? \nA: Yes, the Sony one. Let's have the salesmen for a demonstration.", + "total_duration": 41.2065306122449, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--468/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--468/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--468/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "There are so many record players here. That is hard to choose one that suits our needs and preferences.", + "original_text": "There are so many record players here. That is hard to choose one that suits our needs and preferences.", + "start_time": 0, + "end_time": 5.979138321995465, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--468/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Sorry to interrupt, but do you think we should prioritize sound quality or space-saving features?", + "original_text": "Sorry to interrupt, but do you think we should prioritize sound quality or space-saving features?", + "start_time": 6.356508961459599, + "end_time": 11.395239120189757, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--468/temp/line_1_B.wav", + "silence_duration": 0.37737063946413396, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Good point. I'd rather get one with separated speakers. They give a clear sound.", + "original_text": "Good point. I'd rather get one with separated speakers. They give a clear sound.", + "start_time": 11.786616717348135, + "end_time": 17.162036218481923, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--468/temp/line_2_A.wav", + "silence_duration": 0.39137759715837833, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, but we shouldn't get anything too big. Remember it has to fit in with our living room furniture.", + "original_text": "Yes, but we shouldn't get anything too big. Remember it has to fit in with our living room furniture.", + "start_time": 17.5024623534414, + "end_time": 22.494752602874506, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--468/temp/line_3_B.wav", + "silence_duration": 0.3404261349594742, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "That's right. Now this one looks alright? It's a detached or do you prefer this one? It's", + "original_text": "That's right. Now this one looks alright? It's a detached or do you prefer this one? It's [interrupt] compact and has integrated speakers, which might save us some space while still delivering decent audio quality for our vinyl collection.", + "start_time": 22.886874315548422, + "end_time": 36.78401717269128, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--468/temp/line_4_A.wav", + "silence_duration": 0.39212171267391494, + "is_interrupted": true, + "text_after_interrupt": "compact and has integrated speakers, which might save us some space while still delivering decent audio quality for our vinyl collection." + }, + { + "speaker": "B", + "text": "Oh, I didn't catch which one you were talking about. Were you asking about the Sony model?", + "original_text": "Oh, I didn't catch which one you were talking about. Were you asking about the Sony model?", + "start_time": 28.657033045707152, + "end_time": 32.766965018496265, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--468/temp/line_5_B.wav", + "silence_duration": 0.47244277947204194, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Yes, the Sony one. Let's have the salesmen for a demonstration.", + "original_text": "Yes, the Sony one. Let's have the salesmen for a demonstration.", + "start_time": 37.131449944459874, + "end_time": 41.2065519852762, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--468/temp/line_6_A.wav", + "silence_duration": 0.34743277176859455, + "is_interrupted": false + } + ] + }, + "DialogSum--val--469": { + "original_text": "A: You are married to a foreigner, huh? So what's it like? \nB: Well, the first year of our marriage, we had great difficulty getting along. The things that are important to me are not important to [interrupt] him, and it took us a while to understand each other's priorities, especially when it came to family traditions, financial planning, and even simple daily routines like meal times. \nA: I totally get that. Cultural differences can really make things challenging. How did you manage to work through those conflicts? \nB: We had a lot of discussions and really tried to understand each other's perspectives. And now we have a two-year-old boy. We're very happy that he's healthy and smart. \nA: Oh, so he's half Chinese and half American. That's unusual. What languages does he speak, then? \nB: Right now he speaks mostly Chinese, and he can say a few English words. But he will [interrupt] likely become more fluent in both languages as he grows older, especially since we plan to expose him to both cultures actively through bilingual education, frequent travel, and maintaining close relationships with relatives from both sides. \nA: I was just curious, what does he look like? Can people tell he's mixed? \nB: Yes, people surely can. He's whiter than the Chinese kids, and his hair is a little blonde. My husband says his eyes are very Chinese though. And about the languages, I was going to say that he will eventually learn more English as he grows up.", + "cleaned_text": "A: You are married to a foreigner, huh? So what's it like? \nB:Well, the first year of our marriage, we had great difficulty getting along. The things that are important to me are not important to him, and it took us a while to understand each other's priorities, especially when it came to family traditions, financial planning, and even simple daily routines like meal times.\nA: I totally get that. Cultural differences can really make things challenging. How did you manage to work through those conflicts? \nB: We had a lot of discussions and really tried to understand each other's perspectives. And now we have a two-year-old boy. We're very happy that he's healthy and smart. \nA: Oh, so he's half Chinese and half American. That's unusual. What languages does he speak, then? \nB:Right now he speaks mostly Chinese, and he can say a few English words. But he will likely become more fluent in both languages as he grows older, especially since we plan to expose him to both cultures actively through bilingual education, frequent travel, and maintaining close relationships with relatives from both sides.\nA: I was just curious, what does he look like? Can people tell he's mixed? \nB: Yes, people surely can. He's whiter than the Chinese kids, and his hair is a little blonde. My husband says his eyes are very Chinese though. And about the languages, I was going to say that he will eventually learn more English as he grows up.", + "total_duration": 65.70857142857143, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--469/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--469/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--469/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "You are married to a foreigner, huh? So what's it like?", + "original_text": "You are married to a foreigner, huh? So what's it like?", + "start_time": 0, + "end_time": 3.3901133786848074, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--469/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Well, the first year of our marriage, we had great difficulty getting along. The things that are important to me are not important to", + "original_text": "Well, the first year of our marriage, we had great difficulty getting along. The things that are important to me are not important to [interrupt] him, and it took us a while to understand each other's priorities, especially when it came to family traditions, financial planning, and even simple daily routines like meal times.", + "start_time": 3.7196076206943514, + "end_time": 19.671716464231768, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--469/temp/line_1_B.wav", + "silence_duration": 0.3294942420095441, + "is_interrupted": true, + "text_after_interrupt": "him, and it took us a while to understand each other's priorities, especially when it came to family traditions, financial planning, and even simple daily routines like meal times." + }, + { + "speaker": "A", + "text": "I totally get that. Cultural differences can really make things challenging. How did you manage to work through those conflicts?", + "original_text": "I totally get that. Cultural differences can really make things challenging. How did you manage to work through those conflicts?", + "start_time": 10.59271419665807, + "end_time": 18.162419412077572, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--469/temp/line_2_A.wav", + "silence_duration": 0.5071274551848958, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "We had a lot of discussions and really tried to understand each other's perspectives. And now we have a two-year-old boy. We're very happy that he's healthy and smart.", + "original_text": "We had a lot of discussions and really tried to understand each other's perspectives. And now we have a two-year-old boy. We're very happy that he's healthy and smart.", + "start_time": 20.094879403413024, + "end_time": 27.385945163050213, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--469/temp/line_3_B.wav", + "silence_duration": 0.4231629391812578, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Oh, so he's half Chinese and half American. That's unusual. What languages does he speak, then?", + "original_text": "Oh, so he's half Chinese and half American. That's unusual. What languages does he speak, then?", + "start_time": 27.857378040917006, + "end_time": 34.34735536518004, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--469/temp/line_4_A.wav", + "silence_duration": 0.4714328778667928, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Right now he speaks mostly Chinese, and he can say a few English words. But he will", + "original_text": "Right now he speaks mostly Chinese, and he can say a few English words. But he will [interrupt] likely become more fluent in both languages as he grows older, especially since we plan to expose him to both cultures actively through bilingual education, frequent travel, and maintaining close relationships with relatives from both sides.", + "start_time": 34.73746751484201, + "end_time": 51.96667386404836, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--469/temp/line_5_B.wav", + "silence_duration": 0.39011214966196966, + "is_interrupted": true, + "text_after_interrupt": "likely become more fluent in both languages as he grows older, especially since we plan to expose him to both cultures actively through bilingual education, frequent travel, and maintaining close relationships with relatives from both sides." + }, + { + "speaker": "A", + "text": "I was just curious, what does he look like? Can people tell he's mixed?", + "original_text": "I was just curious, what does he look like? Can people tell he's mixed?", + "start_time": 47.81769830360165, + "end_time": 53.00735816754723, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--469/temp/line_6_A.wav", + "silence_duration": 0.3704796479478507, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, people surely can. He's whiter than the Chinese kids, and his hair is a little blonde. My husband says his eyes are very Chinese though. And about the languages, I was going to say that he will eventually learn more English as he grows up.", + "original_text": "Yes, people surely can. He's whiter than the Chinese kids, and his hair is a little blonde. My husband says his eyes are very Chinese though. And about the languages, I was going to say that he will eventually learn more English as he grows up.", + "start_time": 53.30915083623905, + "end_time": 65.70860661855197, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--469/temp/line_7_B.wav", + "silence_duration": 0.30179266869181487, + "is_interrupted": false + } + ] + }, + "DialogSum--val--470": { + "original_text": "A: When were you born may I ask? \nB: On 20th May 1963. \nA: Do you know what it was according to the lunar calendar? \nB: 27th day of the fourth month. By the way, could you tell me when the film will [interrupt] start so that I can plan my day accordingly and make sure I arrive early enough to get good seats? \nA: Oh, speaking of the film, I just remembered I might need to reschedule my plans. What time does it start again? \nB: It will begin at five thirty. \nA: Right, thanks. But you were saying something about the lunar calendar date—what was the rest of that? \nB: I was just asking when the film will begin. Anyway, I am frigid I can't be there on time. \nA: You can see it tomorrow. \nB: I don't want to miss it today. \nA: See you.", + "cleaned_text": "A: When were you born may I ask? \nB: On 20th May 1963. \nA: Do you know what it was according to the lunar calendar? \nB:27th day of the fourth month. By the way, could you tell me when the film will start so that I can plan my day accordingly and make sure I arrive early enough to get good seats?\nA: Oh, speaking of the film, I just remembered I might need to reschedule my plans. What time does it start again? \nB: It will begin at five thirty. \nA: Right, thanks. But you were saying something about the lunar calendar date—what was the rest of that? \nB: I was just asking when the film will begin. Anyway, I am frigid I can't be there on time. \nA: You can see it tomorrow. \nB: I don't want to miss it today. \nA: See you.", + "total_duration": 38.58458049886622, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--470/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--470/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--470/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "When were you born may I ask?", + "original_text": "When were you born may I ask?", + "start_time": 0, + "end_time": 1.799546485260771, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--470/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "On 20th May 1963.", + "original_text": "On 20th May 1963.", + "start_time": 2.2178109873092757, + "end_time": 4.690736157377303, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--470/temp/line_1_B.wav", + "silence_duration": 0.4182645020485048, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Do you know what it was according to the lunar calendar?", + "original_text": "Do you know what it was according to the lunar calendar?", + "start_time": 5.121213873007361, + "end_time": 7.779898680263596, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--470/temp/line_2_A.wav", + "silence_duration": 0.4304777156300572, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "27th day of the fourth month. By the way, could you tell me when the film will", + "original_text": "27th day of the fourth month. By the way, could you tell me when the film will [interrupt] start so that I can plan my day accordingly and make sure I arrive early enough to get good seats?", + "start_time": 8.096585750806652, + "end_time": 17.732866929944976, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--470/temp/line_3_B.wav", + "silence_duration": 0.3166870705430559, + "is_interrupted": true, + "text_after_interrupt": "start so that I can plan my day accordingly and make sure I arrive early enough to get good seats?" + }, + { + "speaker": "A", + "text": "Oh, speaking of the film, I just remembered I might need to reschedule my plans. What time does it start again?", + "original_text": "Oh, speaking of the film, I just remembered I might need to reschedule my plans. What time does it start again?", + "start_time": 12.914726340375813, + "end_time": 19.39309368731459, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--470/temp/line_4_A.wav", + "silence_duration": 0.3626453910701799, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "It will begin at five thirty.", + "original_text": "It will begin at five thirty.", + "start_time": 19.958289836387177, + "end_time": 21.35148711529874, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--470/temp/line_5_B.wav", + "silence_duration": 0.5651961490725883, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Right, thanks. But you were saying something about the lunar calendar date—what was the rest of that?", + "original_text": "Right, thanks. But you were saying something about the lunar calendar date—what was the rest of that?", + "start_time": 21.7463564595847, + "end_time": 27.51651518974343, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--470/temp/line_6_A.wav", + "silence_duration": 0.3948693442859577, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I was just asking when the film will begin. Anyway, I am frigid I can't be there on time.", + "original_text": "I was just asking when the film will begin. Anyway, I am frigid I can't be there on time.", + "start_time": 28.082048618560357, + "end_time": 33.51551800631546, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--470/temp/line_7_B.wav", + "silence_duration": 0.5655334288169258, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "You can see it tomorrow.", + "original_text": "You can see it tomorrow.", + "start_time": 33.94610844317022, + "end_time": 35.397355608703094, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--470/temp/line_8_A.wav", + "silence_duration": 0.43059043685475495, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I don't want to miss it today.", + "original_text": "I don't want to miss it today.", + "start_time": 35.77579216627454, + "end_time": 37.28508921842874, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--470/temp/line_9_B.wav", + "silence_duration": 0.37843655757145045, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "See you.", + "original_text": "See you.", + "start_time": 37.74868121708301, + "end_time": 38.58459958442995, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--470/temp/line_10_A.wav", + "silence_duration": 0.46359199865427003, + "is_interrupted": false + } + ] + }, + "DialogSum--val--471": { + "original_text": "A: Harry, do you like the opera? \nB: No, not really. \nA: Why is that? It is called real [interrupt] art, you know, and it has influenced so many other forms of music and theater throughout history, with its complex compositions and dramatic storytelling that continues to inspire modern performances. \nB: Sorry to jump in, but when you say \"real art,\" do you mean in terms of its historical significance or the skill involved? \nA: Both, actually. Opera has a rich history and requires immense talent. But you mentioned it gets on your nerves because of the language barrier. Could you elaborate on that? \nB: Well, it's very expensive and they're usually singing in another language. That kind of gets on my nerves.", + "cleaned_text": "A: Harry, do you like the opera? \nB: No, not really. \nA:Why is that? It is called real art, you know, and it has influenced so many other forms of music and theater throughout history, with its complex compositions and dramatic storytelling that continues to inspire modern performances.\nB: Sorry to jump in, but when you say \"real art,\" do you mean in terms of its historical significance or the skill involved? \nA: Both, actually. Opera has a rich history and requires immense talent. But you mentioned it gets on your nerves because of the language barrier. Could you elaborate on that? \nB: Well, it's very expensive and they're usually singing in another language. That kind of gets on my nerves.", + "total_duration": 35.19074829931973, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--471/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--471/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--471/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Harry, do you like the opera?", + "original_text": "Harry, do you like the opera?", + "start_time": 0, + "end_time": 2.1130158730158732, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--471/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "No, not really.", + "original_text": "No, not really.", + "start_time": 2.414993338108506, + "end_time": 3.4482813199679168, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--471/temp/line_1_B.wav", + "silence_duration": 0.3019774650926327, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Why is that? It is called real", + "original_text": "Why is that? It is called real [interrupt] art, you know, and it has influenced so many other forms of music and theater throughout history, with its complex compositions and dramatic storytelling that continues to inspire modern performances.", + "start_time": 4.044512417545801, + "end_time": 18.696303800765754, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--471/temp/line_2_A.wav", + "silence_duration": 0.5962310975778837, + "is_interrupted": true, + "text_after_interrupt": "art, you know, and it has influenced so many other forms of music and theater throughout history, with its complex compositions and dramatic storytelling that continues to inspire modern performances." + }, + { + "speaker": "B", + "text": "Sorry to jump in, but when you say \"real art,\" do you mean in terms of its historical significance or the skill involved?", + "original_text": "Sorry to jump in, but when you say \"real art,\" do you mean in terms of its historical significance or the skill involved?", + "start_time": 6.436167746343987, + "end_time": 12.833265252012922, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--471/temp/line_3_B.wav", + "silence_duration": 0.4367288793190609, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Both, actually. Opera has a rich history and requires immense talent. But you mentioned it gets on your nerves because of the language barrier. Could you elaborate on that?", + "original_text": "Both, actually. Opera has a rich history and requires immense talent. But you mentioned it gets on your nerves because of the language barrier. Could you elaborate on that?", + "start_time": 19.284551880007452, + "end_time": 29.594211743953032, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--471/temp/line_4_A.wav", + "silence_duration": 0.5882480792416964, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Well, it's very expensive and they're usually singing in another language. That kind of gets on my nerves.", + "original_text": "Well, it's very expensive and they're usually singing in another language. That kind of gets on my nerves.", + "start_time": 30.09400611200821, + "end_time": 35.19078615735968, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--471/temp/line_5_B.wav", + "silence_duration": 0.4997943680551771, + "is_interrupted": false + } + ] + }, + "DialogSum--val--473": { + "original_text": "A: Mary, do you remember when we met? \nB: I won't ever forget it! I was sitting in the cafeteria all by myself. . . \nA: And I came up and asked to [interrupt] sit with you because you looked like you could use some company and I had been wanting to make new friends since transferring to the school that semester. \nB: Sorry, just curious, what made you come over to me in the first place? \nA: I noticed you seemed a bit lonely, and I thought we might have something in common. But I was going to ask if you remember what you were about to say before I interrupted. \nB: Oh, right! I was going to say, you asked to sit by me, and that really made my day. \nA: It seems like it was just yesterday.", + "cleaned_text": "A: Mary, do you remember when we met? \nB: I won't ever forget it! I was sitting in the cafeteria all by myself. . . \nA:And I came up and asked to sit with you because you looked like you could use some company and I had been wanting to make new friends since transferring to the school that semester.\nB: Sorry, just curious, what made you come over to me in the first place? \nA: I noticed you seemed a bit lonely, and I thought we might have something in common. But I was going to ask if you remember what you were about to say before I interrupted. \nB: Oh, right! I was going to say, you asked to sit by me, and that really made my day. \nA: It seems like it was just yesterday.", + "total_duration": 34.6740589569161, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--473/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--473/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--473/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Mary, do you remember when we met?", + "original_text": "Mary, do you remember when we met?", + "start_time": 0, + "end_time": 2.589024943310658, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--473/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I won't ever forget it! I was sitting in the cafeteria all by myself. . .", + "original_text": "I won't ever forget it! I was sitting in the cafeteria all by myself. . .", + "start_time": 3.060776960741249, + "end_time": 6.671479908587054, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--473/temp/line_1_B.wav", + "silence_duration": 0.47175201743059103, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "And I came up and asked to", + "original_text": "And I came up and asked to [interrupt] sit with you because you looked like you could use some company and I had been wanting to make new friends since transferring to the school that semester.", + "start_time": 7.223590813317077, + "end_time": 17.74223026909939, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--473/temp/line_2_A.wav", + "silence_duration": 0.5521109047300232, + "is_interrupted": true, + "text_after_interrupt": "sit with you because you looked like you could use some company and I had been wanting to make new friends since transferring to the school that semester." + }, + { + "speaker": "B", + "text": "Sorry, just curious, what made you come over to me in the first place?", + "original_text": "Sorry, just curious, what made you come over to me in the first place?", + "start_time": 9.081187185199164, + "end_time": 12.680280155720705, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--473/temp/line_3_B.wav", + "silence_duration": 0.5670568319400652, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I noticed you seemed a bit lonely, and I thought we might have something in common. But I was going to ask if you remember what you were about to say before I interrupted.", + "original_text": "I noticed you seemed a bit lonely, and I thought we might have something in common. But I was going to ask if you remember what you were about to say before I interrupted.", + "start_time": 18.12528149013225, + "end_time": 27.599022986730887, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--473/temp/line_4_A.wav", + "silence_duration": 0.38305122103285855, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Oh, right! I was going to say, you asked to sit by me, and that really made my day.", + "original_text": "Oh, right! I was going to say, you asked to sit by me, and that really made my day.", + "start_time": 28.073152007925934, + "end_time": 32.125034094093735, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--473/temp/line_5_B.wav", + "silence_duration": 0.47412902119504774, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "It seems like it was just yesterday.", + "original_text": "It seems like it was just yesterday.", + "start_time": 32.67715745695563, + "end_time": 34.67407355672887, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--473/temp/line_6_A.wav", + "silence_duration": 0.5521233628618949, + "is_interrupted": false + } + ] + }, + "DialogSum--val--475": { + "original_text": "A: Excuse me. May I see that laptop for a moment? \nB: Sure. You mean this one? \nA: No, the one on the left. Yes, that's the one. . . . Thank you. \nB: It's a state-of-the-art piece of equipment, sir. With a gigantic 16.1 USGA TFT screen, 2.8 Ghz mobile processor, generous 512 MB RAM, removable 80 GB hard drive, convenient CD-RW / DVD combo drive, stunning fast graphics board with 64 MB DDR DRAM, dual battery capability, integrated Fast Ethernet card, IEEE 1394 digital interface and eight USB ports, it has all the power of a desktop computer packed into an ultra-slim [interrupt] design with military-grade durability and spill-resistant keyboard, making it perfect for professionals who need reliability in demanding work environments.\nA: Sorry to cut in, but I just want to clarify—does it come with any pre-installed software or do I need to purchase that separately? \nB: It does come with some essential software pre-installed, like a basic operating system and productivity suite. Now, as I was saying, this ultra-slim notebook really offers the power of a desktop computer. The regular price is $2980.00, but until December the 31st it's on sale for just $2,699.00. \nA: That's a good discount. By the way, you mentioned earlier about the dual battery capability—how long does the battery last on a single charge?", + "cleaned_text": "A: Excuse me. May I see that laptop for a moment? \nB: Sure. You mean this one? \nA: No, the one on the left. Yes, that's the one. . . . Thank you. \nB:It's a state-of-the-art piece of equipment, sir. With a gigantic 16.1 USGA TFT screen, 2.8 Ghz mobile processor, generous 512 MB RAM, removable 80 GB hard drive, convenient CD-RW / DVD combo drive, stunning fast graphics board with 64 MB DDR DRAM, dual battery capability, integrated Fast Ethernet card, IEEE 1394 digital interface and eight USB ports, it has all the power of a desktop computer packed into an ultra-slim design with military-grade durability and spill-resistant keyboard, making it perfect for professionals who need reliability in demanding work environments.\nA: Sorry to cut in, but I just want to clarify—does it come with any pre-installed software or do I need to purchase that separately? \nB: It does come with some essential software pre-installed, like a basic operating system and productivity suite. Now, as I was saying, this ultra-slim notebook really offers the power of a desktop computer. The regular price is $2980.00, but until December the 31st it's on sale for just $2,699.00. \nA: That's a good discount. By the way, you mentioned earlier about the dual battery capability—how long does the battery last on a single charge?", + "total_duration": 89.2372335600907, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--475/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--475/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--475/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Excuse me. May I see that laptop for a moment?", + "original_text": "Excuse me. May I see that laptop for a moment?", + "start_time": 0, + "end_time": 3.250793650793651, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--475/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Sure. You mean this one?", + "original_text": "Sure. You mean this one?", + "start_time": 3.721487826378153, + "end_time": 4.97536537739856, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--475/temp/line_1_B.wav", + "silence_duration": 0.470694175584502, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "No, the one on the left. Yes, that's the one. . . . Thank you.", + "original_text": "No, the one on the left. Yes, that's the one. . . . Thank you.", + "start_time": 5.545010639140361, + "end_time": 10.096121750251472, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--475/temp/line_2_A.wav", + "silence_duration": 0.5696452617418, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "It's a state-of-the-art piece of equipment, sir. With a gigantic 16.1 USGA TFT screen, 2.8 Ghz mobile processor, generous 512 MB RAM, removable 80 GB hard drive, convenient CD-RW / DVD combo drive, stunning fast graphics board with 64 MB DDR DRAM, dual battery capability, integrated Fast Ethernet card, IEEE 1394 digital interface and eight USB ports, it has all the power of a desktop computer packed into an ultra-slim", + "original_text": "It's a state-of-the-art piece of equipment, sir. With a gigantic 16.1 USGA TFT screen, 2.8 Ghz mobile processor, generous 512 MB RAM, removable 80 GB hard drive, convenient CD-RW / DVD combo drive, stunning fast graphics board with 64 MB DDR DRAM, dual battery capability, integrated Fast Ethernet card, IEEE 1394 digital interface and eight USB ports, it has all the power of a desktop computer packed into an ultra-slim [interrupt] design with military-grade durability and spill-resistant keyboard, making it perfect for professionals who need reliability in demanding work environments.", + "start_time": 10.503241032619457, + "end_time": 61.354941712891566, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--475/temp/line_3_B.wav", + "silence_duration": 0.4071192823679849, + "is_interrupted": true, + "text_after_interrupt": "design with military-grade durability and spill-resistant keyboard, making it perfect for professionals who need reliability in demanding work environments." + }, + { + "speaker": "A", + "text": "Sorry to cut in, but I just want to clarify—does it come with any pre-installed software or do I need to purchase that separately?", + "original_text": "Sorry to cut in, but I just want to clarify—does it come with any pre-installed software or do I need to purchase that separately?", + "start_time": 38.55294624803896, + "end_time": 46.66832039769882, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--475/temp/line_4_A.wav", + "silence_duration": 0.3666874611057658, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "It does come with some essential software pre-installed, like a basic operating system and productivity suite. Now, as I was saying, this ultra-slim notebook really offers the power of a desktop computer. The regular price is $2980.00, but until December the 31st it's on sale for just $2,699.00.", + "original_text": "It does come with some essential software pre-installed, like a basic operating system and productivity suite. Now, as I was saying, this ultra-slim notebook really offers the power of a desktop computer. The regular price is $2980.00, but until December the 31st it's on sale for just $2,699.00.", + "start_time": 61.73139174948025, + "end_time": 80.82980444789295, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--475/temp/line_5_B.wav", + "silence_duration": 0.37645003658868903, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "That's a good discount. By the way, you mentioned earlier about the dual battery capability—how long does the battery last on a single charge?", + "original_text": "That's a good discount. By the way, you mentioned earlier about the dual battery capability—how long does the battery last on a single charge?", + "start_time": 81.36568340695945, + "end_time": 89.23724803280979, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--475/temp/line_6_A.wav", + "silence_duration": 0.5358789590664892, + "is_interrupted": false + } + ] + }, + "DialogSum--val--476": { + "original_text": "A: Good morning. I'm thinking about buying some new furniture for my living room. Could you help me?\nB: Certainly. As you can see, we have several three-piece suites on sale. Feel free to sit down and test how comfortable they are.\nA: I came to your store yesterday and have come back today to make a final decision. I think I like the black leather suite. It's on sale, isn't it? I was also wondering about the warranty period for this set.\nB: Sorry to interrupt, but before you decide, have you considered how the black leather might affect the overall ambiance of your living room, especially if you're thinking about changing the lighting as well?\nA: That's a good point. I was actually going to ask about lighting next. But yes, the black leather suite is on sale, right?\nB: Yes. The price has been reduced by 50%. It's a real bargain.\nA: I'll take it. I also need to improve the lighting in my living room. Do you have any suggestions?\nB: Those floor lamps are very nice and you can vary the brightness according to whether you're reading or watching [interrupt] TV or entertaining guests, plus they feature energy-efficient LED bulbs that can last for years while providing excellent illumination throughout your spacious living area.\nA: Oh, I forgot to mention earlier, my living room is quite large, about 40 square meters. Do you think one floor lamp would be enough?\nB: I'd suggest you buy two. That allows you to change the brightness of the room better.", + "cleaned_text": "A: Good morning. I'm thinking about buying some new furniture for my living room. Could you help me?\nB: Certainly. As you can see, we have several three-piece suites on sale. Feel free to sit down and test how comfortable they are.\nA: I came to your store yesterday and have come back today to make a final decision. I think I like the black leather suite. It's on sale, isn't it? I was also wondering about the warranty period for this set.\nB: Sorry to interrupt, but before you decide, have you considered how the black leather might affect the overall ambiance of your living room, especially if you're thinking about changing the lighting as well?\nA: That's a good point. I was actually going to ask about lighting next. But yes, the black leather suite is on sale, right?\nB: Yes. The price has been reduced by 50%. It's a real bargain.\nA: I'll take it. I also need to improve the lighting in my living room. Do you have any suggestions?\nB:Those floor lamps are very nice and you can vary the brightness according to whether you're reading or watching TV or entertaining guests, plus they feature energy-efficient LED bulbs that can last for years while providing excellent illumination throughout your spacious living area.\nA: Oh, I forgot to mention earlier, my living room is quite large, about 40 square meters. Do you think one floor lamp would be enough?\nB: I'd suggest you buy two. That allows you to change the brightness of the room better.", + "total_duration": 73.86526077097506, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--476/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--476/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--476/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Good morning. I'm thinking about buying some new furniture for my living room. Could you help me?", + "original_text": "Good morning. I'm thinking about buying some new furniture for my living room. Could you help me?", + "start_time": 0, + "end_time": 4.957460317460318, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--476/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Certainly. As you can see, we have several three-piece suites on sale. Feel free to sit down and test how comfortable they are.", + "original_text": "Certainly. As you can see, we have several three-piece suites on sale. Feel free to sit down and test how comfortable they are.", + "start_time": 5.442865627655214, + "end_time": 12.095382634457936, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--476/temp/line_1_B.wav", + "silence_duration": 0.4854053101948961, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I came to your store yesterday and have come back today to make a final decision. I think I like the black leather suite. It's on sale, isn't it? I was also wondering about the warranty period for this set.", + "original_text": "I came to your store yesterday and have come back today to make a final decision. I think I like the black leather suite. It's on sale, isn't it? I was also wondering about the warranty period for this set.", + "start_time": 12.465760191471338, + "end_time": 25.42249488534889, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--476/temp/line_2_A.wav", + "silence_duration": 0.3703775570134023, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Sorry to interrupt, but before you decide, have you considered how the black leather might affect the overall ambiance of your living room, especially if you're thinking about changing the lighting as well?", + "original_text": "Sorry to interrupt, but before you decide, have you considered how the black leather might affect the overall ambiance of your living room, especially if you're thinking about changing the lighting as well?", + "start_time": 25.985870915055834, + "end_time": 35.81952170870663, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--476/temp/line_3_B.wav", + "silence_duration": 0.5633760297069461, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "That's a good point. I was actually going to ask about lighting next. But yes, the black leather suite is on sale, right?", + "original_text": "That's a good point. I was actually going to ask about lighting next. But yes, the black leather suite is on sale, right?", + "start_time": 36.22057444048956, + "end_time": 43.650959928017905, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--476/temp/line_4_A.wav", + "silence_duration": 0.40105273178292616, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes. The price has been reduced by 50%. It's a real bargain.", + "original_text": "Yes. The price has been reduced by 50%. It's a real bargain.", + "start_time": 43.971272293239586, + "end_time": 48.127644175325756, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--476/temp/line_5_B.wav", + "silence_duration": 0.320312365221681, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I'll take it. I also need to improve the lighting in my living room. Do you have any suggestions?", + "original_text": "I'll take it. I also need to improve the lighting in my living room. Do you have any suggestions?", + "start_time": 48.53255911448995, + "end_time": 54.88321671086183, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--476/temp/line_6_A.wav", + "silence_duration": 0.4049149391641916, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Those floor lamps are very nice and you can vary the brightness according to whether you're reading or watching", + "original_text": "Those floor lamps are very nice and you can vary the brightness according to whether you're reading or watching [interrupt] TV or entertaining guests, plus they feature energy-efficient LED bulbs that can last for years while providing excellent illumination throughout your spacious living area.", + "start_time": 55.35296680028475, + "end_time": 69.2501096574276, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--476/temp/line_7_B.wav", + "silence_duration": 0.46975008942291785, + "is_interrupted": true, + "text_after_interrupt": "TV or entertaining guests, plus they feature energy-efficient LED bulbs that can last for years while providing excellent illumination throughout your spacious living area." + }, + { + "speaker": "A", + "text": "Oh, I forgot to mention earlier, my living room is quite large, about 40 square meters. Do you think one floor lamp would be enough?", + "original_text": "Oh, I forgot to mention earlier, my living room is quite large, about 40 square meters. Do you think one floor lamp would be enough?", + "start_time": 60.043397639287015, + "end_time": 67.71759265062488, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--476/temp/line_8_A.wav", + "silence_duration": 0.4668533926013093, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I'd suggest you buy two. That allows you to change the brightness of the room better.", + "original_text": "I'd suggest you buy two. That allows you to change the brightness of the room better.", + "start_time": 69.59282425152993, + "end_time": 73.86529590685873, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--476/temp/line_9_B.wav", + "silence_duration": 0.34271459410232563, + "is_interrupted": false + } + ] + }, + "DialogSum--val--477": { + "original_text": "A: Can you help me with my timesheet? \nB: Sure! I can help you. Do you know where the timesheets are [interrupt] kept in the office? They should be in the filing cabinet near the break room, organized alphabetically by department. \nA: No, I don't know where to find one. \nB: Oh, they're usually kept on the shelf over there. Once you get one, you first put your name on it. OK? \nA: Yes, I can do that. \nB: Now you have to fill in the hours in the blanks and total the hours for the week. Do you know how to use military [interrupt] time to record your hours? It's actually quite simple once you get used to it, and it helps avoid any confusion between AM and PM hours. \nA: No, I don't know what that is. \nB: OK, so we just start counting hours at midnight and record it. Show all minutes as a dot and then write how many minutes. OK? \nA: Yes, I understand how to do this. \nB: After you total your hours, make sure you sign it and turn it in to your supervisor. \nA: Wait, you mentioned something about military time earlier. Can you explain that again? \nB: Sure! Military time is a 24-hour clock system. For example, 1 PM is 1300, and 11 PM is 2300. You just write the hours in that format. \nA: Got it, thanks! \nB: That was easy! Good luck and let me know if you need any help later on.", + "cleaned_text": "A: Can you help me with my timesheet? \nB:Sure! I can help you. Do you know where the timesheets are kept in the office? They should be in the filing cabinet near the break room, organized alphabetically by department.\nA: No, I don't know where to find one. \nB: Oh, they're usually kept on the shelf over there. Once you get one, you first put your name on it. OK? \nA: Yes, I can do that. \nB:Now you have to fill in the hours in the blanks and total the hours for the week. Do you know how to use military time to record your hours? It's actually quite simple once you get used to it, and it helps avoid any confusion between AM and PM hours.\nA: No, I don't know what that is. \nB: OK, so we just start counting hours at midnight and record it. Show all minutes as a dot and then write how many minutes. OK? \nA: Yes, I understand how to do this. \nB: After you total your hours, make sure you sign it and turn it in to your supervisor. \nA: Wait, you mentioned something about military time earlier. Can you explain that again? \nB: Sure! Military time is a 24-hour clock system. For example, 1 PM is 1300, and 11 PM is 2300. You just write the hours in that format. \nA: Got it, thanks! \nB: That was easy! Good luck and let me know if you need any help later on.", + "total_duration": 67.58657596371881, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--477/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--477/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--477/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Can you help me with my timesheet?", + "original_text": "Can you help me with my timesheet?", + "start_time": 0, + "end_time": 1.8343764172335602, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--477/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Sure! I can help you. Do you know where the timesheets are", + "original_text": "Sure! I can help you. Do you know where the timesheets are [interrupt] kept in the office? They should be in the filing cabinet near the break room, organized alphabetically by department.", + "start_time": 2.215356625357183, + "end_time": 10.6906400720692, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--477/temp/line_1_B.wav", + "silence_duration": 0.3809802081236228, + "is_interrupted": true, + "text_after_interrupt": "kept in the office? They should be in the filing cabinet near the break room, organized alphabetically by department." + }, + { + "speaker": "A", + "text": "No, I don't know where to find one.", + "original_text": "No, I don't know where to find one.", + "start_time": 5.129460933747206, + "end_time": 7.068327146899133, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--477/temp/line_2_A.wav", + "silence_duration": 0.5771620500240346, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Oh, they're usually kept on the shelf over there. Once you get one, you first put your name on it. OK?", + "original_text": "Oh, they're usually kept on the shelf over there. Once you get one, you first put your name on it. OK?", + "start_time": 11.121360596756924, + "end_time": 15.858231345056243, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--477/temp/line_3_B.wav", + "silence_duration": 0.43072052468772265, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Yes, I can do that.", + "original_text": "Yes, I can do that.", + "start_time": 16.310650764498746, + "end_time": 17.727067998058835, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--477/temp/line_4_A.wav", + "silence_duration": 0.4524194194425031, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Now you have to fill in the hours in the blanks and total the hours for the week. Do you know how to use military", + "original_text": "Now you have to fill in the hours in the blanks and total the hours for the week. Do you know how to use military [interrupt] time to record your hours? It's actually quite simple once you get used to it, and it helps avoid any confusion between AM and PM hours.", + "start_time": 18.2383083411821, + "end_time": 30.8351337380075, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--477/temp/line_5_B.wav", + "silence_duration": 0.5112403431232667, + "is_interrupted": true, + "text_after_interrupt": "time to record your hours? It's actually quite simple once you get used to it, and it helps avoid any confusion between AM and PM hours." + }, + { + "speaker": "A", + "text": "No, I don't know what that is.", + "original_text": "No, I don't know what that is.", + "start_time": 26.75757797656433, + "end_time": 28.766104053661838, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--477/temp/line_6_A.wav", + "silence_duration": 0.45848417121503476, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "OK, so we just start counting hours at midnight and record it. Show all minutes as a dot and then write how many minutes. OK?", + "original_text": "OK, so we just start counting hours at midnight and record it. Show all minutes as a dot and then write how many minutes. OK?", + "start_time": 31.23280021674981, + "end_time": 37.96658706482237, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--477/temp/line_7_B.wav", + "silence_duration": 0.39766647874230854, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Yes, I understand how to do this.", + "original_text": "Yes, I understand how to do this.", + "start_time": 38.55586620799031, + "end_time": 40.634052149033394, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--477/temp/line_8_A.wav", + "silence_duration": 0.5892791431679443, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "After you total your hours, make sure you sign it and turn it in to your supervisor.", + "original_text": "After you total your hours, make sure you sign it and turn it in to your supervisor.", + "start_time": 41.14334568746766, + "end_time": 45.63640691195745, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--477/temp/line_9_B.wav", + "silence_duration": 0.5092935384342642, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Wait, you mentioned something about military time earlier. Can you explain that again?", + "original_text": "Wait, you mentioned something about military time earlier. Can you explain that again?", + "start_time": 46.09087088732267, + "end_time": 51.129601046052834, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--477/temp/line_10_A.wav", + "silence_duration": 0.4544639753652193, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Sure! Military time is a 24-hour clock system. For example, 1 PM is 1300, and 11 PM is 2300. You just write the hours in that format.", + "original_text": "Sure! Military time is a 24-hour clock system. For example, 1 PM is 1300, and 11 PM is 2300. You just write the hours in that format.", + "start_time": 51.690944942088656, + "end_time": 61.965774874061445, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--477/temp/line_11_B.wav", + "silence_duration": 0.5613438960358247, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Got it, thanks!", + "original_text": "Got it, thanks!", + "start_time": 62.322015574866015, + "end_time": 63.355303556725424, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--477/temp/line_12_A.wav", + "silence_duration": 0.35624070080456854, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "That was easy! Good luck and let me know if you need any help later on.", + "original_text": "That was easy! Good luck and let me know if you need any help later on.", + "start_time": 63.76691421476105, + "end_time": 67.58659675444359, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--477/temp/line_13_B.wav", + "silence_duration": 0.41161065803563046, + "is_interrupted": false + } + ] + }, + "DialogSum--val--478": { + "original_text": "A: What did you say your stop was? \nB: Fifth Avenue. \nA: Oh, then you should have [interrupt] gotten off at the last stop because the train doesn't actually go any further in this direction and now you'll have to take the return trip back to Fifth Avenue. \nB: Wait, are you sure? I thought the stop after Fifth Avenue was still within the same area. \nA: No, Fifth Avenue was the stop before this one. You should have gotten off there. \nB: I should have? So, does that mean I need to go back a stop?", + "cleaned_text": "A: What did you say your stop was? \nB: Fifth Avenue. \nA:Oh, then you should have gotten off at the last stop because the train doesn't actually go any further in this direction and now you'll have to take the return trip back to Fifth Avenue.\nB: Wait, are you sure? I thought the stop after Fifth Avenue was still within the same area. \nA: No, Fifth Avenue was the stop before this one. You should have gotten off there. \nB: I should have? So, does that mean I need to go back a stop?", + "total_duration": 22.054285714285715, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--478/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--478/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--478/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "What did you say your stop was?", + "original_text": "What did you say your stop was?", + "start_time": 0, + "end_time": 1.9156462585034013, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--478/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Fifth Avenue.", + "original_text": "Fifth Avenue.", + "start_time": 2.2613902989423686, + "end_time": 3.1901884848834117, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--478/temp/line_1_B.wav", + "silence_duration": 0.3457440404389673, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Oh, then you should have", + "original_text": "Oh, then you should have [interrupt] gotten off at the last stop because the train doesn't actually go any further in this direction and now you'll have to take the return trip back to Fifth Avenue.", + "start_time": 3.582936645853659, + "end_time": 13.393367484855926, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--478/temp/line_2_A.wav", + "silence_duration": 0.3927481609702474, + "is_interrupted": true, + "text_after_interrupt": "gotten off at the last stop because the train doesn't actually go any further in this direction and now you'll have to take the return trip back to Fifth Avenue." + }, + { + "speaker": "B", + "text": "Wait, are you sure? I thought the stop after Fifth Avenue was still within the same area.", + "original_text": "Wait, are you sure? I thought the stop after Fifth Avenue was still within the same area.", + "start_time": 5.38248313111443, + "end_time": 10.072913970116698, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--478/temp/line_3_B.wav", + "silence_duration": 0.49017571221545353, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "No, Fifth Avenue was the stop before this one. You should have gotten off there.", + "original_text": "No, Fifth Avenue was the stop before this one. You should have gotten off there.", + "start_time": 13.756466799234682, + "end_time": 18.330797864994317, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--478/temp/line_4_A.wav", + "silence_duration": 0.3630993143787554, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I should have? So, does that mean I need to go back a stop?", + "original_text": "I should have? So, does that mean I need to go back a stop?", + "start_time": 18.884777785603138, + "end_time": 22.054301595126947, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--478/temp/line_5_B.wav", + "silence_duration": 0.5539799206088218, + "is_interrupted": false + } + ] + }, + "DialogSum--val--479": { + "original_text": "A: You two are so health-conscious! \nB: Well, we try! Here, I just made some carrot juice. Would you like a [interrupt] glass? It's really refreshing and packed with vitamins A, C, and K, plus it has antioxidants that help with skin health and immune system support. \nA: Oh, absolutely! Before you know it, I'll be heading off to the mountains to stand on my head! \nB: You don't have to go to the mountains! I stand on my head during my yoga routine every morning! But wait, I didn't finish offering you the carrot juice, would you still like to try some? It might give you the energy boost you need for that headstand! \nA: Yes, please! Thanks for the carrot juice, Mrs. Schmidt. I've got to run to class! \nB: Have a good day at school! See you tonight!", + "cleaned_text": "A: You two are so health-conscious! \nB:Well, we try! Here, I just made some carrot juice. Would you like a glass? It's really refreshing and packed with vitamins A, C, and K, plus it has antioxidants that help with skin health and immune system support.\nA: Oh, absolutely! Before you know it, I'll be heading off to the mountains to stand on my head! \nB: You don't have to go to the mountains! I stand on my head during my yoga routine every morning! But wait, I didn't finish offering you the carrot juice, would you still like to try some? It might give you the energy boost you need for that headstand! \nA: Yes, please! Thanks for the carrot juice, Mrs. Schmidt. I've got to run to class! \nB: Have a good day at school! See you tonight!", + "total_duration": 34.33043083900227, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--479/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--479/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--479/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "You two are so health-conscious!", + "original_text": "You two are so health-conscious!", + "start_time": 0, + "end_time": 2.0317460317460316, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--479/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Well, we try! Here, I just made some carrot juice. Would you like a", + "original_text": "Well, we try! Here, I just made some carrot juice. Would you like a [interrupt] glass? It's really refreshing and packed with vitamins A, C, and K, plus it has antioxidants that help with skin health and immune system support.", + "start_time": 2.390092280212159, + "end_time": 13.663380262071568, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--479/temp/line_1_B.wav", + "silence_duration": 0.3583462484661271, + "is_interrupted": true, + "text_after_interrupt": "glass? It's really refreshing and packed with vitamins A, C, and K, plus it has antioxidants that help with skin health and immune system support." + }, + { + "speaker": "A", + "text": "Oh, absolutely! Before you know it, I'll be heading off to the mountains to stand on my head!", + "original_text": "Oh, absolutely! Before you know it, I'll be heading off to the mountains to stand on my head!", + "start_time": 6.685783890189484, + "end_time": 11.515534457082907, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--479/temp/line_2_A.wav", + "silence_duration": 0.33484422170434086, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "You don't have to go to the mountains! I stand on my head during my yoga routine every morning! But wait, I didn't finish offering you the carrot juice, would you still like to try some? It might give you the energy boost you need for that headstand!", + "original_text": "You don't have to go to the mountains! I stand on my head during my yoga routine every morning! But wait, I didn't finish offering you the carrot juice, would you still like to try some? It might give you the energy boost you need for that headstand!", + "start_time": 14.16701078875022, + "end_time": 25.8582579542831, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--479/temp/line_3_B.wav", + "silence_duration": 0.5036305266786514, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Yes, please! Thanks for the carrot juice, Mrs. Schmidt. I've got to run to class!", + "original_text": "Yes, please! Thanks for the carrot juice, Mrs. Schmidt. I've got to run to class!", + "start_time": 26.355203454537776, + "end_time": 31.475203454537777, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--479/temp/line_4_A.wav", + "silence_duration": 0.49694550025467366, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Have a good day at school! See you tonight!", + "original_text": "Have a good day at school! See you tonight!", + "start_time": 32.03166163367386, + "end_time": 34.330437143877944, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--479/temp/line_5_B.wav", + "silence_duration": 0.5564581791360876, + "is_interrupted": false + } + ] + }, + "DialogSum--val--480": { + "original_text": "A: Did your meal meet with your approval? \nB: Our meal was absolutely perfect! \nA: How about a dessert to top off that wonderful meal? \nB: Dessert sounds perfect, but I would like to split something with my [interrupt] partner. We're both trying to watch our calories a bit, so sharing would be ideal, and we'd love to hear your recommendations for the best sharing-sized desserts on the menu. \nA: Sorry to jump in, but before you decide, I wanted to mention that tonight's dessert list includes a few special items—chocolate mousse cake, homemade fresh strawberry shortcake, and a spicy rum apple crisp. \nB: Oh, those sound amazing! I think that the apple crisp would be wonderful. \nA: One dessert will serve two, so would you like to split a second one? \nB: We would also like a piece of chocolate mousse cake. Could you bring us four dessert forks, please? \nA: How about some coffee and perhaps a digestif to go with your desserts? \nB: Actually, we're all tea drinkers. Please bring us four teas. \nA: Got it. I'll prepare your desserts and have someone bring you your drinks right away. \nB: The hot drinks first would be great. Thanks!", + "cleaned_text": "A: Did your meal meet with your approval? \nB: Our meal was absolutely perfect! \nA: How about a dessert to top off that wonderful meal? \nB:Dessert sounds perfect, but I would like to split something with my partner. We're both trying to watch our calories a bit, so sharing would be ideal, and we'd love to hear your recommendations for the best sharing-sized desserts on the menu.\nA: Sorry to jump in, but before you decide, I wanted to mention that tonight's dessert list includes a few special items—chocolate mousse cake, homemade fresh strawberry shortcake, and a spicy rum apple crisp. \nB: Oh, those sound amazing! I think that the apple crisp would be wonderful. \nA: One dessert will serve two, so would you like to split a second one? \nB: We would also like a piece of chocolate mousse cake. Could you bring us four dessert forks, please? \nA: How about some coffee and perhaps a digestif to go with your desserts? \nB: Actually, we're all tea drinkers. Please bring us four teas. \nA: Got it. I'll prepare your desserts and have someone bring you your drinks right away. \nB: The hot drinks first would be great. Thanks!", + "total_duration": 55.26285714285714, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--480/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--480/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--480/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Did your meal meet with your approval?", + "original_text": "Did your meal meet with your approval?", + "start_time": 0, + "end_time": 1.9388662131519274, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--480/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Our meal was absolutely perfect!", + "original_text": "Our meal was absolutely perfect!", + "start_time": 2.239609135528154, + "end_time": 3.969495756843347, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--480/temp/line_1_B.wav", + "silence_duration": 0.30074292237622696, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "How about a dessert to top off that wonderful meal?", + "original_text": "How about a dessert to top off that wonderful meal?", + "start_time": 4.461090707820608, + "end_time": 7.201045356346685, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--480/temp/line_2_A.wav", + "silence_duration": 0.491594950977261, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Dessert sounds perfect, but I would like to split something with my", + "original_text": "Dessert sounds perfect, but I would like to split something with my [interrupt] partner. We're both trying to watch our calories a bit, so sharing would be ideal, and we'd love to hear your recommendations for the best sharing-sized desserts on the menu.", + "start_time": 7.523312409337443, + "end_time": 18.959140073736535, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--480/temp/line_3_B.wav", + "silence_duration": 0.3222670529907575, + "is_interrupted": true, + "text_after_interrupt": "partner. We're both trying to watch our calories a bit, so sharing would be ideal, and we'd love to hear your recommendations for the best sharing-sized desserts on the menu." + }, + { + "speaker": "A", + "text": "Sorry to jump in, but before you decide, I wanted to mention that tonight's dessert list includes a few special items—chocolate mousse cake, homemade fresh strawberry shortcake, and a spicy rum apple crisp.", + "original_text": "Sorry to jump in, but before you decide, I wanted to mention that tonight's dessert list includes a few special items—chocolate mousse cake, homemade fresh strawberry shortcake, and a spicy rum apple crisp.", + "start_time": 11.134015357183248, + "end_time": 24.113970005709326, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--480/temp/line_4_A.wav", + "silence_duration": 0.4519786597625066, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Oh, those sound amazing! I think that the apple crisp would be wonderful.", + "original_text": "Oh, those sound amazing! I think that the apple crisp would be wonderful.", + "start_time": 24.636939201260713, + "end_time": 28.932630811238038, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--480/temp/line_5_B.wav", + "silence_duration": 0.5229691955513873, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "One dessert will serve two, so would you like to split a second one?", + "original_text": "One dessert will serve two, so would you like to split a second one?", + "start_time": 29.39697867758939, + "end_time": 33.646230378269664, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--480/temp/line_6_A.wav", + "silence_duration": 0.46434786635135294, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "We would also like a piece of chocolate mousse cake. Could you bring us four dessert forks, please?", + "original_text": "We would also like a piece of chocolate mousse cake. Could you bring us four dessert forks, please?", + "start_time": 33.996994919059844, + "end_time": 38.32751646100996, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--480/temp/line_7_B.wav", + "silence_duration": 0.3507645407901837, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "How about some coffee and perhaps a digestif to go with your desserts?", + "original_text": "How about some coffee and perhaps a digestif to go with your desserts?", + "start_time": 38.720741510981874, + "end_time": 43.19058278082314, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--480/temp/line_8_A.wav", + "silence_duration": 0.39322504997191693, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Actually, we're all tea drinkers. Please bring us four teas.", + "original_text": "Actually, we're all tea drinkers. Please bring us four teas.", + "start_time": 43.49754491122872, + "end_time": 47.015368040480425, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--480/temp/line_9_B.wav", + "silence_duration": 0.3069621304055787, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Got it. I'll prepare your desserts and have someone bring you your drinks right away.", + "original_text": "Got it. I'll prepare your desserts and have someone bring you your drinks right away.", + "start_time": 47.60338376954628, + "end_time": 52.1196649486846, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--480/temp/line_10_A.wav", + "silence_duration": 0.5880157290658508, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "The hot drinks first would be great. Thanks!", + "original_text": "The hot drinks first would be great. Thanks!", + "start_time": 52.46486920704763, + "end_time": 55.26287374219502, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--480/temp/line_11_B.wav", + "silence_duration": 0.34520425836302726, + "is_interrupted": false + } + ] + }, + "DialogSum--val--482": { + "original_text": "A: Okay well listen, here is my business card with my mobile number. If any other questions spring to mind don't hesitate to contact me. Of course you can also call Miss Childs [interrupt] if you need any immediate assistance or have any follow-up questions regarding the position or the hiring process, as she's our HR coordinator and handles all candidate communications.\nB: Oh, I just realized, I wanted to ask—when can I expect to hear from you?\nA: We are finishing the shortlist interviews tomorrow, so we will certainly have a decision made by early next week. Miss Childs will call you to discuss more on Monday or Tuesday. How does that sound?\nB: That sounds perfect. Thank you very much for taking the time to speak to me Mr. Parsons. Also, you were about to say something about Miss Childs earlier?\nA: Ah yes, I was just mentioning that you can also call Miss Childs if you have any questions.\nB: Got it. The pleasure's all mine, Rebecca.\nA: I hope to hear from you very soon.", + "cleaned_text": "A:Okay well listen, here is my business card with my mobile number. If any other questions spring to mind don't hesitate to contact me. Of course you can also call Miss Childs if you need any immediate assistance or have any follow-up questions regarding the position or the hiring process, as she's our HR coordinator and handles all candidate communications.\nB: Oh, I just realized, I wanted to ask—when can I expect to hear from you?\nA: We are finishing the shortlist interviews tomorrow, so we will certainly have a decision made by early next week. Miss Childs will call you to discuss more on Monday or Tuesday. How does that sound?\nB: That sounds perfect. Thank you very much for taking the time to speak to me Mr. Parsons. Also, you were about to say something about Miss Childs earlier?\nA: Ah yes, I was just mentioning that you can also call Miss Childs if you have any questions.\nB: Got it. The pleasure's all mine, Rebecca.\nA: I hope to hear from you very soon.", + "total_duration": 52.55052154195011, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--482/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--482/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--482/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Okay well listen, here is my business card with my mobile number. If any other questions spring to mind don't hesitate to contact me. Of course you can also call Miss Childs", + "original_text": "Okay well listen, here is my business card with my mobile number. If any other questions spring to mind don't hesitate to contact me. Of course you can also call Miss Childs [interrupt] if you need any immediate assistance or have any follow-up questions regarding the position or the hiring process, as she's our HR coordinator and handles all candidate communications.", + "start_time": 0, + "end_time": 21.037278911564627, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--482/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": true, + "text_after_interrupt": "if you need any immediate assistance or have any follow-up questions regarding the position or the hiring process, as she's our HR coordinator and handles all candidate communications." + }, + { + "speaker": "B", + "text": "Oh, I just realized, I wanted to ask—when can I expect to hear from you?", + "original_text": "Oh, I just realized, I wanted to ask—when can I expect to hear from you?", + "start_time": 10.89015873015873, + "end_time": 14.663401360544217, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--482/temp/line_1_B.wav", + "silence_duration": 0.37442408647760195, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "We are finishing the shortlist interviews tomorrow, so we will certainly have a decision made by early next week. Miss Childs will call you to discuss more on Monday or Tuesday. How does that sound?", + "original_text": "We are finishing the shortlist interviews tomorrow, so we will certainly have a decision made by early next week. Miss Childs will call you to discuss more on Monday or Tuesday. How does that sound?", + "start_time": 21.42505675802718, + "end_time": 33.44138328863942, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--482/temp/line_2_A.wav", + "silence_duration": 0.38777784646255076, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "That sounds perfect. Thank you very much for taking the time to speak to me Mr. Parsons. Also, you were about to say something about Miss Childs earlier?", + "original_text": "That sounds perfect. Thank you very much for taking the time to speak to me Mr. Parsons. Also, you were about to say something about Miss Childs earlier?", + "start_time": 33.931555791873734, + "end_time": 41.57092087123881, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--482/temp/line_3_B.wav", + "silence_duration": 0.49017250323431105, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Ah yes, I was just mentioning that you can also call Miss Childs if you have any questions.", + "original_text": "Ah yes, I was just mentioning that you can also call Miss Childs if you have any questions.", + "start_time": 42.034145061214886, + "end_time": 47.24702487980899, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--482/temp/line_4_A.wav", + "silence_duration": 0.4632241899760762, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Got it. The pleasure's all mine, Rebecca.", + "original_text": "Got it. The pleasure's all mine, Rebecca.", + "start_time": 47.829031419868805, + "end_time": 50.00009717950599, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--482/temp/line_5_B.wav", + "silence_duration": 0.5820065400598148, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I hope to hear from you very soon.", + "original_text": "I hope to hear from you very soon.", + "start_time": 50.60007233167396, + "end_time": 52.550548522150144, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--482/temp/line_6_A.wav", + "silence_duration": 0.5999751521679648, + "is_interrupted": false + } + ] + }, + "DialogSum--val--483": { + "original_text": "A: Welcome, young man. No offence, but I haven't seen you here before. \nB: Of course, this is my first time here. My Mom has a membership here. Here is the card. \nA: Okay then. You are the younger customer here [interrupt] but it's great to see young people interested in fitness and taking initiative to improve their health at such an early age. \nB: It's not so wise that you do not explore the children's market. \nA: It's the marketing's fault, I suppose. What do you want to do? \nB: Well, I want to become just like Bruce Lee. What should I do? \nA: That's a long way to go, I'm afraid. First of all, you gotta [interrupt] build a strong foundation with basic exercises and proper nutrition, focusing on developing both your physical strength and mental discipline which were hallmarks of Bruce Lee's training philosophy. \nB: I am still young. And I'm growing every minute. \nA: Sure. Then what about trying the treadmill or the skipping rope. \nB: I love running. Anything else? \nA: Please change your clothes first! \nB: I'm perfect with my clothes. And I do not have anything else with me. By the way, you were saying something about what I need to do first to become like Bruce Lee?", + "cleaned_text": "A: Welcome, young man. No offence, but I haven't seen you here before. \nB: Of course, this is my first time here. My Mom has a membership here. Here is the card. \nA:Okay then. You are the younger customer here but it's great to see young people interested in fitness and taking initiative to improve their health at such an early age.\nB: It's not so wise that you do not explore the children's market. \nA: It's the marketing's fault, I suppose. What do you want to do? \nB: Well, I want to become just like Bruce Lee. What should I do? \nA:That's a long way to go, I'm afraid. First of all, you gotta build a strong foundation with basic exercises and proper nutrition, focusing on developing both your physical strength and mental discipline which were hallmarks of Bruce Lee's training philosophy.\nB: I am still young. And I'm growing every minute. \nA: Sure. Then what about trying the treadmill or the skipping rope. \nB: I love running. Anything else? \nA: Please change your clothes first! \nB: I'm perfect with my clothes. And I do not have anything else with me. By the way, you were saying something about what I need to do first to become like Bruce Lee?", + "total_duration": 62.01596371882086, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--483/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--483/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--483/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Welcome, young man. No offence, but I haven't seen you here before.", + "original_text": "Welcome, young man. No offence, but I haven't seen you here before.", + "start_time": 0, + "end_time": 4.330521541950113, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--483/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Of course, this is my first time here. My Mom has a membership here. Here is the card.", + "original_text": "Of course, this is my first time here. My Mom has a membership here. Here is the card.", + "start_time": 4.71805844731017, + "end_time": 9.547809014203594, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--483/temp/line_1_B.wav", + "silence_duration": 0.3875369053600566, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Okay then. You are the younger customer here", + "original_text": "Okay then. You are the younger customer here [interrupt] but it's great to see young people interested in fitness and taking initiative to improve their health at such an early age.", + "start_time": 9.903355450394674, + "end_time": 19.8531060172881, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--483/temp/line_2_A.wav", + "silence_duration": 0.35554643619108045, + "is_interrupted": true, + "text_after_interrupt": "but it's great to see young people interested in fitness and taking initiative to improve their health at such an early age." + }, + { + "speaker": "B", + "text": "It's not so wise that you do not explore the children's market.", + "original_text": "It's not so wise that you do not explore the children's market.", + "start_time": 12.875509645406012, + "end_time": 15.952153636335717, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--483/temp/line_3_B.wav", + "silence_duration": 0.585039872833221, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "It's the marketing's fault, I suppose. What do you want to do?", + "original_text": "It's the marketing's fault, I suppose. What do you want to do?", + "start_time": 20.3949675709455, + "end_time": 24.24948004260083, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--483/temp/line_4_A.wav", + "silence_duration": 0.5418615536574029, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Well, I want to become just like Bruce Lee. What should I do?", + "original_text": "Well, I want to become just like Bruce Lee. What should I do?", + "start_time": 24.847491393794147, + "end_time": 28.318874613748797, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--483/temp/line_5_B.wav", + "silence_duration": 0.5980113511933163, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "That's a long way to go, I'm afraid. First of all, you gotta", + "original_text": "That's a long way to go, I'm afraid. First of all, you gotta [interrupt] build a strong foundation with basic exercises and proper nutrition, focusing on developing both your physical strength and mental discipline which were hallmarks of Bruce Lee's training philosophy.", + "start_time": 28.859923009644458, + "end_time": 45.438970628692076, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--483/temp/line_6_A.wav", + "silence_duration": 0.5410483958956595, + "is_interrupted": true, + "text_after_interrupt": "build a strong foundation with basic exercises and proper nutrition, focusing on developing both your physical strength and mental discipline which were hallmarks of Bruce Lee's training philosophy." + }, + { + "speaker": "B", + "text": "I am still young. And I'm growing every minute.", + "original_text": "I am still young. And I'm growing every minute.", + "start_time": 36.17766394175628, + "end_time": 38.47643945196036, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--483/temp/line_7_B.wav", + "silence_duration": 0.5867679674392132, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Sure. Then what about trying the treadmill or the skipping rope.", + "original_text": "Sure. Then what about trying the treadmill or the skipping rope.", + "start_time": 45.78293453307616, + "end_time": 49.55617716346165, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--483/temp/line_8_A.wav", + "silence_duration": 0.3439639043840848, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I love running. Anything else?", + "original_text": "I love running. Anything else?", + "start_time": 50.03683232783219, + "end_time": 51.56934933463491, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--483/temp/line_9_B.wav", + "silence_duration": 0.48065516437053935, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Please change your clothes first!", + "original_text": "Please change your clothes first!", + "start_time": 51.97742578725696, + "end_time": 53.75375231786921, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--483/temp/line_10_A.wav", + "silence_duration": 0.4080764526220545, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I'm perfect with my clothes. And I do not have anything else with me. By the way, you were saying something about what I need to do first to become like Bruce Lee?", + "original_text": "I'm perfect with my clothes. And I do not have anything else with me. By the way, you were saying something about what I need to do first to become like Bruce Lee?", + "start_time": 54.225711052366854, + "end_time": 62.01600583694735, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--483/temp/line_11_B.wav", + "silence_duration": 0.47195873449764825, + "is_interrupted": false + } + ] + }, + "DialogSum--val--484": { + "original_text": "A: Hello, this is Susan speaking. Is Mr. Brown in, please? \nB: Yes, speaking. \nA: Hi, Mr. Brown. Your son Ted missed the school trip this morning. Do you know why? \nB: Yes. He got up a bit late this morning. He missed the school bus. \nA: Why did he get up late? Didn't he have a [interrupt] good night's sleep last night and follow his usual bedtime routine properly? \nB: Oh, about that, the clock didn't work this morning. I worked overtime till midnight at home last night, so I got up late, too. It was already nine o'clock when I woke him up. \nA: I see. But why did he wake up at such a late hour? Did he stay up late last night? \nB: Oh, right, I didn't mention—he didn't go to bed until 11:00 pm. \nA: Why didn't you ask him to go to bed early? \nB: He's a 'night owl'. He can't fall asleep before 11:00 pm. \nA: You should really change his sleeping habits. Otherwise, it will happen again. \nB: I will. Thank you for calling, Susan.", + "cleaned_text": "A: Hello, this is Susan speaking. Is Mr. Brown in, please? \nB: Yes, speaking. \nA: Hi, Mr. Brown. Your son Ted missed the school trip this morning. Do you know why? \nB: Yes. He got up a bit late this morning. He missed the school bus. \nA:Why did he get up late? Didn't he have a good night's sleep last night and follow his usual bedtime routine properly?\nB: Oh, about that, the clock didn't work this morning. I worked overtime till midnight at home last night, so I got up late, too. It was already nine o'clock when I woke him up. \nA: I see. But why did he wake up at such a late hour? Did he stay up late last night? \nB: Oh, right, I didn't mention—he didn't go to bed until 11:00 pm. \nA: Why didn't you ask him to go to bed early? \nB: He's a 'night owl'. He can't fall asleep before 11:00 pm. \nA: You should really change his sleeping habits. Otherwise, it will happen again. \nB: I will. Thank you for calling, Susan.", + "total_duration": 51.753696145124714, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--484/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--484/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--484/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Hello, this is Susan speaking. Is Mr. Brown in, please?", + "original_text": "Hello, this is Susan speaking. Is Mr. Brown in, please?", + "start_time": 0, + "end_time": 4.31891156462585, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--484/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, speaking.", + "original_text": "Yes, speaking.", + "start_time": 4.7955508493546946, + "end_time": 5.794008899241316, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--484/temp/line_1_B.wav", + "silence_duration": 0.4766392847288443, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Hi, Mr. Brown. Your son Ted missed the school trip this morning. Do you know why?", + "original_text": "Hi, Mr. Brown. Your son Ted missed the school trip this morning. Do you know why?", + "start_time": 6.268685865395341, + "end_time": 12.027234618229809, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--484/temp/line_2_A.wav", + "silence_duration": 0.4746769661540251, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes. He got up a bit late this morning. He missed the school bus.", + "original_text": "Yes. He got up a bit late this morning. He missed the school bus.", + "start_time": 12.53471513061622, + "end_time": 15.588139166897399, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--484/temp/line_3_B.wav", + "silence_duration": 0.5074805123864125, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Why did he get up late? Didn't he have a", + "original_text": "Why did he get up late? Didn't he have a [interrupt] good night's sleep last night and follow his usual bedtime routine properly?", + "start_time": 16.111928628418514, + "end_time": 22.78766558986976, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--484/temp/line_4_A.wav", + "silence_duration": 0.5237894615211164, + "is_interrupted": true, + "text_after_interrupt": "good night's sleep last night and follow his usual bedtime routine properly?" + }, + { + "speaker": "B", + "text": "Oh, about that, the clock didn't work this morning. I worked overtime till midnight at home last night, so I got up late, too. It was already nine o'clock when I woke him up.", + "original_text": "Oh, about that, the clock didn't work this morning. I worked overtime till midnight at home last night, so I got up late, too. It was already nine o'clock when I woke him up.", + "start_time": 18.88671320891738, + "end_time": 27.605806179438922, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--484/temp/line_5_B.wav", + "silence_duration": 0.33010000879486, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I see. But why did he wake up at such a late hour? Did he stay up late last night?", + "original_text": "I see. But why did he wake up at such a late hour? Did he stay up late last night?", + "start_time": 27.94130790873697, + "end_time": 34.03654600397506, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--484/temp/line_6_A.wav", + "silence_duration": 0.3355017292980488, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Oh, right, I didn't mention—he didn't go to bed until 11:00 pm.", + "original_text": "Oh, right, I didn't mention—he didn't go to bed until 11:00 pm.", + "start_time": 34.58461872420235, + "end_time": 38.13727178542684, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--484/temp/line_7_B.wav", + "silence_duration": 0.5480727202272859, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Why didn't you ask him to go to bed early?", + "original_text": "Why didn't you ask him to go to bed early?", + "start_time": 38.52685717210479, + "end_time": 40.82563268230887, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--484/temp/line_8_A.wav", + "silence_duration": 0.3895853866779512, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "He's a 'night owl'. He can't fall asleep before 11:00 pm.", + "original_text": "He's a 'night owl'. He can't fall asleep before 11:00 pm.", + "start_time": 41.16533848056216, + "end_time": 44.63672170051681, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--484/temp/line_9_B.wav", + "silence_duration": 0.33970579825329367, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "You should really change his sleeping habits. Otherwise, it will happen again.", + "original_text": "You should really change his sleeping habits. Otherwise, it will happen again.", + "start_time": 44.95138246794343, + "end_time": 49.502493579054544, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--484/temp/line_10_A.wav", + "silence_duration": 0.31466076742662125, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I will. Thank you for calling, Susan.", + "original_text": "I will. Thank you for calling, Susan.", + "start_time": 49.97741032246438, + "end_time": 51.753736853076624, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--484/temp/line_11_B.wav", + "silence_duration": 0.4749167434098326, + "is_interrupted": false + } + ] + }, + "DialogSum--val--486": { + "original_text": "A: You can just skip that. I'll put in the room number for you [interrupt] after I confirm your check-in details and ensure all the necessary paperwork is properly completed for your stay with us.\nB: Oh, I just remembered—do you have any recommendations for nearby restaurants? I might want to grab something to eat later.\nA: Absolutely, I can suggest a few great places nearby. But let me finish filling in the room number for you first. So, as I was saying, you can skip that part, and I'll take care of it.\nB: Here you are. I think I've filled in everything correctly.\nA: Let me see...name, address, nationality, forwarding address, passport number, place of issue, signature and date of departure. Oh, here, sir. You forgot to put in the date of your departure. Here let me fill it in for you. You are leaving on...?\nB: October 24th.", + "cleaned_text": "A:You can just skip that. I'll put in the room number for you after I confirm your check-in details and ensure all the necessary paperwork is properly completed for your stay with us.\nB: Oh, I just remembered—do you have any recommendations for nearby restaurants? I might want to grab something to eat later.\nA: Absolutely, I can suggest a few great places nearby. But let me finish filling in the room number for you first. So, as I was saying, you can skip that part, and I'll take care of it.\nB: Here you are. I think I've filled in everything correctly.\nA: Let me see...name, address, nationality, forwarding address, passport number, place of issue, signature and date of departure. Oh, here, sir. You forgot to put in the date of your departure. Here let me fill it in for you. You are leaving on...?\nB: October 24th.", + "total_duration": 43.40875283446712, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--486/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--486/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--486/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "You can just skip that. I'll put in the room number for you", + "original_text": "You can just skip that. I'll put in the room number for you [interrupt] after I confirm your check-in details and ensure all the necessary paperwork is properly completed for your stay with us.", + "start_time": 0, + "end_time": 9.752380952380953, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--486/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": true, + "text_after_interrupt": "after I confirm your check-in details and ensure all the necessary paperwork is properly completed for your stay with us." + }, + { + "speaker": "B", + "text": "Oh, I just remembered—do you have any recommendations for nearby restaurants? I might want to grab something to eat later.", + "original_text": "Oh, I just remembered—do you have any recommendations for nearby restaurants? I might want to grab something to eat later.", + "start_time": 3.030204081632653, + "end_time": 9.044172335600907, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--486/temp/line_1_B.wav", + "silence_duration": 0.30147415892979523, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Absolutely, I can suggest a few great places nearby. But let me finish filling in the room number for you first. So, as I was saying, you can skip that part, and I'll take care of it.", + "original_text": "Absolutely, I can suggest a few great places nearby. But let me finish filling in the room number for you first. So, as I was saying, you can skip that part, and I'll take care of it.", + "start_time": 10.347296606936862, + "end_time": 21.45804490625659, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--486/temp/line_2_A.wav", + "silence_duration": 0.5949156545559076, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Here you are. I think I've filled in everything correctly.", + "original_text": "Here you are. I think I've filled in everything correctly.", + "start_time": 21.867359898072166, + "end_time": 24.816294138434976, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--486/temp/line_3_B.wav", + "silence_duration": 0.40931499181557607, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Let me see...name, address, nationality, forwarding address, passport number, place of issue, signature and date of departure. Oh, here, sir. You forgot to put in the date of your departure. Here let me fill it in for you. You are leaving on...?", + "original_text": "Let me see...name, address, nationality, forwarding address, passport number, place of issue, signature and date of departure. Oh, here, sir. You forgot to put in the date of your departure. Here let me fill it in for you. You are leaving on...?", + "start_time": 25.13387034259135, + "end_time": 41.387838596559604, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--486/temp/line_4_A.wav", + "silence_duration": 0.3175762041563746, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "October 24th.", + "original_text": "October 24th.", + "start_time": 41.8762733175437, + "end_time": 43.40879032434642, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--486/temp/line_5_B.wav", + "silence_duration": 0.48843472098409363, + "is_interrupted": false + } + ] + }, + "DialogSum--val--487": { + "original_text": "A: Pardon me. Are you familiar with this neighborhood? \nB: Well, I should be. I've lived here all my life. What are you looking [interrupt] for specifically? Maybe I can point you in the right direction or even walk you there if it's not too far. \nA: Sorry to jump in, but I'm actually looking for the Post Office. \nB: The nearest one is about a mile away. \nA: Oh. Well, I guess I could send a letter. \nB: There's a mailbox up the street. Have you already got a stamp on that [interrupt] letter or do you need to purchase one? I know the post office sells them but there's also a convenience store nearby that might have stamps. \nA: Yes, but I need to register it. Could you tell me how to walk to the post office from here? \nB: Go up this street until you get to the main street. Then turn right and walk about four blocks or so. \nA: Thank you for your help. \nB: The post office entrance is inside a building complex with some other offices. \nA: Oh, you mentioned the mailbox earlier—where exactly is it, just in case I change my mind? \nB: It's just up the street, on the right side. But if you still want to go to the post office, there's an American flag out front and a sign: The U.S. Post Office. \nA: Got it. Thanks again!", + "cleaned_text": "A: Pardon me. Are you familiar with this neighborhood? \nB:Well, I should be. I've lived here all my life. What are you looking for specifically? Maybe I can point you in the right direction or even walk you there if it's not too far.\nA: Sorry to jump in, but I'm actually looking for the Post Office. \nB: The nearest one is about a mile away. \nA: Oh. Well, I guess I could send a letter. \nB:There's a mailbox up the street. Have you already got a stamp on that letter or do you need to purchase one? I know the post office sells them but there's also a convenience store nearby that might have stamps.\nA: Yes, but I need to register it. Could you tell me how to walk to the post office from here? \nB: Go up this street until you get to the main street. Then turn right and walk about four blocks or so. \nA: Thank you for your help. \nB: The post office entrance is inside a building complex with some other offices. \nA: Oh, you mentioned the mailbox earlier—where exactly is it, just in case I change my mind? \nB: It's just up the street, on the right side. But if you still want to go to the post office, there's an American flag out front and a sign: The U.S. Post Office. \nA: Got it. Thanks again!", + "total_duration": 59.07065759637188, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--487/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--487/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--487/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Pardon me. Are you familiar with this neighborhood?", + "original_text": "Pardon me. Are you familiar with this neighborhood?", + "start_time": 0, + "end_time": 2.4961451247165534, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--487/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Well, I should be. I've lived here all my life. What are you looking", + "original_text": "Well, I should be. I've lived here all my life. What are you looking [interrupt] for specifically? Maybe I can point you in the right direction or even walk you there if it's not too far.", + "start_time": 2.9463157523238572, + "end_time": 12.060147951870341, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--487/temp/line_1_B.wav", + "silence_duration": 0.45017062760730386, + "is_interrupted": true, + "text_after_interrupt": "for specifically? Maybe I can point you in the right direction or even walk you there if it's not too far." + }, + { + "speaker": "A", + "text": "Sorry to jump in, but I'm actually looking for the Post Office.", + "original_text": "Sorry to jump in, but I'm actually looking for the Post Office.", + "start_time": 6.220329357766034, + "end_time": 10.040011897448574, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--487/temp/line_2_A.wav", + "silence_duration": 0.3256448457378757, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "The nearest one is about a mile away.", + "original_text": "The nearest one is about a mile away.", + "start_time": 12.650825372473996, + "end_time": 14.589691585625923, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--487/temp/line_3_B.wav", + "silence_duration": 0.5906774206036546, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Oh. Well, I guess I could send a letter.", + "original_text": "Oh. Well, I guess I could send a letter.", + "start_time": 15.034373252727386, + "end_time": 17.34475874025573, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--487/temp/line_4_A.wav", + "silence_duration": 0.4446816671014633, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "There's a mailbox up the street. Have you already got a stamp on that", + "original_text": "There's a mailbox up the street. Have you already got a stamp on that [interrupt] letter or do you need to purchase one? I know the post office sells them but there's also a convenience store nearby that might have stamps.", + "start_time": 17.818220138494375, + "end_time": 28.56905914076195, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--487/temp/line_5_B.wav", + "silence_duration": 0.47346139823864447, + "is_interrupted": true, + "text_after_interrupt": "letter or do you need to purchase one? I know the post office sells them but there's also a convenience store nearby that might have stamps." + }, + { + "speaker": "A", + "text": "Yes, but I need to register it. Could you tell me how to walk to the post office from here?", + "original_text": "Yes, but I need to register it. Could you tell me how to walk to the post office from here?", + "start_time": 25.805343057396033, + "end_time": 30.98339294401735, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--487/temp/line_6_A.wav", + "silence_duration": 0.3865370872246584, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Go up this street until you get to the main street. Then turn right and walk about four blocks or so.", + "original_text": "Go up this street until you get to the main street. Then turn right and walk about four blocks or so.", + "start_time": 31.28755311513258, + "end_time": 36.47721297907816, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--487/temp/line_7_B.wav", + "silence_duration": 0.30416017111523347, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Thank you for your help.", + "original_text": "Thank you for your help.", + "start_time": 36.95676807730588, + "end_time": 38.187425673677765, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--487/temp/line_8_A.wav", + "silence_duration": 0.4795550982277187, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "The post office entrance is inside a building complex with some other offices.", + "original_text": "The post office entrance is inside a building complex with some other offices.", + "start_time": 38.527851937979335, + "end_time": 42.417194341607455, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--487/temp/line_9_B.wav", + "silence_duration": 0.34042626430156936, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Oh, you mentioned the mailbox earlier—where exactly is it, just in case I change my mind?", + "original_text": "Oh, you mentioned the mailbox earlier—where exactly is it, just in case I change my mind?", + "start_time": 42.88223763553414, + "end_time": 48.4550267511804, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--487/temp/line_10_A.wav", + "silence_duration": 0.4650432939266838, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "It's just up the street, on the right side. But if you still want to go to the post office, there's an American flag out front and a sign: The U.S. Post Office.", + "original_text": "It's just up the street, on the right side. But if you still want to go to the post office, there's an American flag out front and a sign: The U.S. Post Office.", + "start_time": 48.90248282020074, + "end_time": 57.31971638029144, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--487/temp/line_11_B.wav", + "silence_duration": 0.44745606902033774, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Got it. Thanks again!", + "original_text": "Got it. Thanks again!", + "start_time": 57.71231395456912, + "end_time": 59.070681301507896, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--487/temp/line_12_A.wav", + "silence_duration": 0.3925975742776793, + "is_interrupted": false + } + ] + }, + "DialogSum--val--490": { + "original_text": "A: What's going on between you and Charlie? Did you have a fight or [interrupt] did something happen that made things worse recently, like maybe he borrowed something without asking or left a huge mess in the kitchen again? \nB: No, but I can't stand him anymore. He is the worst roommate I've ever had. He never cleans up after himself and he is always listening to loud music when I try to get some sleep. \nA: Wait, he's always listening to loud music? That must be really frustrating. Have you tried talking to him about this? \nB: I've tried, but it didn't work. Maybe you can talk to him. After all, you are his good friend. By the way, I didn't finish explaining—it's not just the music, it's also the fact that he never cleans up after himself, and it's really starting to affect my mood every day.", + "cleaned_text": "A:What's going on between you and Charlie? Did you have a fight or did something happen that made things worse recently, like maybe he borrowed something without asking or left a huge mess in the kitchen again?\nB: No, but I can't stand him anymore. He is the worst roommate I've ever had. He never cleans up after himself and he is always listening to loud music when I try to get some sleep. \nA: Wait, he's always listening to loud music? That must be really frustrating. Have you tried talking to him about this? \nB: I've tried, but it didn't work. Maybe you can talk to him. After all, you are his good friend. By the way, I didn't finish explaining—it's not just the music, it's also the fact that he never cleans up after himself, and it's really starting to affect my mood every day.", + "total_duration": 35.022222222222226, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--490/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--490/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--490/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "What's going on between you and Charlie? Did you have a fight or", + "original_text": "What's going on between you and Charlie? Did you have a fight or [interrupt] did something happen that made things worse recently, like maybe he borrowed something without asking or left a huge mess in the kitchen again?", + "start_time": 0, + "end_time": 11.853786848072563, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--490/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": true, + "text_after_interrupt": "did something happen that made things worse recently, like maybe he borrowed something without asking or left a huge mess in the kitchen again?" + }, + { + "speaker": "B", + "text": "No, but I can't stand him anymore. He is the worst roommate I've ever had. He never cleans up after himself and he is always listening to loud music when I try to get some sleep.", + "original_text": "No, but I can't stand him anymore. He is the worst roommate I've ever had. He never cleans up after himself and he is always listening to loud music when I try to get some sleep.", + "start_time": 4.493061224489796, + "end_time": 13.084444444444443, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--490/temp/line_1_B.wav", + "silence_duration": 0.35009783171474607, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Wait, he's always listening to loud music? That must be really frustrating. Have you tried talking to him about this?", + "original_text": "Wait, he's always listening to loud music? That must be really frustrating. Have you tried talking to him about this?", + "start_time": 13.447687185143748, + "end_time": 20.738752944780934, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--490/temp/line_2_A.wav", + "silence_duration": 0.36324274069930484, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I've tried, but it didn't work. Maybe you can talk to him. After all, you are his good friend. By the way, I didn't finish explaining—it's not just the music, it's also the fact that he never cleans up after himself, and it's really starting to affect my mood every day.", + "original_text": "I've tried, but it didn't work. Maybe you can talk to him. After all, you are his good friend. By the way, I didn't finish explaining—it's not just the music, it's also the fact that he never cleans up after himself, and it's really starting to affect my mood every day.", + "start_time": 21.264443548989547, + "end_time": 35.02226667824125, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--490/temp/line_3_B.wav", + "silence_duration": 0.5256906042086146, + "is_interrupted": false + } + ] + }, + "DialogSum--val--491": { + "original_text": "A: Tom, I married Julia last month. Have you already [interrupt] told anyone else about it? We wanted to keep it a small, private ceremony with just our closest family and friends present, but I'm worried the news might have spread further than intended. \nB: Wait, you got married? That's huge news! How did I not know about this? \nA: Indeed, we got married too soon. \nB: Congratulations. But have you heard the proverb that if one gets married too hurriedly one may [interrupt] regret it later when the initial excitement fades and the realities of daily married life set in? I'm not saying that's the case for you, but it's something people say. \nA: I know what you're getting at, but I truly believe that marriage comes by destiny. I knew I would marry Julia when I met her for the first time. \nB: How's your married life? \nA: We're happy together now. \nB: I have to say you're a well-matched couple. But you didn't finish earlier—what were you going to say about getting married too hurriedly?", + "cleaned_text": "A:Tom, I married Julia last month. Have you already told anyone else about it? We wanted to keep it a small, private ceremony with just our closest family and friends present, but I'm worried the news might have spread further than intended.\nB: Wait, you got married? That's huge news! How did I not know about this? \nA: Indeed, we got married too soon. \nB:Congratulations. But have you heard the proverb that if one gets married too hurriedly one may regret it later when the initial excitement fades and the realities of daily married life set in? I'm not saying that's the case for you, but it's something people say.\nA: I know what you're getting at, but I truly believe that marriage comes by destiny. I knew I would marry Julia when I met her for the first time. \nB: How's your married life? \nA: We're happy together now. \nB: I have to say you're a well-matched couple. But you didn't finish earlier—what were you going to say about getting married too hurriedly?", + "total_duration": 45.75274376417234, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--491/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--491/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--491/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Tom, I married Julia last month. Have you already", + "original_text": "Tom, I married Julia last month. Have you already [interrupt] told anyone else about it? We wanted to keep it a small, private ceremony with just our closest family and friends present, but I'm worried the news might have spread further than intended.", + "start_time": 0, + "end_time": 14.315102040816326, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--491/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": true, + "text_after_interrupt": "told anyone else about it? We wanted to keep it a small, private ceremony with just our closest family and friends present, but I'm worried the news might have spread further than intended." + }, + { + "speaker": "B", + "text": "Wait, you got married? That's huge news! How did I not know about this?", + "original_text": "Wait, you got married? That's huge news! How did I not know about this?", + "start_time": 3.575873015873016, + "end_time": 8.034104308390022, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--491/temp/line_1_B.wav", + "silence_duration": 0.47111936527154286, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Indeed, we got married too soon.", + "original_text": "Indeed, we got married too soon.", + "start_time": 14.741360770411847, + "end_time": 16.90081655272477, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--491/temp/line_2_A.wav", + "silence_duration": 0.42625872959552, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Congratulations. But have you heard the proverb that if one gets married too hurriedly one may", + "original_text": "Congratulations. But have you heard the proverb that if one gets married too hurriedly one may [interrupt] regret it later when the initial excitement fades and the realities of daily married life set in? I'm not saying that's the case for you, but it's something people say.", + "start_time": 17.493507912673632, + "end_time": 29.98584351358066, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--491/temp/line_3_B.wav", + "silence_duration": 0.5926913599488615, + "is_interrupted": true, + "text_after_interrupt": "regret it later when the initial excitement fades and the realities of daily married life set in? I'm not saying that's the case for you, but it's something people say." + }, + { + "speaker": "A", + "text": "I know what you're getting at, but I truly believe that marriage comes by destiny. I knew I would marry Julia when I met her for the first time.", + "original_text": "I know what you're getting at, but I truly believe that marriage comes by destiny. I knew I would marry Julia when I met her for the first time.", + "start_time": 27.23336488306424, + "end_time": 35.464838805966735, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--491/temp/line_4_A.wav", + "silence_duration": 0.40768807420834613, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "How's your married life?", + "original_text": "How's your married life?", + "start_time": 36.05444126228077, + "end_time": 37.1457791307615, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--491/temp/line_5_B.wav", + "silence_duration": 0.5896024563140343, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "We're happy together now.", + "original_text": "We're happy together now.", + "start_time": 37.452148779379975, + "end_time": 39.06593562745254, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--491/temp/line_6_A.wav", + "silence_duration": 0.3063696486184793, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I have to say you're a well-matched couple. But you didn't finish earlier—what were you going to say about getting married too hurriedly?", + "original_text": "I have to say you're a well-matched couple. But you didn't finish earlier—what were you going to say about getting married too hurriedly?", + "start_time": 39.62270140133835, + "end_time": 45.75276942854923, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--491/temp/line_7_B.wav", + "silence_duration": 0.5567657738858065, + "is_interrupted": false + } + ] + }, + "DialogSum--val--492": { + "original_text": "A: It's got its own library, theatre, swimming pool, and a guest house. The house itself has about ten different rooms that are all hooked up to computers so you can get things done in each room through a remote control. It's also located near the sea, so he can park his boats next to his house. It's absolutely [interrupt] stunning, with every detail meticulously designed to showcase luxury and technology, from the automated climate control systems to the voice-activated lighting that adjusts based on the time of day and your personal preferences.\nB: Sorry to jump in, but you mentioned the rooms are hooked up to computers. Do you know what kind of technology he uses? Like, is it something custom-made or available to the public?\nA: I'm not entirely sure, but I think it's a mix of custom-made systems and advanced smart home technology that's not widely available yet. But back to what I was saying, the house is absolutely amazing!\nB: Would you want to live there?\nA: I think his house is fantastic, but I wouldn't want to live there. You would have to hire one or two people to clean all the rooms in the house, plus a few people to take care of the gardens, and probably an au pair or two to take care of the children. It's just too big of a place to [interrupt] maintain without a full-time staff, and I prefer a simpler lifestyle with more manageable spaces that don't require constant upkeep and supervision.\nB: So, what would your dream home be like then? Something smaller, I assume?", + "cleaned_text": "A:It's got its own library, theatre, swimming pool, and a guest house. The house itself has about ten different rooms that are all hooked up to computers so you can get things done in each room through a remote control. It's also located near the sea, so he can park his boats next to his house. It's absolutely stunning, with every detail meticulously designed to showcase luxury and technology, from the automated climate control systems to the voice-activated lighting that adjusts based on the time of day and your personal preferences.\nB: Sorry to jump in, but you mentioned the rooms are hooked up to computers. Do you know what kind of technology he uses? Like, is it something custom-made or available to the public?\nA: I'm not entirely sure, but I think it's a mix of custom-made systems and advanced smart home technology that's not widely available yet. But back to what I was saying, the house is absolutely amazing!\nB: Would you want to live there?\nA:I think his house is fantastic, but I wouldn't want to live there. You would have to hire one or two people to clean all the rooms in the house, plus a few people to take care of the gardens, and probably an au pair or two to take care of the children. It's just too big of a place to maintain without a full-time staff, and I prefer a simpler lifestyle with more manageable spaces that don't require constant upkeep and supervision.\nB: So, what would your dream home be like then? Something smaller, I assume?", + "total_duration": 78.53215419501134, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--492/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--492/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--492/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "It's got its own library, theatre, swimming pool, and a guest house. The house itself has about ten different rooms that are all hooked up to computers so you can get things done in each room through a remote control. It's also located near the sea, so he can park his boats next to his house. It's absolutely", + "original_text": "It's got its own library, theatre, swimming pool, and a guest house. The house itself has about ten different rooms that are all hooked up to computers so you can get things done in each room through a remote control. It's also located near the sea, so he can park his boats next to his house. It's absolutely [interrupt] stunning, with every detail meticulously designed to showcase luxury and technology, from the automated climate control systems to the voice-activated lighting that adjusts based on the time of day and your personal preferences.", + "start_time": 0, + "end_time": 32.80979591836735, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--492/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": true, + "text_after_interrupt": "stunning, with every detail meticulously designed to showcase luxury and technology, from the automated climate control systems to the voice-activated lighting that adjusts based on the time of day and your personal preferences." + }, + { + "speaker": "B", + "text": "Sorry to jump in, but you mentioned the rooms are hooked up to computers. Do you know what kind of technology he uses? Like, is it something custom-made or available to the public?", + "original_text": "Sorry to jump in, but you mentioned the rooms are hooked up to computers. Do you know what kind of technology he uses? Like, is it something custom-made or available to the public?", + "start_time": 18.819773242630387, + "end_time": 27.956825396825398, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--492/temp/line_1_B.wav", + "silence_duration": 0.4625566965002403, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I'm not entirely sure, but I think it's a mix of custom-made systems and advanced smart home technology that's not widely available yet. But back to what I was saying, the house is absolutely amazing!", + "original_text": "I'm not entirely sure, but I think it's a mix of custom-made systems and advanced smart home technology that's not widely available yet. But back to what I was saying, the house is absolutely amazing!", + "start_time": 33.1717715571727, + "end_time": 46.163336183023034, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--492/temp/line_2_A.wav", + "silence_duration": 0.36197563880534606, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Would you want to live there?", + "original_text": "Would you want to live there?", + "start_time": 46.60089280768081, + "end_time": 47.7967204720799, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--492/temp/line_3_B.wav", + "silence_duration": 0.43755662465777434, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I think his house is fantastic, but I wouldn't want to live there. You would have to hire one or two people to clean all the rooms in the house, plus a few people to take care of the gardens, and probably an au pair or two to take care of the children. It's just too big of a place to", + "original_text": "I think his house is fantastic, but I wouldn't want to live there. You would have to hire one or two people to clean all the rooms in the house, plus a few people to take care of the gardens, and probably an au pair or two to take care of the children. It's just too big of a place to [interrupt] maintain without a full-time staff, and I prefer a simpler lifestyle with more manageable spaces that don't require constant upkeep and supervision.", + "start_time": 48.273736757404826, + "end_time": 72.88688868484246, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--492/temp/line_4_A.wav", + "silence_duration": 0.4770162853249268, + "is_interrupted": true, + "text_after_interrupt": "maintain without a full-time staff, and I prefer a simpler lifestyle with more manageable spaces that don't require constant upkeep and supervision." + }, + { + "speaker": "B", + "text": "So, what would your dream home be like then? Something smaller, I assume?", + "original_text": "So, what would your dream home be like then? Something smaller, I assume?", + "start_time": 74.61962221877624, + "end_time": 78.53218457705289, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--492/temp/line_5_B.wav", + "silence_duration": 0.5866637113056765, + "is_interrupted": false + } + ] + }, + "DialogSum--val--493": { + "original_text": "A: What can I do for you, sir? \nB: What have you got this morning? \nA: Fruit juice, cakes and refreshments, and [interrupt] some freshly baked pastries as well, including croissants, danishes, and muffins that were prepared just an hour ago with premium ingredients. \nB: Could you tell me more about the fruit juices? I'm particularly interested in something fresh. \nA: Certainly! We have fresh orange juice, apple juice, and tomato juice. \nB: I'd like to have a glass of tomato juice, please. \nA: Any cereal, sir? \nB: Yes, a dish of cream of wheat. \nA: And eggs? \nB: Yes, bacon and eggs with buttered toast. I like my bacon very [interrupt] well done, almost crispy, with just a slight hint of smokiness and none of that chewy fat remaining. \nA: Sorry, did you say you wanted your bacon crispy? \nB: Yes, very crisp. \nA: How do you want your eggs? \nB: Fried, please. \nA: Anything more, sir? \nB: No, that's enough. Thank you.", + "cleaned_text": "A: What can I do for you, sir? \nB: What have you got this morning? \nA:Fruit juice, cakes and refreshments, and some freshly baked pastries as well, including croissants, danishes, and muffins that were prepared just an hour ago with premium ingredients.\nB: Could you tell me more about the fruit juices? I'm particularly interested in something fresh. \nA: Certainly! We have fresh orange juice, apple juice, and tomato juice. \nB: I'd like to have a glass of tomato juice, please. \nA: Any cereal, sir? \nB: Yes, a dish of cream of wheat. \nA: And eggs? \nB:Yes, bacon and eggs with buttered toast. I like my bacon very well done, almost crispy, with just a slight hint of smokiness and none of that chewy fat remaining.\nA: Sorry, did you say you wanted your bacon crispy? \nB: Yes, very crisp. \nA: How do you want your eggs? \nB: Fried, please. \nA: Anything more, sir? \nB: No, that's enough. Thank you.", + "total_duration": 50.599818594104306, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--493/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--493/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--493/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "What can I do for you, sir?", + "original_text": "What can I do for you, sir?", + "start_time": 0, + "end_time": 1.6370068027210884, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--493/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "What have you got this morning?", + "original_text": "What have you got this morning?", + "start_time": 2.0042535353854936, + "end_time": 3.339400927675743, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--493/temp/line_1_B.wav", + "silence_duration": 0.36724673266440533, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Fruit juice, cakes and refreshments, and", + "original_text": "Fruit juice, cakes and refreshments, and [interrupt] some freshly baked pastries as well, including croissants, danishes, and muffins that were prepared just an hour ago with premium ingredients.", + "start_time": 3.7865020910070997, + "end_time": 15.535799143161293, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--493/temp/line_2_A.wav", + "silence_duration": 0.447101163331357, + "is_interrupted": true, + "text_after_interrupt": "some freshly baked pastries as well, including croissants, danishes, and muffins that were prepared just an hour ago with premium ingredients." + }, + { + "speaker": "B", + "text": "Could you tell me more about the fruit juices? I'm particularly interested in something fresh.", + "original_text": "Could you tell me more about the fruit juices? I'm particularly interested in something fresh.", + "start_time": 7.780334290553585, + "end_time": 12.911944267877848, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--493/temp/line_3_B.wav", + "silence_duration": 0.5983930086413294, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Certainly! We have fresh orange juice, apple juice, and tomato juice.", + "original_text": "Certainly! We have fresh orange juice, apple juice, and tomato juice.", + "start_time": 15.932937482441648, + "end_time": 20.36794882031013, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--493/temp/line_4_A.wav", + "silence_duration": 0.3971383392803558, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I'd like to have a glass of tomato juice, please.", + "original_text": "I'd like to have a glass of tomato juice, please.", + "start_time": 20.83790682390352, + "end_time": 23.032192538189236, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--493/temp/line_5_B.wav", + "silence_duration": 0.4699580035933911, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Any cereal, sir?", + "original_text": "Any cereal, sir?", + "start_time": 23.57953367806896, + "end_time": 24.914681070359208, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--493/temp/line_6_A.wav", + "silence_duration": 0.5473411398797215, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, a dish of cream of wheat.", + "original_text": "Yes, a dish of cream of wheat.", + "start_time": 25.220781310589736, + "end_time": 26.892618045283612, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--493/temp/line_7_B.wav", + "silence_duration": 0.30610024023052623, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "And eggs?", + "original_text": "And eggs?", + "start_time": 27.45337244195652, + "end_time": 28.40539058254609, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--493/temp/line_8_A.wav", + "silence_duration": 0.560754396672908, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, bacon and eggs with buttered toast. I like my bacon very", + "original_text": "Yes, bacon and eggs with buttered toast. I like my bacon very [interrupt] well done, almost crispy, with just a slight hint of smokiness and none of that chewy fat remaining.", + "start_time": 28.821160211948104, + "end_time": 38.770910778841525, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--493/temp/line_9_B.wav", + "silence_duration": 0.41576962940201556, + "is_interrupted": true, + "text_after_interrupt": "well done, almost crispy, with just a slight hint of smokiness and none of that chewy fat remaining." + }, + { + "speaker": "A", + "text": "Sorry, did you say you wanted your bacon crispy?", + "original_text": "Sorry, did you say you wanted your bacon crispy?", + "start_time": 38.1828873144122, + "end_time": 41.13182155477501, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--493/temp/line_10_A.wav", + "silence_duration": 0.5475838515095279, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes, very crisp.", + "original_text": "Yes, very crisp.", + "start_time": 41.64100554615113, + "end_time": 42.929713029144324, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--493/temp/line_11_B.wav", + "silence_duration": 0.5091839913761185, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "How do you want your eggs?", + "original_text": "How do you want your eggs?", + "start_time": 43.4687447796166, + "end_time": 44.96643185444653, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--493/temp/line_12_A.wav", + "silence_duration": 0.5390317504722758, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Fried, please.", + "original_text": "Fried, please.", + "start_time": 45.39925289484476, + "end_time": 46.40932092205564, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--493/temp/line_13_B.wav", + "silence_duration": 0.4328210403982261, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Anything more, sir?", + "original_text": "Anything more, sir?", + "start_time": 46.741637352844016, + "end_time": 47.995514903864425, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--493/temp/line_14_A.wav", + "silence_duration": 0.3323164307883709, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "No, that's enough. Thank you.", + "original_text": "No, that's enough. Thank you.", + "start_time": 48.591327747804925, + "end_time": 50.59985382490243, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--493/temp/line_15_B.wav", + "silence_duration": 0.5958128439405017, + "is_interrupted": false + } + ] + }, + "DialogSum--val--494": { + "original_text": "A: Excuse me, is there a table for 8 right now? \nB: Let me see... I am sorry the tables you want are [interrupt] currently occupied by another large party who's just finishing their desserts, but they should be free in about 15 minutes if you'd like to wait in our lounge area. \nA: Oh, before I forget, are there any tables near the window available? \nB: The tables by the window are booked for the evening, but as I was saying, the tables you want are booked as well though we can certainly accommodate you shortly. \nA: Well, since there are some small square tables, could we put two tables together? \nB: No problem, sir. Let me help you with that right away and I'll have our staff prepare the combined table with fresh linens and settings for your party.", + "cleaned_text": "A: Excuse me, is there a table for 8 right now? \nB:Let me see... I am sorry the tables you want are currently occupied by another large party who's just finishing their desserts, but they should be free in about 15 minutes if you'd like to wait in our lounge area.\nA: Oh, before I forget, are there any tables near the window available? \nB: The tables by the window are booked for the evening, but as I was saying, the tables you want are booked as well though we can certainly accommodate you shortly. \nA: Well, since there are some small square tables, could we put two tables together? \nB: No problem, sir. Let me help you with that right away and I'll have our staff prepare the combined table with fresh linens and settings for your party.", + "total_duration": 34.64621315192744, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--494/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--494/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--494/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Excuse me, is there a table for 8 right now?", + "original_text": "Excuse me, is there a table for 8 right now?", + "start_time": 0, + "end_time": 2.8792743764172335, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--494/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Let me see... I am sorry the tables you want are", + "original_text": "Let me see... I am sorry the tables you want are [interrupt] currently occupied by another large party who's just finishing their desserts, but they should be free in about 15 minutes if you'd like to wait in our lounge area.", + "start_time": 3.449891058162925, + "end_time": 13.805990831405555, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--494/temp/line_1_B.wav", + "silence_duration": 0.5706166817456915, + "is_interrupted": true, + "text_after_interrupt": "currently occupied by another large party who's just finishing their desserts, but they should be free in about 15 minutes if you'd like to wait in our lounge area." + }, + { + "speaker": "A", + "text": "Oh, before I forget, are there any tables near the window available?", + "original_text": "Oh, before I forget, are there any tables near the window available?", + "start_time": 6.25950557063458, + "end_time": 10.508757271314852, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--494/temp/line_2_A.wav", + "silence_duration": 0.3628413431490657, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "The tables by the window are booked for the evening, but as I was saying, the tables you want are booked as well though we can certainly accommodate you shortly.", + "original_text": "The tables by the window are booked for the evening, but as I was saying, the tables you want are booked as well though we can certainly accommodate you shortly.", + "start_time": 14.142763789477055, + "end_time": 21.457049503762768, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--494/temp/line_3_B.wav", + "silence_duration": 0.33677295807149876, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Well, since there are some small square tables, could we put two tables together?", + "original_text": "Well, since there are some small square tables, could we put two tables together?", + "start_time": 21.835712135072427, + "end_time": 26.630632769993063, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--494/temp/line_4_A.wav", + "silence_duration": 0.37866263130966066, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "No problem, sir. Let me help you with that right away and I'll have our staff prepare the combined table with fresh linens and settings for your party.", + "original_text": "No problem, sir. Let me help you with that right away and I'll have our staff prepare the combined table with fresh linens and settings for your party.", + "start_time": 27.227448829784546, + "end_time": 34.64622433998863, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--494/temp/line_5_B.wav", + "silence_duration": 0.5968160597914824, + "is_interrupted": false + } + ] + }, + "DialogSum--val--495": { + "original_text": "A: I am totally fed up with my boss. He has crossed the line one too many times with his sexist comments. This time I am really going to report him for sexual harassment.\nB: What happened? Did your boss say something to offend you at [interrupt] the meeting yesterday when he made that comment about how women are \"naturally better at administrative tasks\" while men excel in leadership roles? That was completely inappropriate and unprofessional.\nA: He constantly lets inappropriate things slip out, referring to the women employees as girls or calling us sweetheart or darling. I doubt any of my male colleagues would stand for such treatment.\nB: Don't you think you are overreacting a little? Calling you by nicknames shouldn't [interrupt] be considered harassment unless there's clear evidence of a hostile work environment or repeated patterns of behavior that make you feel uncomfortable and undervalued as a professional.\nA: You're missing the point. It's about respect. He treats us with such a patronizing attitude, as if we are not equal or not as serious as our male co-workers. It's his attitude that needs to be changed, not just his words.\nB: That's what you get for working in a male-dominated field. But wait, you mentioned earlier that your boss said something specific this time—what exactly did he say that crossed the line?", + "cleaned_text": "A: I am totally fed up with my boss. He has crossed the line one too many times with his sexist comments. This time I am really going to report him for sexual harassment.\nB:What happened? Did your boss say something to offend you at the meeting yesterday when he made that comment about how women are \"naturally better at administrative tasks\" while men excel in leadership roles? That was completely inappropriate and unprofessional.\nA: He constantly lets inappropriate things slip out, referring to the women employees as girls or calling us sweetheart or darling. I doubt any of my male colleagues would stand for such treatment.\nB:Don't you think you are overreacting a little? Calling you by nicknames shouldn't be considered harassment unless there's clear evidence of a hostile work environment or repeated patterns of behavior that make you feel uncomfortable and undervalued as a professional.\nA: You're missing the point. It's about respect. He treats us with such a patronizing attitude, as if we are not equal or not as serious as our male co-workers. It's his attitude that needs to be changed, not just his words.\nB: That's what you get for working in a male-dominated field. But wait, you mentioned earlier that your boss said something specific this time—what exactly did he say that crossed the line?", + "total_duration": 66.41836734693878, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--495/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--495/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--495/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "I am totally fed up with my boss. He has crossed the line one too many times with his sexist comments. This time I am really going to report him for sexual harassment.", + "original_text": "I am totally fed up with my boss. He has crossed the line one too many times with his sexist comments. This time I am really going to report him for sexual harassment.", + "start_time": 0, + "end_time": 10.448979591836734, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--495/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "What happened? Did your boss say something to offend you at", + "original_text": "What happened? Did your boss say something to offend you at [interrupt] the meeting yesterday when he made that comment about how women are \"naturally better at administrative tasks\" while men excel in leadership roles? That was completely inappropriate and unprofessional.", + "start_time": 10.967749322100298, + "end_time": 23.95931394795064, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--495/temp/line_1_B.wav", + "silence_duration": 0.5187697302635643, + "is_interrupted": true, + "text_after_interrupt": "the meeting yesterday when he made that comment about how women are \"naturally better at administrative tasks\" while men excel in leadership roles? That was completely inappropriate and unprofessional." + }, + { + "speaker": "A", + "text": "He constantly lets inappropriate things slip out, referring to the women employees as girls or calling us sweetheart or darling. I doubt any of my male colleagues would stand for such treatment.", + "original_text": "He constantly lets inappropriate things slip out, referring to the women employees as girls or calling us sweetheart or darling. I doubt any of my male colleagues would stand for such treatment.", + "start_time": 14.044393313030003, + "end_time": 27.05917789352887, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--495/temp/line_2_A.wav", + "silence_duration": 0.3261048424988487, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Don't you think you are overreacting a little? Calling you by nicknames shouldn't", + "original_text": "Don't you think you are overreacting a little? Calling you by nicknames shouldn't [interrupt] be considered harassment unless there's clear evidence of a hostile work environment or repeated patterns of behavior that make you feel uncomfortable and undervalued as a professional.", + "start_time": 27.648740086393875, + "end_time": 40.96538407732358, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--495/temp/line_3_B.wav", + "silence_duration": 0.5895621928650059, + "is_interrupted": true, + "text_after_interrupt": "be considered harassment unless there's clear evidence of a hostile work environment or repeated patterns of behavior that make you feel uncomfortable and undervalued as a professional." + }, + { + "speaker": "A", + "text": "You're missing the point. It's about respect. He treats us with such a patronizing attitude, as if we are not equal or not as serious as our male co-workers. It's his attitude that needs to be changed, not just his words.", + "original_text": "You're missing the point. It's about respect. He treats us with such a patronizing attitude, as if we are not equal or not as serious as our male co-workers. It's his attitude that needs to be changed, not just his words.", + "start_time": 41.56639039977649, + "end_time": 55.881492440592815, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--495/temp/line_4_A.wav", + "silence_duration": 0.3521903637427021, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "That's what you get for working in a male-dominated field. But wait, you mentioned earlier that your boss said something specific this time—what exactly did he say that crossed the line?", + "original_text": "That's what you get for working in a male-dominated field. But wait, you mentioned earlier that your boss said something specific this time—what exactly did he say that crossed the line?", + "start_time": 56.28289625841075, + "end_time": 66.41840646249238, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--495/temp/line_5_B.wav", + "silence_duration": 0.4014038178179327, + "is_interrupted": false + } + ] + }, + "DialogSum--val--496": { + "original_text": "A: Now that it's the new year, I've decided to turn over a new leaf.\nB: Yeah? You finally decided to wipe the slate [interrupt] clean and start fresh with a completely new perspective on life, embracing all the opportunities that come your way?\nA: Actually, yes! I have a new job, I'm living in a new city, with new friends! This is my opportunity to make some small changes in the way I live my life.\nB: That sounds exciting. So what are you going to do? Take up an art class or something?\nA: Well, first of all, I've decided to stop smoking. It's not that I'm pinching pennies or anything, it's just that I've been smoking since I was sixteen, and I think it's time to prioritize my health and make some positive changes.\nB: That's a big step! But I was curious, you mentioned a new job—what kind of work are you doing now?\nA: Oh, I'm working in marketing now, but about the smoking thing, I just feel like it's time to stop. And there's one last thing—I've decided to come out of the closet.\nB: It's about time! I'm so proud of you for making all these positive changes in your life. This is going to be an amazing year for you!", + "cleaned_text": "A: Now that it's the new year, I've decided to turn over a new leaf.\nB:Yeah? You finally decided to wipe the slate clean and start fresh with a completely new perspective on life, embracing all the opportunities that come your way?\nA: Actually, yes! I have a new job, I'm living in a new city, with new friends! This is my opportunity to make some small changes in the way I live my life.\nB: That sounds exciting. So what are you going to do? Take up an art class or something?\nA: Well, first of all, I've decided to stop smoking. It's not that I'm pinching pennies or anything, it's just that I've been smoking since I was sixteen, and I think it's time to prioritize my health and make some positive changes.\nB: That's a big step! But I was curious, you mentioned a new job—what kind of work are you doing now?\nA: Oh, I'm working in marketing now, but about the smoking thing, I just feel like it's time to stop. And there's one last thing—I've decided to come out of the closet.\nB: It's about time! I'm so proud of you for making all these positive changes in your life. This is going to be an amazing year for you!", + "total_duration": 59.17115646258503, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--496/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--496/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--496/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Now that it's the new year, I've decided to turn over a new leaf.", + "original_text": "Now that it's the new year, I've decided to turn over a new leaf.", + "start_time": 0, + "end_time": 4.0751020408163265, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--496/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yeah? You finally decided to wipe the slate", + "original_text": "Yeah? You finally decided to wipe the slate [interrupt] clean and start fresh with a completely new perspective on life, embracing all the opportunities that come your way?", + "start_time": 4.394830506868141, + "end_time": 13.427392865144785, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--496/temp/line_1_B.wav", + "silence_duration": 0.31972846605181465, + "is_interrupted": true, + "text_after_interrupt": "clean and start fresh with a completely new perspective on life, embracing all the opportunities that come your way?" + }, + { + "speaker": "A", + "text": "Actually, yes! I have a new job, I'm living in a new city, with new friends! This is my opportunity to make some small changes in the way I live my life.", + "original_text": "Actually, yes! I have a new job, I'm living in a new city, with new friends! This is my opportunity to make some small changes in the way I live my life.", + "start_time": 7.146395132718482, + "end_time": 16.480816901425964, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--496/temp/line_2_A.wav", + "silence_duration": 0.3837116882582351, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "That sounds exciting. So what are you going to do? Take up an art class or something?", + "original_text": "That sounds exciting. So what are you going to do? Take up an art class or something?", + "start_time": 16.8035299039952, + "end_time": 20.994731718054158, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--496/temp/line_3_B.wav", + "silence_duration": 0.32271300256923924, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Well, first of all, I've decided to stop smoking. It's not that I'm pinching pennies or anything, it's just that I've been smoking since I was sixteen, and I think it's time to prioritize my health and make some positive changes.", + "original_text": "Well, first of all, I've decided to stop smoking. It's not that I'm pinching pennies or anything, it's just that I've been smoking since I was sixteen, and I think it's time to prioritize my health and make some positive changes.", + "start_time": 21.43206136684784, + "end_time": 35.14344458680249, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--496/temp/line_4_A.wav", + "silence_duration": 0.4373296487936809, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "That's a big step! But I was curious, you mentioned a new job—what kind of work are you doing now?", + "original_text": "That's a big step! But I was curious, you mentioned a new job—what kind of work are you doing now?", + "start_time": 35.52887129657819, + "end_time": 40.85785088841492, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--496/temp/line_5_B.wav", + "silence_duration": 0.38542670977569937, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Oh, I'm working in marketing now, but about the smoking thing, I just feel like it's time to stop. And there's one last thing—I've decided to come out of the closet.", + "original_text": "Oh, I'm working in marketing now, but about the smoking thing, I just feel like it's time to stop. And there's one last thing—I've decided to come out of the closet.", + "start_time": 41.34970384436403, + "end_time": 51.48521404844566, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--496/temp/line_6_A.wav", + "silence_duration": 0.4918529559491087, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "It's about time! I'm so proud of you for making all these positive changes in your life. This is going to be an amazing year for you!", + "original_text": "It's about time! I'm so proud of you for making all these positive changes in your life. This is going to be an amazing year for you!", + "start_time": 51.97299979510592, + "end_time": 59.171185736149006, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--496/temp/line_7_B.wav", + "silence_duration": 0.4877857466602612, + "is_interrupted": false + } + ] + }, + "DialogSum--val--497": { + "original_text": "A: You married Joe, didn't you? \nB: Joe? I don't know what you [interrupt] mean by that, we were definitely close but marriage was never something we seriously considered given our different life goals and priorities at the time. \nA: Sorry to jump in, but I just remembered—didn't you mention something about being in love with him? \nB: Oh, I took a shine to him when we met for the first time. But it comes and [interrupt] fades as we got to know each other better, especially when I realized how incompatible we were in terms of values and long-term aspirations. \nA: Wait, so you're saying it wasn't anything serious? What happened after that? \nB: It comes and goes. Feelings are complicated, you know?", + "cleaned_text": "A: You married Joe, didn't you? \nB:Joe? I don't know what you mean by that, we were definitely close but marriage was never something we seriously considered given our different life goals and priorities at the time.\nA: Sorry to jump in, but I just remembered—didn't you mention something about being in love with him? \nB:Oh, I took a shine to him when we met for the first time. But it comes and fades as we got to know each other better, especially when I realized how incompatible we were in terms of values and long-term aspirations.\nA: Wait, so you're saying it wasn't anything serious? What happened after that? \nB: It comes and goes. Feelings are complicated, you know?", + "total_duration": 29.407573696145125, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--497/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--497/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--497/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "You married Joe, didn't you?", + "original_text": "You married Joe, didn't you?", + "start_time": 0, + "end_time": 1.555736961451247, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--497/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Joe? I don't know what you", + "original_text": "Joe? I don't know what you [interrupt] mean by that, we were definitely close but marriage was never something we seriously considered given our different life goals and priorities at the time.", + "start_time": 1.8975355297963916, + "end_time": 11.48737679963766, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--497/temp/line_1_B.wav", + "silence_duration": 0.34179856834514444, + "is_interrupted": true, + "text_after_interrupt": "mean by that, we were definitely close but marriage was never something we seriously considered given our different life goals and priorities at the time." + }, + { + "speaker": "A", + "text": "Sorry to jump in, but I just remembered—didn't you mention something about being in love with him?", + "original_text": "Sorry to jump in, but I just remembered—didn't you mention something about being in love with him?", + "start_time": 3.6506421057601104, + "end_time": 8.979621697596844, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--497/temp/line_2_A.wav", + "silence_duration": 0.40875431323039413, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Oh, I took a shine to him when we met for the first time. But it comes and", + "original_text": "Oh, I took a shine to him when we met for the first time. But it comes and [interrupt] fades as we got to know each other better, especially when I realized how incompatible we were in terms of values and long-term aspirations.", + "start_time": 11.866219419386148, + "end_time": 22.617058421653724, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--497/temp/line_3_B.wav", + "silence_duration": 0.3788426197484872, + "is_interrupted": true, + "text_after_interrupt": "fades as we got to know each other better, especially when I realized how incompatible we were in terms of values and long-term aspirations." + }, + { + "speaker": "A", + "text": "Wait, so you're saying it wasn't anything serious? What happened after that?", + "original_text": "Wait, so you're saying it wasn't anything serious? What happened after that?", + "start_time": 21.594874632667658, + "end_time": 26.22725558504861, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--497/temp/line_4_A.wav", + "silence_duration": 0.3015091571336604, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "It comes and goes. Feelings are complicated, you know?", + "original_text": "It comes and goes. Feelings are complicated, you know?", + "start_time": 26.748919416901412, + "end_time": 29.407604224157648, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--497/temp/line_5_B.wav", + "silence_duration": 0.5216638318528031, + "is_interrupted": false + } + ] + }, + "DialogSum--val--498": { + "original_text": "A: How can I help you, ma'am?\nB: I was hoping you could look at my car today. For the past few weeks, it has been making very strange [interrupt] grinding noises that seem to come from the front left wheel area, and it's getting worse especially when I brake hard or go over bumps.\nA: Strange noises? What kind of noises are we talking about?\nB: It sounds as if something is being damaged in the wheels. It only happens when I'm slowing down.\nA: Wow, it sounds like you need new brakes. You'll have to leave the car with us until [interrupt] we can perform a full diagnostic check on all the brake components including pads, rotors and calipers to ensure everything gets fixed properly and safely.\nB: Oh, I was really hoping you'd be able to get it back to me this afternoon. Is there any way to speed up the process?\nA: Unfortunately, we need to order the parts, and we can't get started until they arrive. If I order them now, they'll be here this afternoon or tomorrow morning at the latest.\nB: I see. Well, why don't I just bring my car back in the morning? There is a show I really want to see downtown tonight.", + "cleaned_text": "A: How can I help you, ma'am?\nB:I was hoping you could look at my car today. For the past few weeks, it has been making very strange grinding noises that seem to come from the front left wheel area, and it's getting worse especially when I brake hard or go over bumps.\nA: Strange noises? What kind of noises are we talking about?\nB: It sounds as if something is being damaged in the wheels. It only happens when I'm slowing down.\nA:Wow, it sounds like you need new brakes. You'll have to leave the car with us until we can perform a full diagnostic check on all the brake components including pads, rotors and calipers to ensure everything gets fixed properly and safely.\nB: Oh, I was really hoping you'd be able to get it back to me this afternoon. Is there any way to speed up the process?\nA: Unfortunately, we need to order the parts, and we can't get started until they arrive. If I order them now, they'll be here this afternoon or tomorrow morning at the latest.\nB: I see. Well, why don't I just bring my car back in the morning? There is a show I really want to see downtown tonight.", + "total_duration": 50.77260770975057, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--498/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--498/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--498/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "How can I help you, ma'am?", + "original_text": "How can I help you, ma'am?", + "start_time": 0, + "end_time": 1.4164172335600906, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--498/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I was hoping you could look at my car today. For the past few weeks, it has been making very strange", + "original_text": "I was hoping you could look at my car today. For the past few weeks, it has been making very strange [interrupt] grinding noises that seem to come from the front left wheel area, and it's getting worse especially when I brake hard or go over bumps.", + "start_time": 1.8922702261911373, + "end_time": 12.91013870691676, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--498/temp/line_1_B.wav", + "silence_duration": 0.4758529926310466, + "is_interrupted": true, + "text_after_interrupt": "grinding noises that seem to come from the front left wheel area, and it's getting worse especially when I brake hard or go over bumps." + }, + { + "speaker": "A", + "text": "Strange noises? What kind of noises are we talking about?", + "original_text": "Strange noises? What kind of noises are we talking about?", + "start_time": 6.605921019841931, + "end_time": 10.634583151361205, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--498/temp/line_2_A.wav", + "silence_duration": 0.5825831585417469, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "It sounds as if something is being damaged in the wheels. It only happens when I'm slowing down.", + "original_text": "It sounds as if something is being damaged in the wheels. It only happens when I'm slowing down.", + "start_time": 13.474617399680568, + "end_time": 18.548177490383516, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--498/temp/line_3_B.wav", + "silence_duration": 0.5644786927638079, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Wow, it sounds like you need new brakes. You'll have to leave the car with us until", + "original_text": "Wow, it sounds like you need new brakes. You'll have to leave the car with us until [interrupt] we can perform a full diagnostic check on all the brake components including pads, rotors and calipers to ensure everything gets fixed properly and safely.", + "start_time": 18.86374321648034, + "end_time": 32.7608860736232, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--498/temp/line_4_A.wav", + "silence_duration": 0.3155657260968236, + "is_interrupted": true, + "text_after_interrupt": "we can perform a full diagnostic check on all the brake components including pads, rotors and calipers to ensure everything gets fixed properly and safely." + }, + { + "speaker": "B", + "text": "Oh, I was really hoping you'd be able to get it back to me this afternoon. Is there any way to speed up the process?", + "original_text": "Oh, I was really hoping you'd be able to get it back to me this afternoon. Is there any way to speed up the process?", + "start_time": 28.54805562616854, + "end_time": 34.480754038866955, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--498/temp/line_5_B.wav", + "silence_duration": 0.5796052159779845, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Unfortunately, we need to order the parts, and we can't get started until they arrive. If I order them now, they'll be here this afternoon or tomorrow morning at the latest.", + "original_text": "Unfortunately, we need to order the parts, and we can't get started until they arrive. If I order them now, they'll be here this afternoon or tomorrow morning at the latest.", + "start_time": 34.96033739147897, + "end_time": 44.329589092159246, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--498/temp/line_6_A.wav", + "silence_duration": 0.47958335261201734, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I see. Well, why don't I just bring my car back in the morning? There is a show I really want to see downtown tonight.", + "original_text": "I see. Well, why don't I just bring my car back in the morning? There is a show I really want to see downtown tonight.", + "start_time": 44.92120361280741, + "end_time": 50.77263218423598, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--498/temp/line_7_B.wav", + "silence_duration": 0.5916145206481616, + "is_interrupted": false + } + ] + }, + "DialogSum--val--499": { + "original_text": "A: Hello, Amazon's customer service. How can I help you? \nB: Hello, it's the book I got from your website yesterday when I was reading it. I found that one page is missing, page [interrupt] 245, to be exact, and it's right in the middle of an important chapter which makes it impossible to follow the story properly. \nA: Sorry to interrupt, but could you please provide me with your order number so I can assist you further? \nB: Oh, sure. It's B113. Dash 7423935. \nA: OK. Let me check. It's the paper bag night of the Hunter written by RA Salvatore you bought on our web 10 days ago, which is on October thirteenth, right? \nB: Yes. \nA: Well, we might need you to take a photo of the missing part of this book and upload it to the customer service page of our website. And when the problem is confirmed, we will send you a new book in 2 days. \nB: OK. Then what should I do with the old book? Should I send it back to you or donate it to a local library if it's still readable. \nA: Oh, sorry to cut in. You were asking about the old book—no need to return it, sir. You can keep it if you like. Is there anything more I can help you with? \nB: No, thanks.", + "cleaned_text": "A: Hello, Amazon's customer service. How can I help you? \nB:Hello, it's the book I got from your website yesterday when I was reading it. I found that one page is missing, page 245, to be exact, and it's right in the middle of an important chapter which makes it impossible to follow the story properly.\nA: Sorry to interrupt, but could you please provide me with your order number so I can assist you further? \nB: Oh, sure. It's B113. Dash 7423935. \nA: OK. Let me check. It's the paper bag night of the Hunter written by RA Salvatore you bought on our web 10 days ago, which is on October thirteenth, right? \nB: Yes. \nA: Well, we might need you to take a photo of the missing part of this book and upload it to the customer service page of our website. And when the problem is confirmed, we will send you a new book in 2 days. \nB: OK. Then what should I do with the old book? Should I send it back to you or donate it to a local library if it's still readable. \nA: Oh, sorry to cut in. You were asking about the old book—no need to return it, sir. You can keep it if you like. Is there anything more I can help you with? \nB: No, thanks.", + "total_duration": 67.5487074829932, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--499/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--499/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--499/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "Hello, Amazon's customer service. How can I help you?", + "original_text": "Hello, Amazon's customer service. How can I help you?", + "start_time": 0, + "end_time": 3.877732426303855, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--499/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Hello, it's the book I got from your website yesterday when I was reading it. I found that one page is missing, page", + "original_text": "Hello, it's the book I got from your website yesterday when I was reading it. I found that one page is missing, page [interrupt] 245, to be exact, and it's right in the middle of an important chapter which makes it impossible to follow the story properly.", + "start_time": 4.36150106530992, + "end_time": 16.714516938325794, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--499/temp/line_1_B.wav", + "silence_duration": 0.4837686390060645, + "is_interrupted": true, + "text_after_interrupt": "245, to be exact, and it's right in the middle of an important chapter which makes it impossible to follow the story properly." + }, + { + "speaker": "A", + "text": "Sorry to interrupt, but could you please provide me with your order number so I can assist you further?", + "original_text": "Sorry to interrupt, but could you please provide me with your order number so I can assist you further?", + "start_time": 10.43351920589949, + "end_time": 16.66807702902874, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--499/temp/line_2_A.wav", + "silence_duration": 0.3988829385019933, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Oh, sure. It's B113. Dash 7423935.", + "original_text": "Oh, sure. It's B113. Dash 7423935.", + "start_time": 17.2062397588871, + "end_time": 23.905196674986875, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--499/temp/line_3_B.wav", + "silence_duration": 0.49172282056130817, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "OK. Let me check. It's the paper bag night of the Hunter written by RA Salvatore you bought on our web 10 days ago, which is on October thirteenth, right?", + "original_text": "OK. Let me check. It's the paper bag night of the Hunter written by RA Salvatore you bought on our web 10 days ago, which is on October thirteenth, right?", + "start_time": 24.311918378948835, + "end_time": 34.83055783473115, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--499/temp/line_4_A.wav", + "silence_duration": 0.4067217039619615, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yes.", + "original_text": "Yes.", + "start_time": 35.222841909493404, + "end_time": 35.7569008664095, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--499/temp/line_5_B.wav", + "silence_duration": 0.39228407476225274, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Well, we might need you to take a photo of the missing part of this book and upload it to the customer service page of our website. And when the problem is confirmed, we will send you a new book in 2 days.", + "original_text": "Well, we might need you to take a photo of the missing part of this book and upload it to the customer service page of our website. And when the problem is confirmed, we will send you a new book in 2 days.", + "start_time": 36.111905645385384, + "end_time": 48.62746120094094, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--499/temp/line_6_A.wav", + "silence_duration": 0.3550047789758819, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "OK. Then what should I do with the old book? Should I send it back to you or donate it to a local library if it's still readable.", + "original_text": "OK. Then what should I do with the old book? Should I send it back to you or donate it to a local library if it's still readable.", + "start_time": 48.97855299408957, + "end_time": 55.573020114270975, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--499/temp/line_7_B.wav", + "silence_duration": 0.3510917931486276, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Oh, sorry to cut in. You were asking about the old book—no need to return it, sir. You can keep it if you like. Is there anything more I can help you with?", + "original_text": "Oh, sorry to cut in. You were asking about the old book—no need to return it, sir. You can keep it if you like. Is there anything more I can help you with?", + "start_time": 56.1030846133482, + "end_time": 66.26181477207837, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--499/temp/line_8_A.wav", + "silence_duration": 0.5300644990772252, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "No, thanks.", + "original_text": "No, thanks.", + "start_time": 66.770878270297, + "end_time": 67.54874675102263, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--499/temp/line_9_B.wav", + "silence_duration": 0.5090634982186416, + "is_interrupted": false + } + ] + }, + "DialogSum--val--500": { + "original_text": "A: I can't believe it's almost summer.\nB: Yeah, I know. The year went really fast.\nA: What are you going to do this summer vacation?\nB: I'm going to work for a company.\nA: A company? What's that? What do you [interrupt] do there? Are you going to be in an office or will you be working at different locations depending on the catering events?\nB: Oh, it's a catering company. We help at parties. Our company prepares and serves the food, and usually another company provides the music.\nA: I didn't know you could cook.\nB: I don't have to cook. I'm only an assistant.\nA: When do you start?\nB: Tomorrow. We're helping a birthday party. Then a big family get together.\nA: So, what exactly do you [interrupt] do during the event? Do you help with serving or just setting up, and how do you handle any last-minute changes or special requests from the clients?\nB: Before the party starts, I help set everything up. You know, bring the food in and arrange the tables, make sure it looks nice.\nA: Got it. But you mentioned something about another company providing the music—do you also coordinate with them during the event?", + "cleaned_text": "A: I can't believe it's almost summer.\nB: Yeah, I know. The year went really fast.\nA: What are you going to do this summer vacation?\nB: I'm going to work for a company.\nA:A company? What's that? What do you do there? Are you going to be in an office or will you be working at different locations depending on the catering events?\nB: Oh, it's a catering company. We help at parties. Our company prepares and serves the food, and usually another company provides the music.\nA: I didn't know you could cook.\nB: I don't have to cook. I'm only an assistant.\nA: When do you start?\nB: Tomorrow. We're helping a birthday party. Then a big family get together.\nA:So, what exactly do you do during the event? Do you help with serving or just setting up, and how do you handle any last-minute changes or special requests from the clients?\nB: Before the party starts, I help set everything up. You know, bring the food in and arrange the tables, make sure it looks nice.\nA: Got it. But you mentioned something about another company providing the music—do you also coordinate with them during the event?", + "total_duration": 55.401315192743766, + "stereo_audio": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--500/stereo_dialogue.wav", + "speaker_tracks": { + "A": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--500/A_track.wav", + "B": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--500/B_track.wav" + }, + "error_type": "error_after_interrupt", + "segments": [ + { + "speaker": "A", + "text": "I can't believe it's almost summer.", + "original_text": "I can't believe it's almost summer.", + "start_time": 0, + "end_time": 1.8692063492063493, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--500/temp/line_0_A.wav", + "silence_duration": 0, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Yeah, I know. The year went really fast.", + "original_text": "Yeah, I know. The year went really fast.", + "start_time": 2.2254987125940455, + "end_time": 4.756473769283388, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--500/temp/line_1_B.wav", + "silence_duration": 0.3562923633876961, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "What are you going to do this summer vacation?", + "original_text": "What are you going to do this summer vacation?", + "start_time": 5.173030285748416, + "end_time": 7.344096045385604, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--500/temp/line_2_A.wav", + "silence_duration": 0.4165565164650276, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I'm going to work for a company.", + "original_text": "I'm going to work for a company.", + "start_time": 7.675777181859912, + "end_time": 9.208294188662633, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--500/temp/line_3_B.wav", + "silence_duration": 0.33168113647430764, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "A company? What's that? What do you", + "original_text": "A company? What's that? What do you [interrupt] do there? Are you going to be in an office or will you be working at different locations depending on the catering events?", + "start_time": 9.791321129161615, + "end_time": 20.08937101578293, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--500/temp/line_4_A.wav", + "silence_duration": 0.5830269404989815, + "is_interrupted": true, + "text_after_interrupt": "do there? Are you going to be in an office or will you be working at different locations depending on the catering events?" + }, + { + "speaker": "B", + "text": "Oh, it's a catering company. We help at parties. Our company prepares and serves the food, and usually another company provides the music.", + "original_text": "Oh, it's a catering company. We help at parties. Our company prepares and serves the food, and usually another company provides the music.", + "start_time": 13.227874417143473, + "end_time": 20.797579632562975, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--500/temp/line_5_B.wav", + "silence_duration": 0.48091175911131345, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "I didn't know you could cook.", + "original_text": "I didn't know you could cook.", + "start_time": 21.118114251520087, + "end_time": 22.755121054241176, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--500/temp/line_6_A.wav", + "silence_duration": 0.3205346189571126, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "I don't have to cook. I'm only an assistant.", + "original_text": "I don't have to cook. I'm only an assistant.", + "start_time": 23.129464707113556, + "end_time": 25.486290103938952, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--500/temp/line_7_B.wav", + "silence_duration": 0.37434365287238003, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "When do you start?", + "original_text": "When do you start?", + "start_time": 25.806109940345177, + "end_time": 26.88583783150164, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--500/temp/line_8_A.wav", + "silence_duration": 0.3198198364062261, + "is_interrupted": false + }, + { + "speaker": "B", + "text": "Tomorrow. We're helping a birthday party. Then a big family get together.", + "original_text": "Tomorrow. We're helping a birthday party. Then a big family get together.", + "start_time": 27.262827519394623, + "end_time": 31.361149514859477, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--500/temp/line_9_B.wav", + "silence_duration": 0.3769896878929826, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "So, what exactly do you", + "original_text": "So, what exactly do you [interrupt] do during the event? Do you help with serving or just setting up, and how do you handle any last-minute changes or special requests from the clients?", + "start_time": 31.929508564749202, + "end_time": 42.146288610100676, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--500/temp/line_10_A.wav", + "silence_duration": 0.5683590498897237, + "is_interrupted": true, + "text_after_interrupt": "do during the event? Do you help with serving or just setting up, and how do you handle any last-minute changes or special requests from the clients?" + }, + { + "speaker": "B", + "text": "Before the party starts, I help set everything up. You know, bring the food in and arrange the tables, make sure it looks nice.", + "original_text": "Before the party starts, I help set everything up. You know, bring the food in and arrange the tables, make sure it looks nice.", + "start_time": 41.43456503746846, + "end_time": 47.56463306467934, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--500/temp/line_11_B.wav", + "silence_duration": 0.30534572666500404, + "is_interrupted": false + }, + { + "speaker": "A", + "text": "Got it. But you mentioned something about another company providing the music—do you also coordinate with them during the event?", + "original_text": "Got it. But you mentioned something about another company providing the music—do you also coordinate with them during the event?", + "start_time": 48.12187468574204, + "end_time": 55.401330468054965, + "audio_file": "/root/autodl-tmp/output_overlap5s_dialogsum_testVal/processed_processed_2_val_dialogsum_output/DialogSum--val--500/temp/line_12_A.wav", + "silence_duration": 0.557241621062698, + "is_interrupted": false + } + ] + } +} \ No newline at end of file