word-sub / tests /expected /corner_cases /large-v2.efficient_gloria.mp3.words.json
RaeesRSB's picture
Upload 185 files
2cba4ca
{
"text": " Ella, my glorious love. How are you? Oh, I'm okay. I will be. I said she could stay with us tomorrow, just until she feels better. Of course she can. No, this won't be for long. Well, if you can stay as long as you want, my love. I really missed you. I agree.",
"segments": [
{
"id": 0,
"seek": 0,
"start": 0.0,
"end": 4.02,
"text": " Ella, my glorious love.",
"tokens": [
50364,
29261,
11,
452,
24026,
959,
13,
50564
],
"temperature": 0.0,
"avg_logprob": -0.36081909347366503,
"compression_ratio": 1.446927374301676,
"no_speech_prob": 0.244294673204422,
"confidence": 0.477,
"words": [
{
"text": "Ella,",
"start": 0.0,
"end": 1.68,
"confidence": 0.128
},
{
"text": "my",
"start": 1.92,
"end": 2.1,
"confidence": 0.733
},
{
"text": "glorious",
"start": 2.1,
"end": 3.36,
"confidence": 0.625
},
{
"text": "love.",
"start": 3.36,
"end": 4.02,
"confidence": 0.883
}
]
},
{
"id": 1,
"seek": 0,
"start": 5.46,
"end": 6.24,
"text": " How are you?",
"tokens": [
50564,
1012,
366,
291,
30,
50664
],
"temperature": 0.0,
"avg_logprob": -0.36081909347366503,
"compression_ratio": 1.446927374301676,
"no_speech_prob": 0.244294673204422,
"confidence": 0.682,
"words": [
{
"text": "How",
"start": 5.46,
"end": 5.62,
"confidence": 0.454
},
{
"text": "are",
"start": 5.62,
"end": 6.02,
"confidence": 0.893
},
{
"text": "you?",
"start": 6.02,
"end": 6.24,
"confidence": 0.783
}
]
},
{
"id": 2,
"seek": 0,
"start": 6.32,
"end": 9.12,
"text": " Oh, I'm okay. I will be.",
"tokens": [
50664,
876,
11,
286,
478,
1392,
13,
286,
486,
312,
13,
50814
],
"temperature": 0.0,
"avg_logprob": -0.36081909347366503,
"compression_ratio": 1.446927374301676,
"no_speech_prob": 0.244294673204422,
"confidence": 0.73,
"words": [
{
"text": "Oh,",
"start": 6.32,
"end": 6.66,
"confidence": 0.479
},
{
"text": "I'm",
"start": 6.74,
"end": 7.02,
"confidence": 0.971
},
{
"text": "okay.",
"start": 7.02,
"end": 7.7,
"confidence": 0.476
},
{
"text": "I",
"start": 8.14,
"end": 8.56,
"confidence": 0.714
},
{
"text": "will",
"start": 8.56,
"end": 8.82,
"confidence": 0.795
},
{
"text": "be.",
"start": 8.82,
"end": 9.12,
"confidence": 0.906
}
]
},
{
"id": 3,
"seek": 0,
"start": 9.32,
"end": 11.42,
"text": " I said she could stay with us tomorrow, just until she feels better.",
"tokens": [
50814,
286,
848,
750,
727,
1754,
365,
505,
4153,
11,
445,
1826,
750,
3417,
1101,
13,
50914
],
"temperature": 0.0,
"avg_logprob": -0.36081909347366503,
"compression_ratio": 1.446927374301676,
"no_speech_prob": 0.244294673204422,
"confidence": 0.723,
"words": [
{
"text": "I",
"start": 9.32,
"end": 9.48,
"confidence": 0.878
},
{
"text": "said",
"start": 9.48,
"end": 9.62,
"confidence": 0.862
},
{
"text": "she",
"start": 9.62,
"end": 9.76,
"confidence": 0.762
},
{
"text": "could",
"start": 9.76,
"end": 9.88,
"confidence": 0.801
},
{
"text": "stay",
"start": 9.88,
"end": 10.08,
"confidence": 0.921
},
{
"text": "with",
"start": 10.08,
"end": 10.22,
"confidence": 0.812
},
{
"text": "us",
"start": 10.22,
"end": 10.36,
"confidence": 0.848
},
{
"text": "tomorrow,",
"start": 10.36,
"end": 10.56,
"confidence": 0.515
},
{
"text": "just",
"start": 10.74,
"end": 10.76,
"confidence": 0.433
},
{
"text": "until",
"start": 10.76,
"end": 10.86,
"confidence": 0.439
},
{
"text": "she",
"start": 10.86,
"end": 10.98,
"confidence": 0.809
},
{
"text": "feels",
"start": 10.98,
"end": 11.16,
"confidence": 0.777
},
{
"text": "better.",
"start": 11.16,
"end": 11.42,
"confidence": 0.822
}
]
},
{
"id": 4,
"seek": 0,
"start": 11.9,
"end": 13.06,
"text": " Of course she can.",
"tokens": [
50914,
2720,
1164,
750,
393,
13,
51014
],
"temperature": 0.0,
"avg_logprob": -0.36081909347366503,
"compression_ratio": 1.446927374301676,
"no_speech_prob": 0.244294673204422,
"confidence": 0.761,
"words": [
{
"text": "Of",
"start": 11.9,
"end": 12.16,
"confidence": 0.562
},
{
"text": "course",
"start": 12.16,
"end": 12.54,
"confidence": 0.875
},
{
"text": "she",
"start": 12.54,
"end": 12.8,
"confidence": 0.758
},
{
"text": "can.",
"start": 12.8,
"end": 13.06,
"confidence": 0.899
}
]
},
{
"id": 5,
"seek": 0,
"start": 13.7,
"end": 15.2,
"text": " No, this won't be for long.",
"tokens": [
51014,
883,
11,
341,
1582,
380,
312,
337,
938,
13,
51114
],
"temperature": 0.0,
"avg_logprob": -0.36081909347366503,
"compression_ratio": 1.446927374301676,
"no_speech_prob": 0.244294673204422,
"confidence": 0.774,
"words": [
{
"text": "No,",
"start": 13.7,
"end": 13.72,
"confidence": 0.381
},
{
"text": "this",
"start": 13.92,
"end": 14.26,
"confidence": 0.702
},
{
"text": "won't",
"start": 14.26,
"end": 14.54,
"confidence": 0.943
},
{
"text": "be",
"start": 14.54,
"end": 14.68,
"confidence": 0.898
},
{
"text": "for",
"start": 14.68,
"end": 14.86,
"confidence": 0.891
},
{
"text": "long.",
"start": 14.86,
"end": 15.2,
"confidence": 0.877
}
]
},
{
"id": 6,
"seek": 0,
"start": 15.3,
"end": 17.48,
"text": " Well, if you can stay as long as you want, my love.",
"tokens": [
51114,
1042,
11,
498,
291,
393,
1754,
382,
938,
382,
291,
528,
11,
452,
959,
13,
51214
],
"temperature": 0.0,
"avg_logprob": -0.36081909347366503,
"compression_ratio": 1.446927374301676,
"no_speech_prob": 0.244294673204422,
"confidence": 0.836,
"words": [
{
"text": "Well,",
"start": 15.3,
"end": 15.46,
"confidence": 0.647
},
{
"text": "if",
"start": 15.52,
"end": 15.6,
"confidence": 0.615
},
{
"text": "you",
"start": 15.6,
"end": 15.68,
"confidence": 0.896
},
{
"text": "can",
"start": 15.68,
"end": 15.82,
"confidence": 0.851
},
{
"text": "stay",
"start": 15.82,
"end": 16.04,
"confidence": 0.924
},
{
"text": "as",
"start": 16.04,
"end": 16.2,
"confidence": 0.885
},
{
"text": "long",
"start": 16.2,
"end": 16.32,
"confidence": 0.883
},
{
"text": "as",
"start": 16.32,
"end": 16.48,
"confidence": 0.907
},
{
"text": "you",
"start": 16.48,
"end": 16.58,
"confidence": 0.899
},
{
"text": "want,",
"start": 16.58,
"end": 16.76,
"confidence": 0.81
},
{
"text": "my",
"start": 16.9,
"end": 17.02,
"confidence": 0.901
},
{
"text": "love.",
"start": 17.02,
"end": 17.48,
"confidence": 0.896
}
]
},
{
"id": 7,
"seek": 0,
"start": 17.66,
"end": 18.96,
"text": " I really missed you.",
"tokens": [
51214,
286,
534,
6721,
291,
13,
51314
],
"temperature": 0.0,
"avg_logprob": -0.36081909347366503,
"compression_ratio": 1.446927374301676,
"no_speech_prob": 0.244294673204422,
"confidence": 0.479,
"words": [
{
"text": "I",
"start": 17.66,
"end": 17.86,
"confidence": 0.252
},
{
"text": "really",
"start": 17.86,
"end": 18.22,
"confidence": 0.447
},
{
"text": "missed",
"start": 18.22,
"end": 18.7,
"confidence": 0.653
},
{
"text": "you.",
"start": 18.7,
"end": 18.96,
"confidence": 0.717
}
]
},
{
"id": 8,
"seek": 0,
"start": 19.58,
"end": 20.6,
"text": " I agree.",
"tokens": [
51314,
286,
3986,
13,
51414
],
"temperature": 0.0,
"avg_logprob": -0.36081909347366503,
"compression_ratio": 1.446927374301676,
"no_speech_prob": 0.244294673204422,
"confidence": 0.421,
"words": [
{
"text": "I",
"start": 19.58,
"end": 20.4,
"confidence": 0.403
},
{
"text": "agree.",
"start": 20.4,
"end": 20.6,
"confidence": 0.439
}
]
}
],
"language": "en"
}