word-sub / tests /expected /corner_cases.cpu /accurate.tiny_apollo11.mp3.words.json
RaeesRSB's picture
Upload 185 files
2cba4ca
{
"text": " I'm all around my business and we gotta eat recommendations for you on your door to the VA We have 18A's I'm all around my business and I'm all around my business and I'm all around my business I got a little bit of a problem with that, and you want to have the advice down My goal is to reach these things, not to reach out to them and they're out of the bag And I can't see anything else, I don't want to hear anything else I'm at the least, I'm not making the tag I can't see anything else Yeah, I'm taking a heavy out of the bag We're on the highway, we're on the highway, we're on the highway We're on the highway, we're on the highway We want to hear that, this is the case, we know we can't get that much of our business So I guess we'll be somewhere in our place, but it's not over Okay, it's not over, it's not over, it's not over",
"segments": [
{
"id": 0,
"seek": 0,
"start": 0.6,
"end": 5.28,
"text": " I'm all around my business and we gotta eat recommendations for you on your door to the VA",
"tokens": [
286,
478,
439,
926,
452,
1606,
293,
321,
3428,
1862,
10434,
337,
291,
322,
428,
2853,
281,
264,
18527
],
"temperature": 0.0,
"avg_logprob": -0.4247800021701389,
"compression_ratio": 6.281818181818182,
"no_speech_prob": 0.3518604338169098,
"confidence": 0.27,
"words": [
{
"text": "I'm",
"start": 0.6,
"end": 0.74,
"confidence": 0.168
},
{
"text": "all",
"start": 0.74,
"end": 1.02,
"confidence": 0.083
},
{
"text": "around",
"start": 1.02,
"end": 1.24,
"confidence": 0.103
},
{
"text": "my",
"start": 1.24,
"end": 1.42,
"confidence": 0.129
},
{
"text": "business",
"start": 1.42,
"end": 1.62,
"confidence": 0.339
},
{
"text": "and",
"start": 1.62,
"end": 1.9,
"confidence": 0.613
},
{
"text": "we",
"start": 1.9,
"end": 1.98,
"confidence": 0.938
},
{
"text": "gotta",
"start": 1.98,
"end": 2.16,
"confidence": 0.402
},
{
"text": "eat",
"start": 2.16,
"end": 2.38,
"confidence": 0.246
},
{
"text": "recommendations",
"start": 2.38,
"end": 2.84,
"confidence": 0.111
},
{
"text": "for",
"start": 2.84,
"end": 3.48,
"confidence": 0.236
},
{
"text": "you",
"start": 3.48,
"end": 3.62,
"confidence": 0.95
},
{
"text": "on",
"start": 3.62,
"end": 3.82,
"confidence": 0.774
},
{
"text": "your",
"start": 3.82,
"end": 4.36,
"confidence": 0.598
},
{
"text": "door",
"start": 4.36,
"end": 4.62,
"confidence": 0.113
},
{
"text": "to",
"start": 4.62,
"end": 4.84,
"confidence": 0.194
},
{
"text": "the",
"start": 4.84,
"end": 4.9,
"confidence": 0.457
},
{
"text": "VA",
"start": 4.9,
"end": 5.28,
"confidence": 0.23
}
]
},
{
"id": 1,
"seek": 0,
"start": 5.28,
"end": 6.82,
"text": " We have 18A's",
"tokens": [
492,
362,
2443,
32,
311
],
"temperature": 0.0,
"avg_logprob": -0.4247800021701389,
"compression_ratio": 6.281818181818182,
"no_speech_prob": 0.3518604338169098,
"confidence": 0.189,
"words": [
{
"text": "We",
"start": 5.28,
"end": 5.6,
"confidence": 0.056
},
{
"text": "have",
"start": 5.6,
"end": 5.72,
"confidence": 0.61
},
{
"text": "18A's",
"start": 5.72,
"end": 6.82,
"confidence": 0.191
}
]
},
{
"id": 2,
"seek": 700,
"start": 7.02,
"end": 24.14,
"text": " I'm all around my business and I'm all around my business and I'm all around my business",
"tokens": [
286,
478,
439,
926,
452,
1606,
293,
286,
478,
439,
926,
452,
1606,
293,
286,
478,
439,
926,
452,
1606
],
"temperature": 0.0,
"avg_logprob": -0.8006511529286703,
"compression_ratio": 2.1463414634146343,
"no_speech_prob": 0.1812065988779068,
"confidence": 0.476,
"words": [
{
"text": "I'm",
"start": 7.02,
"end": 11.1,
"confidence": 0.124
},
{
"text": "all",
"start": 11.1,
"end": 13.62,
"confidence": 0.143
},
{
"text": "around",
"start": 13.62,
"end": 13.66,
"confidence": 0.517
},
{
"text": "my",
"start": 13.66,
"end": 13.7,
"confidence": 0.294
},
{
"text": "business",
"start": 13.7,
"end": 13.74,
"confidence": 0.931
},
{
"text": "and",
"start": 13.74,
"end": 14.08,
"confidence": 0.249
},
{
"text": "I'm",
"start": 14.08,
"end": 14.48,
"confidence": 0.379
},
{
"text": "all",
"start": 14.48,
"end": 14.68,
"confidence": 0.368
},
{
"text": "around",
"start": 14.68,
"end": 14.72,
"confidence": 0.892
},
{
"text": "my",
"start": 14.72,
"end": 14.76,
"confidence": 0.743
},
{
"text": "business",
"start": 14.76,
"end": 14.8,
"confidence": 0.981
},
{
"text": "and",
"start": 14.8,
"end": 15.04,
"confidence": 0.391
},
{
"text": "I'm",
"start": 15.04,
"end": 16.06,
"confidence": 0.861
},
{
"text": "all",
"start": 16.06,
"end": 16.12,
"confidence": 0.674
},
{
"text": "around",
"start": 16.12,
"end": 16.8,
"confidence": 0.932
},
{
"text": "my",
"start": 16.8,
"end": 21.82,
"confidence": 0.765
},
{
"text": "business",
"start": 21.82,
"end": 24.14,
"confidence": 0.977
}
]
},
{
"id": 3,
"seek": 3100,
"start": 31.24,
"end": 36.52,
"text": " I got a little bit of a problem with that, and you want to have the advice down",
"tokens": [
286,
658,
257,
707,
857,
295,
257,
1154,
365,
300,
11,
293,
291,
528,
281,
362,
264,
5192,
760
],
"temperature": 0.0,
"avg_logprob": -1.0431414517489346,
"compression_ratio": 1.8074866310160427,
"no_speech_prob": 0.09527108818292618,
"confidence": 0.336,
"words": [
{
"text": "I",
"start": 31.24,
"end": 31.66,
"confidence": 0.447
},
{
"text": "got",
"start": 31.66,
"end": 31.96,
"confidence": 0.219
},
{
"text": "a",
"start": 31.96,
"end": 33.32,
"confidence": 0.159
},
{
"text": "little",
"start": 33.32,
"end": 33.52,
"confidence": 0.104
},
{
"text": "bit",
"start": 33.52,
"end": 33.74,
"confidence": 0.919
},
{
"text": "of",
"start": 33.74,
"end": 33.86,
"confidence": 0.903
},
{
"text": "a",
"start": 33.86,
"end": 33.94,
"confidence": 0.347
},
{
"text": "problem",
"start": 33.94,
"end": 34.12,
"confidence": 0.226
},
{
"text": "with",
"start": 34.12,
"end": 34.38,
"confidence": 0.395
},
{
"text": "that,",
"start": 34.38,
"end": 34.52,
"confidence": 0.175
},
{
"text": "and",
"start": 34.52,
"end": 34.58,
"confidence": 0.331
},
{
"text": "you",
"start": 34.58,
"end": 34.7,
"confidence": 0.511
},
{
"text": "want",
"start": 34.7,
"end": 35.0,
"confidence": 0.533
},
{
"text": "to",
"start": 35.0,
"end": 35.06,
"confidence": 0.568
},
{
"text": "have",
"start": 35.06,
"end": 35.36,
"confidence": 0.857
},
{
"text": "the",
"start": 35.36,
"end": 35.52,
"confidence": 0.519
},
{
"text": "advice",
"start": 35.52,
"end": 35.88,
"confidence": 0.077
},
{
"text": "down",
"start": 35.88,
"end": 36.52,
"confidence": 0.231
}
]
},
{
"id": 4,
"seek": 3100,
"start": 37.68,
"end": 41.92,
"text": " My goal is to reach these things, not to reach out to them and they're out of the bag",
"tokens": [
1222,
3387,
307,
281,
2524,
613,
721,
11,
406,
281,
2524,
484,
281,
552,
293,
436,
434,
484,
295,
264,
3411
],
"temperature": 0.0,
"avg_logprob": -1.0431414517489346,
"compression_ratio": 1.8074866310160427,
"no_speech_prob": 0.09527108818292618,
"confidence": 0.312,
"words": [
{
"text": "My",
"start": 37.68,
"end": 38.04,
"confidence": 0.443
},
{
"text": "goal",
"start": 38.04,
"end": 38.14,
"confidence": 0.106
},
{
"text": "is",
"start": 38.14,
"end": 38.34,
"confidence": 0.697
},
{
"text": "to",
"start": 38.34,
"end": 38.68,
"confidence": 0.952
},
{
"text": "reach",
"start": 38.68,
"end": 38.84,
"confidence": 0.185
},
{
"text": "these",
"start": 38.84,
"end": 39.12,
"confidence": 0.19
},
{
"text": "things,",
"start": 39.12,
"end": 39.62,
"confidence": 0.06
},
{
"text": "not",
"start": 39.62,
"end": 40.1,
"confidence": 0.865
},
{
"text": "to",
"start": 40.1,
"end": 40.22,
"confidence": 0.13
},
{
"text": "reach",
"start": 40.22,
"end": 40.36,
"confidence": 0.433
},
{
"text": "out",
"start": 40.36,
"end": 40.58,
"confidence": 0.376
},
{
"text": "to",
"start": 40.58,
"end": 40.72,
"confidence": 0.771
},
{
"text": "them",
"start": 40.72,
"end": 40.84,
"confidence": 0.296
},
{
"text": "and",
"start": 40.84,
"end": 40.88,
"confidence": 0.254
},
{
"text": "they're",
"start": 40.88,
"end": 41.1,
"confidence": 0.244
},
{
"text": "out",
"start": 41.1,
"end": 41.34,
"confidence": 0.162
},
{
"text": "of",
"start": 41.34,
"end": 41.58,
"confidence": 0.722
},
{
"text": "the",
"start": 41.58,
"end": 41.68,
"confidence": 0.562
},
{
"text": "bag",
"start": 41.68,
"end": 41.92,
"confidence": 0.277
}
]
},
{
"id": 5,
"seek": 3100,
"start": 43.52,
"end": 47.08,
"text": " And I can't see anything else, I don't want to hear anything else",
"tokens": [
400,
286,
393,
380,
536,
1340,
1646,
11,
286,
500,
380,
528,
281,
1568,
1340,
1646
],
"temperature": 0.0,
"avg_logprob": -1.0431414517489346,
"compression_ratio": 1.8074866310160427,
"no_speech_prob": 0.09527108818292618,
"confidence": 0.326,
"words": [
{
"text": "And",
"start": 43.52,
"end": 43.56,
"confidence": 0.363
},
{
"text": "I",
"start": 43.56,
"end": 44.12,
"confidence": 0.396
},
{
"text": "can't",
"start": 44.12,
"end": 44.9,
"confidence": 0.248
},
{
"text": "see",
"start": 44.9,
"end": 45.08,
"confidence": 0.22
},
{
"text": "anything",
"start": 45.08,
"end": 45.64,
"confidence": 0.254
},
{
"text": "else,",
"start": 45.64,
"end": 45.68,
"confidence": 0.295
},
{
"text": "I",
"start": 45.68,
"end": 46.4,
"confidence": 0.191
},
{
"text": "don't",
"start": 46.4,
"end": 46.56,
"confidence": 0.615
},
{
"text": "want",
"start": 46.56,
"end": 46.6,
"confidence": 0.269
},
{
"text": "to",
"start": 46.6,
"end": 46.64,
"confidence": 0.744
},
{
"text": "hear",
"start": 46.64,
"end": 46.76,
"confidence": 0.262
},
{
"text": "anything",
"start": 46.76,
"end": 46.88,
"confidence": 0.287
},
{
"text": "else",
"start": 46.88,
"end": 47.08,
"confidence": 0.311
}
]
},
{
"id": 6,
"seek": 3100,
"start": 48.24,
"end": 49.68,
"text": " I'm at the least, I'm not making the tag",
"tokens": [
286,
478,
412,
264,
1935,
11,
286,
478,
406,
1455,
264,
6162
],
"temperature": 0.0,
"avg_logprob": -1.0431414517489346,
"compression_ratio": 1.8074866310160427,
"no_speech_prob": 0.09527108818292618,
"confidence": 0.379,
"words": [
{
"text": "I'm",
"start": 48.24,
"end": 48.48,
"confidence": 0.231
},
{
"text": "at",
"start": 48.48,
"end": 48.52,
"confidence": 0.206
},
{
"text": "the",
"start": 48.52,
"end": 48.68,
"confidence": 0.811
},
{
"text": "least,",
"start": 48.68,
"end": 48.94,
"confidence": 0.235
},
{
"text": "I'm",
"start": 48.94,
"end": 49.0,
"confidence": 0.424
},
{
"text": "not",
"start": 49.0,
"end": 49.12,
"confidence": 0.938
},
{
"text": "making",
"start": 49.12,
"end": 49.26,
"confidence": 0.293
},
{
"text": "the",
"start": 49.26,
"end": 49.44,
"confidence": 0.747
},
{
"text": "tag",
"start": 49.44,
"end": 49.68,
"confidence": 0.298
}
]
},
{
"id": 7,
"seek": 3100,
"start": 51.46,
"end": 52.88,
"text": " I can't see anything else",
"tokens": [
286,
393,
380,
536,
1340,
1646
],
"temperature": 0.0,
"avg_logprob": -1.0431414517489346,
"compression_ratio": 1.8074866310160427,
"no_speech_prob": 0.09527108818292618,
"confidence": 0.412,
"words": [
{
"text": "I",
"start": 51.46,
"end": 51.5,
"confidence": 0.173
},
{
"text": "can't",
"start": 51.5,
"end": 51.86,
"confidence": 0.374
},
{
"text": "see",
"start": 51.86,
"end": 52.2,
"confidence": 0.34
},
{
"text": "anything",
"start": 52.2,
"end": 52.5,
"confidence": 0.915
},
{
"text": "else",
"start": 52.5,
"end": 52.88,
"confidence": 0.653
}
]
},
{
"id": 8,
"seek": 3100,
"start": 53.16,
"end": 54.7,
"text": " Yeah, I'm taking a heavy out of the bag",
"tokens": [
865,
11,
286,
478,
1940,
257,
4676,
484,
295,
264,
3411
],
"temperature": 0.0,
"avg_logprob": -1.0431414517489346,
"compression_ratio": 1.8074866310160427,
"no_speech_prob": 0.09527108818292618,
"confidence": 0.28,
"words": [
{
"text": "Yeah,",
"start": 53.16,
"end": 53.38,
"confidence": 0.569
},
{
"text": "I'm",
"start": 53.38,
"end": 53.46,
"confidence": 0.59
},
{
"text": "taking",
"start": 53.46,
"end": 53.64,
"confidence": 0.881
},
{
"text": "a",
"start": 53.64,
"end": 53.76,
"confidence": 0.177
},
{
"text": "heavy",
"start": 53.76,
"end": 54.04,
"confidence": 0.1
},
{
"text": "out",
"start": 54.04,
"end": 54.28,
"confidence": 0.073
},
{
"text": "of",
"start": 54.28,
"end": 54.42,
"confidence": 0.948
},
{
"text": "the",
"start": 54.42,
"end": 54.6,
"confidence": 0.168
},
{
"text": "bag",
"start": 54.6,
"end": 54.7,
"confidence": 0.084
}
]
},
{
"id": 9,
"seek": 5600,
"start": 56.46,
"end": 59.78,
"text": " We're on the highway, we're on the highway, we're on the highway",
"tokens": [
492,
434,
322,
264,
17205,
11,
321,
434,
322,
264,
17205,
11,
321,
434,
322,
264,
17205
],
"temperature": 0.0,
"avg_logprob": -0.750541016295716,
"compression_ratio": 1.901840490797546,
"no_speech_prob": 0.01289769820868969,
"confidence": 0.498,
"words": [
{
"text": "We're",
"start": 56.46,
"end": 56.94,
"confidence": 0.281
},
{
"text": "on",
"start": 56.94,
"end": 57.18,
"confidence": 0.116
},
{
"text": "the",
"start": 57.18,
"end": 57.26,
"confidence": 0.261
},
{
"text": "highway,",
"start": 57.26,
"end": 57.78,
"confidence": 0.129
},
{
"text": "we're",
"start": 57.78,
"end": 58.32,
"confidence": 0.604
},
{
"text": "on",
"start": 58.32,
"end": 58.44,
"confidence": 0.813
},
{
"text": "the",
"start": 58.44,
"end": 58.74,
"confidence": 0.861
},
{
"text": "highway,",
"start": 58.74,
"end": 58.94,
"confidence": 0.925
},
{
"text": "we're",
"start": 58.94,
"end": 58.98,
"confidence": 0.742
},
{
"text": "on",
"start": 58.98,
"end": 59.02,
"confidence": 0.82
},
{
"text": "the",
"start": 59.02,
"end": 59.18,
"confidence": 0.937
},
{
"text": "highway",
"start": 59.18,
"end": 59.78,
"confidence": 0.948
}
]
},
{
"id": 10,
"seek": 5600,
"start": 60.52,
"end": 66.02,
"text": " We're on the highway, we're on the highway",
"tokens": [
492,
434,
322,
264,
17205,
11,
321,
434,
322,
264,
17205
],
"temperature": 0.0,
"avg_logprob": -0.750541016295716,
"compression_ratio": 1.901840490797546,
"no_speech_prob": 0.01289769820868969,
"confidence": 0.785,
"words": [
{
"text": "We're",
"start": 60.52,
"end": 60.66,
"confidence": 0.62
},
{
"text": "on",
"start": 60.66,
"end": 60.84,
"confidence": 0.437
},
{
"text": "the",
"start": 60.84,
"end": 60.88,
"confidence": 0.94
},
{
"text": "highway,",
"start": 60.88,
"end": 61.16,
"confidence": 0.977
},
{
"text": "we're",
"start": 61.16,
"end": 63.48,
"confidence": 0.865
},
{
"text": "on",
"start": 63.48,
"end": 63.62,
"confidence": 0.911
},
{
"text": "the",
"start": 63.62,
"end": 63.7,
"confidence": 0.892
},
{
"text": "highway",
"start": 63.7,
"end": 66.02,
"confidence": 0.945
}
]
},
{
"id": 11,
"seek": 5600,
"start": 66.02,
"end": 69.04,
"text": " We want to hear that, this is the case, we know we can't get that much of our business",
"tokens": [
492,
528,
281,
1568,
300,
11,
341,
307,
264,
1389,
11,
321,
458,
321,
393,
380,
483,
300,
709,
295,
527,
1606
],
"temperature": 0.0,
"avg_logprob": -0.750541016295716,
"compression_ratio": 1.901840490797546,
"no_speech_prob": 0.01289769820868969,
"confidence": 0.371,
"words": [
{
"text": "We",
"start": 66.02,
"end": 66.06,
"confidence": 0.369
},
{
"text": "want",
"start": 66.06,
"end": 66.1,
"confidence": 0.335
},
{
"text": "to",
"start": 66.1,
"end": 66.14,
"confidence": 0.662
},
{
"text": "hear",
"start": 66.14,
"end": 66.18,
"confidence": 0.323
},
{
"text": "that,",
"start": 66.18,
"end": 66.22,
"confidence": 0.878
},
{
"text": "this",
"start": 66.22,
"end": 66.26,
"confidence": 0.265
},
{
"text": "is",
"start": 66.26,
"end": 66.3,
"confidence": 0.806
},
{
"text": "the",
"start": 66.3,
"end": 66.34,
"confidence": 0.286
},
{
"text": "case,",
"start": 66.34,
"end": 66.38,
"confidence": 0.195
},
{
"text": "we",
"start": 66.38,
"end": 66.92,
"confidence": 0.423
},
{
"text": "know",
"start": 66.92,
"end": 66.96,
"confidence": 0.736
},
{
"text": "we",
"start": 66.96,
"end": 67.06,
"confidence": 0.814
},
{
"text": "can't",
"start": 67.06,
"end": 67.3,
"confidence": 0.339
},
{
"text": "get",
"start": 67.3,
"end": 67.4,
"confidence": 0.219
},
{
"text": "that",
"start": 67.4,
"end": 67.64,
"confidence": 0.209
},
{
"text": "much",
"start": 67.64,
"end": 68.46,
"confidence": 0.213
},
{
"text": "of",
"start": 68.46,
"end": 68.7,
"confidence": 0.59
},
{
"text": "our",
"start": 68.7,
"end": 68.74,
"confidence": 0.679
},
{
"text": "business",
"start": 68.74,
"end": 69.04,
"confidence": 0.077
}
]
},
{
"id": 12,
"seek": 5600,
"start": 69.04,
"end": 72.64,
"text": " So I guess we'll be somewhere in our place, but it's not over",
"tokens": [
407,
286,
2041,
321,
603,
312,
4079,
294,
527,
1081,
11,
457,
309,
311,
406,
670
],
"temperature": 0.0,
"avg_logprob": -0.750541016295716,
"compression_ratio": 1.901840490797546,
"no_speech_prob": 0.01289769820868969,
"confidence": 0.435,
"words": [
{
"text": "So",
"start": 69.04,
"end": 70.38,
"confidence": 0.736
},
{
"text": "I",
"start": 70.38,
"end": 70.52,
"confidence": 0.675
},
{
"text": "guess",
"start": 70.52,
"end": 70.68,
"confidence": 0.721
},
{
"text": "we'll",
"start": 70.68,
"end": 71.04,
"confidence": 0.462
},
{
"text": "be",
"start": 71.04,
"end": 71.22,
"confidence": 0.27
},
{
"text": "somewhere",
"start": 71.22,
"end": 71.36,
"confidence": 0.369
},
{
"text": "in",
"start": 71.36,
"end": 71.4,
"confidence": 0.107
},
{
"text": "our",
"start": 71.4,
"end": 71.5,
"confidence": 0.192
},
{
"text": "place,",
"start": 71.5,
"end": 71.92,
"confidence": 0.38
},
{
"text": "but",
"start": 71.92,
"end": 72.14,
"confidence": 0.431
},
{
"text": "it's",
"start": 72.14,
"end": 72.36,
"confidence": 0.939
},
{
"text": "not",
"start": 72.36,
"end": 72.4,
"confidence": 0.552
},
{
"text": "over",
"start": 72.4,
"end": 72.64,
"confidence": 0.308
}
]
},
{
"id": 13,
"seek": 7400,
"start": 74.02,
"end": 78.4,
"text": " Okay, it's not over, it's not over, it's not over",
"tokens": [
50364,
1033,
11,
309,
311,
406,
670,
11,
309,
311,
406,
670,
11,
309,
311,
406,
670,
51164
],
"temperature": 0.0,
"avg_logprob": -0.405017099882427,
"compression_ratio": 1.6896551724137931,
"no_speech_prob": 0.01679050177335739,
"confidence": 0.705,
"words": [
{
"text": "Okay,",
"start": 74.02,
"end": 75.9,
"confidence": 0.147
},
{
"text": "it's",
"start": 75.9,
"end": 76.16,
"confidence": 0.589
},
{
"text": "not",
"start": 76.16,
"end": 76.22,
"confidence": 0.956
},
{
"text": "over,",
"start": 76.22,
"end": 76.76,
"confidence": 0.89
},
{
"text": "it's",
"start": 76.76,
"end": 77.08,
"confidence": 0.647
},
{
"text": "not",
"start": 77.08,
"end": 77.18,
"confidence": 0.897
},
{
"text": "over,",
"start": 77.18,
"end": 77.36,
"confidence": 0.962
},
{
"text": "it's",
"start": 77.36,
"end": 77.86,
"confidence": 0.869
},
{
"text": "not",
"start": 77.86,
"end": 78.26,
"confidence": 0.955
},
{
"text": "over",
"start": 78.26,
"end": 78.4,
"confidence": 0.934
}
]
}
],
"language": "en"
}