ecker commited on
Commit
a669b9a
1 Parent(s): f12f07a

added: SH2 James dataset

Browse files
Files changed (35) hide show
  1. finetunes/james-sunderland/dataset/lxgbsm_00000.wav +3 -0
  2. finetunes/james-sunderland/dataset/lxgbsm_00001.wav +3 -0
  3. finetunes/james-sunderland/dataset/lxgbsm_00002.wav +3 -0
  4. finetunes/james-sunderland/dataset/lxgbsm_00003.wav +3 -0
  5. finetunes/james-sunderland/dataset/lxgbsm_00004.wav +3 -0
  6. finetunes/james-sunderland/dataset/lxgbsm_00005.wav +3 -0
  7. finetunes/james-sunderland/dataset/lxgbsm_00006.wav +3 -0
  8. finetunes/james-sunderland/dataset/lxgbsm_00007.wav +3 -0
  9. finetunes/james-sunderland/dataset/lxgbsm_00008.wav +3 -0
  10. finetunes/james-sunderland/dataset/lxgbsm_00009.wav +3 -0
  11. finetunes/james-sunderland/dataset/lxgbsm_00010.wav +3 -0
  12. finetunes/james-sunderland/dataset/lxgbsm_00011.wav +3 -0
  13. finetunes/james-sunderland/dataset/train.txt +32 -0
  14. finetunes/james-sunderland/dataset/train.yaml +147 -0
  15. finetunes/james-sunderland/dataset/whisper.json +1066 -0
  16. finetunes/james-sunderland/dataset/ynoeld_00000.wav +3 -0
  17. finetunes/james-sunderland/dataset/ynoeld_00001.wav +3 -0
  18. finetunes/james-sunderland/dataset/ynoeld_00002.wav +3 -0
  19. finetunes/james-sunderland/dataset/ynoeld_00003.wav +3 -0
  20. finetunes/james-sunderland/dataset/ynoeld_00004.wav +3 -0
  21. finetunes/james-sunderland/dataset/ynoeld_00005.wav +3 -0
  22. finetunes/james-sunderland/dataset/ynoeld_00006.wav +3 -0
  23. finetunes/james-sunderland/dataset/ynoeld_00007.wav +3 -0
  24. finetunes/james-sunderland/dataset/ynoeld_00008.wav +3 -0
  25. finetunes/james-sunderland/dataset/ynoeld_00009.wav +3 -0
  26. finetunes/james-sunderland/dataset/ynoeld_00010.wav +3 -0
  27. finetunes/james-sunderland/dataset/ynoeld_00011.wav +3 -0
  28. finetunes/james-sunderland/dataset/ynoeld_00012.wav +3 -0
  29. finetunes/james-sunderland/dataset/ynoeld_00013.wav +3 -0
  30. finetunes/james-sunderland/dataset/ynoeld_00014.wav +3 -0
  31. finetunes/james-sunderland/dataset/ynoeld_00015.wav +3 -0
  32. finetunes/james-sunderland/dataset/ynoeld_00016.wav +3 -0
  33. finetunes/james-sunderland/dataset/ynoeld_00017.wav +3 -0
  34. finetunes/james-sunderland/dataset/ynoeld_00018.wav +3 -0
  35. finetunes/james-sunderland/dataset/ynoeld_00019.wav +3 -0
finetunes/james-sunderland/dataset/lxgbsm_00000.wav ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cb65d9c3571f12f6a3ff6de1f43a468466fec3328a620bc271e971c816c13cdd
3
+ size 1234880
finetunes/james-sunderland/dataset/lxgbsm_00001.wav ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cfc5673c594825be558acb0256c56c5a8808d0eb0e9630183fe2a3e9b85f4e9a
3
+ size 1587680
finetunes/james-sunderland/dataset/lxgbsm_00002.wav ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ee6c2a46fb6289374844e160db4173d9572bf046230819f0bf6f4ce4d6433c26
3
+ size 1587680
finetunes/james-sunderland/dataset/lxgbsm_00003.wav ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f97fb2cf229a4e3849b166e9276d5570237a8eb04b70a96f5e47cc641f24726d
3
+ size 1940480
finetunes/james-sunderland/dataset/lxgbsm_00004.wav ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d33ecb3eb38426364ef3f10fb746c3f52c2dd6eb3188418bb5fdb0559ce4919a
3
+ size 1587680
finetunes/james-sunderland/dataset/lxgbsm_00005.wav ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:02de0317585aab8cd30180587c37680bef4202a11f18605062bf0a85812a9f04
3
+ size 1940480
finetunes/james-sunderland/dataset/lxgbsm_00006.wav ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:583e4417dcafc5dc1b6f55ed5e24f474a5c5513c318e51fd360293c626aea3ec
3
+ size 1587680
finetunes/james-sunderland/dataset/lxgbsm_00007.wav ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2902802b9ad97f5b0fa72e245a598714c2289ea5d8f1b415e928ed6abba774e3
3
+ size 2116880
finetunes/james-sunderland/dataset/lxgbsm_00008.wav ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5c6ee7a8d1cceffb255a5d2c959a7af2ee0f5ba1238f2e9eebf25fdf14068168
3
+ size 1764080
finetunes/james-sunderland/dataset/lxgbsm_00009.wav ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fd8228c3b3ffb4304c0c3bf859361f1a3b68bdd7a9277673737321158bf81466
3
+ size 1764080
finetunes/james-sunderland/dataset/lxgbsm_00010.wav ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0ce2d9d9a9faaf12c78a9aa70af88664415a00af75bba7f024400ffdf727c04a
3
+ size 1764080
finetunes/james-sunderland/dataset/lxgbsm_00011.wav ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2700fcaf46c9f9b99bdf1a95d135bbe4451962c5f7991ed90a954b2d6e777f10
3
+ size 2646080
finetunes/james-sunderland/dataset/train.txt ADDED
@@ -0,0 +1,32 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ lxgbsm_00000.wav|I'm kind of lost. I'm looking for Silent Hill. Silent Hill? Is this the right way?
2
+ lxgbsm_00001.wav|Well, there's the hotel 2, I guess. There's the hotel 2, I guess. The one on the lake? I wonder if it's still there.
3
+ lxgbsm_00002.wav|You're coming with me? Is it dangerous? I'll be careful. I guess I really don't care if it's dangerous or not.
4
+ lxgbsm_00003.wav|I'm going to town either way. I'm looking for someone. I'm looking for someone. Someone very important to me.
5
+ lxgbsm_00004.wav|I'm looking for Mary. Have you seen her? Without Mary, I just can't go on.
6
+ lxgbsm_00005.wav|I'd do anything if I could be with her again. I'm going to go look for her. I wish I knew. I killed her. Three years ago.
7
+ lxgbsm_00006.wav|Last year. But I got a letter from her. I got a letter from her. How do you know about Mary? You really seem to care about her.
8
+ lxgbsm_00007.wav|Is that why you're here too? You're not Mary. You're really not Mary. You're alive! I thought that thing killed you. Are you hurt bad?
9
+ lxgbsm_00008.wav|Your face, your voice, just your hair and... I was confused. There are all sorts of strange things around here.
10
+ lxgbsm_00009.wav|This is no place for a kid. Eddie told me. Who's Rachel? What's that letter? It's time to end this nightmare.
11
+ lxgbsm_00010.wav|What the hell is it? I didn't come here to play, you know. You liar! Don't be ridiculous. How can you sit there and eat pizza?
12
+ lxgbsm_00011.wav|You! It was you, wasn't it? You're the one who stepped on my hand. I'm done with you. Forget you. Someone very important to me. You're not Mary.
13
+ ynoeld_00000.wav|It's you. It's you. But I don't need you anymore.
14
+ ynoeld_00001.wav|How old are you? Are you still here? Are you okay? What happened to you?
15
+ ynoeld_00002.wav|We met in the apartment building. We met in the apartment building. Sure is quiet here, huh?
16
+ ynoeld_00003.wav|What are you doing, Laura? Aren't you Maria?
17
+ ynoeld_00004.wav|So, you're Maria? You're Maria? What's a little girl like you doing here, anyway?
18
+ ynoeld_00005.wav|I didn't mean to scare you. Are you alone here, Eddie?
19
+ ynoeld_00006.wav|James Sunderland. James. My name's James.
20
+ ynoeld_00007.wav|Eddie? Laura? Laura. Maria? Maria. Mary? Mary? Mary?
21
+ ynoeld_00008.wav|Is that her name? Who is that girl, anyhow?
22
+ ynoeld_00009.wav|Yeah. Yeah. Yes! Okay. That's right.
23
+ ynoeld_00010.wav|Oh, yeah. I understand now. I believe you.
24
+ ynoeld_00011.wav|No. No. No, I... No, you're not.
25
+ ynoeld_00012.wav|Nothing. Oh, nothing. I guess I really don't care.
26
+ ynoeld_00013.wav|I don't know. Sorry.
27
+ ynoeld_00014.wav|What? Do what? Tell me what happened.
28
+ ynoeld_00015.wav|Why can't you just tell me?
29
+ ynoeld_00016.wav|All I want from you is an answer. How do you know about that?
30
+ ynoeld_00017.wav|Is there any other way? Don't you remember?
31
+ ynoeld_00018.wav|Later, okay?
32
+ ynoeld_00019.wav|Stay right there. I'll be there soon. I'll be there soon. Thanks.
finetunes/james-sunderland/dataset/train.yaml ADDED
@@ -0,0 +1,147 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ name: james-finetune
2
+ model: extensibletrainer
3
+ scale: 1
4
+ gpu_ids: [0] # Superfluous, redundant, unnecessary, the way you launch the training script will set this
5
+ start_step: 0
6
+ checkpointing_enabled: true
7
+ fp16: false
8
+ wandb: false
9
+ use_tb_logger: true
10
+
11
+ datasets:
12
+ train:
13
+ name: james-train
14
+ n_workers: 2
15
+ batch_size: 32
16
+ mode: paired_voice_audio
17
+ path: ./training/james/train.txt
18
+ fetcher_mode: ['lj']
19
+ phase: train
20
+ max_wav_length: 255995
21
+ max_text_length: 200
22
+ sample_rate: 22050
23
+ load_conditioning: True
24
+ num_conditioning_candidates: 2
25
+ conditioning_length: 44000
26
+ use_bpe_tokenizer: True
27
+ tokenizer_vocab: ./models/tortoise/bpe_lowercase_asr_256.json
28
+ load_aligned_codes: False
29
+ val: # I really do not care about validation right now
30
+ name: james-val
31
+ n_workers: 1
32
+ batch_size: 1
33
+ mode: paired_voice_audio
34
+ path: ./training/james/train.txt
35
+ fetcher_mode: ['lj']
36
+ phase: val
37
+ max_wav_length: 255995
38
+ max_text_length: 200
39
+ sample_rate: 22050
40
+ load_conditioning: True
41
+ num_conditioning_candidates: 2
42
+ conditioning_length: 44000
43
+ use_bpe_tokenizer: True
44
+ tokenizer_vocab: ./models/tortoise/bpe_lowercase_asr_256.json
45
+ load_aligned_codes: False
46
+
47
+ steps:
48
+ gpt_train:
49
+ training: gpt
50
+ loss_log_buffer: 500
51
+
52
+ # Generally follows the recipe from the DALLE paper.
53
+ optimizer: adamw # this should be adamw_zero if you're using distributed training
54
+ optimizer_params:
55
+ lr: !!float 0.0001 # originally: 1e-4
56
+ weight_decay: !!float 1e-2
57
+ beta1: 0.9
58
+ beta2: 0.96
59
+ clip_grad_eps: 4
60
+
61
+ injectors:
62
+ paired_to_mel:
63
+ type: torch_mel_spectrogram
64
+ mel_norm_file: ./models/tortoise/clips_mel_norms.pth
65
+ in: wav
66
+ out: paired_mel
67
+ paired_cond_to_mel:
68
+ type: for_each
69
+ subtype: torch_mel_spectrogram
70
+ mel_norm_file: ./models/tortoise/clips_mel_norms.pth
71
+ in: conditioning
72
+ out: paired_conditioning_mel
73
+ to_codes:
74
+ type: discrete_token
75
+ in: paired_mel
76
+ out: paired_mel_codes
77
+ dvae_config: "./models/tortoise/train_diffusion_vocoder_22k_level.yml"
78
+ paired_fwd_text:
79
+ type: generator
80
+ generator: gpt
81
+ in: [paired_conditioning_mel, padded_text, text_lengths, paired_mel_codes, wav_lengths]
82
+ out: [loss_text_ce, loss_mel_ce, logits]
83
+ losses:
84
+ text_ce:
85
+ type: direct
86
+ weight: 0.01
87
+ key: loss_text_ce
88
+ mel_ce:
89
+ type: direct
90
+ weight: 1
91
+ key: loss_mel_ce
92
+
93
+ networks:
94
+ gpt:
95
+ type: generator
96
+ which_model_G: unified_voice2 # none of the unified_voice*.py files actually match the tortoise inference code... 4 and 3 have "alignment_head" (wtf is that?), 2 lacks the types=1 parameter.
97
+ kwargs:
98
+ layers: 30 # originally: 8
99
+ model_dim: 1024 # originally: 512
100
+ heads: 16 # originally: 8
101
+ max_text_tokens: 402 # originally: 120
102
+ max_mel_tokens: 604 # originally: 250
103
+ max_conditioning_inputs: 2 # originally: 1
104
+ mel_length_compression: 1024
105
+ number_text_tokens: 256 # supposed to be 255 for newer unified_voice files
106
+ number_mel_codes: 8194
107
+ start_mel_token: 8192
108
+ stop_mel_token: 8193
109
+ start_text_token: 255
110
+ train_solo_embeddings: False # missing in uv3/4
111
+ use_mel_codes_as_input: True # ditto
112
+ checkpointing: True
113
+ #types: 1 # this is MISSING, but in my analysis 1 is equivalent to not having it.
114
+ #only_alignment_head: False # uv3/4
115
+
116
+ path:
117
+ pretrain_model_gpt: './models/tortoise/autoregressive.pth'
118
+ strict_load: true
119
+ # resume_state: './training/james-finetune//training_state//50.state'
120
+
121
+ train:
122
+ niter: 500
123
+ warmup_iter: -1
124
+ mega_batch_factor: 16
125
+ val_freq: 500
126
+
127
+ ema_enabled: false # I really don't think EMA matters
128
+
129
+ default_lr_scheme: MultiStepLR
130
+ gen_lr_steps: [9, 18, 25, 33] #[50000, 100000, 140000, 180000]
131
+ lr_gamma: 0.5
132
+
133
+ eval:
134
+ output_state: gen
135
+ injectors:
136
+ gen_inj_eval:
137
+ type: generator
138
+ generator: generator
139
+ in: hq
140
+ out: [gen, codebook_commitment_loss]
141
+
142
+ logger:
143
+ print_freq: 5
144
+ save_checkpoint_freq: 25
145
+ visuals: [gen, mel]
146
+ visual_debug_rate: 5
147
+ is_mel_spectrogram: true
finetunes/james-sunderland/dataset/whisper.json ADDED
@@ -0,0 +1,1066 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "lxgbsm.wav": {
3
+ "text": " I'm kind of lost. I'm looking for Silent Hill. Silent Hill? Is this the right way? Well, there's the hotel 2, I guess. There's the hotel 2, I guess. The one on the lake? I wonder if it's still there. You're coming with me? Is it dangerous? I'll be careful. I guess I really don't care if it's dangerous or not. I'm going to town either way. I'm looking for someone. I'm looking for someone. Someone very important to me. I'm looking for Mary. Have you seen her? Without Mary, I just can't go on. I'd do anything if I could be with her again. I'm going to go look for her. I wish I knew. I killed her. Three years ago. Last year. But I got a letter from her. I got a letter from her. How do you know about Mary? You really seem to care about her. Is that why you're here too? You're not Mary. You're really not Mary. You're alive! I thought that thing killed you. Are you hurt bad? Your face, your voice, just your hair and... I was confused. There are all sorts of strange things around here. This is no place for a kid. Eddie told me. Who's Rachel? What's that letter? It's time to end this nightmare. What the hell is it? I didn't come here to play, you know. You liar! Don't be ridiculous. How can you sit there and eat pizza? You! It was you, wasn't it? You're the one who stepped on my hand. I'm done with you. Forget you. Someone very important to me. You're not Mary.",
4
+ "segments": [
5
+ {
6
+ "id": 0,
7
+ "seek": 0,
8
+ "start": 0.0,
9
+ "end": 7.0,
10
+ "text": " I'm kind of lost. I'm looking for Silent Hill. Silent Hill? Is this the right way?",
11
+ "tokens": [
12
+ 314,
13
+ 1101,
14
+ 1611,
15
+ 286,
16
+ 2626,
17
+ 13,
18
+ 314,
19
+ 1101,
20
+ 2045,
21
+ 329,
22
+ 25083,
23
+ 3327,
24
+ 13,
25
+ 25083,
26
+ 3327,
27
+ 30,
28
+ 1148,
29
+ 428,
30
+ 262,
31
+ 826,
32
+ 835,
33
+ 30
34
+ ],
35
+ "temperature": 0.0,
36
+ "avg_logprob": -0.13657650896297988,
37
+ "compression_ratio": 1.6756756756756757,
38
+ "no_speech_prob": 0.0679725632071495
39
+ },
40
+ {
41
+ "id": 1,
42
+ "seek": 0,
43
+ "start": 7.0,
44
+ "end": 16.0,
45
+ "text": " Well, there's the hotel 2, I guess. There's the hotel 2, I guess. The one on the lake? I wonder if it's still there.",
46
+ "tokens": [
47
+ 3894,
48
+ 11,
49
+ 612,
50
+ 338,
51
+ 262,
52
+ 7541,
53
+ 362,
54
+ 11,
55
+ 314,
56
+ 4724,
57
+ 13,
58
+ 1318,
59
+ 338,
60
+ 262,
61
+ 7541,
62
+ 362,
63
+ 11,
64
+ 314,
65
+ 4724,
66
+ 13,
67
+ 383,
68
+ 530,
69
+ 319,
70
+ 262,
71
+ 13546,
72
+ 30,
73
+ 314,
74
+ 4240,
75
+ 611,
76
+ 340,
77
+ 338,
78
+ 991,
79
+ 612,
80
+ 13
81
+ ],
82
+ "temperature": 0.0,
83
+ "avg_logprob": -0.13657650896297988,
84
+ "compression_ratio": 1.6756756756756757,
85
+ "no_speech_prob": 0.0679725632071495
86
+ },
87
+ {
88
+ "id": 2,
89
+ "seek": 0,
90
+ "start": 16.0,
91
+ "end": 25.0,
92
+ "text": " You're coming with me? Is it dangerous? I'll be careful. I guess I really don't care if it's dangerous or not.",
93
+ "tokens": [
94
+ 921,
95
+ 821,
96
+ 2406,
97
+ 351,
98
+ 502,
99
+ 30,
100
+ 1148,
101
+ 340,
102
+ 4923,
103
+ 30,
104
+ 314,
105
+ 1183,
106
+ 307,
107
+ 8161,
108
+ 13,
109
+ 314,
110
+ 4724,
111
+ 314,
112
+ 1107,
113
+ 836,
114
+ 470,
115
+ 1337,
116
+ 611,
117
+ 340,
118
+ 338,
119
+ 4923,
120
+ 393,
121
+ 407,
122
+ 13
123
+ ],
124
+ "temperature": 0.0,
125
+ "avg_logprob": -0.13657650896297988,
126
+ "compression_ratio": 1.6756756756756757,
127
+ "no_speech_prob": 0.0679725632071495
128
+ },
129
+ {
130
+ "id": 3,
131
+ "seek": 2500,
132
+ "start": 25.0,
133
+ "end": 36.0,
134
+ "text": " I'm going to town either way. I'm looking for someone. I'm looking for someone. Someone very important to me.",
135
+ "tokens": [
136
+ 314,
137
+ 1101,
138
+ 1016,
139
+ 284,
140
+ 3240,
141
+ 2035,
142
+ 835,
143
+ 13,
144
+ 314,
145
+ 1101,
146
+ 2045,
147
+ 329,
148
+ 2130,
149
+ 13,
150
+ 314,
151
+ 1101,
152
+ 2045,
153
+ 329,
154
+ 2130,
155
+ 13,
156
+ 17877,
157
+ 845,
158
+ 1593,
159
+ 284,
160
+ 502,
161
+ 13
162
+ ],
163
+ "temperature": 0.0,
164
+ "avg_logprob": -0.07823550926064546,
165
+ "compression_ratio": 1.4959349593495934,
166
+ "no_speech_prob": 3.0241180866141804e-05
167
+ },
168
+ {
169
+ "id": 4,
170
+ "seek": 2500,
171
+ "start": 36.0,
172
+ "end": 45.0,
173
+ "text": " I'm looking for Mary. Have you seen her? Without Mary, I just can't go on.",
174
+ "tokens": [
175
+ 314,
176
+ 1101,
177
+ 2045,
178
+ 329,
179
+ 5335,
180
+ 13,
181
+ 8192,
182
+ 345,
183
+ 1775,
184
+ 607,
185
+ 30,
186
+ 9170,
187
+ 5335,
188
+ 11,
189
+ 314,
190
+ 655,
191
+ 460,
192
+ 470,
193
+ 467,
194
+ 319,
195
+ 13
196
+ ],
197
+ "temperature": 0.0,
198
+ "avg_logprob": -0.07823550926064546,
199
+ "compression_ratio": 1.4959349593495934,
200
+ "no_speech_prob": 3.0241180866141804e-05
201
+ },
202
+ {
203
+ "id": 5,
204
+ "seek": 4500,
205
+ "start": 45.0,
206
+ "end": 56.0,
207
+ "text": " I'd do anything if I could be with her again. I'm going to go look for her. I wish I knew. I killed her. Three years ago.",
208
+ "tokens": [
209
+ 314,
210
+ 1549,
211
+ 466,
212
+ 1997,
213
+ 611,
214
+ 314,
215
+ 714,
216
+ 307,
217
+ 351,
218
+ 607,
219
+ 757,
220
+ 13,
221
+ 314,
222
+ 1101,
223
+ 1016,
224
+ 284,
225
+ 467,
226
+ 804,
227
+ 329,
228
+ 607,
229
+ 13,
230
+ 314,
231
+ 4601,
232
+ 314,
233
+ 2993,
234
+ 13,
235
+ 314,
236
+ 2923,
237
+ 607,
238
+ 13,
239
+ 7683,
240
+ 812,
241
+ 2084,
242
+ 13
243
+ ],
244
+ "temperature": 0.0,
245
+ "avg_logprob": -0.06976071449175272,
246
+ "compression_ratio": 1.5182926829268293,
247
+ "no_speech_prob": 0.00030994918779470026
248
+ },
249
+ {
250
+ "id": 6,
251
+ "seek": 4500,
252
+ "start": 56.0,
253
+ "end": 65.0,
254
+ "text": " Last year. But I got a letter from her. I got a letter from her. How do you know about Mary? You really seem to care about her.",
255
+ "tokens": [
256
+ 4586,
257
+ 614,
258
+ 13,
259
+ 887,
260
+ 314,
261
+ 1392,
262
+ 257,
263
+ 3850,
264
+ 422,
265
+ 607,
266
+ 13,
267
+ 314,
268
+ 1392,
269
+ 257,
270
+ 3850,
271
+ 422,
272
+ 607,
273
+ 13,
274
+ 1374,
275
+ 466,
276
+ 345,
277
+ 760,
278
+ 546,
279
+ 5335,
280
+ 30,
281
+ 921,
282
+ 1107,
283
+ 1283,
284
+ 284,
285
+ 1337,
286
+ 546,
287
+ 607,
288
+ 13
289
+ ],
290
+ "temperature": 0.0,
291
+ "avg_logprob": -0.06976071449175272,
292
+ "compression_ratio": 1.5182926829268293,
293
+ "no_speech_prob": 0.00030994918779470026
294
+ },
295
+ {
296
+ "id": 7,
297
+ "seek": 6500,
298
+ "start": 65.0,
299
+ "end": 77.0,
300
+ "text": " Is that why you're here too? You're not Mary. You're really not Mary. You're alive! I thought that thing killed you. Are you hurt bad?",
301
+ "tokens": [
302
+ 1148,
303
+ 326,
304
+ 1521,
305
+ 345,
306
+ 821,
307
+ 994,
308
+ 1165,
309
+ 30,
310
+ 921,
311
+ 821,
312
+ 407,
313
+ 5335,
314
+ 13,
315
+ 921,
316
+ 821,
317
+ 1107,
318
+ 407,
319
+ 5335,
320
+ 13,
321
+ 921,
322
+ 821,
323
+ 6776,
324
+ 0,
325
+ 314,
326
+ 1807,
327
+ 326,
328
+ 1517,
329
+ 2923,
330
+ 345,
331
+ 13,
332
+ 4231,
333
+ 345,
334
+ 5938,
335
+ 2089,
336
+ 30
337
+ ],
338
+ "temperature": 0.0,
339
+ "avg_logprob": -0.09471903425274474,
340
+ "compression_ratio": 1.50920245398773,
341
+ "no_speech_prob": 0.0003512969706207514
342
+ },
343
+ {
344
+ "id": 8,
345
+ "seek": 6500,
346
+ "start": 77.0,
347
+ "end": 87.0,
348
+ "text": " Your face, your voice, just your hair and... I was confused. There are all sorts of strange things around here.",
349
+ "tokens": [
350
+ 3406,
351
+ 1986,
352
+ 11,
353
+ 534,
354
+ 3809,
355
+ 11,
356
+ 655,
357
+ 534,
358
+ 4190,
359
+ 290,
360
+ 986,
361
+ 314,
362
+ 373,
363
+ 10416,
364
+ 13,
365
+ 1318,
366
+ 389,
367
+ 477,
368
+ 10524,
369
+ 286,
370
+ 6283,
371
+ 1243,
372
+ 1088,
373
+ 994,
374
+ 13
375
+ ],
376
+ "temperature": 0.0,
377
+ "avg_logprob": -0.09471903425274474,
378
+ "compression_ratio": 1.50920245398773,
379
+ "no_speech_prob": 0.0003512969706207514
380
+ },
381
+ {
382
+ "id": 9,
383
+ "seek": 8700,
384
+ "start": 87.0,
385
+ "end": 97.0,
386
+ "text": " This is no place for a kid. Eddie told me. Who's Rachel? What's that letter? It's time to end this nightmare.",
387
+ "tokens": [
388
+ 770,
389
+ 318,
390
+ 645,
391
+ 1295,
392
+ 329,
393
+ 257,
394
+ 5141,
395
+ 13,
396
+ 19478,
397
+ 1297,
398
+ 502,
399
+ 13,
400
+ 5338,
401
+ 338,
402
+ 15984,
403
+ 30,
404
+ 1867,
405
+ 338,
406
+ 326,
407
+ 3850,
408
+ 30,
409
+ 632,
410
+ 338,
411
+ 640,
412
+ 284,
413
+ 886,
414
+ 428,
415
+ 17123,
416
+ 13
417
+ ],
418
+ "temperature": 0.0,
419
+ "avg_logprob": -0.050474664439325745,
420
+ "compression_ratio": 1.4047619047619047,
421
+ "no_speech_prob": 1.406333740305854e-05
422
+ },
423
+ {
424
+ "id": 10,
425
+ "seek": 8700,
426
+ "start": 97.0,
427
+ "end": 107.0,
428
+ "text": " What the hell is it? I didn't come here to play, you know. You liar! Don't be ridiculous. How can you sit there and eat pizza?",
429
+ "tokens": [
430
+ 1867,
431
+ 262,
432
+ 5968,
433
+ 318,
434
+ 340,
435
+ 30,
436
+ 314,
437
+ 1422,
438
+ 470,
439
+ 1282,
440
+ 994,
441
+ 284,
442
+ 711,
443
+ 11,
444
+ 345,
445
+ 760,
446
+ 13,
447
+ 921,
448
+ 31866,
449
+ 0,
450
+ 2094,
451
+ 470,
452
+ 307,
453
+ 11441,
454
+ 13,
455
+ 1374,
456
+ 460,
457
+ 345,
458
+ 1650,
459
+ 612,
460
+ 290,
461
+ 4483,
462
+ 14256,
463
+ 30
464
+ ],
465
+ "temperature": 0.0,
466
+ "avg_logprob": -0.050474664439325745,
467
+ "compression_ratio": 1.4047619047619047,
468
+ "no_speech_prob": 1.406333740305854e-05
469
+ },
470
+ {
471
+ "id": 11,
472
+ "seek": 10700,
473
+ "start": 107.0,
474
+ "end": 122.0,
475
+ "text": " You! It was you, wasn't it? You're the one who stepped on my hand. I'm done with you. Forget you. Someone very important to me. You're not Mary.",
476
+ "tokens": [
477
+ 50363,
478
+ 921,
479
+ 0,
480
+ 632,
481
+ 373,
482
+ 345,
483
+ 11,
484
+ 2492,
485
+ 470,
486
+ 340,
487
+ 30,
488
+ 921,
489
+ 821,
490
+ 262,
491
+ 530,
492
+ 508,
493
+ 10764,
494
+ 319,
495
+ 616,
496
+ 1021,
497
+ 13,
498
+ 314,
499
+ 1101,
500
+ 1760,
501
+ 351,
502
+ 345,
503
+ 13,
504
+ 29624,
505
+ 345,
506
+ 13,
507
+ 17877,
508
+ 845,
509
+ 1593,
510
+ 284,
511
+ 502,
512
+ 13,
513
+ 921,
514
+ 821,
515
+ 407,
516
+ 5335,
517
+ 13,
518
+ 51113
519
+ ],
520
+ "temperature": 0.0,
521
+ "avg_logprob": -0.07767114528389864,
522
+ "compression_ratio": 1.2307692307692308,
523
+ "no_speech_prob": 2.5464909413130954e-05
524
+ }
525
+ ],
526
+ "language": "en"
527
+ },
528
+ "ynoeld.wav": {
529
+ "text": " It's you. It's you. But I don't need you anymore. How old are you? Are you still here? Are you okay? What happened to you? We met in the apartment building. We met in the apartment building. Sure is quiet here, huh? What are you doing, Laura? Aren't you Maria? So, you're Maria? You're Maria? What's a little girl like you doing here, anyway? I didn't mean to scare you. Are you alone here, Eddie? James Sunderland. James. My name's James. Eddie? Laura? Laura. Maria? Maria. Mary? Mary? Mary? Is that her name? Who is that girl, anyhow? Yeah. Yeah. Yes! Okay. That's right. Oh, yeah. I understand now. I believe you. No. No. No, I... No, you're not. Nothing. Oh, nothing. I guess I really don't care. I don't know. Sorry. What? Do what? Tell me what happened. Why can't you just tell me? All I want from you is an answer. How do you know about that? Is there any other way? Don't you remember? Later, okay? Stay right there. I'll be there soon. I'll be there soon. Thanks.",
530
+ "segments": [
531
+ {
532
+ "id": 0,
533
+ "seek": 0,
534
+ "start": 0.0,
535
+ "end": 5.0,
536
+ "text": " It's you. It's you. But I don't need you anymore.",
537
+ "tokens": [
538
+ 632,
539
+ 338,
540
+ 345,
541
+ 13,
542
+ 632,
543
+ 338,
544
+ 345,
545
+ 13,
546
+ 887,
547
+ 314,
548
+ 836,
549
+ 470,
550
+ 761,
551
+ 345,
552
+ 7471,
553
+ 13
554
+ ],
555
+ "temperature": 0.0,
556
+ "avg_logprob": -0.153718864216524,
557
+ "compression_ratio": 1.7720207253886011,
558
+ "no_speech_prob": 0.13705560564994812
559
+ },
560
+ {
561
+ "id": 1,
562
+ "seek": 0,
563
+ "start": 5.0,
564
+ "end": 11.0,
565
+ "text": " How old are you? Are you still here? Are you okay? What happened to you?",
566
+ "tokens": [
567
+ 1374,
568
+ 1468,
569
+ 389,
570
+ 345,
571
+ 30,
572
+ 4231,
573
+ 345,
574
+ 991,
575
+ 994,
576
+ 30,
577
+ 4231,
578
+ 345,
579
+ 8788,
580
+ 30,
581
+ 1867,
582
+ 3022,
583
+ 284,
584
+ 345,
585
+ 30
586
+ ],
587
+ "temperature": 0.0,
588
+ "avg_logprob": -0.153718864216524,
589
+ "compression_ratio": 1.7720207253886011,
590
+ "no_speech_prob": 0.13705560564994812
591
+ },
592
+ {
593
+ "id": 2,
594
+ "seek": 0,
595
+ "start": 11.0,
596
+ "end": 18.0,
597
+ "text": " We met in the apartment building. We met in the apartment building. Sure is quiet here, huh?",
598
+ "tokens": [
599
+ 775,
600
+ 1138,
601
+ 287,
602
+ 262,
603
+ 7962,
604
+ 2615,
605
+ 13,
606
+ 775,
607
+ 1138,
608
+ 287,
609
+ 262,
610
+ 7962,
611
+ 2615,
612
+ 13,
613
+ 10889,
614
+ 318,
615
+ 5897,
616
+ 994,
617
+ 11,
618
+ 24926,
619
+ 30
620
+ ],
621
+ "temperature": 0.0,
622
+ "avg_logprob": -0.153718864216524,
623
+ "compression_ratio": 1.7720207253886011,
624
+ "no_speech_prob": 0.13705560564994812
625
+ },
626
+ {
627
+ "id": 3,
628
+ "seek": 0,
629
+ "start": 18.0,
630
+ "end": 22.0,
631
+ "text": " What are you doing, Laura? Aren't you Maria?",
632
+ "tokens": [
633
+ 1867,
634
+ 389,
635
+ 345,
636
+ 1804,
637
+ 11,
638
+ 16753,
639
+ 30,
640
+ 9843,
641
+ 470,
642
+ 345,
643
+ 14200,
644
+ 30
645
+ ],
646
+ "temperature": 0.0,
647
+ "avg_logprob": -0.153718864216524,
648
+ "compression_ratio": 1.7720207253886011,
649
+ "no_speech_prob": 0.13705560564994812
650
+ },
651
+ {
652
+ "id": 4,
653
+ "seek": 0,
654
+ "start": 22.0,
655
+ "end": 29.0,
656
+ "text": " So, you're Maria? You're Maria? What's a little girl like you doing here, anyway?",
657
+ "tokens": [
658
+ 1406,
659
+ 11,
660
+ 345,
661
+ 821,
662
+ 14200,
663
+ 30,
664
+ 921,
665
+ 821,
666
+ 14200,
667
+ 30,
668
+ 1867,
669
+ 338,
670
+ 257,
671
+ 1310,
672
+ 2576,
673
+ 588,
674
+ 345,
675
+ 1804,
676
+ 994,
677
+ 11,
678
+ 6949,
679
+ 30
680
+ ],
681
+ "temperature": 0.0,
682
+ "avg_logprob": -0.153718864216524,
683
+ "compression_ratio": 1.7720207253886011,
684
+ "no_speech_prob": 0.13705560564994812
685
+ },
686
+ {
687
+ "id": 5,
688
+ "seek": 2900,
689
+ "start": 29.0,
690
+ "end": 33.0,
691
+ "text": " I didn't mean to scare you. Are you alone here, Eddie?",
692
+ "tokens": [
693
+ 314,
694
+ 1422,
695
+ 470,
696
+ 1612,
697
+ 284,
698
+ 19437,
699
+ 345,
700
+ 13,
701
+ 4231,
702
+ 345,
703
+ 3436,
704
+ 994,
705
+ 11,
706
+ 19478,
707
+ 30
708
+ ],
709
+ "temperature": 0.0,
710
+ "avg_logprob": -0.14054276393010065,
711
+ "compression_ratio": 1.5032679738562091,
712
+ "no_speech_prob": 1.9525503375916742e-05
713
+ },
714
+ {
715
+ "id": 6,
716
+ "seek": 2900,
717
+ "start": 33.0,
718
+ "end": 38.0,
719
+ "text": " James Sunderland. James. My name's James.",
720
+ "tokens": [
721
+ 3700,
722
+ 35706,
723
+ 13,
724
+ 3700,
725
+ 13,
726
+ 2011,
727
+ 1438,
728
+ 338,
729
+ 3700,
730
+ 13
731
+ ],
732
+ "temperature": 0.0,
733
+ "avg_logprob": -0.14054276393010065,
734
+ "compression_ratio": 1.5032679738562091,
735
+ "no_speech_prob": 1.9525503375916742e-05
736
+ },
737
+ {
738
+ "id": 7,
739
+ "seek": 2900,
740
+ "start": 38.0,
741
+ "end": 48.0,
742
+ "text": " Eddie? Laura? Laura. Maria? Maria. Mary? Mary? Mary?",
743
+ "tokens": [
744
+ 19478,
745
+ 30,
746
+ 16753,
747
+ 30,
748
+ 16753,
749
+ 13,
750
+ 14200,
751
+ 30,
752
+ 14200,
753
+ 13,
754
+ 5335,
755
+ 30,
756
+ 5335,
757
+ 30,
758
+ 5335,
759
+ 30
760
+ ],
761
+ "temperature": 0.0,
762
+ "avg_logprob": -0.14054276393010065,
763
+ "compression_ratio": 1.5032679738562091,
764
+ "no_speech_prob": 1.9525503375916742e-05
765
+ },
766
+ {
767
+ "id": 8,
768
+ "seek": 2900,
769
+ "start": 48.0,
770
+ "end": 52.0,
771
+ "text": " Is that her name? Who is that girl, anyhow?",
772
+ "tokens": [
773
+ 1148,
774
+ 326,
775
+ 607,
776
+ 1438,
777
+ 30,
778
+ 5338,
779
+ 318,
780
+ 326,
781
+ 2576,
782
+ 11,
783
+ 597,
784
+ 4919,
785
+ 30
786
+ ],
787
+ "temperature": 0.0,
788
+ "avg_logprob": -0.14054276393010065,
789
+ "compression_ratio": 1.5032679738562091,
790
+ "no_speech_prob": 1.9525503375916742e-05
791
+ },
792
+ {
793
+ "id": 9,
794
+ "seek": 2900,
795
+ "start": 52.0,
796
+ "end": 57.0,
797
+ "text": " Yeah. Yeah. Yes! Okay. That's right.",
798
+ "tokens": [
799
+ 9425,
800
+ 13,
801
+ 9425,
802
+ 13,
803
+ 3363,
804
+ 0,
805
+ 16805,
806
+ 13,
807
+ 1320,
808
+ 338,
809
+ 826,
810
+ 13
811
+ ],
812
+ "temperature": 0.0,
813
+ "avg_logprob": -0.14054276393010065,
814
+ "compression_ratio": 1.5032679738562091,
815
+ "no_speech_prob": 1.9525503375916742e-05
816
+ },
817
+ {
818
+ "id": 10,
819
+ "seek": 5700,
820
+ "start": 57.0,
821
+ "end": 61.0,
822
+ "text": " Oh, yeah. I understand now. I believe you.",
823
+ "tokens": [
824
+ 3966,
825
+ 11,
826
+ 10194,
827
+ 13,
828
+ 314,
829
+ 1833,
830
+ 783,
831
+ 13,
832
+ 314,
833
+ 1975,
834
+ 345,
835
+ 13
836
+ ],
837
+ "temperature": 0.0,
838
+ "avg_logprob": -0.09678743459001372,
839
+ "compression_ratio": 1.42,
840
+ "no_speech_prob": 6.1439545788744e-06
841
+ },
842
+ {
843
+ "id": 11,
844
+ "seek": 5700,
845
+ "start": 61.0,
846
+ "end": 68.0,
847
+ "text": " No. No. No, I... No, you're not.",
848
+ "tokens": [
849
+ 1400,
850
+ 13,
851
+ 1400,
852
+ 13,
853
+ 1400,
854
+ 11,
855
+ 314,
856
+ 986,
857
+ 1400,
858
+ 11,
859
+ 345,
860
+ 821,
861
+ 407,
862
+ 13
863
+ ],
864
+ "temperature": 0.0,
865
+ "avg_logprob": -0.09678743459001372,
866
+ "compression_ratio": 1.42,
867
+ "no_speech_prob": 6.1439545788744e-06
868
+ },
869
+ {
870
+ "id": 12,
871
+ "seek": 5700,
872
+ "start": 68.0,
873
+ "end": 72.0,
874
+ "text": " Nothing. Oh, nothing. I guess I really don't care.",
875
+ "tokens": [
876
+ 10528,
877
+ 13,
878
+ 3966,
879
+ 11,
880
+ 2147,
881
+ 13,
882
+ 314,
883
+ 4724,
884
+ 314,
885
+ 1107,
886
+ 836,
887
+ 470,
888
+ 1337,
889
+ 13
890
+ ],
891
+ "temperature": 0.0,
892
+ "avg_logprob": -0.09678743459001372,
893
+ "compression_ratio": 1.42,
894
+ "no_speech_prob": 6.1439545788744e-06
895
+ },
896
+ {
897
+ "id": 13,
898
+ "seek": 5700,
899
+ "start": 72.0,
900
+ "end": 77.0,
901
+ "text": " I don't know. Sorry.",
902
+ "tokens": [
903
+ 314,
904
+ 836,
905
+ 470,
906
+ 760,
907
+ 13,
908
+ 19061,
909
+ 13
910
+ ],
911
+ "temperature": 0.0,
912
+ "avg_logprob": -0.09678743459001372,
913
+ "compression_ratio": 1.42,
914
+ "no_speech_prob": 6.1439545788744e-06
915
+ },
916
+ {
917
+ "id": 14,
918
+ "seek": 5700,
919
+ "start": 77.0,
920
+ "end": 81.0,
921
+ "text": " What? Do what? Tell me what happened.",
922
+ "tokens": [
923
+ 1867,
924
+ 30,
925
+ 2141,
926
+ 644,
927
+ 30,
928
+ 14026,
929
+ 502,
930
+ 644,
931
+ 3022,
932
+ 13
933
+ ],
934
+ "temperature": 0.0,
935
+ "avg_logprob": -0.09678743459001372,
936
+ "compression_ratio": 1.42,
937
+ "no_speech_prob": 6.1439545788744e-06
938
+ },
939
+ {
940
+ "id": 15,
941
+ "seek": 5700,
942
+ "start": 81.0,
943
+ "end": 83.0,
944
+ "text": " Why can't you just tell me?",
945
+ "tokens": [
946
+ 4162,
947
+ 460,
948
+ 470,
949
+ 345,
950
+ 655,
951
+ 1560,
952
+ 502,
953
+ 30
954
+ ],
955
+ "temperature": 0.0,
956
+ "avg_logprob": -0.09678743459001372,
957
+ "compression_ratio": 1.42,
958
+ "no_speech_prob": 6.1439545788744e-06
959
+ },
960
+ {
961
+ "id": 16,
962
+ "seek": 8300,
963
+ "start": 83.0,
964
+ "end": 88.0,
965
+ "text": " All I want from you is an answer. How do you know about that?",
966
+ "tokens": [
967
+ 1439,
968
+ 314,
969
+ 765,
970
+ 422,
971
+ 345,
972
+ 318,
973
+ 281,
974
+ 3280,
975
+ 13,
976
+ 1374,
977
+ 466,
978
+ 345,
979
+ 760,
980
+ 546,
981
+ 326,
982
+ 30
983
+ ],
984
+ "temperature": 0.0,
985
+ "avg_logprob": -0.04557831534023943,
986
+ "compression_ratio": 1.3834586466165413,
987
+ "no_speech_prob": 1.7880429368233308e-06
988
+ },
989
+ {
990
+ "id": 17,
991
+ "seek": 8300,
992
+ "start": 88.0,
993
+ "end": 91.0,
994
+ "text": " Is there any other way? Don't you remember?",
995
+ "tokens": [
996
+ 1148,
997
+ 612,
998
+ 597,
999
+ 584,
1000
+ 835,
1001
+ 30,
1002
+ 2094,
1003
+ 470,
1004
+ 345,
1005
+ 3505,
1006
+ 30
1007
+ ],
1008
+ "temperature": 0.0,
1009
+ "avg_logprob": -0.04557831534023943,
1010
+ "compression_ratio": 1.3834586466165413,
1011
+ "no_speech_prob": 1.7880429368233308e-06
1012
+ },
1013
+ {
1014
+ "id": 18,
1015
+ "seek": 8300,
1016
+ "start": 91.0,
1017
+ "end": 93.0,
1018
+ "text": " Later, okay?",
1019
+ "tokens": [
1020
+ 11450,
1021
+ 11,
1022
+ 8788,
1023
+ 30
1024
+ ],
1025
+ "temperature": 0.0,
1026
+ "avg_logprob": -0.04557831534023943,
1027
+ "compression_ratio": 1.3834586466165413,
1028
+ "no_speech_prob": 1.7880429368233308e-06
1029
+ },
1030
+ {
1031
+ "id": 19,
1032
+ "seek": 9300,
1033
+ "start": 93.0,
1034
+ "end": 114.0,
1035
+ "text": " Stay right there. I'll be there soon. I'll be there soon. Thanks.",
1036
+ "tokens": [
1037
+ 50363,
1038
+ 16160,
1039
+ 826,
1040
+ 612,
1041
+ 13,
1042
+ 314,
1043
+ 1183,
1044
+ 307,
1045
+ 612,
1046
+ 2582,
1047
+ 13,
1048
+ 314,
1049
+ 1183,
1050
+ 307,
1051
+ 612,
1052
+ 2582,
1053
+ 13,
1054
+ 6930,
1055
+ 13,
1056
+ 51413
1057
+ ],
1058
+ "temperature": 0.0,
1059
+ "avg_logprob": -0.10187114988054548,
1060
+ "compression_ratio": 1.3265306122448979,
1061
+ "no_speech_prob": 5.649423474096693e-05
1062
+ }
1063
+ ],
1064
+ "language": "en"
1065
+ }
1066
+ }
finetunes/james-sunderland/dataset/ynoeld_00000.wav ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b31614e30137738984716d1943a56d66487b35310926730882a9ef272da8e09e
3
+ size 882080
finetunes/james-sunderland/dataset/ynoeld_00001.wav ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:98bea197bffbfe02cbfc09e02243709e87a11d65b279a3a1485c671f5e251a6c
3
+ size 1058480
finetunes/james-sunderland/dataset/ynoeld_00002.wav ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bdf95b92f974f4a7023c2b8ea3d2eb2f47dcc83391bc961fd40f373bddc4f680
3
+ size 1234880
finetunes/james-sunderland/dataset/ynoeld_00003.wav ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:27b32b2aa77c0234eca1883620ade655034b2ee42fcf8e26e2c408738c655e39
3
+ size 705680
finetunes/james-sunderland/dataset/ynoeld_00004.wav ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0bd5ca0c4381cc32fad2977e470fdcc6318db4abe42719350a4fb0949c99a94b
3
+ size 1234880
finetunes/james-sunderland/dataset/ynoeld_00005.wav ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:011be88fb79a79dae064270cc7f87689f236d27dd2ccb4bf018d68ad0750cbb2
3
+ size 705680
finetunes/james-sunderland/dataset/ynoeld_00006.wav ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:21ffde4fbd4063dc8a3949c00ec4cc5055ab30944e3f41325ab94a1e79a4f48c
3
+ size 882080
finetunes/james-sunderland/dataset/ynoeld_00007.wav ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bae00b0bfe8cda4909fbfec6e2ef5ede031b8bbc4edb0e2713722abeca101f03
3
+ size 1764080
finetunes/james-sunderland/dataset/ynoeld_00008.wav ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:25863e3b8694cb12762efc3f5597b3885395ae0cc85078d20754569ee7fbc0c9
3
+ size 705680
finetunes/james-sunderland/dataset/ynoeld_00009.wav ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0d9b88538ed6f6ff6c6467983da87024ac34776e6de8af0e4d464f2416062121
3
+ size 882080
finetunes/james-sunderland/dataset/ynoeld_00010.wav ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cead9ecd32d0d85d491d4232b2eafbd5fb323ba21e20a81706f3eb8db8117d15
3
+ size 705680
finetunes/james-sunderland/dataset/ynoeld_00011.wav ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:93fe0f3a558663cec9cc4af2d9e656d8d3954b46bdec3ef423cab876c87771dc
3
+ size 1234880
finetunes/james-sunderland/dataset/ynoeld_00012.wav ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ccffcfef292e328a78d22e53265da9e081d209321b37f56890aa3eb6f5650bd6
3
+ size 705680
finetunes/james-sunderland/dataset/ynoeld_00013.wav ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4533939de62fb46d7ed44d5dea97f91a5c1940f32eace589931bb133c6545f33
3
+ size 882080
finetunes/james-sunderland/dataset/ynoeld_00014.wav ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:39dde7e9d390f1a7241a3caeeed30d125d2cddd57491b510c3b669c61ad5a924
3
+ size 705680
finetunes/james-sunderland/dataset/ynoeld_00015.wav ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5d3a551a0ac7db136fb2554dba7dc1116ffca8dd27d8f91c3ff92c311a1e806d
3
+ size 352880
finetunes/james-sunderland/dataset/ynoeld_00016.wav ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:154ee5f59038ef9751fdffbaa49003c6af4b470ede808c5e52d1425ffd62b3d7
3
+ size 882080
finetunes/james-sunderland/dataset/ynoeld_00017.wav ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dbcfa1b55984b896d2145b2d251766b9915948635350603d8545cd9ae51d3e63
3
+ size 529280
finetunes/james-sunderland/dataset/ynoeld_00018.wav ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ced36b4eea93c69bbf4ed3b456fbbaf4003432c4c6fda689ccb3013037ef87a5
3
+ size 352880
finetunes/james-sunderland/dataset/ynoeld_00019.wav ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6328ccff79da49ff28ccfa494ebbb7dbb09e20118ae56443fdfbb027f866b742
3
+ size 1022260