added: SH2 James dataset
Browse files- finetunes/james-sunderland/dataset/lxgbsm_00000.wav +3 -0
- finetunes/james-sunderland/dataset/lxgbsm_00001.wav +3 -0
- finetunes/james-sunderland/dataset/lxgbsm_00002.wav +3 -0
- finetunes/james-sunderland/dataset/lxgbsm_00003.wav +3 -0
- finetunes/james-sunderland/dataset/lxgbsm_00004.wav +3 -0
- finetunes/james-sunderland/dataset/lxgbsm_00005.wav +3 -0
- finetunes/james-sunderland/dataset/lxgbsm_00006.wav +3 -0
- finetunes/james-sunderland/dataset/lxgbsm_00007.wav +3 -0
- finetunes/james-sunderland/dataset/lxgbsm_00008.wav +3 -0
- finetunes/james-sunderland/dataset/lxgbsm_00009.wav +3 -0
- finetunes/james-sunderland/dataset/lxgbsm_00010.wav +3 -0
- finetunes/james-sunderland/dataset/lxgbsm_00011.wav +3 -0
- finetunes/james-sunderland/dataset/train.txt +32 -0
- finetunes/james-sunderland/dataset/train.yaml +147 -0
- finetunes/james-sunderland/dataset/whisper.json +1066 -0
- finetunes/james-sunderland/dataset/ynoeld_00000.wav +3 -0
- finetunes/james-sunderland/dataset/ynoeld_00001.wav +3 -0
- finetunes/james-sunderland/dataset/ynoeld_00002.wav +3 -0
- finetunes/james-sunderland/dataset/ynoeld_00003.wav +3 -0
- finetunes/james-sunderland/dataset/ynoeld_00004.wav +3 -0
- finetunes/james-sunderland/dataset/ynoeld_00005.wav +3 -0
- finetunes/james-sunderland/dataset/ynoeld_00006.wav +3 -0
- finetunes/james-sunderland/dataset/ynoeld_00007.wav +3 -0
- finetunes/james-sunderland/dataset/ynoeld_00008.wav +3 -0
- finetunes/james-sunderland/dataset/ynoeld_00009.wav +3 -0
- finetunes/james-sunderland/dataset/ynoeld_00010.wav +3 -0
- finetunes/james-sunderland/dataset/ynoeld_00011.wav +3 -0
- finetunes/james-sunderland/dataset/ynoeld_00012.wav +3 -0
- finetunes/james-sunderland/dataset/ynoeld_00013.wav +3 -0
- finetunes/james-sunderland/dataset/ynoeld_00014.wav +3 -0
- finetunes/james-sunderland/dataset/ynoeld_00015.wav +3 -0
- finetunes/james-sunderland/dataset/ynoeld_00016.wav +3 -0
- finetunes/james-sunderland/dataset/ynoeld_00017.wav +3 -0
- finetunes/james-sunderland/dataset/ynoeld_00018.wav +3 -0
- finetunes/james-sunderland/dataset/ynoeld_00019.wav +3 -0
finetunes/james-sunderland/dataset/lxgbsm_00000.wav
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cb65d9c3571f12f6a3ff6de1f43a468466fec3328a620bc271e971c816c13cdd
|
3 |
+
size 1234880
|
finetunes/james-sunderland/dataset/lxgbsm_00001.wav
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cfc5673c594825be558acb0256c56c5a8808d0eb0e9630183fe2a3e9b85f4e9a
|
3 |
+
size 1587680
|
finetunes/james-sunderland/dataset/lxgbsm_00002.wav
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ee6c2a46fb6289374844e160db4173d9572bf046230819f0bf6f4ce4d6433c26
|
3 |
+
size 1587680
|
finetunes/james-sunderland/dataset/lxgbsm_00003.wav
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f97fb2cf229a4e3849b166e9276d5570237a8eb04b70a96f5e47cc641f24726d
|
3 |
+
size 1940480
|
finetunes/james-sunderland/dataset/lxgbsm_00004.wav
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d33ecb3eb38426364ef3f10fb746c3f52c2dd6eb3188418bb5fdb0559ce4919a
|
3 |
+
size 1587680
|
finetunes/james-sunderland/dataset/lxgbsm_00005.wav
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:02de0317585aab8cd30180587c37680bef4202a11f18605062bf0a85812a9f04
|
3 |
+
size 1940480
|
finetunes/james-sunderland/dataset/lxgbsm_00006.wav
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:583e4417dcafc5dc1b6f55ed5e24f474a5c5513c318e51fd360293c626aea3ec
|
3 |
+
size 1587680
|
finetunes/james-sunderland/dataset/lxgbsm_00007.wav
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2902802b9ad97f5b0fa72e245a598714c2289ea5d8f1b415e928ed6abba774e3
|
3 |
+
size 2116880
|
finetunes/james-sunderland/dataset/lxgbsm_00008.wav
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5c6ee7a8d1cceffb255a5d2c959a7af2ee0f5ba1238f2e9eebf25fdf14068168
|
3 |
+
size 1764080
|
finetunes/james-sunderland/dataset/lxgbsm_00009.wav
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fd8228c3b3ffb4304c0c3bf859361f1a3b68bdd7a9277673737321158bf81466
|
3 |
+
size 1764080
|
finetunes/james-sunderland/dataset/lxgbsm_00010.wav
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0ce2d9d9a9faaf12c78a9aa70af88664415a00af75bba7f024400ffdf727c04a
|
3 |
+
size 1764080
|
finetunes/james-sunderland/dataset/lxgbsm_00011.wav
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2700fcaf46c9f9b99bdf1a95d135bbe4451962c5f7991ed90a954b2d6e777f10
|
3 |
+
size 2646080
|
finetunes/james-sunderland/dataset/train.txt
ADDED
@@ -0,0 +1,32 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
lxgbsm_00000.wav|I'm kind of lost. I'm looking for Silent Hill. Silent Hill? Is this the right way?
|
2 |
+
lxgbsm_00001.wav|Well, there's the hotel 2, I guess. There's the hotel 2, I guess. The one on the lake? I wonder if it's still there.
|
3 |
+
lxgbsm_00002.wav|You're coming with me? Is it dangerous? I'll be careful. I guess I really don't care if it's dangerous or not.
|
4 |
+
lxgbsm_00003.wav|I'm going to town either way. I'm looking for someone. I'm looking for someone. Someone very important to me.
|
5 |
+
lxgbsm_00004.wav|I'm looking for Mary. Have you seen her? Without Mary, I just can't go on.
|
6 |
+
lxgbsm_00005.wav|I'd do anything if I could be with her again. I'm going to go look for her. I wish I knew. I killed her. Three years ago.
|
7 |
+
lxgbsm_00006.wav|Last year. But I got a letter from her. I got a letter from her. How do you know about Mary? You really seem to care about her.
|
8 |
+
lxgbsm_00007.wav|Is that why you're here too? You're not Mary. You're really not Mary. You're alive! I thought that thing killed you. Are you hurt bad?
|
9 |
+
lxgbsm_00008.wav|Your face, your voice, just your hair and... I was confused. There are all sorts of strange things around here.
|
10 |
+
lxgbsm_00009.wav|This is no place for a kid. Eddie told me. Who's Rachel? What's that letter? It's time to end this nightmare.
|
11 |
+
lxgbsm_00010.wav|What the hell is it? I didn't come here to play, you know. You liar! Don't be ridiculous. How can you sit there and eat pizza?
|
12 |
+
lxgbsm_00011.wav|You! It was you, wasn't it? You're the one who stepped on my hand. I'm done with you. Forget you. Someone very important to me. You're not Mary.
|
13 |
+
ynoeld_00000.wav|It's you. It's you. But I don't need you anymore.
|
14 |
+
ynoeld_00001.wav|How old are you? Are you still here? Are you okay? What happened to you?
|
15 |
+
ynoeld_00002.wav|We met in the apartment building. We met in the apartment building. Sure is quiet here, huh?
|
16 |
+
ynoeld_00003.wav|What are you doing, Laura? Aren't you Maria?
|
17 |
+
ynoeld_00004.wav|So, you're Maria? You're Maria? What's a little girl like you doing here, anyway?
|
18 |
+
ynoeld_00005.wav|I didn't mean to scare you. Are you alone here, Eddie?
|
19 |
+
ynoeld_00006.wav|James Sunderland. James. My name's James.
|
20 |
+
ynoeld_00007.wav|Eddie? Laura? Laura. Maria? Maria. Mary? Mary? Mary?
|
21 |
+
ynoeld_00008.wav|Is that her name? Who is that girl, anyhow?
|
22 |
+
ynoeld_00009.wav|Yeah. Yeah. Yes! Okay. That's right.
|
23 |
+
ynoeld_00010.wav|Oh, yeah. I understand now. I believe you.
|
24 |
+
ynoeld_00011.wav|No. No. No, I... No, you're not.
|
25 |
+
ynoeld_00012.wav|Nothing. Oh, nothing. I guess I really don't care.
|
26 |
+
ynoeld_00013.wav|I don't know. Sorry.
|
27 |
+
ynoeld_00014.wav|What? Do what? Tell me what happened.
|
28 |
+
ynoeld_00015.wav|Why can't you just tell me?
|
29 |
+
ynoeld_00016.wav|All I want from you is an answer. How do you know about that?
|
30 |
+
ynoeld_00017.wav|Is there any other way? Don't you remember?
|
31 |
+
ynoeld_00018.wav|Later, okay?
|
32 |
+
ynoeld_00019.wav|Stay right there. I'll be there soon. I'll be there soon. Thanks.
|
finetunes/james-sunderland/dataset/train.yaml
ADDED
@@ -0,0 +1,147 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
name: james-finetune
|
2 |
+
model: extensibletrainer
|
3 |
+
scale: 1
|
4 |
+
gpu_ids: [0] # Superfluous, redundant, unnecessary, the way you launch the training script will set this
|
5 |
+
start_step: 0
|
6 |
+
checkpointing_enabled: true
|
7 |
+
fp16: false
|
8 |
+
wandb: false
|
9 |
+
use_tb_logger: true
|
10 |
+
|
11 |
+
datasets:
|
12 |
+
train:
|
13 |
+
name: james-train
|
14 |
+
n_workers: 2
|
15 |
+
batch_size: 32
|
16 |
+
mode: paired_voice_audio
|
17 |
+
path: ./training/james/train.txt
|
18 |
+
fetcher_mode: ['lj']
|
19 |
+
phase: train
|
20 |
+
max_wav_length: 255995
|
21 |
+
max_text_length: 200
|
22 |
+
sample_rate: 22050
|
23 |
+
load_conditioning: True
|
24 |
+
num_conditioning_candidates: 2
|
25 |
+
conditioning_length: 44000
|
26 |
+
use_bpe_tokenizer: True
|
27 |
+
tokenizer_vocab: ./models/tortoise/bpe_lowercase_asr_256.json
|
28 |
+
load_aligned_codes: False
|
29 |
+
val: # I really do not care about validation right now
|
30 |
+
name: james-val
|
31 |
+
n_workers: 1
|
32 |
+
batch_size: 1
|
33 |
+
mode: paired_voice_audio
|
34 |
+
path: ./training/james/train.txt
|
35 |
+
fetcher_mode: ['lj']
|
36 |
+
phase: val
|
37 |
+
max_wav_length: 255995
|
38 |
+
max_text_length: 200
|
39 |
+
sample_rate: 22050
|
40 |
+
load_conditioning: True
|
41 |
+
num_conditioning_candidates: 2
|
42 |
+
conditioning_length: 44000
|
43 |
+
use_bpe_tokenizer: True
|
44 |
+
tokenizer_vocab: ./models/tortoise/bpe_lowercase_asr_256.json
|
45 |
+
load_aligned_codes: False
|
46 |
+
|
47 |
+
steps:
|
48 |
+
gpt_train:
|
49 |
+
training: gpt
|
50 |
+
loss_log_buffer: 500
|
51 |
+
|
52 |
+
# Generally follows the recipe from the DALLE paper.
|
53 |
+
optimizer: adamw # this should be adamw_zero if you're using distributed training
|
54 |
+
optimizer_params:
|
55 |
+
lr: !!float 0.0001 # originally: 1e-4
|
56 |
+
weight_decay: !!float 1e-2
|
57 |
+
beta1: 0.9
|
58 |
+
beta2: 0.96
|
59 |
+
clip_grad_eps: 4
|
60 |
+
|
61 |
+
injectors:
|
62 |
+
paired_to_mel:
|
63 |
+
type: torch_mel_spectrogram
|
64 |
+
mel_norm_file: ./models/tortoise/clips_mel_norms.pth
|
65 |
+
in: wav
|
66 |
+
out: paired_mel
|
67 |
+
paired_cond_to_mel:
|
68 |
+
type: for_each
|
69 |
+
subtype: torch_mel_spectrogram
|
70 |
+
mel_norm_file: ./models/tortoise/clips_mel_norms.pth
|
71 |
+
in: conditioning
|
72 |
+
out: paired_conditioning_mel
|
73 |
+
to_codes:
|
74 |
+
type: discrete_token
|
75 |
+
in: paired_mel
|
76 |
+
out: paired_mel_codes
|
77 |
+
dvae_config: "./models/tortoise/train_diffusion_vocoder_22k_level.yml"
|
78 |
+
paired_fwd_text:
|
79 |
+
type: generator
|
80 |
+
generator: gpt
|
81 |
+
in: [paired_conditioning_mel, padded_text, text_lengths, paired_mel_codes, wav_lengths]
|
82 |
+
out: [loss_text_ce, loss_mel_ce, logits]
|
83 |
+
losses:
|
84 |
+
text_ce:
|
85 |
+
type: direct
|
86 |
+
weight: 0.01
|
87 |
+
key: loss_text_ce
|
88 |
+
mel_ce:
|
89 |
+
type: direct
|
90 |
+
weight: 1
|
91 |
+
key: loss_mel_ce
|
92 |
+
|
93 |
+
networks:
|
94 |
+
gpt:
|
95 |
+
type: generator
|
96 |
+
which_model_G: unified_voice2 # none of the unified_voice*.py files actually match the tortoise inference code... 4 and 3 have "alignment_head" (wtf is that?), 2 lacks the types=1 parameter.
|
97 |
+
kwargs:
|
98 |
+
layers: 30 # originally: 8
|
99 |
+
model_dim: 1024 # originally: 512
|
100 |
+
heads: 16 # originally: 8
|
101 |
+
max_text_tokens: 402 # originally: 120
|
102 |
+
max_mel_tokens: 604 # originally: 250
|
103 |
+
max_conditioning_inputs: 2 # originally: 1
|
104 |
+
mel_length_compression: 1024
|
105 |
+
number_text_tokens: 256 # supposed to be 255 for newer unified_voice files
|
106 |
+
number_mel_codes: 8194
|
107 |
+
start_mel_token: 8192
|
108 |
+
stop_mel_token: 8193
|
109 |
+
start_text_token: 255
|
110 |
+
train_solo_embeddings: False # missing in uv3/4
|
111 |
+
use_mel_codes_as_input: True # ditto
|
112 |
+
checkpointing: True
|
113 |
+
#types: 1 # this is MISSING, but in my analysis 1 is equivalent to not having it.
|
114 |
+
#only_alignment_head: False # uv3/4
|
115 |
+
|
116 |
+
path:
|
117 |
+
pretrain_model_gpt: './models/tortoise/autoregressive.pth'
|
118 |
+
strict_load: true
|
119 |
+
# resume_state: './training/james-finetune//training_state//50.state'
|
120 |
+
|
121 |
+
train:
|
122 |
+
niter: 500
|
123 |
+
warmup_iter: -1
|
124 |
+
mega_batch_factor: 16
|
125 |
+
val_freq: 500
|
126 |
+
|
127 |
+
ema_enabled: false # I really don't think EMA matters
|
128 |
+
|
129 |
+
default_lr_scheme: MultiStepLR
|
130 |
+
gen_lr_steps: [9, 18, 25, 33] #[50000, 100000, 140000, 180000]
|
131 |
+
lr_gamma: 0.5
|
132 |
+
|
133 |
+
eval:
|
134 |
+
output_state: gen
|
135 |
+
injectors:
|
136 |
+
gen_inj_eval:
|
137 |
+
type: generator
|
138 |
+
generator: generator
|
139 |
+
in: hq
|
140 |
+
out: [gen, codebook_commitment_loss]
|
141 |
+
|
142 |
+
logger:
|
143 |
+
print_freq: 5
|
144 |
+
save_checkpoint_freq: 25
|
145 |
+
visuals: [gen, mel]
|
146 |
+
visual_debug_rate: 5
|
147 |
+
is_mel_spectrogram: true
|
finetunes/james-sunderland/dataset/whisper.json
ADDED
@@ -0,0 +1,1066 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"lxgbsm.wav": {
|
3 |
+
"text": " I'm kind of lost. I'm looking for Silent Hill. Silent Hill? Is this the right way? Well, there's the hotel 2, I guess. There's the hotel 2, I guess. The one on the lake? I wonder if it's still there. You're coming with me? Is it dangerous? I'll be careful. I guess I really don't care if it's dangerous or not. I'm going to town either way. I'm looking for someone. I'm looking for someone. Someone very important to me. I'm looking for Mary. Have you seen her? Without Mary, I just can't go on. I'd do anything if I could be with her again. I'm going to go look for her. I wish I knew. I killed her. Three years ago. Last year. But I got a letter from her. I got a letter from her. How do you know about Mary? You really seem to care about her. Is that why you're here too? You're not Mary. You're really not Mary. You're alive! I thought that thing killed you. Are you hurt bad? Your face, your voice, just your hair and... I was confused. There are all sorts of strange things around here. This is no place for a kid. Eddie told me. Who's Rachel? What's that letter? It's time to end this nightmare. What the hell is it? I didn't come here to play, you know. You liar! Don't be ridiculous. How can you sit there and eat pizza? You! It was you, wasn't it? You're the one who stepped on my hand. I'm done with you. Forget you. Someone very important to me. You're not Mary.",
|
4 |
+
"segments": [
|
5 |
+
{
|
6 |
+
"id": 0,
|
7 |
+
"seek": 0,
|
8 |
+
"start": 0.0,
|
9 |
+
"end": 7.0,
|
10 |
+
"text": " I'm kind of lost. I'm looking for Silent Hill. Silent Hill? Is this the right way?",
|
11 |
+
"tokens": [
|
12 |
+
314,
|
13 |
+
1101,
|
14 |
+
1611,
|
15 |
+
286,
|
16 |
+
2626,
|
17 |
+
13,
|
18 |
+
314,
|
19 |
+
1101,
|
20 |
+
2045,
|
21 |
+
329,
|
22 |
+
25083,
|
23 |
+
3327,
|
24 |
+
13,
|
25 |
+
25083,
|
26 |
+
3327,
|
27 |
+
30,
|
28 |
+
1148,
|
29 |
+
428,
|
30 |
+
262,
|
31 |
+
826,
|
32 |
+
835,
|
33 |
+
30
|
34 |
+
],
|
35 |
+
"temperature": 0.0,
|
36 |
+
"avg_logprob": -0.13657650896297988,
|
37 |
+
"compression_ratio": 1.6756756756756757,
|
38 |
+
"no_speech_prob": 0.0679725632071495
|
39 |
+
},
|
40 |
+
{
|
41 |
+
"id": 1,
|
42 |
+
"seek": 0,
|
43 |
+
"start": 7.0,
|
44 |
+
"end": 16.0,
|
45 |
+
"text": " Well, there's the hotel 2, I guess. There's the hotel 2, I guess. The one on the lake? I wonder if it's still there.",
|
46 |
+
"tokens": [
|
47 |
+
3894,
|
48 |
+
11,
|
49 |
+
612,
|
50 |
+
338,
|
51 |
+
262,
|
52 |
+
7541,
|
53 |
+
362,
|
54 |
+
11,
|
55 |
+
314,
|
56 |
+
4724,
|
57 |
+
13,
|
58 |
+
1318,
|
59 |
+
338,
|
60 |
+
262,
|
61 |
+
7541,
|
62 |
+
362,
|
63 |
+
11,
|
64 |
+
314,
|
65 |
+
4724,
|
66 |
+
13,
|
67 |
+
383,
|
68 |
+
530,
|
69 |
+
319,
|
70 |
+
262,
|
71 |
+
13546,
|
72 |
+
30,
|
73 |
+
314,
|
74 |
+
4240,
|
75 |
+
611,
|
76 |
+
340,
|
77 |
+
338,
|
78 |
+
991,
|
79 |
+
612,
|
80 |
+
13
|
81 |
+
],
|
82 |
+
"temperature": 0.0,
|
83 |
+
"avg_logprob": -0.13657650896297988,
|
84 |
+
"compression_ratio": 1.6756756756756757,
|
85 |
+
"no_speech_prob": 0.0679725632071495
|
86 |
+
},
|
87 |
+
{
|
88 |
+
"id": 2,
|
89 |
+
"seek": 0,
|
90 |
+
"start": 16.0,
|
91 |
+
"end": 25.0,
|
92 |
+
"text": " You're coming with me? Is it dangerous? I'll be careful. I guess I really don't care if it's dangerous or not.",
|
93 |
+
"tokens": [
|
94 |
+
921,
|
95 |
+
821,
|
96 |
+
2406,
|
97 |
+
351,
|
98 |
+
502,
|
99 |
+
30,
|
100 |
+
1148,
|
101 |
+
340,
|
102 |
+
4923,
|
103 |
+
30,
|
104 |
+
314,
|
105 |
+
1183,
|
106 |
+
307,
|
107 |
+
8161,
|
108 |
+
13,
|
109 |
+
314,
|
110 |
+
4724,
|
111 |
+
314,
|
112 |
+
1107,
|
113 |
+
836,
|
114 |
+
470,
|
115 |
+
1337,
|
116 |
+
611,
|
117 |
+
340,
|
118 |
+
338,
|
119 |
+
4923,
|
120 |
+
393,
|
121 |
+
407,
|
122 |
+
13
|
123 |
+
],
|
124 |
+
"temperature": 0.0,
|
125 |
+
"avg_logprob": -0.13657650896297988,
|
126 |
+
"compression_ratio": 1.6756756756756757,
|
127 |
+
"no_speech_prob": 0.0679725632071495
|
128 |
+
},
|
129 |
+
{
|
130 |
+
"id": 3,
|
131 |
+
"seek": 2500,
|
132 |
+
"start": 25.0,
|
133 |
+
"end": 36.0,
|
134 |
+
"text": " I'm going to town either way. I'm looking for someone. I'm looking for someone. Someone very important to me.",
|
135 |
+
"tokens": [
|
136 |
+
314,
|
137 |
+
1101,
|
138 |
+
1016,
|
139 |
+
284,
|
140 |
+
3240,
|
141 |
+
2035,
|
142 |
+
835,
|
143 |
+
13,
|
144 |
+
314,
|
145 |
+
1101,
|
146 |
+
2045,
|
147 |
+
329,
|
148 |
+
2130,
|
149 |
+
13,
|
150 |
+
314,
|
151 |
+
1101,
|
152 |
+
2045,
|
153 |
+
329,
|
154 |
+
2130,
|
155 |
+
13,
|
156 |
+
17877,
|
157 |
+
845,
|
158 |
+
1593,
|
159 |
+
284,
|
160 |
+
502,
|
161 |
+
13
|
162 |
+
],
|
163 |
+
"temperature": 0.0,
|
164 |
+
"avg_logprob": -0.07823550926064546,
|
165 |
+
"compression_ratio": 1.4959349593495934,
|
166 |
+
"no_speech_prob": 3.0241180866141804e-05
|
167 |
+
},
|
168 |
+
{
|
169 |
+
"id": 4,
|
170 |
+
"seek": 2500,
|
171 |
+
"start": 36.0,
|
172 |
+
"end": 45.0,
|
173 |
+
"text": " I'm looking for Mary. Have you seen her? Without Mary, I just can't go on.",
|
174 |
+
"tokens": [
|
175 |
+
314,
|
176 |
+
1101,
|
177 |
+
2045,
|
178 |
+
329,
|
179 |
+
5335,
|
180 |
+
13,
|
181 |
+
8192,
|
182 |
+
345,
|
183 |
+
1775,
|
184 |
+
607,
|
185 |
+
30,
|
186 |
+
9170,
|
187 |
+
5335,
|
188 |
+
11,
|
189 |
+
314,
|
190 |
+
655,
|
191 |
+
460,
|
192 |
+
470,
|
193 |
+
467,
|
194 |
+
319,
|
195 |
+
13
|
196 |
+
],
|
197 |
+
"temperature": 0.0,
|
198 |
+
"avg_logprob": -0.07823550926064546,
|
199 |
+
"compression_ratio": 1.4959349593495934,
|
200 |
+
"no_speech_prob": 3.0241180866141804e-05
|
201 |
+
},
|
202 |
+
{
|
203 |
+
"id": 5,
|
204 |
+
"seek": 4500,
|
205 |
+
"start": 45.0,
|
206 |
+
"end": 56.0,
|
207 |
+
"text": " I'd do anything if I could be with her again. I'm going to go look for her. I wish I knew. I killed her. Three years ago.",
|
208 |
+
"tokens": [
|
209 |
+
314,
|
210 |
+
1549,
|
211 |
+
466,
|
212 |
+
1997,
|
213 |
+
611,
|
214 |
+
314,
|
215 |
+
714,
|
216 |
+
307,
|
217 |
+
351,
|
218 |
+
607,
|
219 |
+
757,
|
220 |
+
13,
|
221 |
+
314,
|
222 |
+
1101,
|
223 |
+
1016,
|
224 |
+
284,
|
225 |
+
467,
|
226 |
+
804,
|
227 |
+
329,
|
228 |
+
607,
|
229 |
+
13,
|
230 |
+
314,
|
231 |
+
4601,
|
232 |
+
314,
|
233 |
+
2993,
|
234 |
+
13,
|
235 |
+
314,
|
236 |
+
2923,
|
237 |
+
607,
|
238 |
+
13,
|
239 |
+
7683,
|
240 |
+
812,
|
241 |
+
2084,
|
242 |
+
13
|
243 |
+
],
|
244 |
+
"temperature": 0.0,
|
245 |
+
"avg_logprob": -0.06976071449175272,
|
246 |
+
"compression_ratio": 1.5182926829268293,
|
247 |
+
"no_speech_prob": 0.00030994918779470026
|
248 |
+
},
|
249 |
+
{
|
250 |
+
"id": 6,
|
251 |
+
"seek": 4500,
|
252 |
+
"start": 56.0,
|
253 |
+
"end": 65.0,
|
254 |
+
"text": " Last year. But I got a letter from her. I got a letter from her. How do you know about Mary? You really seem to care about her.",
|
255 |
+
"tokens": [
|
256 |
+
4586,
|
257 |
+
614,
|
258 |
+
13,
|
259 |
+
887,
|
260 |
+
314,
|
261 |
+
1392,
|
262 |
+
257,
|
263 |
+
3850,
|
264 |
+
422,
|
265 |
+
607,
|
266 |
+
13,
|
267 |
+
314,
|
268 |
+
1392,
|
269 |
+
257,
|
270 |
+
3850,
|
271 |
+
422,
|
272 |
+
607,
|
273 |
+
13,
|
274 |
+
1374,
|
275 |
+
466,
|
276 |
+
345,
|
277 |
+
760,
|
278 |
+
546,
|
279 |
+
5335,
|
280 |
+
30,
|
281 |
+
921,
|
282 |
+
1107,
|
283 |
+
1283,
|
284 |
+
284,
|
285 |
+
1337,
|
286 |
+
546,
|
287 |
+
607,
|
288 |
+
13
|
289 |
+
],
|
290 |
+
"temperature": 0.0,
|
291 |
+
"avg_logprob": -0.06976071449175272,
|
292 |
+
"compression_ratio": 1.5182926829268293,
|
293 |
+
"no_speech_prob": 0.00030994918779470026
|
294 |
+
},
|
295 |
+
{
|
296 |
+
"id": 7,
|
297 |
+
"seek": 6500,
|
298 |
+
"start": 65.0,
|
299 |
+
"end": 77.0,
|
300 |
+
"text": " Is that why you're here too? You're not Mary. You're really not Mary. You're alive! I thought that thing killed you. Are you hurt bad?",
|
301 |
+
"tokens": [
|
302 |
+
1148,
|
303 |
+
326,
|
304 |
+
1521,
|
305 |
+
345,
|
306 |
+
821,
|
307 |
+
994,
|
308 |
+
1165,
|
309 |
+
30,
|
310 |
+
921,
|
311 |
+
821,
|
312 |
+
407,
|
313 |
+
5335,
|
314 |
+
13,
|
315 |
+
921,
|
316 |
+
821,
|
317 |
+
1107,
|
318 |
+
407,
|
319 |
+
5335,
|
320 |
+
13,
|
321 |
+
921,
|
322 |
+
821,
|
323 |
+
6776,
|
324 |
+
0,
|
325 |
+
314,
|
326 |
+
1807,
|
327 |
+
326,
|
328 |
+
1517,
|
329 |
+
2923,
|
330 |
+
345,
|
331 |
+
13,
|
332 |
+
4231,
|
333 |
+
345,
|
334 |
+
5938,
|
335 |
+
2089,
|
336 |
+
30
|
337 |
+
],
|
338 |
+
"temperature": 0.0,
|
339 |
+
"avg_logprob": -0.09471903425274474,
|
340 |
+
"compression_ratio": 1.50920245398773,
|
341 |
+
"no_speech_prob": 0.0003512969706207514
|
342 |
+
},
|
343 |
+
{
|
344 |
+
"id": 8,
|
345 |
+
"seek": 6500,
|
346 |
+
"start": 77.0,
|
347 |
+
"end": 87.0,
|
348 |
+
"text": " Your face, your voice, just your hair and... I was confused. There are all sorts of strange things around here.",
|
349 |
+
"tokens": [
|
350 |
+
3406,
|
351 |
+
1986,
|
352 |
+
11,
|
353 |
+
534,
|
354 |
+
3809,
|
355 |
+
11,
|
356 |
+
655,
|
357 |
+
534,
|
358 |
+
4190,
|
359 |
+
290,
|
360 |
+
986,
|
361 |
+
314,
|
362 |
+
373,
|
363 |
+
10416,
|
364 |
+
13,
|
365 |
+
1318,
|
366 |
+
389,
|
367 |
+
477,
|
368 |
+
10524,
|
369 |
+
286,
|
370 |
+
6283,
|
371 |
+
1243,
|
372 |
+
1088,
|
373 |
+
994,
|
374 |
+
13
|
375 |
+
],
|
376 |
+
"temperature": 0.0,
|
377 |
+
"avg_logprob": -0.09471903425274474,
|
378 |
+
"compression_ratio": 1.50920245398773,
|
379 |
+
"no_speech_prob": 0.0003512969706207514
|
380 |
+
},
|
381 |
+
{
|
382 |
+
"id": 9,
|
383 |
+
"seek": 8700,
|
384 |
+
"start": 87.0,
|
385 |
+
"end": 97.0,
|
386 |
+
"text": " This is no place for a kid. Eddie told me. Who's Rachel? What's that letter? It's time to end this nightmare.",
|
387 |
+
"tokens": [
|
388 |
+
770,
|
389 |
+
318,
|
390 |
+
645,
|
391 |
+
1295,
|
392 |
+
329,
|
393 |
+
257,
|
394 |
+
5141,
|
395 |
+
13,
|
396 |
+
19478,
|
397 |
+
1297,
|
398 |
+
502,
|
399 |
+
13,
|
400 |
+
5338,
|
401 |
+
338,
|
402 |
+
15984,
|
403 |
+
30,
|
404 |
+
1867,
|
405 |
+
338,
|
406 |
+
326,
|
407 |
+
3850,
|
408 |
+
30,
|
409 |
+
632,
|
410 |
+
338,
|
411 |
+
640,
|
412 |
+
284,
|
413 |
+
886,
|
414 |
+
428,
|
415 |
+
17123,
|
416 |
+
13
|
417 |
+
],
|
418 |
+
"temperature": 0.0,
|
419 |
+
"avg_logprob": -0.050474664439325745,
|
420 |
+
"compression_ratio": 1.4047619047619047,
|
421 |
+
"no_speech_prob": 1.406333740305854e-05
|
422 |
+
},
|
423 |
+
{
|
424 |
+
"id": 10,
|
425 |
+
"seek": 8700,
|
426 |
+
"start": 97.0,
|
427 |
+
"end": 107.0,
|
428 |
+
"text": " What the hell is it? I didn't come here to play, you know. You liar! Don't be ridiculous. How can you sit there and eat pizza?",
|
429 |
+
"tokens": [
|
430 |
+
1867,
|
431 |
+
262,
|
432 |
+
5968,
|
433 |
+
318,
|
434 |
+
340,
|
435 |
+
30,
|
436 |
+
314,
|
437 |
+
1422,
|
438 |
+
470,
|
439 |
+
1282,
|
440 |
+
994,
|
441 |
+
284,
|
442 |
+
711,
|
443 |
+
11,
|
444 |
+
345,
|
445 |
+
760,
|
446 |
+
13,
|
447 |
+
921,
|
448 |
+
31866,
|
449 |
+
0,
|
450 |
+
2094,
|
451 |
+
470,
|
452 |
+
307,
|
453 |
+
11441,
|
454 |
+
13,
|
455 |
+
1374,
|
456 |
+
460,
|
457 |
+
345,
|
458 |
+
1650,
|
459 |
+
612,
|
460 |
+
290,
|
461 |
+
4483,
|
462 |
+
14256,
|
463 |
+
30
|
464 |
+
],
|
465 |
+
"temperature": 0.0,
|
466 |
+
"avg_logprob": -0.050474664439325745,
|
467 |
+
"compression_ratio": 1.4047619047619047,
|
468 |
+
"no_speech_prob": 1.406333740305854e-05
|
469 |
+
},
|
470 |
+
{
|
471 |
+
"id": 11,
|
472 |
+
"seek": 10700,
|
473 |
+
"start": 107.0,
|
474 |
+
"end": 122.0,
|
475 |
+
"text": " You! It was you, wasn't it? You're the one who stepped on my hand. I'm done with you. Forget you. Someone very important to me. You're not Mary.",
|
476 |
+
"tokens": [
|
477 |
+
50363,
|
478 |
+
921,
|
479 |
+
0,
|
480 |
+
632,
|
481 |
+
373,
|
482 |
+
345,
|
483 |
+
11,
|
484 |
+
2492,
|
485 |
+
470,
|
486 |
+
340,
|
487 |
+
30,
|
488 |
+
921,
|
489 |
+
821,
|
490 |
+
262,
|
491 |
+
530,
|
492 |
+
508,
|
493 |
+
10764,
|
494 |
+
319,
|
495 |
+
616,
|
496 |
+
1021,
|
497 |
+
13,
|
498 |
+
314,
|
499 |
+
1101,
|
500 |
+
1760,
|
501 |
+
351,
|
502 |
+
345,
|
503 |
+
13,
|
504 |
+
29624,
|
505 |
+
345,
|
506 |
+
13,
|
507 |
+
17877,
|
508 |
+
845,
|
509 |
+
1593,
|
510 |
+
284,
|
511 |
+
502,
|
512 |
+
13,
|
513 |
+
921,
|
514 |
+
821,
|
515 |
+
407,
|
516 |
+
5335,
|
517 |
+
13,
|
518 |
+
51113
|
519 |
+
],
|
520 |
+
"temperature": 0.0,
|
521 |
+
"avg_logprob": -0.07767114528389864,
|
522 |
+
"compression_ratio": 1.2307692307692308,
|
523 |
+
"no_speech_prob": 2.5464909413130954e-05
|
524 |
+
}
|
525 |
+
],
|
526 |
+
"language": "en"
|
527 |
+
},
|
528 |
+
"ynoeld.wav": {
|
529 |
+
"text": " It's you. It's you. But I don't need you anymore. How old are you? Are you still here? Are you okay? What happened to you? We met in the apartment building. We met in the apartment building. Sure is quiet here, huh? What are you doing, Laura? Aren't you Maria? So, you're Maria? You're Maria? What's a little girl like you doing here, anyway? I didn't mean to scare you. Are you alone here, Eddie? James Sunderland. James. My name's James. Eddie? Laura? Laura. Maria? Maria. Mary? Mary? Mary? Is that her name? Who is that girl, anyhow? Yeah. Yeah. Yes! Okay. That's right. Oh, yeah. I understand now. I believe you. No. No. No, I... No, you're not. Nothing. Oh, nothing. I guess I really don't care. I don't know. Sorry. What? Do what? Tell me what happened. Why can't you just tell me? All I want from you is an answer. How do you know about that? Is there any other way? Don't you remember? Later, okay? Stay right there. I'll be there soon. I'll be there soon. Thanks.",
|
530 |
+
"segments": [
|
531 |
+
{
|
532 |
+
"id": 0,
|
533 |
+
"seek": 0,
|
534 |
+
"start": 0.0,
|
535 |
+
"end": 5.0,
|
536 |
+
"text": " It's you. It's you. But I don't need you anymore.",
|
537 |
+
"tokens": [
|
538 |
+
632,
|
539 |
+
338,
|
540 |
+
345,
|
541 |
+
13,
|
542 |
+
632,
|
543 |
+
338,
|
544 |
+
345,
|
545 |
+
13,
|
546 |
+
887,
|
547 |
+
314,
|
548 |
+
836,
|
549 |
+
470,
|
550 |
+
761,
|
551 |
+
345,
|
552 |
+
7471,
|
553 |
+
13
|
554 |
+
],
|
555 |
+
"temperature": 0.0,
|
556 |
+
"avg_logprob": -0.153718864216524,
|
557 |
+
"compression_ratio": 1.7720207253886011,
|
558 |
+
"no_speech_prob": 0.13705560564994812
|
559 |
+
},
|
560 |
+
{
|
561 |
+
"id": 1,
|
562 |
+
"seek": 0,
|
563 |
+
"start": 5.0,
|
564 |
+
"end": 11.0,
|
565 |
+
"text": " How old are you? Are you still here? Are you okay? What happened to you?",
|
566 |
+
"tokens": [
|
567 |
+
1374,
|
568 |
+
1468,
|
569 |
+
389,
|
570 |
+
345,
|
571 |
+
30,
|
572 |
+
4231,
|
573 |
+
345,
|
574 |
+
991,
|
575 |
+
994,
|
576 |
+
30,
|
577 |
+
4231,
|
578 |
+
345,
|
579 |
+
8788,
|
580 |
+
30,
|
581 |
+
1867,
|
582 |
+
3022,
|
583 |
+
284,
|
584 |
+
345,
|
585 |
+
30
|
586 |
+
],
|
587 |
+
"temperature": 0.0,
|
588 |
+
"avg_logprob": -0.153718864216524,
|
589 |
+
"compression_ratio": 1.7720207253886011,
|
590 |
+
"no_speech_prob": 0.13705560564994812
|
591 |
+
},
|
592 |
+
{
|
593 |
+
"id": 2,
|
594 |
+
"seek": 0,
|
595 |
+
"start": 11.0,
|
596 |
+
"end": 18.0,
|
597 |
+
"text": " We met in the apartment building. We met in the apartment building. Sure is quiet here, huh?",
|
598 |
+
"tokens": [
|
599 |
+
775,
|
600 |
+
1138,
|
601 |
+
287,
|
602 |
+
262,
|
603 |
+
7962,
|
604 |
+
2615,
|
605 |
+
13,
|
606 |
+
775,
|
607 |
+
1138,
|
608 |
+
287,
|
609 |
+
262,
|
610 |
+
7962,
|
611 |
+
2615,
|
612 |
+
13,
|
613 |
+
10889,
|
614 |
+
318,
|
615 |
+
5897,
|
616 |
+
994,
|
617 |
+
11,
|
618 |
+
24926,
|
619 |
+
30
|
620 |
+
],
|
621 |
+
"temperature": 0.0,
|
622 |
+
"avg_logprob": -0.153718864216524,
|
623 |
+
"compression_ratio": 1.7720207253886011,
|
624 |
+
"no_speech_prob": 0.13705560564994812
|
625 |
+
},
|
626 |
+
{
|
627 |
+
"id": 3,
|
628 |
+
"seek": 0,
|
629 |
+
"start": 18.0,
|
630 |
+
"end": 22.0,
|
631 |
+
"text": " What are you doing, Laura? Aren't you Maria?",
|
632 |
+
"tokens": [
|
633 |
+
1867,
|
634 |
+
389,
|
635 |
+
345,
|
636 |
+
1804,
|
637 |
+
11,
|
638 |
+
16753,
|
639 |
+
30,
|
640 |
+
9843,
|
641 |
+
470,
|
642 |
+
345,
|
643 |
+
14200,
|
644 |
+
30
|
645 |
+
],
|
646 |
+
"temperature": 0.0,
|
647 |
+
"avg_logprob": -0.153718864216524,
|
648 |
+
"compression_ratio": 1.7720207253886011,
|
649 |
+
"no_speech_prob": 0.13705560564994812
|
650 |
+
},
|
651 |
+
{
|
652 |
+
"id": 4,
|
653 |
+
"seek": 0,
|
654 |
+
"start": 22.0,
|
655 |
+
"end": 29.0,
|
656 |
+
"text": " So, you're Maria? You're Maria? What's a little girl like you doing here, anyway?",
|
657 |
+
"tokens": [
|
658 |
+
1406,
|
659 |
+
11,
|
660 |
+
345,
|
661 |
+
821,
|
662 |
+
14200,
|
663 |
+
30,
|
664 |
+
921,
|
665 |
+
821,
|
666 |
+
14200,
|
667 |
+
30,
|
668 |
+
1867,
|
669 |
+
338,
|
670 |
+
257,
|
671 |
+
1310,
|
672 |
+
2576,
|
673 |
+
588,
|
674 |
+
345,
|
675 |
+
1804,
|
676 |
+
994,
|
677 |
+
11,
|
678 |
+
6949,
|
679 |
+
30
|
680 |
+
],
|
681 |
+
"temperature": 0.0,
|
682 |
+
"avg_logprob": -0.153718864216524,
|
683 |
+
"compression_ratio": 1.7720207253886011,
|
684 |
+
"no_speech_prob": 0.13705560564994812
|
685 |
+
},
|
686 |
+
{
|
687 |
+
"id": 5,
|
688 |
+
"seek": 2900,
|
689 |
+
"start": 29.0,
|
690 |
+
"end": 33.0,
|
691 |
+
"text": " I didn't mean to scare you. Are you alone here, Eddie?",
|
692 |
+
"tokens": [
|
693 |
+
314,
|
694 |
+
1422,
|
695 |
+
470,
|
696 |
+
1612,
|
697 |
+
284,
|
698 |
+
19437,
|
699 |
+
345,
|
700 |
+
13,
|
701 |
+
4231,
|
702 |
+
345,
|
703 |
+
3436,
|
704 |
+
994,
|
705 |
+
11,
|
706 |
+
19478,
|
707 |
+
30
|
708 |
+
],
|
709 |
+
"temperature": 0.0,
|
710 |
+
"avg_logprob": -0.14054276393010065,
|
711 |
+
"compression_ratio": 1.5032679738562091,
|
712 |
+
"no_speech_prob": 1.9525503375916742e-05
|
713 |
+
},
|
714 |
+
{
|
715 |
+
"id": 6,
|
716 |
+
"seek": 2900,
|
717 |
+
"start": 33.0,
|
718 |
+
"end": 38.0,
|
719 |
+
"text": " James Sunderland. James. My name's James.",
|
720 |
+
"tokens": [
|
721 |
+
3700,
|
722 |
+
35706,
|
723 |
+
13,
|
724 |
+
3700,
|
725 |
+
13,
|
726 |
+
2011,
|
727 |
+
1438,
|
728 |
+
338,
|
729 |
+
3700,
|
730 |
+
13
|
731 |
+
],
|
732 |
+
"temperature": 0.0,
|
733 |
+
"avg_logprob": -0.14054276393010065,
|
734 |
+
"compression_ratio": 1.5032679738562091,
|
735 |
+
"no_speech_prob": 1.9525503375916742e-05
|
736 |
+
},
|
737 |
+
{
|
738 |
+
"id": 7,
|
739 |
+
"seek": 2900,
|
740 |
+
"start": 38.0,
|
741 |
+
"end": 48.0,
|
742 |
+
"text": " Eddie? Laura? Laura. Maria? Maria. Mary? Mary? Mary?",
|
743 |
+
"tokens": [
|
744 |
+
19478,
|
745 |
+
30,
|
746 |
+
16753,
|
747 |
+
30,
|
748 |
+
16753,
|
749 |
+
13,
|
750 |
+
14200,
|
751 |
+
30,
|
752 |
+
14200,
|
753 |
+
13,
|
754 |
+
5335,
|
755 |
+
30,
|
756 |
+
5335,
|
757 |
+
30,
|
758 |
+
5335,
|
759 |
+
30
|
760 |
+
],
|
761 |
+
"temperature": 0.0,
|
762 |
+
"avg_logprob": -0.14054276393010065,
|
763 |
+
"compression_ratio": 1.5032679738562091,
|
764 |
+
"no_speech_prob": 1.9525503375916742e-05
|
765 |
+
},
|
766 |
+
{
|
767 |
+
"id": 8,
|
768 |
+
"seek": 2900,
|
769 |
+
"start": 48.0,
|
770 |
+
"end": 52.0,
|
771 |
+
"text": " Is that her name? Who is that girl, anyhow?",
|
772 |
+
"tokens": [
|
773 |
+
1148,
|
774 |
+
326,
|
775 |
+
607,
|
776 |
+
1438,
|
777 |
+
30,
|
778 |
+
5338,
|
779 |
+
318,
|
780 |
+
326,
|
781 |
+
2576,
|
782 |
+
11,
|
783 |
+
597,
|
784 |
+
4919,
|
785 |
+
30
|
786 |
+
],
|
787 |
+
"temperature": 0.0,
|
788 |
+
"avg_logprob": -0.14054276393010065,
|
789 |
+
"compression_ratio": 1.5032679738562091,
|
790 |
+
"no_speech_prob": 1.9525503375916742e-05
|
791 |
+
},
|
792 |
+
{
|
793 |
+
"id": 9,
|
794 |
+
"seek": 2900,
|
795 |
+
"start": 52.0,
|
796 |
+
"end": 57.0,
|
797 |
+
"text": " Yeah. Yeah. Yes! Okay. That's right.",
|
798 |
+
"tokens": [
|
799 |
+
9425,
|
800 |
+
13,
|
801 |
+
9425,
|
802 |
+
13,
|
803 |
+
3363,
|
804 |
+
0,
|
805 |
+
16805,
|
806 |
+
13,
|
807 |
+
1320,
|
808 |
+
338,
|
809 |
+
826,
|
810 |
+
13
|
811 |
+
],
|
812 |
+
"temperature": 0.0,
|
813 |
+
"avg_logprob": -0.14054276393010065,
|
814 |
+
"compression_ratio": 1.5032679738562091,
|
815 |
+
"no_speech_prob": 1.9525503375916742e-05
|
816 |
+
},
|
817 |
+
{
|
818 |
+
"id": 10,
|
819 |
+
"seek": 5700,
|
820 |
+
"start": 57.0,
|
821 |
+
"end": 61.0,
|
822 |
+
"text": " Oh, yeah. I understand now. I believe you.",
|
823 |
+
"tokens": [
|
824 |
+
3966,
|
825 |
+
11,
|
826 |
+
10194,
|
827 |
+
13,
|
828 |
+
314,
|
829 |
+
1833,
|
830 |
+
783,
|
831 |
+
13,
|
832 |
+
314,
|
833 |
+
1975,
|
834 |
+
345,
|
835 |
+
13
|
836 |
+
],
|
837 |
+
"temperature": 0.0,
|
838 |
+
"avg_logprob": -0.09678743459001372,
|
839 |
+
"compression_ratio": 1.42,
|
840 |
+
"no_speech_prob": 6.1439545788744e-06
|
841 |
+
},
|
842 |
+
{
|
843 |
+
"id": 11,
|
844 |
+
"seek": 5700,
|
845 |
+
"start": 61.0,
|
846 |
+
"end": 68.0,
|
847 |
+
"text": " No. No. No, I... No, you're not.",
|
848 |
+
"tokens": [
|
849 |
+
1400,
|
850 |
+
13,
|
851 |
+
1400,
|
852 |
+
13,
|
853 |
+
1400,
|
854 |
+
11,
|
855 |
+
314,
|
856 |
+
986,
|
857 |
+
1400,
|
858 |
+
11,
|
859 |
+
345,
|
860 |
+
821,
|
861 |
+
407,
|
862 |
+
13
|
863 |
+
],
|
864 |
+
"temperature": 0.0,
|
865 |
+
"avg_logprob": -0.09678743459001372,
|
866 |
+
"compression_ratio": 1.42,
|
867 |
+
"no_speech_prob": 6.1439545788744e-06
|
868 |
+
},
|
869 |
+
{
|
870 |
+
"id": 12,
|
871 |
+
"seek": 5700,
|
872 |
+
"start": 68.0,
|
873 |
+
"end": 72.0,
|
874 |
+
"text": " Nothing. Oh, nothing. I guess I really don't care.",
|
875 |
+
"tokens": [
|
876 |
+
10528,
|
877 |
+
13,
|
878 |
+
3966,
|
879 |
+
11,
|
880 |
+
2147,
|
881 |
+
13,
|
882 |
+
314,
|
883 |
+
4724,
|
884 |
+
314,
|
885 |
+
1107,
|
886 |
+
836,
|
887 |
+
470,
|
888 |
+
1337,
|
889 |
+
13
|
890 |
+
],
|
891 |
+
"temperature": 0.0,
|
892 |
+
"avg_logprob": -0.09678743459001372,
|
893 |
+
"compression_ratio": 1.42,
|
894 |
+
"no_speech_prob": 6.1439545788744e-06
|
895 |
+
},
|
896 |
+
{
|
897 |
+
"id": 13,
|
898 |
+
"seek": 5700,
|
899 |
+
"start": 72.0,
|
900 |
+
"end": 77.0,
|
901 |
+
"text": " I don't know. Sorry.",
|
902 |
+
"tokens": [
|
903 |
+
314,
|
904 |
+
836,
|
905 |
+
470,
|
906 |
+
760,
|
907 |
+
13,
|
908 |
+
19061,
|
909 |
+
13
|
910 |
+
],
|
911 |
+
"temperature": 0.0,
|
912 |
+
"avg_logprob": -0.09678743459001372,
|
913 |
+
"compression_ratio": 1.42,
|
914 |
+
"no_speech_prob": 6.1439545788744e-06
|
915 |
+
},
|
916 |
+
{
|
917 |
+
"id": 14,
|
918 |
+
"seek": 5700,
|
919 |
+
"start": 77.0,
|
920 |
+
"end": 81.0,
|
921 |
+
"text": " What? Do what? Tell me what happened.",
|
922 |
+
"tokens": [
|
923 |
+
1867,
|
924 |
+
30,
|
925 |
+
2141,
|
926 |
+
644,
|
927 |
+
30,
|
928 |
+
14026,
|
929 |
+
502,
|
930 |
+
644,
|
931 |
+
3022,
|
932 |
+
13
|
933 |
+
],
|
934 |
+
"temperature": 0.0,
|
935 |
+
"avg_logprob": -0.09678743459001372,
|
936 |
+
"compression_ratio": 1.42,
|
937 |
+
"no_speech_prob": 6.1439545788744e-06
|
938 |
+
},
|
939 |
+
{
|
940 |
+
"id": 15,
|
941 |
+
"seek": 5700,
|
942 |
+
"start": 81.0,
|
943 |
+
"end": 83.0,
|
944 |
+
"text": " Why can't you just tell me?",
|
945 |
+
"tokens": [
|
946 |
+
4162,
|
947 |
+
460,
|
948 |
+
470,
|
949 |
+
345,
|
950 |
+
655,
|
951 |
+
1560,
|
952 |
+
502,
|
953 |
+
30
|
954 |
+
],
|
955 |
+
"temperature": 0.0,
|
956 |
+
"avg_logprob": -0.09678743459001372,
|
957 |
+
"compression_ratio": 1.42,
|
958 |
+
"no_speech_prob": 6.1439545788744e-06
|
959 |
+
},
|
960 |
+
{
|
961 |
+
"id": 16,
|
962 |
+
"seek": 8300,
|
963 |
+
"start": 83.0,
|
964 |
+
"end": 88.0,
|
965 |
+
"text": " All I want from you is an answer. How do you know about that?",
|
966 |
+
"tokens": [
|
967 |
+
1439,
|
968 |
+
314,
|
969 |
+
765,
|
970 |
+
422,
|
971 |
+
345,
|
972 |
+
318,
|
973 |
+
281,
|
974 |
+
3280,
|
975 |
+
13,
|
976 |
+
1374,
|
977 |
+
466,
|
978 |
+
345,
|
979 |
+
760,
|
980 |
+
546,
|
981 |
+
326,
|
982 |
+
30
|
983 |
+
],
|
984 |
+
"temperature": 0.0,
|
985 |
+
"avg_logprob": -0.04557831534023943,
|
986 |
+
"compression_ratio": 1.3834586466165413,
|
987 |
+
"no_speech_prob": 1.7880429368233308e-06
|
988 |
+
},
|
989 |
+
{
|
990 |
+
"id": 17,
|
991 |
+
"seek": 8300,
|
992 |
+
"start": 88.0,
|
993 |
+
"end": 91.0,
|
994 |
+
"text": " Is there any other way? Don't you remember?",
|
995 |
+
"tokens": [
|
996 |
+
1148,
|
997 |
+
612,
|
998 |
+
597,
|
999 |
+
584,
|
1000 |
+
835,
|
1001 |
+
30,
|
1002 |
+
2094,
|
1003 |
+
470,
|
1004 |
+
345,
|
1005 |
+
3505,
|
1006 |
+
30
|
1007 |
+
],
|
1008 |
+
"temperature": 0.0,
|
1009 |
+
"avg_logprob": -0.04557831534023943,
|
1010 |
+
"compression_ratio": 1.3834586466165413,
|
1011 |
+
"no_speech_prob": 1.7880429368233308e-06
|
1012 |
+
},
|
1013 |
+
{
|
1014 |
+
"id": 18,
|
1015 |
+
"seek": 8300,
|
1016 |
+
"start": 91.0,
|
1017 |
+
"end": 93.0,
|
1018 |
+
"text": " Later, okay?",
|
1019 |
+
"tokens": [
|
1020 |
+
11450,
|
1021 |
+
11,
|
1022 |
+
8788,
|
1023 |
+
30
|
1024 |
+
],
|
1025 |
+
"temperature": 0.0,
|
1026 |
+
"avg_logprob": -0.04557831534023943,
|
1027 |
+
"compression_ratio": 1.3834586466165413,
|
1028 |
+
"no_speech_prob": 1.7880429368233308e-06
|
1029 |
+
},
|
1030 |
+
{
|
1031 |
+
"id": 19,
|
1032 |
+
"seek": 9300,
|
1033 |
+
"start": 93.0,
|
1034 |
+
"end": 114.0,
|
1035 |
+
"text": " Stay right there. I'll be there soon. I'll be there soon. Thanks.",
|
1036 |
+
"tokens": [
|
1037 |
+
50363,
|
1038 |
+
16160,
|
1039 |
+
826,
|
1040 |
+
612,
|
1041 |
+
13,
|
1042 |
+
314,
|
1043 |
+
1183,
|
1044 |
+
307,
|
1045 |
+
612,
|
1046 |
+
2582,
|
1047 |
+
13,
|
1048 |
+
314,
|
1049 |
+
1183,
|
1050 |
+
307,
|
1051 |
+
612,
|
1052 |
+
2582,
|
1053 |
+
13,
|
1054 |
+
6930,
|
1055 |
+
13,
|
1056 |
+
51413
|
1057 |
+
],
|
1058 |
+
"temperature": 0.0,
|
1059 |
+
"avg_logprob": -0.10187114988054548,
|
1060 |
+
"compression_ratio": 1.3265306122448979,
|
1061 |
+
"no_speech_prob": 5.649423474096693e-05
|
1062 |
+
}
|
1063 |
+
],
|
1064 |
+
"language": "en"
|
1065 |
+
}
|
1066 |
+
}
|
finetunes/james-sunderland/dataset/ynoeld_00000.wav
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b31614e30137738984716d1943a56d66487b35310926730882a9ef272da8e09e
|
3 |
+
size 882080
|
finetunes/james-sunderland/dataset/ynoeld_00001.wav
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:98bea197bffbfe02cbfc09e02243709e87a11d65b279a3a1485c671f5e251a6c
|
3 |
+
size 1058480
|
finetunes/james-sunderland/dataset/ynoeld_00002.wav
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bdf95b92f974f4a7023c2b8ea3d2eb2f47dcc83391bc961fd40f373bddc4f680
|
3 |
+
size 1234880
|
finetunes/james-sunderland/dataset/ynoeld_00003.wav
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:27b32b2aa77c0234eca1883620ade655034b2ee42fcf8e26e2c408738c655e39
|
3 |
+
size 705680
|
finetunes/james-sunderland/dataset/ynoeld_00004.wav
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0bd5ca0c4381cc32fad2977e470fdcc6318db4abe42719350a4fb0949c99a94b
|
3 |
+
size 1234880
|
finetunes/james-sunderland/dataset/ynoeld_00005.wav
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:011be88fb79a79dae064270cc7f87689f236d27dd2ccb4bf018d68ad0750cbb2
|
3 |
+
size 705680
|
finetunes/james-sunderland/dataset/ynoeld_00006.wav
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:21ffde4fbd4063dc8a3949c00ec4cc5055ab30944e3f41325ab94a1e79a4f48c
|
3 |
+
size 882080
|
finetunes/james-sunderland/dataset/ynoeld_00007.wav
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bae00b0bfe8cda4909fbfec6e2ef5ede031b8bbc4edb0e2713722abeca101f03
|
3 |
+
size 1764080
|
finetunes/james-sunderland/dataset/ynoeld_00008.wav
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:25863e3b8694cb12762efc3f5597b3885395ae0cc85078d20754569ee7fbc0c9
|
3 |
+
size 705680
|
finetunes/james-sunderland/dataset/ynoeld_00009.wav
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0d9b88538ed6f6ff6c6467983da87024ac34776e6de8af0e4d464f2416062121
|
3 |
+
size 882080
|
finetunes/james-sunderland/dataset/ynoeld_00010.wav
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:cead9ecd32d0d85d491d4232b2eafbd5fb323ba21e20a81706f3eb8db8117d15
|
3 |
+
size 705680
|
finetunes/james-sunderland/dataset/ynoeld_00011.wav
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:93fe0f3a558663cec9cc4af2d9e656d8d3954b46bdec3ef423cab876c87771dc
|
3 |
+
size 1234880
|
finetunes/james-sunderland/dataset/ynoeld_00012.wav
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ccffcfef292e328a78d22e53265da9e081d209321b37f56890aa3eb6f5650bd6
|
3 |
+
size 705680
|
finetunes/james-sunderland/dataset/ynoeld_00013.wav
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4533939de62fb46d7ed44d5dea97f91a5c1940f32eace589931bb133c6545f33
|
3 |
+
size 882080
|
finetunes/james-sunderland/dataset/ynoeld_00014.wav
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:39dde7e9d390f1a7241a3caeeed30d125d2cddd57491b510c3b669c61ad5a924
|
3 |
+
size 705680
|
finetunes/james-sunderland/dataset/ynoeld_00015.wav
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5d3a551a0ac7db136fb2554dba7dc1116ffca8dd27d8f91c3ff92c311a1e806d
|
3 |
+
size 352880
|
finetunes/james-sunderland/dataset/ynoeld_00016.wav
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:154ee5f59038ef9751fdffbaa49003c6af4b470ede808c5e52d1425ffd62b3d7
|
3 |
+
size 882080
|
finetunes/james-sunderland/dataset/ynoeld_00017.wav
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dbcfa1b55984b896d2145b2d251766b9915948635350603d8545cd9ae51d3e63
|
3 |
+
size 529280
|
finetunes/james-sunderland/dataset/ynoeld_00018.wav
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ced36b4eea93c69bbf4ed3b456fbbaf4003432c4c6fda689ccb3013037ef87a5
|
3 |
+
size 352880
|
finetunes/james-sunderland/dataset/ynoeld_00019.wav
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6328ccff79da49ff28ccfa494ebbb7dbb09e20118ae56443fdfbb027f866b742
|
3 |
+
size 1022260
|