File size: 479 Bytes
37a9836
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
# original BARK semantic vocab size
SEMANTIC_VOCAB_SIZE = 10_000
# HuBERT model output vocab size
HUBERT_OUTPUT_VOCAB_SIZE = 10_003
CODEBOOK_SIZE = 1024
N_COARSE_CODEBOOKS = 2
COARSE_RATE_HZ = 75
COARSE_SEMANTIC_PAD_TOKEN = 12_048
COARSE_INFER_TOKEN = 12_050

# for the BERT model to get semantic tokens from raw texts
TEXT_ENCODING_OFFSET = 10_048
SEMANTIC_PAD_TOKEN = 10_000
TEXT_PAD_TOKEN = 129_595
SEMANTIC_INFER_TOKEN = 129_599
SEMANTIC_RATE_HZ = 49.9

N_FINE_CODEBOOKS = 8