# original BARK semantic vocab size SEMANTIC_VOCAB_SIZE = 10_000 # HuBERT model output vocab size HUBERT_OUTPUT_VOCAB_SIZE = 10_003 CODEBOOK_SIZE = 1024 N_COARSE_CODEBOOKS = 2 COARSE_RATE_HZ = 75 COARSE_SEMANTIC_PAD_TOKEN = 12_048 COARSE_INFER_TOKEN = 12_050 # for the BERT model to get semantic tokens from raw texts TEXT_ENCODING_OFFSET = 10_048 SEMANTIC_PAD_TOKEN = 10_000 TEXT_PAD_TOKEN = 129_595 SEMANTIC_INFER_TOKEN = 129_599 SEMANTIC_RATE_HZ = 49.9 N_FINE_CODEBOOKS = 8