szhengac25 commited on
Commit
7f15729
·
1 Parent(s): 78ad88b
Files changed (2) hide show
  1. config.json +1 -9
  2. preprocessor_config.json +2 -3
config.json CHANGED
@@ -30,7 +30,6 @@
30
  "architectures": [
31
  "HiggsAudioTokenizer"
32
  ],
33
- "audio_channels": 1,
34
  "block_dilations": [
35
  1,
36
  1
@@ -41,18 +40,11 @@
41
  ],
42
  "codebook_dim": 64,
43
  "codebook_size": 1024,
44
- "decoder_channels": 768,
45
  "downsample_mode": "step_down",
46
- "encoder_channels": 768,
47
- "hidden_dim": 1024,
48
  "initializer_range": 0.02,
49
- "input_channels": 768,
50
- "intermediate_dim": 768,
51
  "kernel_size": 3,
52
  "model_type": "higgs_audio_tokenizer",
53
  "num_quantizers": 8,
54
- "output_channels": 768,
55
- "output_dim": 256,
56
  "sample_rate": 24000,
57
  "semantic_model_config": {
58
  "activation_dropout": 0.1,
@@ -131,6 +123,6 @@
131
  4
132
  ],
133
  "torch_dtype": "float32",
134
- "transformers_version": "4.55.0.dev0",
135
  "unit_kernel_size": 3
136
  }
 
30
  "architectures": [
31
  "HiggsAudioTokenizer"
32
  ],
 
33
  "block_dilations": [
34
  1,
35
  1
 
40
  ],
41
  "codebook_dim": 64,
42
  "codebook_size": 1024,
 
43
  "downsample_mode": "step_down",
 
 
44
  "initializer_range": 0.02,
 
 
45
  "kernel_size": 3,
46
  "model_type": "higgs_audio_tokenizer",
47
  "num_quantizers": 8,
 
 
48
  "sample_rate": 24000,
49
  "semantic_model_config": {
50
  "activation_dropout": 0.1,
 
123
  4
124
  ],
125
  "torch_dtype": "float32",
126
+ "transformers_version": "4.56.0.dev0",
127
  "unit_kernel_size": 3
128
  }
preprocessor_config.json CHANGED
@@ -1,8 +1,7 @@
1
  {
2
- "chunk_length_s": null,
3
- "feature_extractor_type": "EncodecFeatureExtractor",
4
  "feature_size": 1,
5
- "overlap": null,
6
  "padding_side": "right",
7
  "padding_value": 0.0,
8
  "return_attention_mask": true,
 
1
  {
2
+ "feature_extractor_type": "DacFeatureExtractor",
 
3
  "feature_size": 1,
4
+ "hop_length": 960,
5
  "padding_side": "right",
6
  "padding_value": 0.0,
7
  "return_attention_mask": true,