44khz -> 22khz; remove saved model

Files changed (4) hide show

README.md CHANGED Viewed

@@ -9,7 +9,7 @@ tags:
 # Descript Audio Codec (DAC)
 DAC is the state-of-the-art audio tokenizer with improvement upon the previous tokenizers like SoundStream and EnCodec.
-This model card provides an easy-to-use API for a *pretrained DAC* [1] for 44.1khz audio whose backbone and pretrained weights are from [its original reposotiry](https://github.com/descriptinc/descript-audio-codec). With this API, you can encode and decode by a single line of code either using CPU or GPU. Furhtermore, it supports chunk-based processing for memory-efficient processing, especially important for GPU processing.
@@ -47,7 +47,7 @@ from transformers import AutoModel
 device = 'cpu'  # or 'cuda:0'
 # load
-model = AutoModel.from_pretrained('hance-ai/descript-audio-codec', trust_remote_code=True)
 model.to(device)
 ```

 # Descript Audio Codec (DAC)
 DAC is the state-of-the-art audio tokenizer with improvement upon the previous tokenizers like SoundStream and EnCodec.
+This model card provides an easy-to-use API for a *pretrained DAC* [1] for 24khz audio whose backbone and pretrained weights are from [its original reposotiry](https://github.com/descriptinc/descript-audio-codec). With this API, you can encode and decode by a single line of code either using CPU or GPU. Furhtermore, it supports chunk-based processing for memory-efficient processing, especially important for GPU processing.
 device = 'cpu'  # or 'cuda:0'
 # load
+model = AutoModel.from_pretrained('hance-ai/descript-audio-codec-24khz', trust_remote_code=True)
 model.to(device)
 ```

model.safetensors DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:fcc4931e3729bfe19838e458b2149ccc95fc3bc5452bdd4e6530e25968d1cbf6
-size 306641816

save_model.ipynb CHANGED Viewed

@@ -47,7 +47,7 @@
    ],
    "source": [
     "# create instances\n",
-    "config = DACConfig(model_type_by_sampling_freq='44khz')\n",
     "model = DAC(config)"
    ]
   },
@@ -126,7 +126,7 @@
    "source": [
     "# load the uploaded model\n",
     "from transformers import AutoModel\n",
-    "model = AutoModel.from_pretrained('hance-ai/descript-audio-codec-44khz', trust_remote_code=True)\n",
     "model.to('cpu');"
    ]
   },

    ],
    "source": [
     "# create instances\n",
+    "config = DACConfig(model_type_by_sampling_freq='24khz')\n",
     "model = DAC(config)"
    ]
   },
    "source": [
     "# load the uploaded model\n",
     "from transformers import AutoModel\n",
+    "model = AutoModel.from_pretrained('hance-ai/descript-audio-codec-24khz', trust_remote_code=True)\n",
     "model.to('cpu');"
    ]
   },

test_DAC.ipynb CHANGED Viewed

@@ -28,7 +28,7 @@
     "# settings\n",
     "fname = str(Path(os.getcwd()).joinpath('.sample_sound', 'jazz_swing.wav'))\n",
     "device = 'cpu'\n",
-    "model_type_by_sampling_freq = '44khz'"
    ]
   },
   {

     "# settings\n",
     "fname = str(Path(os.getcwd()).joinpath('.sample_sound', 'jazz_swing.wav'))\n",
     "device = 'cpu'\n",
+    "model_type_by_sampling_freq = '24khz'"
    ]
   },
   {