44khz -> 22khz; remove saved model
Browse files- README.md +2 -2
- model.safetensors +0 -3
- save_model.ipynb +2 -2
- test_DAC.ipynb +1 -1
    	
        README.md
    CHANGED
    
    | @@ -9,7 +9,7 @@ tags: | |
| 9 | 
             
            # Descript Audio Codec (DAC)
         | 
| 10 | 
             
            DAC is the state-of-the-art audio tokenizer with improvement upon the previous tokenizers like SoundStream and EnCodec.
         | 
| 11 |  | 
| 12 | 
            -
            This model card provides an easy-to-use API for a *pretrained DAC* [1] for  | 
| 13 |  | 
| 14 |  | 
| 15 |  | 
| @@ -47,7 +47,7 @@ from transformers import AutoModel | |
| 47 | 
             
            device = 'cpu'  # or 'cuda:0'
         | 
| 48 |  | 
| 49 | 
             
            # load
         | 
| 50 | 
            -
            model = AutoModel.from_pretrained('hance-ai/descript-audio-codec', trust_remote_code=True)
         | 
| 51 | 
             
            model.to(device)
         | 
| 52 | 
             
            ```
         | 
| 53 |  | 
|  | |
| 9 | 
             
            # Descript Audio Codec (DAC)
         | 
| 10 | 
             
            DAC is the state-of-the-art audio tokenizer with improvement upon the previous tokenizers like SoundStream and EnCodec.
         | 
| 11 |  | 
| 12 | 
            +
            This model card provides an easy-to-use API for a *pretrained DAC* [1] for 24khz audio whose backbone and pretrained weights are from [its original reposotiry](https://github.com/descriptinc/descript-audio-codec). With this API, you can encode and decode by a single line of code either using CPU or GPU. Furhtermore, it supports chunk-based processing for memory-efficient processing, especially important for GPU processing. 
         | 
| 13 |  | 
| 14 |  | 
| 15 |  | 
|  | |
| 47 | 
             
            device = 'cpu'  # or 'cuda:0'
         | 
| 48 |  | 
| 49 | 
             
            # load
         | 
| 50 | 
            +
            model = AutoModel.from_pretrained('hance-ai/descript-audio-codec-24khz', trust_remote_code=True)
         | 
| 51 | 
             
            model.to(device)
         | 
| 52 | 
             
            ```
         | 
| 53 |  | 
    	
        model.safetensors
    DELETED
    
    | @@ -1,3 +0,0 @@ | |
| 1 | 
            -
            version https://git-lfs.github.com/spec/v1
         | 
| 2 | 
            -
            oid sha256:fcc4931e3729bfe19838e458b2149ccc95fc3bc5452bdd4e6530e25968d1cbf6
         | 
| 3 | 
            -
            size 306641816
         | 
|  | |
|  | |
|  | |
|  | 
    	
        save_model.ipynb
    CHANGED
    
    | @@ -47,7 +47,7 @@ | |
| 47 | 
             
               ],
         | 
| 48 | 
             
               "source": [
         | 
| 49 | 
             
                "# create instances\n",
         | 
| 50 | 
            -
                "config = DACConfig(model_type_by_sampling_freq=' | 
| 51 | 
             
                "model = DAC(config)"
         | 
| 52 | 
             
               ]
         | 
| 53 | 
             
              },
         | 
| @@ -126,7 +126,7 @@ | |
| 126 | 
             
               "source": [
         | 
| 127 | 
             
                "# load the uploaded model\n",
         | 
| 128 | 
             
                "from transformers import AutoModel\n",
         | 
| 129 | 
            -
                "model = AutoModel.from_pretrained('hance-ai/descript-audio-codec- | 
| 130 | 
             
                "model.to('cpu');"
         | 
| 131 | 
             
               ]
         | 
| 132 | 
             
              },
         | 
|  | |
| 47 | 
             
               ],
         | 
| 48 | 
             
               "source": [
         | 
| 49 | 
             
                "# create instances\n",
         | 
| 50 | 
            +
                "config = DACConfig(model_type_by_sampling_freq='24khz')\n",
         | 
| 51 | 
             
                "model = DAC(config)"
         | 
| 52 | 
             
               ]
         | 
| 53 | 
             
              },
         | 
|  | |
| 126 | 
             
               "source": [
         | 
| 127 | 
             
                "# load the uploaded model\n",
         | 
| 128 | 
             
                "from transformers import AutoModel\n",
         | 
| 129 | 
            +
                "model = AutoModel.from_pretrained('hance-ai/descript-audio-codec-24khz', trust_remote_code=True)\n",
         | 
| 130 | 
             
                "model.to('cpu');"
         | 
| 131 | 
             
               ]
         | 
| 132 | 
             
              },
         | 
    	
        test_DAC.ipynb
    CHANGED
    
    | @@ -28,7 +28,7 @@ | |
| 28 | 
             
                "# settings\n",
         | 
| 29 | 
             
                "fname = str(Path(os.getcwd()).joinpath('.sample_sound', 'jazz_swing.wav'))\n",
         | 
| 30 | 
             
                "device = 'cpu'\n",
         | 
| 31 | 
            -
                "model_type_by_sampling_freq = ' | 
| 32 | 
             
               ]
         | 
| 33 | 
             
              },
         | 
| 34 | 
             
              {
         | 
|  | |
| 28 | 
             
                "# settings\n",
         | 
| 29 | 
             
                "fname = str(Path(os.getcwd()).joinpath('.sample_sound', 'jazz_swing.wav'))\n",
         | 
| 30 | 
             
                "device = 'cpu'\n",
         | 
| 31 | 
            +
                "model_type_by_sampling_freq = '24khz'"
         | 
| 32 | 
             
               ]
         | 
| 33 | 
             
              },
         | 
| 34 | 
             
              {
         | 

