[CSM] update model id (#38211)

* update model id * codec_model eval * add processor img * use ungated repo for processor tests
2025-05-27 17:03:55 +02:00
parent 07dd6b2495
commit b9f8f863d9
8 changed files with 17 additions and 14 deletions
--- a/docs/source/en/model_doc/csm.md
+++ b/docs/source/en/model_doc/csm.md
@@ -39,7 +39,7 @@ CSM can be used to simply generate speech from a text prompt:
 import torch
 from transformers import CsmForConditionalGeneration, AutoProcessor

-model_id = "eustlb/csm-1b"
+model_id = "sesame/csm-1b"
 device = "cuda" if torch.cuda.is_available() else "cpu"

 # load the model and the processor
@@ -74,7 +74,7 @@ import torch
 from transformers import CsmForConditionalGeneration, AutoProcessor
 from datasets import load_dataset, Audio

-model_id = "eustlb/csm-1b"
+model_id = "sesame/csm-1b"
 device = "cuda" if torch.cuda.is_available() else "cpu"

 # load the model and the processor
@@ -119,7 +119,7 @@ import torch
 from transformers import CsmForConditionalGeneration, AutoProcessor
 from datasets import load_dataset, Audio

-model_id = "eustlb/csm-1b"
+model_id = "sesame/csm-1b"
 device = "cuda" if torch.cuda.is_available() else "cpu"

 # load the model and the processor
@@ -176,7 +176,7 @@ import copy
 from transformers import CsmForConditionalGeneration, AutoProcessor
 from datasets import load_dataset

-model_id = "eustlb/csm-1b"
+model_id = "sesame/csm-1b"
 device = "cuda"

 # set logs to ensure no recompilation and graph breaks
@@ -308,7 +308,7 @@ CSM Transformers integration supports training!
 from transformers import CsmForConditionalGeneration, AutoProcessor
 from datasets import load_dataset, Audio

-model_id = "eustlb/csm-1b"
+model_id = "sesame/csm-1b"
 device = "cuda"

 # load the model and the processor
@@ -356,6 +356,10 @@ The original code can be found [here](https://github.com/SesameAILabs/csm).

 ## CsmProcessor

+<div class="flex justify-center">
+    <img src="https://huggingface.co/datasets/eustlb/documentation-images/resolve/main/fig1.jpg"/>
+</div>
+
 [[autodoc]] CsmProcessor
    - __call__