[CSM] infer codec model with no_grad + audio eos label (#38215)
* infer codec model with no_grad * codec_model eval * training labels: add audio eos token
This commit is contained in:
@@ -315,6 +315,7 @@ device = "cuda"
|
||||
processor = AutoProcessor.from_pretrained(model_id)
|
||||
model = CsmForConditionalGeneration.from_pretrained(model_id, device_map=device)
|
||||
model.train()
|
||||
model.codec_model.eval()
|
||||
|
||||
ds = load_dataset("hf-internal-testing/dailytalk-dummy", split="train")
|
||||
# ensure the audio is 24kHz
|
||||
|
||||
Reference in New Issue
Block a user