huggingface
diff --git a/‎docs/source/en/model_doc/bart.md
Lines changed: 1 addition & 1 deletion b/‎docs/source/en/model_doc/bart.md
Lines changed: 1 addition & 1 deletion
diff --git a/‎docs/source/en/model_doc/barthez.md
Lines changed: 1 addition & 1 deletion b/‎docs/source/en/model_doc/barthez.md
Lines changed: 1 addition & 1 deletion
diff --git a/‎docs/source/en/model_doc/bartpho.md
Lines changed: 1 addition & 1 deletion b/‎docs/source/en/model_doc/bartpho.md
Lines changed: 1 addition & 1 deletion
diff --git a/‎docs/source/en/model_doc/bertweet.md
Lines changed: 1 addition & 1 deletion b/‎docs/source/en/model_doc/bertweet.md
Lines changed: 1 addition & 1 deletion
diff --git a/‎docs/source/en/model_doc/big_bird.md
Lines changed: 1 addition & 1 deletion b/‎docs/source/en/model_doc/big_bird.md
Lines changed: 1 addition & 1 deletion
diff --git a/‎docs/source/en/model_doc/bigbird_pegasus.md
Lines changed: 2 additions & 2 deletions b/‎docs/source/en/model_doc/bigbird_pegasus.md
Lines changed: 2 additions & 2 deletions
diff --git a/‎docs/source/en/model_doc/blip.md
Lines changed: 1 addition & 1 deletion b/‎docs/source/en/model_doc/blip.md
Lines changed: 1 addition & 1 deletion
diff --git a/‎docs/source/en/model_doc/clap.md
Lines changed: 1 addition & 1 deletion b/‎docs/source/en/model_doc/clap.md
Lines changed: 1 addition & 1 deletion
diff --git a/‎docs/source/en/model_doc/code_llama.md
Lines changed: 2 additions & 2 deletions b/‎docs/source/en/model_doc/code_llama.md
Lines changed: 2 additions & 2 deletions
diff --git a/‎docs/source/en/model_doc/csm.md
Lines changed: 8 additions & 8 deletions b/‎docs/source/en/model_doc/csm.md
Lines changed: 8 additions & 8 deletions
@@ -65,7 +65,7 @@ model = AutoModelForMaskedLM.from_pretrained(
     device_map="auto",
     attn_implementation="sdpa"
 )
-inputs = tokenizer("Plants create <mask> through a process known as photosynthesis.", return_tensors="pt").to("cuda")
+inputs = tokenizer("Plants create <mask> through a process known as photosynthesis.", return_tensors="pt").to(model.device)
 
 with torch.no_grad():
     outputs = model(**inputs)
 
@@ -68,7 +68,7 @@ model = AutoModelForMaskedLM.from_pretrained(
     torch_dtype=torch.float16,
     device_map="auto",
 )
-inputs = tokenizer("Les plantes produisent <mask> grâce à un processus appelé photosynthèse.", return_tensors="pt").to("cuda")
+inputs = tokenizer("Les plantes produisent <mask> grâce à un processus appelé photosynthèse.", return_tensors="pt").to(model.device)
 
 with torch.no_grad():
     outputs = model(**inputs)
 
@@ -82,7 +82,7 @@ Quang tổng hợp hay gọi tắt là quang hợp là quá trình thu nhận v
 tảo và một số vi khuẩn để tạo ra hợp chất hữu cơ phục vụ bản thân cũng như làm nguồn thức ăn cho hầu hết các sinh vật 
 trên Trái Đất. Quang hợp trong thực vật thường liên quan đến chất tố diệp lục màu xanh lá cây và tạo ra oxy như một sản phẩm phụ
 """
-inputs = tokenizer(text, return_tensors="pt").to("cuda")
+inputs = tokenizer(text, return_tensors="pt").to(model.device)
 
 outputs = model.generate(inputs["input_ids"], num_beams=2, min_length=0, max_length=20)
 tokenizer.batch_decode(outputs, skip_special_tokens=True, clean_up_tokenization_spaces=False)[0]
 
@@ -67,7 +67,7 @@ model = AutoModelForMaskedLM.from_pretrained(
     torch_dtype=torch.float16,
     device_map="auto"
 )
-inputs = tokenizer("Plants create <mask> through a process known as photosynthesis.", return_tensors="pt").to("cuda")
+inputs = tokenizer("Plants create <mask> through a process known as photosynthesis.", return_tensors="pt").to(model.device)
 
 with torch.no_grad():
     outputs = model(**inputs)
 
@@ -64,7 +64,7 @@ model = AutoModelForMaskedLM.from_pretrained(
     torch_dtype=torch.float16,
     device_map="auto",
 )
-inputs = tokenizer("Plants create [MASK] through a process known as photosynthesis.", return_tensors="pt").to("cuda")
+inputs = tokenizer("Plants create [MASK] through a process known as photosynthesis.", return_tensors="pt").to(model.device)
 
 with torch.no_grad():
     outputs = model(**inputs)
 
@@ -72,7 +72,7 @@ input_text = """Plants are among the most remarkable and essential life forms on
 Through photosynthesis, plants capture energy from sunlight using a green pigment called chlorophyll, which is located in specialized cell structures called chloroplasts. In the presence of light, plants absorb carbon dioxide from the atmosphere through small pores in their leaves called stomata, and take in water from the soil through their root systems.
 These ingredients are then transformed into glucose, a type of sugar that serves as a source of chemical energy, and oxygen, which is released as a byproduct into the atmosphere. The glucose produced during photosynthesis is not just used immediately; plants also store it as starch or convert it into other organic compounds like cellulose, which is essential for building their cellular structure.
 This energy reserve allows them to grow, develop leaves, produce flowers, bear fruit, and carry out various physiological processes throughout their lifecycle."""
-input_ids = tokenizer(input_text, return_tensors="pt").to("cuda")
+input_ids = tokenizer(input_text, return_tensors="pt").to(model.device)
 
 output = model.generate(**input_ids, cache_implementation="static")
 print(tokenizer.decode(output[0], skip_special_tokens=True))
@@ -115,7 +115,7 @@ input_text = """Plants are among the most remarkable and essential life forms on
 Through photosynthesis, plants capture energy from sunlight using a green pigment called chlorophyll, which is located in specialized cell structures called chloroplasts. In the presence of light, plants absorb carbon dioxide from the atmosphere through small pores in their leaves called stomata, and take in water from the soil through their root systems.
 These ingredients are then transformed into glucose, a type of sugar that serves as a source of chemical energy, and oxygen, which is released as a byproduct into the atmosphere. The glucose produced during photosynthesis is not just used immediately; plants also store it as starch or convert it into other organic compounds like cellulose, which is essential for building their cellular structure.
 This energy reserve allows them to grow, develop leaves, produce flowers, bear fruit, and carry out various physiological processes throughout their lifecycle."""
-input_ids = tokenizer(input_text, return_tensors="pt").to("cuda")
+input_ids = tokenizer(input_text, return_tensors="pt").to(model.device)
 
 output = model.generate(**input_ids, cache_implementation="static")
 print(tokenizer.decode(output[0], skip_special_tokens=True))
 
@@ -73,7 +73,7 @@ url = "https://huggingface.co/datasets/huggingface/documentation-images/resolve/
 image = Image.open(requests.get(url, stream=True).raw)
 
 question = "What is the weather in this image?"
-inputs = processor(images=image, text=question, return_tensors="pt").to("cuda", torch.float16)
+inputs = processor(images=image, text=question, return_tensors="pt").to(model.device, torch.float16)
 
 output = model.generate(**inputs)
 processor.batch_decode(output, skip_special_tokens=True)[0]
 
@@ -48,7 +48,7 @@ tokenizer = AutoTokenizer.from_pretrained("laion/clap-htsat-unfused")
 
 texts = ["the sound of a cat", "the sound of a dog", "music playing"]
 
-inputs = tokenizer(texts, padding=True, return_tensors="pt").to("cuda")
+inputs = tokenizer(texts, padding=True, return_tensors="pt").to(model.device)
 
 with torch.no_grad():
     text_features = model.get_text_features(**inputs)
 
@@ -74,7 +74,7 @@ model = AutoModelForCausalLM.from_pretrained(
 
 # basic code generation
 prompt = "# Function to calculate the factorial of a number\ndef factorial(n):"
-input_ids = tokenizer(prompt, return_tensors="pt").to("cuda")
+input_ids = tokenizer(prompt, return_tensors="pt").to(model.device)
 
 output = model.generate(
     **input_ids,
@@ -121,7 +121,7 @@ model = AutoModelForCausalLM.from_pretrained(
 )
 
 prompt = "# Write a Python function to check if a string is a palindrome\ndef is_palindrome(s):"
-input_ids = tokenizer(prompt, return_tensors="pt").to("cuda")
+input_ids = tokenizer(prompt, return_tensors="pt").to(model.device)
 
 output = model.generate(**input_ids, max_new_tokens=200, cache_implementation="static")
 print(tokenizer.decode(output[0], skip_special_tokens=True))
 
@@ -38,10 +38,10 @@ CSM can be used to simply generate speech from a text prompt:
 
 ```python
 import torch
-from transformers import CsmForConditionalGeneration, AutoProcessor
+from transformers import CsmForConditionalGeneration, AutoProcessor, infer_device
 
 model_id = "sesame/csm-1b"
-device = "cuda" if torch.cuda.is_available() else "cpu"
+device = infer_device()
 
 # load the model and the processor
 processor = AutoProcessor.from_pretrained(model_id)
@@ -72,11 +72,11 @@ CSM can be used to generate speech given a conversation, allowing consistency in
 
 ```python
 import torch
-from transformers import CsmForConditionalGeneration, AutoProcessor
+from transformers import CsmForConditionalGeneration, AutoProcessor, infer_device
 from datasets import load_dataset, Audio
 
 model_id = "sesame/csm-1b"
-device = "cuda" if torch.cuda.is_available() else "cpu"
+device = infer_device()
 
 # load the model and the processor
 processor = AutoProcessor.from_pretrained(model_id)
@@ -117,11 +117,11 @@ CSM supports batched inference!
 
 ```python
 import torch
-from transformers import CsmForConditionalGeneration, AutoProcessor
+from transformers import CsmForConditionalGeneration, AutoProcessor, infer_device
 from datasets import load_dataset, Audio
 
 model_id = "sesame/csm-1b"
-device = "cuda" if torch.cuda.is_available() else "cpu"
+device = infer_device()
 
 # load the model and the processor
 processor = AutoProcessor.from_pretrained(model_id)
@@ -306,11 +306,11 @@ print("="*50)
 CSM Transformers integration supports training!
 
 ```python
-from transformers import CsmForConditionalGeneration, AutoProcessor
+from transformers import CsmForConditionalGeneration, AutoProcessor, infer_device
 from datasets import load_dataset, Audio
 
 model_id = "sesame/csm-1b"
-device = "cuda"
+device = infer_device()
 
 # load the model and the processor
 processor = AutoProcessor.from_pretrained(model_id)
Original file line number	Diff line number	Diff line change
`@@ -65,7 +65,7 @@ model = AutoModelForMaskedLM.from_pretrained(`
`65`	`65`	`device_map="auto",`
`66`	`66`	`attn_implementation="sdpa"`
`67`	`67`	`)`
`68`		`-inputs = tokenizer("Plants create <mask> through a process known as photosynthesis.", return_tensors="pt").to("cuda")`
	`68`	`+inputs = tokenizer("Plants create <mask> through a process known as photosynthesis.", return_tensors="pt").to(model.device)`
`69`	`69`
`70`	`70`	`with torch.no_grad():`
`71`	`71`	`outputs = model(**inputs)`
Original file line number	Diff line number	Diff line change
`@@ -68,7 +68,7 @@ model = AutoModelForMaskedLM.from_pretrained(`
`68`	`68`	`torch_dtype=torch.float16,`
`69`	`69`	`device_map="auto",`
`70`	`70`	`)`
`71`		`-inputs = tokenizer("Les plantes produisent <mask> grâce à un processus appelé photosynthèse.", return_tensors="pt").to("cuda")`
	`71`	`+inputs = tokenizer("Les plantes produisent <mask> grâce à un processus appelé photosynthèse.", return_tensors="pt").to(model.device)`
`72`	`72`
`73`	`73`	`with torch.no_grad():`
`74`	`74`	`outputs = model(**inputs)`
Original file line number	Diff line number	Diff line change
`@@ -67,7 +67,7 @@ model = AutoModelForMaskedLM.from_pretrained(`
`67`	`67`	`torch_dtype=torch.float16,`
`68`	`68`	`device_map="auto"`
`69`	`69`	`)`
`70`		`-inputs = tokenizer("Plants create <mask> through a process known as photosynthesis.", return_tensors="pt").to("cuda")`
	`70`	`+inputs = tokenizer("Plants create <mask> through a process known as photosynthesis.", return_tensors="pt").to(model.device)`
`71`	`71`
`72`	`72`	`with torch.no_grad():`
`73`	`73`	`outputs = model(**inputs)`
Original file line number	Diff line number	Diff line change
`@@ -64,7 +64,7 @@ model = AutoModelForMaskedLM.from_pretrained(`
`64`	`64`	`torch_dtype=torch.float16,`
`65`	`65`	`device_map="auto",`
`66`	`66`	`)`
`67`		`-inputs = tokenizer("Plants create [MASK] through a process known as photosynthesis.", return_tensors="pt").to("cuda")`
	`67`	`+inputs = tokenizer("Plants create [MASK] through a process known as photosynthesis.", return_tensors="pt").to(model.device)`
`68`	`68`
`69`	`69`	`with torch.no_grad():`
`70`	`70`	`outputs = model(**inputs)`