diff --git a/funasr/datasets/sense_voice_datasets/datasets.py b/funasr/datasets/sense_voice_datasets/datasets.py
index 1a55593f9..e78bd2a00 100644
--- a/funasr/datasets/sense_voice_datasets/datasets.py
+++ b/funasr/datasets/sense_voice_datasets/datasets.py
@@ -587,10 +587,10 @@ class SenseVoicePitchDataset(torch.utils.data.Dataset):
                 elif f0.shape < speech.shape[1]:
                     last_value = f0[-1]
                     f0 =  torch.cat([f0, last_value.repeat(speech.shape[1] - f0.shape)])
-                f0_tag = torch.Tensor([1], dtype=torch.int32)
+                f0_tag = torch.tensor([1], dtype=torch.int32)
             else:
                 f0 = torch.tensor([0.0], dtype=torch.float32)
-                f0_tag = torch.Tensor([0], dtype=torch.int32)
+                f0_tag = torch.tensor([0], dtype=torch.int32)
             
             output = {
                 "speech": speech[0, :, :],