пре 2 година · 85cabd30a9
--- a/funasr/models/e2e_asr.py
+++ b/funasr/models/e2e_asr.py
@@ -222,7 +222,8 @@ class ASRModel(FunASRModel):
 
															         # force_gatherable: to-device and to-tensor if scalar for DataParallel
														
 
															         if self.length_normalized_loss:
														
 
															-            batch_size = (text_lengths + 1).sum().type_as(batch_size)
														
 
															+            batch_size = int((text_lengths + 1).sum())
														
 
															+
														
 
															         loss, stats, weight = force_gatherable((loss, stats, batch_size), loss.device)
														
 
															         return loss, stats, weight
														
--- a/funasr/models/e2e_asr_contextual_paraformer.py
+++ b/funasr/models/e2e_asr_contextual_paraformer.py
@@ -233,7 +233,8 @@ class NeatContextualParaformer(Paraformer):
 
															         stats["loss"] = torch.clone(loss.detach())
														
 
															         # force_gatherable: to-device and to-tensor if scalar for DataParallel
														
 
															         if self.length_normalized_loss:
														
 
															-            batch_size = (text_lengths + self.predictor_bias).sum().type_as(batch_size)
														
 
															+            batch_size = int((text_lengths + self.predictor_bias).sum())
														
 
															+
														
 
															         loss, stats, weight = force_gatherable((loss, stats, batch_size), loss.device)
														
 
															         return loss, stats, weight
														
--- a/funasr/models/e2e_asr_paraformer.py
+++ b/funasr/models/e2e_asr_paraformer.py
@@ -255,7 +255,8 @@ class Paraformer(FunASRModel):
 
															         # force_gatherable: to-device and to-tensor if scalar for DataParallel
														
 
															         if self.length_normalized_loss:
														
 
															-            batch_size = (text_lengths + self.predictor_bias).sum().type_as(batch_size)
														
 
															+            batch_size = int((text_lengths + self.predictor_bias).sum())
														
 
															+
														
 
															         loss, stats, weight = force_gatherable((loss, stats, batch_size), loss.device)
														
 
															         return loss, stats, weight
														
@@ -867,7 +868,8 @@ class ParaformerOnline(Paraformer):
 
															         # force_gatherable: to-device and to-tensor if scalar for DataParallel
														
 
															         if self.length_normalized_loss:
														
 
															-            batch_size = (text_lengths + self.predictor_bias).sum().type_as(batch_size)
														
 
															+            batch_size = int((text_lengths + self.predictor_bias).sum())
														
 
															+
														
 
															         loss, stats, weight = force_gatherable((loss, stats, batch_size), loss.device)
														
 
															         return loss, stats, weight
														
@@ -1494,7 +1496,8 @@ class ParaformerBert(Paraformer):
 
															         # force_gatherable: to-device and to-tensor if scalar for DataParallel
														
 
															         if self.length_normalized_loss:
														
 
															-            batch_size = (text_lengths + self.predictor_bias).sum().type_as(batch_size)
														
 
															+            batch_size = int((text_lengths + self.predictor_bias).sum())
														
 
															+
														
 
															         loss, stats, weight = force_gatherable((loss, stats, batch_size), loss.device)
														
 
															         return loss, stats, weight
														
@@ -1765,7 +1768,8 @@ class BiCifParaformer(Paraformer):
 
															         # force_gatherable: to-device and to-tensor if scalar for DataParallel
														
 
															         if self.length_normalized_loss:
														
 
															-            batch_size = (text_lengths + self.predictor_bias).sum().type_as(batch_size)
														
 
															+            batch_size = int((text_lengths + self.predictor_bias).sum())
														
 
															+
														
 
															         loss, stats, weight = force_gatherable((loss, stats, batch_size), loss.device)
														
 
															         return loss, stats, weight
														
@@ -1967,7 +1971,8 @@ class ContextualParaformer(Paraformer):
 
															         # force_gatherable: to-device and to-tensor if scalar for DataParallel
														
 
															         if self.length_normalized_loss:
														
 
															-            batch_size = (text_lengths + self.predictor_bias).sum().type_as(batch_size)
														
 
															+            batch_size = int((text_lengths + self.predictor_bias).sum())
														
 
															+
														
 
															         loss, stats, weight = force_gatherable((loss, stats, batch_size), loss.device)
														
 
															         return loss, stats, weight
														
--- a/funasr/models/e2e_uni_asr.py
+++ b/funasr/models/e2e_uni_asr.py
@@ -442,7 +442,8 @@ class UniASR(FunASRModel):
 
															         stats["loss"] = torch.clone(loss.detach())
														
 
															         # force_gatherable: to-device and to-tensor if scalar for DataParallel
														
 
															         if self.length_normalized_loss:
														
 
															-            batch_size = (text_lengths + 1).sum().type_as(batch_size)
														
 
															+            batch_size = int((text_lengths + 1).sum())
														
 
															+
														
 
															         loss, stats, weight = force_gatherable((loss, stats, batch_size), loss.device)
														
 
															         return loss, stats, weight