Răsfoiți Sursa

feat: Add detailed data logging before translation

mrh (aider) 1 an în urmă
părinte
comite
745e63aa4a
1 a modificat fișierele cu 31 adăugiri și 0 ștergeri
  1. 31 0
      mylib/translate_utils.py

+ 31 - 0
mylib/translate_utils.py

@@ -29,6 +29,34 @@ def extract_sample_data(data: List[List[str]], n: int = 2, m: int = 2) -> List[L
         logger.error(f"Error extracting sample data: {e}")
         raise
 
+def log_data_details(data: List[List[str]], search_term_index: int, start_row: int = 3):
+    """记录数据详细信息"""
+    try:
+        # 记录表头信息
+        headers = data[0]
+        logger.info(f"表头信息: {headers}")
+        
+        # 记录前5行数据
+        logger.info("前5行数据预览:")
+        for i, row in enumerate(data[:5]):
+            logger.info(f"行 {i}: {row}")
+            
+        # 记录搜索词列信息
+        search_terms = [row[search_term_index] for row in data[start_row-1:]]
+        logger.info(f"共找到 {len(search_terms)} 个搜索词")
+        logger.info("前10个搜索词:")
+        for i, term in enumerate(search_terms[:10]):
+            logger.info(f"{i+1}. {term}")
+            
+        # 记录最后5个搜索词
+        logger.info("最后5个搜索词:")
+        for i, term in enumerate(search_terms[-5:]):
+            logger.info(f"{len(search_terms)-5+i+1}. {term}")
+            
+    except Exception as e:
+        logger.error(f"记录数据详细信息时出错: {e}")
+        raise
+
 def process_batch_translations(data: List[List[str]], 
                              search_term_index: int,
                              start_row: int = 3) -> Tuple[List[List[str]], List[List[str]]]:
@@ -38,6 +66,9 @@ def process_batch_translations(data: List[List[str]],
         sample_data = extract_sample_data(data)
         logger.info(f"Sample data extracted for inspection:\n{sample_data}")
         
+        # 记录数据详细信息
+        log_data_details(data, search_term_index, start_row)
+        
         # 初始化翻译器
         translator = OpenAITranslator()