Spaces:
Sleeping
Sleeping
Update app.py
Browse files
app.py
CHANGED
|
@@ -348,7 +348,21 @@ def two_stage_qa(question, candidate_paragraphs_str, max_seq_len_mc=512, max_seq
|
|
| 348 |
logger.error(f" !!!!!! CRITICAL: Key '{key_to_check}' in feature {i} contains non-integer {elem} (type: {type(elem)}) at index {elem_idx}!")
|
| 349 |
return f"錯誤: 特徵準備失敗,{key_to_check} 內部有非整數", "N/A", "N/A"
|
| 350 |
logger.info(f" Feature {i}, key '{key_to_check}' passed inspection. Length: {len(val_list)}")
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 351 |
|
|
|
|
|
|
|
| 352 |
qa_dataloader = DataLoader(
|
| 353 |
qa_features_dataset, collate_fn=default_data_collator, batch_size=8 # batch_size可以小一些
|
| 354 |
)
|
|
|
|
| 348 |
logger.error(f" !!!!!! CRITICAL: Key '{key_to_check}' in feature {i} contains non-integer {elem} (type: {type(elem)}) at index {elem_idx}!")
|
| 349 |
return f"錯誤: 特徵準備失敗,{key_to_check} 內部有非整數", "N/A", "N/A"
|
| 350 |
logger.info(f" Feature {i}, key '{key_to_check}' passed inspection. Length: {len(val_list)}")
|
| 351 |
+
|
| 352 |
+
model_input_columns = ["input_ids", "attention_mask"]
|
| 353 |
+
if "token_type_ids" in qa_features_dataset.features:
|
| 354 |
+
model_input_columns.append("token_type_ids")
|
| 355 |
+
|
| 356 |
+
try:
|
| 357 |
+
# 從 qa_features_dataset 中提取需要的列來創建新的 Dataset
|
| 358 |
+
# qa_features_dataset 本身就是一個 Dataset 對象
|
| 359 |
+
features_for_dataloader = qa_features_dataset.select_columns(model_input_columns)
|
| 360 |
+
except Exception as e:
|
| 361 |
+
logger.error(f"從 qa_features_dataset 選擇列時出錯: {e}. Features: {qa_features_dataset.features}")
|
| 362 |
+
return f"錯誤: 準備模型輸入時出錯 (列選擇)。 Error: {e}", "N/A", "N/A"
|
| 363 |
|
| 364 |
+
logger.info(f"--- In two_stage_qa, about to create DataLoader for question_id: {log_question_id} ---")
|
| 365 |
+
|
| 366 |
qa_dataloader = DataLoader(
|
| 367 |
qa_features_dataset, collate_fn=default_data_collator, batch_size=8 # batch_size可以小一些
|
| 368 |
)
|