提交代码

3 months ago · ccd345bcd9
parent c32e95878f
commit ccd345bcd9
12 changed files with 277 additions and 54 deletions
--- a/.idea/.gitignore
+++ b/.idea/.gitignore
@ -0,0 +1,3 @@
+# Default ignored files
+/shelf/
+/workspace.xml
--- a/.idea/inspectionProfiles/Project_Default.xml
+++ b/.idea/inspectionProfiles/Project_Default.xml
@ -0,0 +1,54 @@
+<component name="InspectionProjectProfileManager">
+  <profile version="1.0">
+    <option name="myName" value="Project Default" />
+    <inspection_tool class="HtmlUnknownAttribute" enabled="true" level="WARNING" enabled_by_default="true">
+      <option name="myValues">
+        <value>
+          <list size="1">
+            <item index="0" class="java.lang.String" itemvalue="href" />
+          </list>
+        </value>
+      </option>
+      <option name="myCustomValuesEnabled" value="true" />
+    </inspection_tool>
+    <inspection_tool class="HtmlUnknownTag" enabled="true" level="WARNING" enabled_by_default="true">
+      <option name="myValues">
+        <value>
+          <list size="10">
+            <item index="0" class="java.lang.String" itemvalue="nobr" />
+            <item index="1" class="java.lang.String" itemvalue="noembed" />
+            <item index="2" class="java.lang.String" itemvalue="comment" />
+            <item index="3" class="java.lang.String" itemvalue="noscript" />
+            <item index="4" class="java.lang.String" itemvalue="embed" />
+            <item index="5" class="java.lang.String" itemvalue="script" />
+            <item index="6" class="java.lang.String" itemvalue="a" />
+            <item index="7" class="java.lang.String" itemvalue="hr" />
+            <item index="8" class="java.lang.String" itemvalue="div" />
+            <item index="9" class="java.lang.String" itemvalue="style" />
+          </list>
+        </value>
+      </option>
+      <option name="myCustomValuesEnabled" value="true" />
+    </inspection_tool>
+    <inspection_tool class="PyPep8NamingInspection" enabled="true" level="WEAK WARNING" enabled_by_default="true">
+      <option name="ignoredErrors">
+        <list>
+          <option value="N802" />
+          <option value="N806" />
+          <option value="N803" />
+          <option value="N801" />
+        </list>
+      </option>
+    </inspection_tool>
+    <inspection_tool class="PyUnresolvedReferencesInspection" enabled="true" level="WARNING" enabled_by_default="true">
+      <option name="ignoredIdentifiers">
+        <list>
+          <option value="list.split" />
+          <option value="_random.random.randint" />
+          <option value="str.raise_for_status" />
+        </list>
+      </option>
+    </inspection_tool>
+    <inspection_tool class="XmlDuplicatedId" enabled="false" level="ERROR" enabled_by_default="false" />
+  </profile>
+</component>
--- a/.idea/inspectionProfiles/profiles_settings.xml
+++ b/.idea/inspectionProfiles/profiles_settings.xml
@ -0,0 +1,6 @@
+<component name="InspectionProjectProfileManager">
+  <settings>
+    <option name="USE_PROJECT_PROFILE" value="false" />
+    <version value="1.0" />
+  </settings>
+</component>
--- a/.idea/misc.xml
+++ b/.idea/misc.xml
@ -0,0 +1,10 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<project version="4">
+  <component name="Black">
+    <option name="sdkName" value="Python 3.11 (base) (2)" />
+  </component>
+  <component name="ProjectRootManager" version="2" project-jdk-name="Python 3.11 (base) (2)" project-jdk-type="Python SDK" />
+  <component name="PyCharmProfessionalAdvertiser">
+    <option name="shown" value="true" />
+  </component>
+</project>
--- a/.idea/modules.xml
+++ b/.idea/modules.xml
@ -0,0 +1,8 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<project version="4">
+  <component name="ProjectModuleManager">
+    <modules>
+      <module fileurl="file://$PROJECT_DIR$/.idea/py.iml" filepath="$PROJECT_DIR$/.idea/py.iml" />
+    </modules>
+  </component>
+</project>
--- a/.idea/py.iml
+++ b/.idea/py.iml
@ -0,0 +1,12 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<module type="PYTHON_MODULE" version="4">
+  <component name="NewModuleRootManager">
+    <content url="file://$MODULE_DIR$" />
+    <orderEntry type="jdk" jdkName="Python 3.11 (base) (2)" jdkType="Python SDK" />
+    <orderEntry type="sourceFolder" forTests="false" />
+  </component>
+  <component name="PyDocumentationSettings">
+    <option name="format" value="PLAIN" />
+    <option name="myDocStringFormat" value="Plain" />
+  </component>
+</module>
--- a/4
+++ b/4
@ -20,6 +20,6 @@ RUN pip install --no-cache-dir -r requirements.txt -i https://mirrors.aliyun.com
 COPY predict_with_excel.py .
 COPY degree3/ ./degree3/

-EXPOSE 8000
+EXPOSE 8001

-CMD ["uvicorn", "predict_with_excel:app", "--host", "0.0.0.0", "--port", "8000"]
+CMD ["uvicorn", "predict_with_excel:app", "--host", "0.0.0.0", "--port", "8001"]
--- a/README.md
+++ b/README.md
@ -1,2 +0,0 @@
-# gc_worktime
-
--- a/direct_test.py
+++ b/direct_test.py
@ -0,0 +1,51 @@
+import pandas as pd
+import numpy as np
+from pathlib import Path
+import joblib
+
+# 直接测试模型加载功能
+print("=== Direct Model Loading Test ===")
+
+# 设置模型文件夹路径
+model_folder = Path("./degree3")
+print(f"Model folder path: {model_folder}")
+print(f"Model folder exists: {model_folder.exists()}")
+
+# 加载EV17.5相关的模型
+try:
+    # 加载EV17.5_立焊模型
+    ev175_vertical_model_path = model_folder / "EV17.5_立焊.xlsx_model_degree3.pkl"
+    print(f"EV17.5_立焊 model path: {ev175_vertical_model_path}")
+    print(f"EV17.5_立焊 model exists: {ev175_vertical_model_path.exists()}")
+    
+    if ev175_vertical_model_path.exists():
+        ev175_vertical_model = joblib.load(ev175_vertical_model_path)
+        print(f"EV17.5_立焊 model loaded successfully!")
+        
+        # 测试模型预测
+        test_thickness = np.array([[9.0]])
+        prediction = ev175_vertical_model.predict(test_thickness)
+        print(f"EV17.5_立焊 prediction for thickness 9.0mm: {prediction}")
+    else:
+        print(f"EV17.5_立焊 model file not found!")
+    
+    # 加载EV17.5_横焊模型
+    ev175_horizontal_model_path = model_folder / "EV17.5_横焊.xlsx_model_degree3.pkl"
+    print(f"\nEV17.5_横焊 model path: {ev175_horizontal_model_path}")
+    print(f"EV17.5_横焊 model exists: {ev175_horizontal_model_path.exists()}")
+    
+    if ev175_horizontal_model_path.exists():
+        ev175_horizontal_model = joblib.load(ev175_horizontal_model_path)
+        print(f"EV17.5_横焊 model loaded successfully!")
+        
+        # 测试模型预测
+        test_thickness = np.array([[9.0]])
+        prediction = ev175_horizontal_model.predict(test_thickness)
+        print(f"EV17.5_横焊 prediction for thickness 9.0mm: {prediction}")
+    else:
+        print(f"EV17.5_横焊 model file not found!")
+        
+except Exception as e:
+    print(f"Error during model loading or prediction: {e}")
+    import traceback
+    traceback.print_exc()
--- a/docker-compose.yml
+++ b/docker-compose.yml
@ -3,8 +3,9 @@
 services:
  welding-app:
    build: .
+    container_name: welding-app
    ports:
-      - "8000:8000"
+      - "8001:8001"
 #    volumes:
 #      - ./degree3:/app/degree3
 #      - ./data:/app/data
--- a/predict_with_excel.py
+++ b/predict_with_excel.py
@ -123,7 +123,8 @@ def split_by_plus(s: str) -> list[str]:
 # %%
 import joblib

-folder_path = Path("./degree3")
+# 使用绝对路径来确保模型文件能够被正确找到
+folder_path = Path(__file__).parent / "degree3"


 def load_all_models():
@ -131,14 +132,10 @@ def load_all_models():
    加载所有模型到 model_list
    """
    global model_list
-    # 清空列表以确保重新加载（尽管有启动时加载一次的逻辑）
-    # model_list = []
-    # ^^^ 注释掉这行，因为 FastAPI 的 on_event("startup") 应该只执行一次。
-    # 如果在开发中需要热重载模型，可以取消注释或提供专门的重载端点。
+    # 清空列表以确保重新加载
+    model_list = []
    
-    if model_list:  # 如果已经加载过，则不再重复加载 (主要由 startup_event 控制)
-        print(f"[MODEL_LOADER] Models already loaded. Count: {len(model_list)}")
-        return
+    print(f"[MODEL_LOADER] Attempting to load models...")

    print(
        f"[MODEL_LOADER] Attempting to load models. Initial model_list length: {len(model_list)}"
@ -187,26 +184,15 @@ def load_all_models():
    for file_path_obj in files_found:
        if file_path_obj.is_file():
            try:
-                model_name_parts = file_path_obj.name.split(".xlsx")
-                if len(model_name_parts) > 1:
-                    model_name = model_name_parts[0]
-                else:
-                    model_name_base = file_path_obj.stem
-                    if model_name_base.endswith("_model_degree3"):
-                        model_name = model_name_base[: -len("_model_degree3")]
-                    elif model_name_base.endswith(
-                            "3"
-                    ):  # 兼容 *3.pkl 但不含 .xlsx 的情况
-                        model_name = model_name_base[: -len("3")].rstrip(
-                            "."
-                        )  # 移除可能的尾部'.' (来自.pkl)
-                        if model_name.endswith("_model_degree"):  # 进一步处理
-                            model_name = model_name[: -len("_model_degree")]
-                    else:
-                        model_name = model_name_base
-                    print(
-                        f"[MODEL_LOADER] WARNING: Filename {file_path_obj.name} does not contain '.xlsx' as expected for name splitting. Using '{model_name}' as model name based on stem."
-                    )
+                filename = file_path_obj.name
+                # 移除文件扩展名 .pkl
+                model_name = filename[:-4]
+                # 移除 _model_degree3 后缀
+                if model_name.endswith("_model_degree3"):
+                    model_name = model_name[:-14]
+                # 移除 .xlsx 后缀（如果存在）
+                if ".xlsx" in model_name:
+                    model_name = model_name.split(".xlsx")[0]

                loaded_model = joblib.load(file_path_obj)
                temp_model_list.append(
@ -237,6 +223,12 @@ def load_all_models():
 def get_welding_coefficient(row):
    coefficient = 0.0
    global model_list
+    
+    # 添加调试日志，查看model_list的长度和内容
+    print(f"[DEBUG] model_list length: {len(model_list)}")
+    loaded_model_names = [model["name"] for model in model_list]
+    print(f"[DEBUG] Loaded models: {loaded_model_names}")
+    
    model_map = {model["name"]: model for model in model_list}
    lenth = row.长度_m
    welding_type = row.坡口代码
@ -278,7 +270,9 @@ def get_welding_coefficient(row):
                    model_name = f"{item}_{welding_position}"
                    selected_model_info = model_map.get(model_name)
                    if selected_model_info is None:
-                    raise KeyError(f"模型 '{model_name}' 未加载")
+                        print(f"⚠️ 处理坡口代码模型不存在: {model_name}, 错误: 模型未加载")
+                        coefficient = float('nan')
+                        break
                    model = selected_model_info["model"]
                    range_str = MODEL_RANGES.get(model_name, "0-Infinity")
                    min_val_str, max_val_str = range_str.split("-")
@ -293,8 +287,13 @@ def get_welding_coefficient(row):
                        coefficient = float('nan')
                        break
                    else:
+                        try:
                            prediction = float(model.predict(thickness_array)[0])
                            coefficient += prediction
+                        except Exception as e:
+                            print(f"⚠️ 模型预测失败: {model_name}, 错误: {e}")
+                            coefficient = float('nan')
+                            break
        except Exception as e:
            coefficient = float('nan')
            print(
@ -392,6 +391,9 @@ def process_excel(
    当 sheet_name 为 None 时，处理工作簿内所有工作表并返回 {sheet_name: DataFrame}。
    """
    
+    # 在每次预测之前重新加载模型，确保模型能够被正确加载
+    load_all_models()
+
    path_like, excel_bytes = _prepare_excel_source(excel_source)

    def get_source():
@ -426,6 +428,21 @@ def startup_event():
    load_all_models()


+@app.get("/models", summary="获取已加载的模型列表")
+def get_models():
+    """
+    获取已加载的模型列表，用于调试和检查模型加载状态
+    """
+    global model_list
+    return {
+        "total_models": len(model_list),
+        "models": [{
+            "name": model["name"],
+            "filename": model["filename"]
+        } for model in model_list]
+    }
+
+
 def _sanitize_sheet_name(name: Union[str, int], existing: set[str]) -> str:
    base = str(name) if str(name).strip() else "Sheet"
    base = base[:31]
@ -520,7 +537,36 @@ async def predict(


 def main():
+    print("[TEST] Script started...")
+    
+    # 检查degree3文件夹是否存在
+    print(f"[TEST] Current file path: {__file__}")
+    print(f"[TEST] Folder path: {folder_path}")
+    print(f"[TEST] Folder exists: {folder_path.exists()}")
+    print(f"[TEST] Folder is directory: {folder_path.is_dir()}")
+    
+    # 列出degree3文件夹中的文件
+    if folder_path.exists() and folder_path.is_dir():
+        files = list(folder_path.glob("*3.pkl"))
+        print(f"[TEST] Number of model files found: {len(files)}")
+        for file in files[:10]:  # 显示前10个文件
+            print(f"[TEST] Found model file: {file.name}")
+    
+    # 加载模型
    load_all_models()
+    
+    # 添加调试信息，显示加载的模型名称
+    print(f"[DEBUG] Total models loaded: {len(model_list)}")
+    for model in model_list:
+        print(f"[DEBUG] Loaded model: {model['name']} from {model['filename']}")
+    
+    # 检查是否包含CV17.5相关的模型
+    cv175_models = [model['name'] for model in model_list if 'CV17.5' in model['name']]
+    print(f"[DEBUG] CV17.5 models found: {cv175_models}")
+    
+    # 检查是否包含平焊相关的模型
+    pinghan_models = [model['name'] for model in model_list if '平焊' in model['name']]
+    print(f"[DEBUG] 平焊 models found: {pinghan_models}")
    # result_obj = process_excel(source_excel_path, sheet_name=0)
    # output_file_path = source_excel_path.parent.joinpath(
    #     source_excel_path.stem + "_预测结果.xlsx"
--- a/test_model_load.py
+++ b/test_model_load.py
@ -0,0 +1,34 @@
+import os
+import sys
+from pathlib import Path
+
+# 添加当前目录到Python路径
+sys.path.append(str(Path(__file__).parent))
+
+# 导入需要的模块
+from predict_with_excel import load_all_models, model_list
+
+# 测试模型加载
+print("[TEST] Starting model loading test...")
+print(f"[TEST] Current working directory: {os.getcwd()}")
+
+# 加载模型
+load_all_models()
+
+# 显示加载的模型信息
+print(f"[TEST] Total models loaded: {len(model_list)}")
+if model_list:
+    print("[TEST] Loaded models:")
+    for model in model_list:
+        print(f"  - {model['name']}")
+else:
+    print("[TEST] No models were loaded!")
+
+# 检查EV17.5相关的模型
+ev175_models = [model for model in model_list if 'EV17.5' in model['name']]
+print(f"[TEST] EV17.5 models found: {len(ev175_models)}")
+if ev175_models:
+    for model in ev175_models:
+        print(f"  - {model['name']}")
+else:
+    print("[TEST] No EV17.5 models found!")