|
|
@@ -1,5 +1,18 @@
|
|
|
-(base) [root@localhost ~]# docker exec finetune-trainer cat /root/Fine-tuning/backend/data/logs/638a1786-04d7-44ea-b274-2c673aea22e2.jsonl
|
|
|
-{"ts": "2026-05-22T08:58:18.130363+00:00", "type": "start", "job_id": "638a1786-04d7-44ea-b274-2c673aea22e2"}
|
|
|
-{"ts": "2026-05-22T08:58:18.132911+00:00", "type": "status", "status": "preprocessing"}
|
|
|
-{"ts": "2026-05-22T08:58:22.234319+00:00", "type": "status", "status": "loading_model"}
|
|
|
-{"ts": "2026-05-22T08:58:42.046499+00:00", "type": "error", "message": "GPU model loading failed: We encountered some issues during automatic conversion of the weights. For details look at the `CONVERSION` entries of the above report!", "traceback": "Traceback (most recent call last):\n File \"/root/Fine-tuning/backend/app/engines/remote_train.py\", line 157, in run_training\n await engine.load_model(model_id, quantization=quantization_mode)\n File \"/root/Fine-tuning/backend/app/engines/text_engine.py\", line 131, in load_model\n raise RuntimeError(f\"GPU model loading failed: {load_error[0]}\")\nRuntimeError: GPU model loading failed: We encountered some issues during automatic conversion of the weights. For details look at the `CONVERSION` entries of the above report!\n"}
|
|
|
+(base) [root@localhost ~]# docker exec finetune-trainer /opt/conda/bin/pip install bitsandbytes
|
|
|
+Looking in indexes: http://mirrors.aliyun.com/pypi/simple
|
|
|
+Collecting bitsandbytes
|
|
|
+ Using cached http://mirrors.aliyun.com/pypi/packages/19/57/3443d6f183436fbdaf5000aac332c4d5ddb056665d459244a5608e98ae92/bitsandbytes-0.49.2-py3-none-manylinux_2_24_x86_64.whl (60.7 MB)
|
|
|
+Requirement already satisfied: torch<3,>=2.3 in /opt/conda/lib/python3.10/site-packages (from bitsandbytes) (2.8.0+metax3.5.3.9)
|
|
|
+Requirement already satisfied: numpy>=1.17 in /opt/conda/lib/python3.10/site-packages (from bitsandbytes) (1.26.4)
|
|
|
+Requirement already satisfied: packaging>=20.9 in /opt/conda/lib/python3.10/site-packages (from bitsandbytes) (26.2)
|
|
|
+Requirement already satisfied: filelock in /opt/conda/lib/python3.10/site-packages (from torch<3,>=2.3->bitsandbytes) (3.29.0)
|
|
|
+Requirement already satisfied: typing-extensions>=4.10.0 in /opt/conda/lib/python3.10/site-packages (from torch<3,>=2.3->bitsandbytes) (4.15.0)
|
|
|
+Requirement already satisfied: sympy>=1.13.3 in /opt/conda/lib/python3.10/site-packages (from torch<3,>=2.3->bitsandbytes) (1.14.0)
|
|
|
+Requirement already satisfied: networkx in /opt/conda/lib/python3.10/site-packages (from torch<3,>=2.3->bitsandbytes) (3.4.2)
|
|
|
+Requirement already satisfied: jinja2 in /opt/conda/lib/python3.10/site-packages (from torch<3,>=2.3->bitsandbytes) (3.1.6)
|
|
|
+Requirement already satisfied: fsspec in /opt/conda/lib/python3.10/site-packages (from torch<3,>=2.3->bitsandbytes) (2025.5.1)
|
|
|
+Requirement already satisfied: mpmath<1.4,>=1.1.0 in /opt/conda/lib/python3.10/site-packages (from sympy>=1.13.3->torch<3,>=2.3->bitsandbytes) (1.3.0)
|
|
|
+Requirement already satisfied: MarkupSafe>=2.0 in /opt/conda/lib/python3.10/site-packages (from jinja2->torch<3,>=2.3->bitsandbytes) (3.0.2)
|
|
|
+Installing collected packages: bitsandbytes
|
|
|
+Successfully installed bitsandbytes-0.49.2
|
|
|
+WARNING: Running pip as the 'root' user can result in broken permissions and conflicting behaviour with the system package manager, possibly rendering your system unusable.It is recommended to use a virtual environment instead: https://pip.pypa.io/warnings/venv. Use the --root-user-action option if you know what you are doing and want to suppress this warning.
|