|
@@ -1,28 +1,14 @@
|
|
|
-(base) [root@localhost ~]# docker exec -w /root/Fine-tuning/backend finetune-trainer /opt/conda/bin/python -m app.engines.remote_train "test-manual-001" "Qwen/Qwen3.5-0.8B" "text" "/root/Fine-tuning/backend/data/processed/ms_yanalong_yanalong/distill_r1_sft.json" "/root/Fine-tuning/backend/data/config_aa342346-a39e-4644-9a34-f3a9d3b961f8.json"
|
|
|
|
|
-2026-05-20 14:28:57 | ERROR | peft-platform | Remote training failed: test-manual-001 - Extra data: line 2 column 1 (char 71)
|
|
|
|
|
-Traceback (most recent call last):
|
|
|
|
|
- File "/opt/conda/lib/python3.10/runpy.py", line 196, in _run_module_as_main
|
|
|
|
|
- return _run_code(code, main_globals, None,
|
|
|
|
|
- File "/opt/conda/lib/python3.10/runpy.py", line 86, in _run_code
|
|
|
|
|
- exec(code, run_globals)
|
|
|
|
|
- File "/root/Fine-tuning/backend/app/engines/remote_train.py", line 162, in <module>
|
|
|
|
|
- main()
|
|
|
|
|
- File "/root/Fine-tuning/backend/app/engines/remote_train.py", line 158, in main
|
|
|
|
|
- asyncio.run(run_training(job_id, model_id, model_type, dataset_id, config))
|
|
|
|
|
- File "/opt/conda/lib/python3.10/asyncio/runners.py", line 44, in run
|
|
|
|
|
- return loop.run_until_complete(main)
|
|
|
|
|
- File "/opt/conda/lib/python3.10/asyncio/base_events.py", line 649, in run_until_complete
|
|
|
|
|
- return future.result()
|
|
|
|
|
- File "/root/Fine-tuning/backend/app/engines/remote_train.py", line 108, in run_training
|
|
|
|
|
- await engine.preprocess_dataset(dataset_path, processed_path, task_type=task_type, template=template)
|
|
|
|
|
- File "/root/Fine-tuning/backend/app/engines/text_engine.py", line 119, in preprocess_dataset
|
|
|
|
|
- processed = preprocess_file(dataset_path, output_path, task_type, template)
|
|
|
|
|
- File "/root/Fine-tuning/backend/app/preprocessors/__init__.py", line 130, in preprocess_file
|
|
|
|
|
- data = json.load(f)
|
|
|
|
|
- File "/opt/conda/lib/python3.10/json/__init__.py", line 293, in load
|
|
|
|
|
- return loads(fp.read(),
|
|
|
|
|
- File "/opt/conda/lib/python3.10/json/__init__.py", line 346, in loads
|
|
|
|
|
- return _default_decoder.decode(s)
|
|
|
|
|
- File "/opt/conda/lib/python3.10/json/decoder.py", line 340, in decode
|
|
|
|
|
- raise JSONDecodeError("Extra data", s, end)
|
|
|
|
|
-json.decoder.JSONDecodeError: Extra data: line 2 column 1 (char 71)
|
|
|
|
|
|
|
+lq@lq:~/Fine-tuning$ sudo docker exec finetune-postgres psql -U finetune -d finetuning -c "SELECT id, name, file_path FROM datasets;"
|
|
|
|
|
+[sudo] password for lq:
|
|
|
|
|
+ id | name | file_path
|
|
|
|
|
+--------------------------------------+-------------------+--------------------------------------------------------------------------
|
|
|
|
|
+ 3d5f8808-e71a-449d-94e9-c61c4881b2cf | yanalong/yanalong | /root/Fine-tuning/backend/data/processed/ms_yanalong_yanalong/data.jsonl
|
|
|
|
|
+(1 row)
|
|
|
|
|
+
|
|
|
|
|
+lq@lq:~/Fine-tuning$ docker exec finetune-backend ls -la /root/Fine-tuning/backend/data/uploads/
|
|
|
|
|
+permission denied while trying to connect to the Docker daemon socket at unix:///var/run/docker.sock: Get "http://%2Fvar%2Frun%2Fdocker.sock/v1.49/containers/finetune-backend/json": dial unix /var/run/docker.sock: connect: permission denied
|
|
|
|
|
+lq@lq:~/Fine-tuning$ sudo docker exec finetune-backend ls -la /root/Fine-tuning/backend/data/uploads/
|
|
|
|
|
+total 8
|
|
|
|
|
+drwxr-xr-x 2 root root 4096 May 20 06:35 .
|
|
|
|
|
+drwxrwxr-x 6 1000 1000 4096 May 21 01:27 ..
|
|
|
|
|
+lq@lq:~/Fine-tuning$
|