|
|
@@ -1,52 +1,127 @@
|
|
|
-(base) [root@localhost ~]# docker exec finetune-trainer bash -c 'sed -n "1400,1450p" /opt/conda/lib/python3.10/site-packages/trl/trainer/dpo_trainer.py'
|
|
|
- warnings.warn(
|
|
|
- "compute_loss is only implemented for DPODataCollatorWithPadding, and you passed a datacollator that is different than "
|
|
|
- "DPODataCollatorWithPadding - you might see unexpected behavior. Alternatively, you can implement your own prediction_step method if you are using a custom data collator"
|
|
|
- )
|
|
|
-
|
|
|
- compute_loss_context_manager = torch.cuda.amp.autocast if self._peft_has_been_casted_to_bf16 else nullcontext
|
|
|
-
|
|
|
- with compute_loss_context_manager():
|
|
|
- loss, metrics = self.get_batch_loss_metrics(model, inputs, train_eval="train")
|
|
|
-
|
|
|
- # Make sure to move the loss to the device the original accumulating loss is at back in the `Trainer` class:
|
|
|
- loss = loss.to(self.args.device)
|
|
|
- # force log the metrics
|
|
|
- self.store_metrics(metrics, train_eval="train")
|
|
|
-
|
|
|
- if return_outputs:
|
|
|
- return (loss, metrics)
|
|
|
- return loss
|
|
|
-
|
|
|
- def get_batch_samples(self, model, batch: Dict[str, torch.LongTensor]) -> Tuple[str, str]:
|
|
|
- """Generate samples from the model and reference model for the given batch of inputs."""
|
|
|
-
|
|
|
- # If one uses `generate_during_eval` with peft + bf16, we need to explicitly call generate with
|
|
|
- # the torch cuda amp context manager as some hidden states are silently casted to full precision.
|
|
|
- generate_context_manager = nullcontext if not self._peft_has_been_casted_to_bf16 else torch.cuda.amp.autocast
|
|
|
-
|
|
|
- with generate_context_manager():
|
|
|
- policy_output = model.generate(
|
|
|
- input_ids=batch["prompt_input_ids"],
|
|
|
- attention_mask=batch["prompt_attention_mask"],
|
|
|
- max_length=self.max_length,
|
|
|
- do_sample=True,
|
|
|
- pad_token_id=self.tokenizer.pad_token_id,
|
|
|
- )
|
|
|
-
|
|
|
- # if reference_output in batch use that otherwise use the reference model
|
|
|
- if "reference_output" in batch:
|
|
|
- reference_output = batch["reference_output"]
|
|
|
- else:
|
|
|
- if self.ref_model is None:
|
|
|
- with self.null_ref_context():
|
|
|
- reference_output = self.model.generate(
|
|
|
- input_ids=batch["prompt_input_ids"],
|
|
|
- attention_mask=batch["prompt_attention_mask"],
|
|
|
- max_length=self.max_length,
|
|
|
- do_sample=True,
|
|
|
- pad_token_id=self.tokenizer.pad_token_id,
|
|
|
- )
|
|
|
- else:
|
|
|
- reference_output = self.ref_model.generate(
|
|
|
- input_ids=batch["prompt_input_ids"],
|
|
|
+2026-05-27 07:35:25 | INFO | peft-platform | [253:489b64b9] Map: 0%| | 0/5 [00:00<?, ? examples/s]
|
|
|
+2026-05-27 07:35:25 | INFO | peft-platform | [253:489b64b9] Map: 100%|██████████| 5/5 [00:00<00:00, 174.12 examples/s]
|
|
|
+2026-05-27 07:35:25 | WARNING | peft-platform | [253:489b64b9] /opt/conda/lib/python3.10/site-packages/peft/tuners/tuners_utils.py:1348: UserWarning: Model has `tie_word_embeddings=True` and a tied layer is part of the adapter, but `ensure_weight_tying` is not set to True. This can lead to complications, for example when merging the adapter or converting your model to formats other than safetensors. Check the discussion here: https://github.com/huggingface/peft/issues/2777
|
|
|
+2026-05-27 07:35:25 | INFO | peft-platform | [253:489b64b9] warnings.warn(msg)
|
|
|
+2026-05-27 07:35:25 | INFO | peft-platform | [253:489b64b9] bitsandbytes library load error: Configured CUDA binary not found at /opt/conda/lib/python3.10/site-packages/bitsandbytes/libbitsandbytes_cuda116.so
|
|
|
+2026-05-27 07:35:25 | INFO | peft-platform | [253:489b64b9] Traceback (most recent call last):
|
|
|
+2026-05-27 07:35:25 | INFO | peft-platform | [253:489b64b9] File "/opt/conda/lib/python3.10/site-packages/bitsandbytes/cextension.py", line 320, in <module>
|
|
|
+2026-05-27 07:35:25 | INFO | peft-platform | [253:489b64b9] lib = get_native_library()
|
|
|
+2026-05-27 07:35:25 | INFO | peft-platform | [253:489b64b9] File "/opt/conda/lib/python3.10/site-packages/bitsandbytes/cextension.py", line 288, in get_native_library
|
|
|
+2026-05-27 07:35:25 | ERROR | peft-platform | [253:489b64b9] raise RuntimeError(f"Configured {BNB_BACKEND} binary not found at {cuda_binary_path}")
|
|
|
+2026-05-27 07:35:25 | ERROR | peft-platform | [253:489b64b9] RuntimeError: Configured CUDA binary not found at /opt/conda/lib/python3.10/site-packages/bitsandbytes/libbitsandbytes_cuda116.so
|
|
|
+2026-05-27 07:35:25 | WARNING | peft-platform | [253:489b64b9] [transformers] warmup_ratio is deprecated and will be removed in v5.2. Use `warmup_steps` instead.
|
|
|
+2026-05-27 07:35:25 | WARNING | peft-platform | [253:489b64b9] [transformers] warmup_ratio is deprecated and will be removed in v5.2. Use `warmup_steps` instead.
|
|
|
+2026-05-27 07:35:25 | WARNING | peft-platform | [253:489b64b9] /opt/conda/lib/python3.10/site-packages/trl/trainer/dpo_trainer.py:394: UserWarning: `max_length` is not set in the DPOConfig's init it will default to `512` by default, but you should do it yourself in the future.
|
|
|
+2026-05-27 07:35:25 | INFO | peft-platform | [253:489b64b9] warnings.warn(
|
|
|
+2026-05-27 07:35:25 | WARNING | peft-platform | [253:489b64b9] /opt/conda/lib/python3.10/site-packages/trl/trainer/dpo_trainer.py:407: UserWarning: `max_prompt_length` is not set in the DPOConfig's init it will default to `128` by default, but you should do it yourself in the future.
|
|
|
+2026-05-27 07:35:25 | INFO | peft-platform | [253:489b64b9] warnings.warn(
|
|
|
+2026-05-27 07:35:25 | WARNING | peft-platform | [253:489b64b9] /opt/conda/lib/python3.10/site-packages/trl/trainer/dpo_trainer.py:442: UserWarning: When using DPODataCollatorWithPadding, you should set `remove_unused_columns=False` in your TrainingArguments we have set it for you, but you should do it yourself in the future.
|
|
|
+2026-05-27 07:35:25 | INFO | peft-platform | [253:489b64b9] warnings.warn(
|
|
|
+2026-05-27 07:35:25 | INFO | peft-platform | [253:489b64b9] trainable params: 5,070,848 || all params: 757,463,872 || trainable%: 0.6695
|
|
|
+2026-05-27 07:35:25 | INFO | peft-platform | [253:489b64b9] Map: 0%| | 0/5 [00:00<?, ? examples/s]
|
|
|
+2026-05-27 07:35:25 | INFO | peft-platform | [253:489b64b9] Map: 100%|██████████| 5/5 [00:00<00:00, 173.18 examples/s]
|
|
|
+2026-05-27 07:35:25 | ERROR | peft-platform | [253:489b64b9] 0%| | 0/1 [00:00<?, ?it/s]Training failed for job 489b64b9-f349-4263-82e1-b6a73eaeff80: Caught TypeError in DataLoader worker process 0.
|
|
|
+2026-05-27 07:35:25 | INFO | peft-platform | [253:489b64b9] Original Traceback (most recent call last):
|
|
|
+2026-05-27 07:35:25 | INFO | peft-platform | [253:489b64b9] File "/opt/conda/lib/python3.10/site-packages/torch/utils/data/_utils/worker.py", line 349, in _worker_loop
|
|
|
+2026-05-27 07:35:25 | INFO | peft-platform | [253:489b64b9] data = fetcher.fetch(index) # type: ignore[possibly-undefined]
|
|
|
+2026-05-27 07:35:25 | INFO | peft-platform | [253:489b64b9] File "/opt/conda/lib/python3.10/site-packages/torch/utils/data/_utils/fetch.py", line 55, in fetch
|
|
|
+2026-05-27 07:35:25 | INFO | peft-platform | [253:489b64b9] return self.collate_fn(data)
|
|
|
+2026-05-27 07:35:25 | INFO | peft-platform | [253:489b64b9] File "/opt/conda/lib/python3.10/site-packages/trl/trainer/utils.py", line 460, in __call__
|
|
|
+2026-05-27 07:35:25 | INFO | peft-platform | [253:489b64b9] to_pad = [torch.tensor(ex[k], dtype=dtype) for ex in features]
|
|
|
+2026-05-27 07:35:25 | INFO | peft-platform | [253:489b64b9] File "/opt/conda/lib/python3.10/site-packages/trl/trainer/utils.py", line 460, in <listcomp>
|
|
|
+2026-05-27 07:35:25 | INFO | peft-platform | [253:489b64b9] to_pad = [torch.tensor(ex[k], dtype=dtype) for ex in features]
|
|
|
+2026-05-27 07:35:25 | ERROR | peft-platform | [253:489b64b9] TypeError: 'NoneType' object cannot be interpreted as an integer
|
|
|
+2026-05-27 07:35:25 | INFO | peft-platform | [253:489b64b9] [remote_train] [rank 0] ERROR: Caught TypeError in DataLoader worker process 0.
|
|
|
+2026-05-27 07:35:25 | INFO | peft-platform | [253:489b64b9] Original Traceback (most recent call last):
|
|
|
+2026-05-27 07:35:25 | INFO | peft-platform | [253:489b64b9] File "/opt/conda/lib/python3.10/site-packages/torch/utils/data/_utils/worker.py", line 349, in _worker_loop
|
|
|
+2026-05-27 07:35:25 | INFO | peft-platform | [253:489b64b9] data = fetcher.fetch(index) # type: ignore[possibly-undefined]
|
|
|
+2026-05-27 07:35:25 | INFO | peft-platform | [253:489b64b9] File "/opt/conda/lib/python3.10/site-packages/torch/utils/data/_utils/fetch.py", line 55, in fetch
|
|
|
+2026-05-27 07:35:25 | INFO | peft-platform | [253:489b64b9] return self.collate_fn(data)
|
|
|
+2026-05-27 07:35:25 | INFO | peft-platform | [253:489b64b9] File "/opt/conda/lib/python3.10/site-packages/trl/trainer/utils.py", line 460, in __call__
|
|
|
+2026-05-27 07:35:25 | INFO | peft-platform | [253:489b64b9] to_pad = [torch.tensor(ex[k], dtype=dtype) for ex in features]
|
|
|
+2026-05-27 07:35:25 | INFO | peft-platform | [253:489b64b9] File "/opt/conda/lib/python3.10/site-packages/trl/trainer/utils.py", line 460, in <listcomp>
|
|
|
+2026-05-27 07:35:25 | INFO | peft-platform | [253:489b64b9] to_pad = [torch.tensor(ex[k], dtype=dtype) for ex in features]
|
|
|
+2026-05-27 07:35:25 | ERROR | peft-platform | [253:489b64b9] TypeError: 'NoneType' object cannot be interpreted as an integer
|
|
|
+2026-05-27 07:35:25 | INFO | peft-platform | [253:489b64b9] [remote_train] Traceback (most recent call last):
|
|
|
+2026-05-27 07:35:25 | INFO | peft-platform | [253:489b64b9] File "/root/Fine-tuning/backend/app/engines/remote_train.py", line 236, in run_training
|
|
|
+2026-05-27 07:35:25 | INFO | peft-platform | [253:489b64b9] adapter_path = await engine.train(
|
|
|
+2026-05-27 07:35:25 | INFO | peft-platform | [253:489b64b9] File "/root/Fine-tuning/backend/app/engines/text_engine.py", line 469, in train
|
|
|
+2026-05-27 07:35:25 | INFO | peft-platform | [253:489b64b9] trainer.train()
|
|
|
+2026-05-27 07:35:25 | INFO | peft-platform | [253:489b64b9] File "/opt/conda/lib/python3.10/site-packages/transformers/trainer.py", line 1427, in train
|
|
|
+2026-05-27 07:35:25 | INFO | peft-platform | [253:489b64b9] return inner_training_loop(
|
|
|
+2026-05-27 07:35:25 | INFO | peft-platform | [253:489b64b9] File "/opt/conda/lib/python3.10/site-packages/transformers/trainer.py", line 1509, in _inner_training_loop
|
|
|
+2026-05-27 07:35:25 | INFO | peft-platform | [253:489b64b9] self._run_epoch(
|
|
|
+2026-05-27 07:35:25 | INFO | peft-platform | [253:489b64b9] File "/opt/conda/lib/python3.10/site-packages/transformers/trainer.py", line 1704, in _run_epoch
|
|
|
+2026-05-27 07:35:25 | INFO | peft-platform | [253:489b64b9] batch_samples, num_items_in_batch = self.get_batch_samples(epoch_iterator, num_batches, self.args.device)
|
|
|
+2026-05-27 07:35:25 | INFO | peft-platform | [253:489b64b9] File "/root/Fine-tuning/backend/app/engines/text_engine.py", line 296, in _patched_gbs
|
|
|
+2026-05-27 07:35:25 | INFO | peft-platform | [253:489b64b9] batch = next(epoch_iterator)
|
|
|
+2026-05-27 07:35:25 | INFO | peft-platform | [253:489b64b9] File "/opt/conda/lib/python3.10/site-packages/accelerate/data_loader.py", line 577, in __iter__
|
|
|
+2026-05-27 07:35:25 | INFO | peft-platform | [253:489b64b9] current_batch = next(dataloader_iter)
|
|
|
+2026-05-27 07:35:25 | INFO | peft-platform | [253:489b64b9] File "/opt/conda/lib/python3.10/site-packages/torch/utils/data/dataloader.py", line 734, in __next__
|
|
|
+2026-05-27 07:35:25 | INFO | peft-platform | [253:489b64b9] data = self._next_data()
|
|
|
+2026-05-27 07:35:25 | INFO | peft-platform | [253:489b64b9] File "/opt/conda/lib/python3.10/site-packages/torch/utils/data/dataloader.py", line 1516, in _next_data
|
|
|
+2026-05-27 07:35:25 | INFO | peft-platform | [253:489b64b9] return self._process_data(data, worker_id)
|
|
|
+2026-05-27 07:35:25 | INFO | peft-platform | [253:489b64b9] File "/opt/conda/lib/python3.10/site-packages/torch/utils/data/dataloader.py", line 1551, in _process_data
|
|
|
+2026-05-27 07:35:25 | INFO | peft-platform | [253:489b64b9] data.reraise()
|
|
|
+2026-05-27 07:35:25 | INFO | peft-platform | [253:489b64b9] File "/opt/conda/lib/python3.10/site-packages/torch/_utils.py", line 769, in reraise
|
|
|
+2026-05-27 07:35:25 | INFO | peft-platform | [253:489b64b9] raise exception
|
|
|
+2026-05-27 07:35:25 | ERROR | peft-platform | [253:489b64b9] TypeError: Caught TypeError in DataLoader worker process 0.
|
|
|
+2026-05-27 07:35:25 | INFO | peft-platform | [253:489b64b9] Original Traceback (most recent call last):
|
|
|
+2026-05-27 07:35:25 | INFO | peft-platform | [253:489b64b9] File "/opt/conda/lib/python3.10/site-packages/torch/utils/data/_utils/worker.py", line 349, in _worker_loop
|
|
|
+2026-05-27 07:35:25 | INFO | peft-platform | [253:489b64b9] data = fetcher.fetch(index) # type: ignore[possibly-undefined]
|
|
|
+2026-05-27 07:35:25 | INFO | peft-platform | [253:489b64b9] File "/opt/conda/lib/python3.10/site-packages/torch/utils/data/_utils/fetch.py", line 55, in fetch
|
|
|
+2026-05-27 07:35:25 | INFO | peft-platform | [253:489b64b9] return self.collate_fn(data)
|
|
|
+2026-05-27 07:35:25 | INFO | peft-platform | [253:489b64b9] File "/opt/conda/lib/python3.10/site-packages/trl/trainer/utils.py", line 460, in __call__
|
|
|
+2026-05-27 07:35:25 | INFO | peft-platform | [253:489b64b9] to_pad = [torch.tensor(ex[k], dtype=dtype) for ex in features]
|
|
|
+2026-05-27 07:35:25 | INFO | peft-platform | [253:489b64b9] File "/opt/conda/lib/python3.10/site-packages/trl/trainer/utils.py", line 460, in <listcomp>
|
|
|
+2026-05-27 07:35:25 | INFO | peft-platform | [253:489b64b9] to_pad = [torch.tensor(ex[k], dtype=dtype) for ex in features]
|
|
|
+2026-05-27 07:35:25 | ERROR | peft-platform | [253:489b64b9] TypeError: 'NoneType' object cannot be interpreted as an integer
|
|
|
+2026-05-27 07:35:25 | INFO | peft-platform | [253:489b64b9] [remote_train] === Training job failed: 489b64b9-f349-4263-82e1-b6a73eaeff80 ===
|
|
|
+2026-05-27 07:35:25 | INFO | peft-platform | [253:489b64b9] Traceback (most recent call last):
|
|
|
+2026-05-27 07:35:25 | INFO | peft-platform | [253:489b64b9] File "/opt/conda/lib/python3.10/runpy.py", line 196, in _run_module_as_main
|
|
|
+2026-05-27 07:35:25 | INFO | peft-platform | [253:489b64b9] return _run_code(code, main_globals, None,
|
|
|
+2026-05-27 07:35:25 | INFO | peft-platform | [253:489b64b9] File "/opt/conda/lib/python3.10/runpy.py", line 86, in _run_code
|
|
|
+2026-05-27 07:35:25 | INFO | peft-platform | [253:489b64b9] exec(code, run_globals)
|
|
|
+2026-05-27 07:35:25 | INFO | peft-platform | [253:489b64b9] File "/root/Fine-tuning/backend/app/engines/remote_train.py", line 466, in <module>
|
|
|
+2026-05-27 07:35:25 | INFO | peft-platform | [253:489b64b9] main()
|
|
|
+2026-05-27 07:35:25 | INFO | peft-platform | [253:489b64b9] File "/root/Fine-tuning/backend/app/engines/remote_train.py", line 461, in main
|
|
|
+2026-05-27 07:35:25 | INFO | peft-platform | [253:489b64b9] asyncio.run(run_training(job_id, model_id, model_type, dataset_id, config,
|
|
|
+2026-05-27 07:35:25 | INFO | peft-platform | [253:489b64b9] File "/opt/conda/lib/python3.10/asyncio/runners.py", line 44, in run
|
|
|
+2026-05-27 07:35:25 | INFO | peft-platform | [253:489b64b9] return loop.run_until_complete(main)
|
|
|
+2026-05-27 07:35:25 | INFO | peft-platform | [253:489b64b9] File "/opt/conda/lib/python3.10/asyncio/base_events.py", line 649, in run_until_complete
|
|
|
+2026-05-27 07:35:25 | INFO | peft-platform | [253:489b64b9] return future.result()
|
|
|
+2026-05-27 07:35:25 | INFO | peft-platform | [253:489b64b9] File "/root/Fine-tuning/backend/app/engines/remote_train.py", line 236, in run_training
|
|
|
+2026-05-27 07:35:25 | INFO | peft-platform | [253:489b64b9] adapter_path = await engine.train(
|
|
|
+2026-05-27 07:35:25 | INFO | peft-platform | [253:489b64b9] File "/root/Fine-tuning/backend/app/engines/text_engine.py", line 469, in train
|
|
|
+2026-05-27 07:35:25 | INFO | peft-platform | [253:489b64b9] trainer.train()
|
|
|
+2026-05-27 07:35:25 | INFO | peft-platform | [253:489b64b9] File "/opt/conda/lib/python3.10/site-packages/transformers/trainer.py", line 1427, in train
|
|
|
+2026-05-27 07:35:25 | INFO | peft-platform | [253:489b64b9] return inner_training_loop(
|
|
|
+2026-05-27 07:35:25 | INFO | peft-platform | [253:489b64b9] File "/opt/conda/lib/python3.10/site-packages/transformers/trainer.py", line 1509, in _inner_training_loop
|
|
|
+2026-05-27 07:35:25 | INFO | peft-platform | [253:489b64b9] self._run_epoch(
|
|
|
+2026-05-27 07:35:25 | INFO | peft-platform | [253:489b64b9] File "/opt/conda/lib/python3.10/site-packages/transformers/trainer.py", line 1704, in _run_epoch
|
|
|
+2026-05-27 07:35:25 | INFO | peft-platform | [253:489b64b9] batch_samples, num_items_in_batch = self.get_batch_samples(epoch_iterator, num_batches, self.args.device)
|
|
|
+2026-05-27 07:35:25 | INFO | peft-platform | [253:489b64b9] File "/root/Fine-tuning/backend/app/engines/text_engine.py", line 296, in _patched_gbs
|
|
|
+2026-05-27 07:35:25 | INFO | peft-platform | [253:489b64b9] batch = next(epoch_iterator)
|
|
|
+2026-05-27 07:35:25 | INFO | peft-platform | [253:489b64b9] File "/opt/conda/lib/python3.10/site-packages/accelerate/data_loader.py", line 577, in __iter__
|
|
|
+2026-05-27 07:35:25 | INFO | peft-platform | [253:489b64b9] current_batch = next(dataloader_iter)
|
|
|
+2026-05-27 07:35:25 | INFO | peft-platform | [253:489b64b9] File "/opt/conda/lib/python3.10/site-packages/torch/utils/data/dataloader.py", line 734, in __next__
|
|
|
+2026-05-27 07:35:25 | INFO | peft-platform | [253:489b64b9] data = self._next_data()
|
|
|
+2026-05-27 07:35:25 | INFO | peft-platform | [253:489b64b9] File "/opt/conda/lib/python3.10/site-packages/torch/utils/data/dataloader.py", line 1516, in _next_data
|
|
|
+2026-05-27 07:35:25 | INFO | peft-platform | [253:489b64b9] return self._process_data(data, worker_id)
|
|
|
+2026-05-27 07:35:25 | INFO | peft-platform | [253:489b64b9] File "/opt/conda/lib/python3.10/site-packages/torch/utils/data/dataloader.py", line 1551, in _process_data
|
|
|
+2026-05-27 07:35:25 | INFO | peft-platform | [253:489b64b9] data.reraise()
|
|
|
+2026-05-27 07:35:25 | INFO | peft-platform | [253:489b64b9] File "/opt/conda/lib/python3.10/site-packages/torch/_utils.py", line 769, in reraise
|
|
|
+2026-05-27 07:35:25 | INFO | peft-platform | [253:489b64b9] raise exception
|
|
|
+2026-05-27 07:35:25 | ERROR | peft-platform | [253:489b64b9] TypeError: Caught TypeError in DataLoader worker process 0.
|
|
|
+2026-05-27 07:35:25 | INFO | peft-platform | [253:489b64b9] Original Traceback (most recent call last):
|
|
|
+2026-05-27 07:35:25 | INFO | peft-platform | [253:489b64b9] File "/opt/conda/lib/python3.10/site-packages/torch/utils/data/_utils/worker.py", line 349, in _worker_loop
|
|
|
+2026-05-27 07:35:25 | INFO | peft-platform | [253:489b64b9] data = fetcher.fetch(index) # type: ignore[possibly-undefined]
|
|
|
+2026-05-27 07:35:25 | INFO | peft-platform | [253:489b64b9] File "/opt/conda/lib/python3.10/site-packages/torch/utils/data/_utils/fetch.py", line 55, in fetch
|
|
|
+2026-05-27 07:35:25 | INFO | peft-platform | [253:489b64b9] return self.collate_fn(data)
|
|
|
+2026-05-27 07:35:25 | INFO | peft-platform | [253:489b64b9] File "/opt/conda/lib/python3.10/site-packages/trl/trainer/utils.py", line 460, in __call__
|
|
|
+2026-05-27 07:35:25 | INFO | peft-platform | [253:489b64b9] to_pad = [torch.tensor(ex[k], dtype=dtype) for ex in features]
|
|
|
+2026-05-27 07:35:25 | INFO | peft-platform | [253:489b64b9] File "/opt/conda/lib/python3.10/site-packages/trl/trainer/utils.py", line 460, in <listcomp>
|
|
|
+2026-05-27 07:35:25 | INFO | peft-platform | [253:489b64b9] to_pad = [torch.tensor(ex[k], dtype=dtype) for ex in features]
|
|
|
+2026-05-27 07:35:25 | ERROR | peft-platform | [253:489b64b9] TypeError: 'NoneType' object cannot be interpreted as an integer
|
|
|
+2026-05-27 07:35:25 | INFO | peft-platform | [253:489b64b9] 0%| | 0/1 [00:14<?, ?it/s]
|
|
|
+INFO: 127.0.0.1:56702 - "GET /health HTTP/1.1" 200 OK
|