[2025-12-26 10:10:04,765] [DEBUG] [axolotl.utils.config.resolve_dtype:66] [PID:1090] bf16 support detected, enabling for this configuration.
config.json:   0%|                                                                                                               | 0.00/760 [00:00<?, ?B/s]config.json: 100%|████████████████████████████████████████████████████████████████████████████████████████████████████████| 760/760 [00:00<00:00, 6.81MB/s]
[2025-12-26 10:10:05,805] [DEBUG] [axolotl.utils.config.log_gpu_memory_usage:127] [PID:1090] baseline 0.000GB ()
[2025-12-26 10:10:05,805] [INFO] [axolotl.cli.config.load_cfg:256] [PID:1090] config:
{
  "activation_offloading": false,
  "adapter": "qlora",
  "axolotl_config_path": "train.yaml",
  "base_model": "deepseek-ai/deepseek-coder-6.7b-instruct",
  "base_model_config": "deepseek-ai/deepseek-coder-6.7b-instruct",
  "batch_size": 12,
  "bf16": true,
  "capabilities": {
    "bf16": true,
    "compute_capability": "sm_89",
    "fp8": false,
    "n_gpu": 1,
    "n_node": 1
  },
  "context_parallel_size": 1,
  "dataloader_num_workers": 1,
  "dataloader_pin_memory": true,
  "dataloader_prefetch_factor": 256,
  "dataset_num_proc": 32,
  "datasets": [
    {
      "message_property_mappings": {
        "content": "content",
        "role": "role"
      },
      "path": "darwinkernelpanic/luau_corpus_axolotl",
      "trust_remote_code": false,
      "type": "completion"
    }
  ],
  "ddp": false,
  "device": "cuda:0",
  "dion_rank_fraction": 1.0,
  "dion_rank_multiple_of": 1,
  "env_capabilities": {
    "torch_version": "2.8.0"
  },
  "eval_batch_size": 6,
  "eval_causal_lm_metrics": [
    "sacrebleu",
    "comet",
    "ter",
    "chrf"
  ],
  "eval_max_new_tokens": 128,
  "eval_sample_packing": true,
  "eval_steps": 0.08333333333333333,
  "eval_table_size": 0,
  "evals_per_epoch": 4,
  "experimental_skip_move_to_device": true,
  "flash_attention": true,
  "fp16": false,
  "fsdp": [],
  "fsdp_config": {},
  "gradient_accumulation_steps": 2,
  "gradient_checkpointing": true,
  "gradient_checkpointing_kwargs": {
    "use_reentrant": false
  },
  "hub_model_id": "darwinkernelpanic/deepseek-coder-6.7b-instruct-luau",
  "hub_strategy": "end",
  "include_tkps": true,
  "is_llama_derived_model": true,
  "learning_rate": 0.0002,
  "lisa_layers_attribute": "model.layers",
  "load_best_model_at_end": false,
  "load_in_4bit": true,
  "load_in_8bit": false,
  "local_rank": 0,
  "logging_steps": 10,
  "lora_alpha": 32,
  "lora_dropout": 0.05,
  "lora_r": 32,
  "lora_target_linear": true,
  "loraplus_lr_embedding": 1e-06,
  "lr_scheduler": "cosine",
  "mean_resizing_embeddings": false,
  "micro_batch_size": 6,
  "model_config_type": "llama",
  "num_epochs": 3.0,
  "optimizer": "adamw_torch_fused",
  "otel_metrics_host": "localhost",
  "otel_metrics_port": 8000,
  "output_dir": "./outputs/deepseek-luau-finetune",
  "pad_to_sequence_len": true,
  "pretrain_multipack_attn": true,
  "profiler_steps_start": 0,
  "qlora_sharded_model_loading": false,
  "ray_num_workers": 1,
  "resources_per_worker": {
    "GPU": 1
  },
  "sample_packing": true,
  "sample_packing_bin_size": 200,
  "sample_packing_group_size": 100000,
  "save_only_model": false,
  "save_safetensors": true,
  "save_steps": 0.3333333333333333,
  "saves_per_epoch": 1,
  "sequence_len": 3072,
  "shuffle_before_merging_datasets": false,
  "shuffle_merged_datasets": true,
  "skip_prepare_dataset": false,
  "special_tokens": {
    "pad_token": "<|EOT|>"
  },
  "streaming_multipack_buffer_size": 10000,
  "strict": false,
  "tensor_parallel_size": 1,
  "tf32": true,
  "tiled_mlp_use_original_mlp": true,
  "tokenizer_config": "deepseek-ai/deepseek-coder-6.7b-instruct",
  "tokenizer_save_jinja_files": true,
  "torch_dtype": "torch.bfloat16",
  "train_on_inputs": false,
  "trl": {
    "log_completions": false,
    "mask_truncated_completions": false,
    "ref_model_mixup_alpha": 0.9,
    "ref_model_sync_steps": 64,
    "scale_rewards": true,
    "sync_ref_model": false,
    "use_vllm": false,
    "vllm_server_host": "0.0.0.0",
    "vllm_server_port": 8000
  },
  "trust_remote_code": true,
  "use_otel_metrics": false,
  "use_ray": false,
  "use_wandb": true,
  "val_set_size": 0.05,
  "vllm": {
    "device": "auto",
    "dtype": "auto",
    "gpu_memory_utilization": 0.9,
    "host": "0.0.0.0",
    "port": 8000
  },
  "wandb_name": "deepseek-coder-6.7b-luau",
  "wandb_project": "deepseek-luau-finetune",
  "warmup_ratio": 0.1,
  "weight_decay": 0.01,
  "world_size": 1
}
tokenizer_config.json: 0.00B [00:00, ?B/s]tokenizer_config.json: 1.87kB [00:00, 9.83MB/s]
tokenizer.json: 0.00B [00:00, ?B/s]tokenizer.json: 578kB [00:00, 5.75MB/s]tokenizer.json: 1.37MB [00:00, 12.5MB/s]
[2025-12-26 10:10:09,472] [DEBUG] [axolotl.loaders.tokenizer.load_tokenizer:280] [PID:1090] EOS: 32021 / <|EOT|>
[2025-12-26 10:10:09,472] [DEBUG] [axolotl.loaders.tokenizer.load_tokenizer:281] [PID:1090] BOS: 32013 / <｜begin▁of▁sentence｜>
[2025-12-26 10:10:09,472] [DEBUG] [axolotl.loaders.tokenizer.load_tokenizer:282] [PID:1090] PAD: 32021 / <|EOT|>
[2025-12-26 10:10:09,472] [DEBUG] [axolotl.loaders.tokenizer.load_tokenizer:283] [PID:1090] UNK: None / None
[2025-12-26 10:10:09,472] [INFO] [axolotl.utils.data.shared.load_preprocessed_dataset:481] [PID:1090] Unable to find prepared dataset in last_run_prepared/b55957ea74fd9e928a892829ce7838eb
[2025-12-26 10:10:09,472] [INFO] [axolotl.utils.data.sft._load_raw_datasets:320] [PID:1090] Loading raw datasets...
[2025-12-26 10:10:09,472] [WARNING] [axolotl.utils.data.sft._load_raw_datasets:322] [PID:1090] Processing datasets during training can lead to VRAM instability. Please pre-process your dataset using `axolotl preprocess path/to/config.yml`.
README.md: 0.00B [00:00, ?B/s]README.md: 1.79kB [00:00, 11.7MB/s]
train.jsonl:   0%|                                                                                                             | 0.00/41.1M [00:00<?, ?B/s]train.jsonl: 100%|████████████████████████████████████████████████████████████████████████████████████████████████████| 41.1M/41.1M [00:01<00:00, 33.4MB/s]train.jsonl: 100%|████████████████████████████████████████████████████████████████████████████████████████████████████| 41.1M/41.1M [00:01<00:00, 33.4MB/s]
test.jsonl: 0.00B [00:00, ?B/s]test.jsonl: 7.32MB [00:00, 222MB/s]
Generating train split:   0%|                                                                                             | 0/22633 [00:00<?, ? examples/s]Generating train split: 100%|█████████████████████████████████████████████████████████████████████████████| 22633/22633 [00:00<00:00, 305162.62 examples/s]
Generating test split:   0%|                                                                                               | 0/4969 [00:00<?, ? examples/s]Generating test split: 100%|████████████████████████████████████████████████████████████████████████████████| 4969/4969 [00:00<00:00, 431643.95 examples/s]
[2025-12-26 10:10:15,135] [INFO] [axolotl.utils.data.wrappers.get_dataset_wrapper:87] [PID:1090] Loading dataset: darwinkernelpanic/luau_corpus_axolotl with base_type: completion and prompt_style: None
Tokenizing Prompts (num_proc=32):   0%|                                                                                   | 0/22633 [00:00<?, ? examples/s]Tokenizing Prompts (num_proc=32):   3%|██▏                                                                    | 708/22633 [00:00<00:08, 2733.25 examples/s]Tokenizing Prompts (num_proc=32):  31%|█████████████████████▌                                               | 7079/22633 [00:00<00:00, 24258.29 examples/s]Tokenizing Prompts (num_proc=32):  69%|██████████████████████████████████████████████▊                     | 15563/22633 [00:00<00:00, 44454.89 examples/s]Tokenizing Prompts (num_proc=32): 100%|████████████████████████████████████████████████████████████████████| 22633/22633 [00:00<00:00, 35904.19 examples/s]
[2025-12-26 10:10:15,801] [INFO] [axolotl.utils.data.utils.handle_long_seq_in_dataset:218] [PID:1090] min_input_len: 3
[2025-12-26 10:10:15,801] [INFO] [axolotl.utils.data.utils.handle_long_seq_in_dataset:220] [PID:1090] max_input_len: 3072
Dropping Long Sequences (>3072) (num_proc=32):   0%|                                                                      | 0/22636 [00:00<?, ? examples/s]Dropping Long Sequences (>3072) (num_proc=32):   3%|█▊                                                        | 708/22636 [00:00<00:04, 4664.70 examples/s]Dropping Long Sequences (>3072) (num_proc=32): 100%|███████████████████████████████████████████████████████| 22636/22636 [00:00<00:00, 72336.69 examples/s]
Drop Samples with Zero Trainable Tokens (num_proc=32):   0%|                                                              | 0/22636 [00:00<?, ? examples/s]Drop Samples with Zero Trainable Tokens (num_proc=32):   3%|█▌                                                | 708/22636 [00:00<00:05, 3773.31 examples/s]Drop Samples with Zero Trainable Tokens (num_proc=32): 100%|███████████████████████████████████████████████| 22636/22636 [00:00<00:00, 70261.82 examples/s]
Add position_id column (Sample Packing) (num_proc=32):   0%|                                                              | 0/22636 [00:00<?, ? examples/s]Add position_id column (Sample Packing) (num_proc=32):   3%|█▌                                                | 708/22636 [00:00<00:04, 4460.34 examples/s]Add position_id column (Sample Packing) (num_proc=32): 100%|███████████████████████████████████████████████| 22636/22636 [00:00<00:00, 68446.54 examples/s]
Saving the dataset (0/32 shards):   0%|                                                                                   | 0/22636 [00:00<?, ? examples/s]Saving the dataset (0/32 shards):   3%|██▏                                                                    | 708/22636 [00:00<00:05, 4156.28 examples/s]Saving the dataset (1/32 shards):   3%|██▏                                                                    | 708/22636 [00:00<00:05, 4156.28 examples/s]Saving the dataset (2/32 shards):   6%|████▍                                                                 | 1416/22636 [00:00<00:05, 4156.28 examples/s]Saving the dataset (3/32 shards):   9%|██████▌                                                               | 2124/22636 [00:00<00:04, 4156.28 examples/s]Saving the dataset (4/32 shards):  13%|████████▊                                                             | 2832/22636 [00:00<00:04, 4156.28 examples/s]Saving the dataset (5/32 shards):  16%|██████████▉                                                           | 3540/22636 [00:00<00:04, 4156.28 examples/s]Saving the dataset (6/32 shards):  19%|█████████████▏                                                        | 4248/22636 [00:00<00:04, 4156.28 examples/s]Saving the dataset (7/32 shards):  22%|███████████████▎                                                      | 4956/22636 [00:00<00:04, 4156.28 examples/s]Saving the dataset (8/32 shards):  25%|█████████████████▌                                                    | 5664/22636 [00:00<00:04, 4156.28 examples/s]Saving the dataset (9/32 shards):  28%|███████████████████▋                                                  | 6372/22636 [00:00<00:03, 4156.28 examples/s]Saving the dataset (10/32 shards):  31%|█████████████████████▌                                               | 7080/22636 [00:00<00:03, 4156.28 examples/s]Saving the dataset (11/32 shards):  34%|███████████████████████▋                                             | 7788/22636 [00:00<00:03, 4156.28 examples/s]Saving the dataset (12/32 shards):  38%|█████████████████████████▉                                           | 8496/22636 [00:00<00:03, 4156.28 examples/s]Saving the dataset (13/32 shards):  41%|████████████████████████████                                         | 9203/22636 [00:00<00:03, 4156.28 examples/s]Saving the dataset (14/32 shards):  44%|██████████████████████████████▏                                      | 9910/22636 [00:00<00:03, 4156.28 examples/s]Saving the dataset (15/32 shards):  47%|███████████████████████████████▉                                    | 10617/22636 [00:00<00:02, 4156.28 examples/s]Saving the dataset (16/32 shards):  50%|██████████████████████████████████                                  | 11324/22636 [00:00<00:02, 4156.28 examples/s]Saving the dataset (17/32 shards):  53%|████████████████████████████████████▏                               | 12031/22636 [00:00<00:02, 4156.28 examples/s]Saving the dataset (18/32 shards):  56%|██████████████████████████████████████▎                             | 12738/22636 [00:00<00:02, 4156.28 examples/s]Saving the dataset (19/32 shards):  59%|████████████████████████████████████████▍                           | 13445/22636 [00:00<00:02, 4156.28 examples/s]Saving the dataset (20/32 shards):  63%|██████████████████████████████████████████▌                         | 14152/22636 [00:00<00:02, 4156.28 examples/s]Saving the dataset (21/32 shards):  66%|████████████████████████████████████████████▋                       | 14859/22636 [00:00<00:01, 4156.28 examples/s]Saving the dataset (22/32 shards):  69%|██████████████████████████████████████████████▊                     | 15566/22636 [00:00<00:01, 4156.28 examples/s]Saving the dataset (23/32 shards):  72%|████████████████████████████████████████████████▉                   | 16273/22636 [00:00<00:01, 4156.28 examples/s]Saving the dataset (24/32 shards):  75%|███████████████████████████████████████████████████                 | 16980/22636 [00:00<00:01, 4156.28 examples/s]Saving the dataset (25/32 shards):  78%|█████████████████████████████████████████████████████▏              | 17687/22636 [00:00<00:01, 4156.28 examples/s]Saving the dataset (26/32 shards):  81%|███████████████████████████████████████████████████████▎            | 18394/22636 [00:00<00:01, 4156.28 examples/s]Saving the dataset (27/32 shards):  84%|█████████████████████████████████████████████████████████▍          | 19101/22636 [00:00<00:00, 4156.28 examples/s]Saving the dataset (28/32 shards):  88%|███████████████████████████████████████████████████████████▌        | 19808/22636 [00:00<00:00, 4156.28 examples/s]Saving the dataset (29/32 shards):  91%|█████████████████████████████████████████████████████████████▋      | 20515/22636 [00:00<00:00, 4156.28 examples/s]Saving the dataset (30/32 shards):  94%|███████████████████████████████████████████████████████████████▊    | 21222/22636 [00:00<00:00, 4156.28 examples/s]Saving the dataset (31/32 shards):  97%|█████████████████████████████████████████████████████████████████▉  | 21929/22636 [00:00<00:00, 4156.28 examples/s]Saving the dataset (32/32 shards): 100%|████████████████████████████████████████████████████████████████████| 22636/22636 [00:00<00:00, 4156.28 examples/s]Saving the dataset (32/32 shards): 100%|███████████████████████████████████████████████████████████████████| 22636/22636 [00:00<00:00, 96015.62 examples/s]
[2025-12-26 10:10:17,116] [DEBUG] [axolotl.utils.trainer.calculate_total_num_steps:406] [PID:1090] total_num_tokens: 35_122
[2025-12-26 10:10:17,119] [DEBUG] [axolotl.utils.trainer.calculate_total_num_steps:424] [PID:1090] `total_supervised_tokens: 35_122`
[2025-12-26 10:10:17,125] [DEBUG] [axolotl.utils.samplers.multipack.pack_parallel:177] [PID:1090] Using single process for pack_parallel, running sequentially.
[2025-12-26 10:10:17,841] [DEBUG] [axolotl.utils.samplers.multipack.pack_parallel:177] [PID:1090] Using single process for pack_parallel, running sequentially.
[2025-12-26 10:10:18,075] [DEBUG] [axolotl.utils.samplers.multipack.__len__:462] [PID:1090] generate_batches time: 0.2349259853363037
[2025-12-26 10:10:18,076] [DEBUG] [axolotl.utils.samplers.multipack.pack_parallel:177] [PID:1090] Using single process for pack_parallel, running sequentially.
[2025-12-26 10:10:18,305] [DEBUG] [axolotl.utils.samplers.multipack.__len__:462] [PID:1090] generate_batches time: 0.2298431396484375
[2025-12-26 10:10:18,306] [DEBUG] [axolotl.utils.samplers.multipack.pack_parallel:177] [PID:1090] Using single process for pack_parallel, running sequentially.
[2025-12-26 10:10:18,534] [DEBUG] [axolotl.utils.samplers.multipack.__len__:462] [PID:1090] generate_batches time: 0.22887825965881348
[2025-12-26 10:10:18,535] [DEBUG] [axolotl.utils.samplers.multipack.pack_parallel:177] [PID:1090] Using single process for pack_parallel, running sequentially.
[2025-12-26 10:10:18,765] [DEBUG] [axolotl.utils.samplers.multipack.__len__:462] [PID:1090] generate_batches time: 0.22986292839050293
[2025-12-26 10:10:18,800] [INFO] [axolotl.utils.samplers.multipack.calc_min_len:438] [PID:1090] gather_len_batches: [6]
[2025-12-26 10:10:18,800] [DEBUG] [axolotl.utils.trainer.calculate_total_num_steps:483] [PID:1090] data_loader_len: 3
[2025-12-26 10:10:18,801] [INFO] [axolotl.utils.trainer.calc_sample_packing_eff_est:499] [PID:1090] sample_packing_eff_est across ranks: [0.31758174189814814]
[2025-12-26 10:10:18,801] [DEBUG] [axolotl.utils.trainer.calculate_total_num_steps:511] [PID:1090] sample_packing_eff_est: None
[2025-12-26 10:10:18,801] [DEBUG] [axolotl.utils.trainer.calculate_total_num_steps:522] [PID:1090] total_num_steps: 9
[2025-12-26 10:10:18,808] [DEBUG] [axolotl.utils.trainer.calculate_total_num_steps:406] [PID:1090] total_num_tokens: 729_243
[2025-12-26 10:10:18,846] [DEBUG] [axolotl.utils.trainer.calculate_total_num_steps:424] [PID:1090] `total_supervised_tokens: 729_243`
[2025-12-26 10:10:18,922] [DEBUG] [axolotl.utils.samplers.multipack.pack_parallel:177] [PID:1090] Using single process for pack_parallel, running sequentially.
[2025-12-26 10:10:19,135] [DEBUG] [axolotl.utils.samplers.multipack.pack_parallel:177] [PID:1090] Using single process for pack_parallel, running sequentially.
[2025-12-26 10:10:19,336] [DEBUG] [axolotl.utils.samplers.multipack.__len__:462] [PID:1090] generate_batches time: 0.20236992835998535
[2025-12-26 10:10:19,338] [DEBUG] [axolotl.utils.samplers.multipack.pack_parallel:177] [PID:1090] Using single process for pack_parallel, running sequentially.
[2025-12-26 10:10:19,547] [DEBUG] [axolotl.utils.samplers.multipack.__len__:462] [PID:1090] generate_batches time: 0.21047306060791016
[2025-12-26 10:10:19,549] [DEBUG] [axolotl.utils.samplers.multipack.pack_parallel:177] [PID:1090] Using single process for pack_parallel, running sequentially.
[2025-12-26 10:10:19,750] [DEBUG] [axolotl.utils.samplers.multipack.__len__:462] [PID:1090] generate_batches time: 0.20215082168579102
[2025-12-26 10:10:19,751] [DEBUG] [axolotl.utils.samplers.multipack.pack_parallel:177] [PID:1090] Using single process for pack_parallel, running sequentially.
[2025-12-26 10:10:19,945] [DEBUG] [axolotl.utils.samplers.multipack.__len__:462] [PID:1090] generate_batches time: 0.19507765769958496
[2025-12-26 10:10:19,945] [INFO] [axolotl.utils.samplers.multipack.calc_min_len:438] [PID:1090] gather_len_batches: [108]
[2025-12-26 10:10:19,945] [DEBUG] [axolotl.utils.trainer.calculate_total_num_steps:483] [PID:1090] data_loader_len: 54
[2025-12-26 10:10:19,945] [INFO] [axolotl.utils.trainer.calc_sample_packing_eff_est:499] [PID:1090] sample_packing_eff_est across ranks: [0.3663330078125]
[2025-12-26 10:10:19,945] [DEBUG] [axolotl.utils.trainer.calculate_total_num_steps:511] [PID:1090] sample_packing_eff_est: 0.37
[2025-12-26 10:10:19,945] [DEBUG] [axolotl.utils.trainer.calculate_total_num_steps:522] [PID:1090] total_num_steps: 162
[2025-12-26 10:10:19,945] [INFO] [axolotl.utils.data.sft._prepare_standard_dataset:121] [PID:1090] Maximum number of steps set at 162
[2025-12-26 10:10:19,949] [DEBUG] [axolotl.train.setup_model_and_tokenizer:70] [PID:1090] loading tokenizer... deepseek-ai/deepseek-coder-6.7b-instruct
[2025-12-26 10:10:20,767] [DEBUG] [axolotl.loaders.tokenizer.load_tokenizer:280] [PID:1090] EOS: 32021 / <|EOT|>
[2025-12-26 10:10:20,767] [DEBUG] [axolotl.loaders.tokenizer.load_tokenizer:281] [PID:1090] BOS: 32013 / <｜begin▁of▁sentence｜>
[2025-12-26 10:10:20,767] [DEBUG] [axolotl.loaders.tokenizer.load_tokenizer:282] [PID:1090] PAD: 32021 / <|EOT|>
[2025-12-26 10:10:20,767] [DEBUG] [axolotl.loaders.tokenizer.load_tokenizer:283] [PID:1090] UNK: None / None
[2025-12-26 10:10:20,767] [DEBUG] [axolotl.train.setup_model_and_tokenizer:82] [PID:1090] Loading model
[2025-12-26 10:10:21,021] [DEBUG] [axolotl.monkeypatch.transformers.trainer_loss_calc.patch_evaluation_loop:87] [PID:1090] Patched Trainer.evaluation_loop with nanmean loss calculation
[2025-12-26 10:10:21,022] [DEBUG] [axolotl.monkeypatch.transformers.trainer_loss_calc.patch_maybe_log_save_evaluate:138] [PID:1090] Patched Trainer._maybe_log_save_evaluate with nanmean loss calculation
[2025-12-26 10:10:21,022] [INFO] [axolotl.loaders.patch_manager._apply_multipack_patches:301] [PID:1090] Applying multipack dataloader patch for sample packing...
model.safetensors.index.json: 0.00B [00:00, ?B/s]model.safetensors.index.json: 25.1kB [00:00, 109MB/s]
model-00001-of-00002.safetensors:   0%|                                                                                        | 0.00/9.98G [00:00<?, ?B/s]model-00001-of-00002.safetensors:   0%|                                                                           | 10.1k/9.98G [00:02<775:47:45, 3.57kB/s]model-00001-of-00002.safetensors:   0%|                                                                            | 92.3k/9.98G [00:02<64:22:57, 43.1kB/s]model-00001-of-00002.safetensors:   0%|                                                                              | 252k/9.98G [00:03<19:19:42, 143kB/s]model-00001-of-00002.safetensors:   0%|                                                                               | 745k/9.98G [00:03<5:06:17, 543kB/s]model-00001-of-00002.safetensors:   0%|                                                                               | 986k/9.98G [00:03<3:59:11, 695kB/s]model-00001-of-00002.safetensors:   0%|                                                                             | 2.00M/9.98G [00:03<1:32:41, 1.79MB/s]model-00001-of-00002.safetensors:   0%|                                                                               | 2.99M/9.98G [00:03<55:37, 2.99MB/s]model-00001-of-00002.safetensors:   0%|▏                                                                              | 19.3M/9.98G [00:04<12:02, 13.8MB/s]model-00001-of-00002.safetensors:   0%|▏                                                                              | 20.3M/9.98G [00:05<19:26, 8.54MB/s]model-00001-of-00002.safetensors:   0%|▏                                                                              | 21.2M/9.98G [00:05<19:58, 8.31MB/s]model-00001-of-00002.safetensors:   1%|▋                                                                              | 91.1M/9.98G [00:05<02:04, 79.5MB/s]model-00001-of-00002.safetensors:   1%|▉                                                                               | 116M/9.98G [00:06<03:36, 45.5MB/s]model-00001-of-00002.safetensors:   2%|█▍                                                                              | 184M/9.98G [00:06<01:52, 86.9MB/s]model-00001-of-00002.safetensors:   2%|█▋                                                                              | 212M/9.98G [00:06<01:47, 91.3MB/s]model-00001-of-00002.safetensors:   2%|█▉                                                                              | 243M/9.98G [00:08<03:27, 46.9MB/s]model-00001-of-00002.safetensors:   3%|██▎                                                                             | 285M/9.98G [00:08<02:30, 64.5MB/s]model-00001-of-00002.safetensors:   3%|██▌                                                                             | 315M/9.98G [00:08<02:03, 78.3MB/s]model-00001-of-00002.safetensors:   4%|███▋                                                                             | 449M/9.98G [00:08<00:50, 189MB/s]model-00001-of-00002.safetensors:   6%|████▍                                                                            | 551M/9.98G [00:08<00:34, 274MB/s]model-00001-of-00002.safetensors:   6%|█████                                                                            | 616M/9.98G [00:09<00:57, 163MB/s]model-00001-of-00002.safetensors:   7%|█████▊                                                                           | 717M/9.98G [00:09<00:39, 236MB/s]model-00001-of-00002.safetensors:   8%|██████▋                                                                          | 818M/9.98G [00:10<00:35, 255MB/s]model-00001-of-00002.safetensors:  10%|███████▋                                                                         | 952M/9.98G [00:10<00:25, 358MB/s]model-00001-of-00002.safetensors:  10%|████████▏                                                                       | 1.02G/9.98G [00:11<00:55, 162MB/s]model-00001-of-00002.safetensors:  11%|████████▌                                                                       | 1.06G/9.98G [00:11<00:52, 169MB/s]model-00001-of-00002.safetensors:  11%|████████▉                                                                       | 1.12G/9.98G [00:11<00:51, 173MB/s]model-00001-of-00002.safetensors:  12%|█████████▎                                                                      | 1.16G/9.98G [00:12<00:48, 181MB/s]model-00001-of-00002.safetensors:  12%|█████████▌                                                                      | 1.19G/9.98G [00:12<00:48, 180MB/s]model-00001-of-00002.safetensors:  12%|█████████▋                                                                      | 1.22G/9.98G [00:12<00:48, 180MB/s]model-00001-of-00002.safetensors:  12%|█████████▉                                                                      | 1.24G/9.98G [00:12<00:49, 177MB/s]model-00001-of-00002.safetensors:  14%|██████████▉                                                                     | 1.36G/9.98G [00:12<00:26, 331MB/s]model-00001-of-00002.safetensors:  14%|███████████▎                                                                    | 1.41G/9.98G [00:12<00:25, 341MB/s]model-00001-of-00002.safetensors:  15%|███████████▊                                                                    | 1.47G/9.98G [00:13<00:37, 230MB/s]model-00001-of-00002.safetensors:  15%|████████████▏                                                                   | 1.51G/9.98G [00:13<00:50, 169MB/s]model-00001-of-00002.safetensors:  16%|████████████▍                                                                   | 1.55G/9.98G [00:14<00:49, 170MB/s]model-00001-of-00002.safetensors:  16%|████████████▊                                                                   | 1.60G/9.98G [00:14<00:43, 194MB/s]model-00001-of-00002.safetensors:  16%|█████████████▏                                                                  | 1.64G/9.98G [00:14<00:38, 218MB/s]model-00001-of-00002.safetensors:  17%|█████████████▉                                                                  | 1.74G/9.98G [00:14<00:25, 320MB/s]model-00001-of-00002.safetensors:  18%|██████████████▍                                                                 | 1.79G/9.98G [00:14<00:32, 249MB/s]model-00001-of-00002.safetensors:  18%|██████████████▋                                                                 | 1.83G/9.98G [00:15<00:35, 228MB/s]model-00001-of-00002.safetensors:  19%|███████████████▌                                                                | 1.93G/9.98G [00:15<00:22, 356MB/s]model-00001-of-00002.safetensors:  20%|███████████████▉                                                                | 1.99G/9.98G [00:15<00:25, 319MB/s]model-00001-of-00002.safetensors:  21%|████████████████▋                                                               | 2.08G/9.98G [00:15<00:20, 388MB/s]model-00001-of-00002.safetensors:  22%|█████████████████▏                                                              | 2.15G/9.98G [00:15<00:26, 291MB/s]model-00001-of-00002.safetensors:  22%|█████████████████▌                                                              | 2.20G/9.98G [00:16<00:28, 276MB/s]model-00001-of-00002.safetensors:  23%|██████████████████                                                              | 2.25G/9.98G [00:16<00:31, 245MB/s]model-00001-of-00002.safetensors:  23%|██████████████████▎                                                             | 2.29G/9.98G [00:16<00:29, 263MB/s]model-00001-of-00002.safetensors:  24%|██████████████████▊                                                             | 2.35G/9.98G [00:16<00:27, 276MB/s]model-00001-of-00002.safetensors:  24%|███████████████████▍                                                            | 2.43G/9.98G [00:17<00:32, 229MB/s]model-00001-of-00002.safetensors:  25%|████████████████████                                                            | 2.51G/9.98G [00:17<00:28, 263MB/s]model-00001-of-00002.safetensors:  26%|████████████████████▌                                                           | 2.57G/9.98G [00:17<00:24, 305MB/s]model-00001-of-00002.safetensors:  26%|████████████████████▉                                                           | 2.61G/9.98G [00:17<00:26, 281MB/s]model-00001-of-00002.safetensors:  28%|██████████████████████▍                                                         | 2.80G/9.98G [00:17<00:13, 540MB/s]model-00001-of-00002.safetensors:  29%|███████████████████████▎                                                        | 2.91G/9.98G [00:18<00:22, 315MB/s]model-00001-of-00002.safetensors:  30%|███████████████████████▋                                                        | 2.96G/9.98G [00:18<00:24, 290MB/s]model-00001-of-00002.safetensors:  30%|████████████████████████                                                        | 3.01G/9.98G [00:18<00:25, 279MB/s]model-00001-of-00002.safetensors:  32%|█████████████████████████▍                                                      | 3.17G/9.98G [00:18<00:15, 449MB/s]model-00001-of-00002.safetensors:  32%|█████████████████████████▉                                                      | 3.24G/9.98G [00:19<00:20, 332MB/s]model-00001-of-00002.safetensors:  33%|██████████████████████████▍                                                     | 3.30G/9.98G [00:19<00:23, 281MB/s]model-00001-of-00002.safetensors:  34%|███████████████████████████                                                     | 3.37G/9.98G [00:20<00:29, 226MB/s]model-00001-of-00002.safetensors:  34%|███████████████████████████▍                                                    | 3.43G/9.98G [00:20<00:27, 242MB/s]model-00001-of-00002.safetensors:  35%|███████████████████████████▉                                                    | 3.49G/9.98G [00:20<00:26, 246MB/s]model-00001-of-00002.safetensors:  36%|████████████████████████████▌                                                   | 3.56G/9.98G [00:20<00:24, 267MB/s]model-00001-of-00002.safetensors:  37%|█████████████████████████████▎                                                  | 3.65G/9.98G [00:21<00:21, 300MB/s]model-00001-of-00002.safetensors:  38%|██████████████████████████████▎                                                 | 3.78G/9.98G [00:21<00:15, 411MB/s]model-00001-of-00002.safetensors:  39%|███████████████████████████████▎                                                | 3.91G/9.98G [00:21<00:15, 388MB/s]model-00001-of-00002.safetensors:  40%|███████████████████████████████▋                                                | 3.96G/9.98G [00:22<00:22, 266MB/s]model-00001-of-00002.safetensors:  40%|████████████████████████████████                                                | 4.00G/9.98G [00:22<00:23, 251MB/s]model-00001-of-00002.safetensors:  41%|████████████████████████████████▍                                               | 4.05G/9.98G [00:22<00:21, 272MB/s]model-00001-of-00002.safetensors:  41%|████████████████████████████████▉                                               | 4.11G/9.98G [00:22<00:22, 258MB/s]model-00001-of-00002.safetensors:  42%|█████████████████████████████████▊                                              | 4.22G/9.98G [00:22<00:16, 343MB/s]model-00001-of-00002.safetensors:  43%|██████████████████████████████████▌                                             | 4.32G/9.98G [00:23<00:19, 295MB/s]model-00001-of-00002.safetensors:  44%|██████████████████████████████████▉                                             | 4.36G/9.98G [00:23<00:20, 270MB/s]model-00001-of-00002.safetensors:  44%|███████████████████████████████████▎                                            | 4.40G/9.98G [00:23<00:19, 290MB/s]model-00001-of-00002.safetensors:  45%|███████████████████████████████████▊                                            | 4.47G/9.98G [00:23<00:17, 315MB/s]model-00001-of-00002.safetensors:  46%|████████████████████████████████████▉                                           | 4.61G/9.98G [00:23<00:12, 445MB/s]model-00001-of-00002.safetensors:  47%|█████████████████████████████████████▍                                          | 4.67G/9.98G [00:24<00:12, 438MB/s]model-00001-of-00002.safetensors:  48%|██████████████████████████████████████▏                                         | 4.76G/9.98G [00:24<00:15, 327MB/s]model-00001-of-00002.safetensors:  48%|██████████████████████████████████████▋                                         | 4.83G/9.98G [00:24<00:14, 353MB/s]model-00001-of-00002.safetensors:  49%|███████████████████████████████████████▎                                        | 4.90G/9.98G [00:24<00:14, 361MB/s]model-00001-of-00002.safetensors:  50%|████████████████████████████████████████                                        | 5.00G/9.98G [00:24<00:10, 458MB/s]model-00001-of-00002.safetensors:  52%|█████████████████████████████████████████▎                                      | 5.15G/9.98G [00:25<00:11, 423MB/s]model-00001-of-00002.safetensors:  52%|█████████████████████████████████████████▉                                      | 5.24G/9.98G [00:25<00:10, 447MB/s]model-00001-of-00002.safetensors:  53%|██████████████████████████████████████████▌                                     | 5.31G/9.98G [00:25<00:09, 490MB/s]model-00001-of-00002.safetensors:  54%|███████████████████████████████████████████▎                                    | 5.40G/9.98G [00:25<00:10, 448MB/s]model-00001-of-00002.safetensors:  55%|███████████████████████████████████████████▋                                    | 5.46G/9.98G [00:26<00:12, 350MB/s]model-00001-of-00002.safetensors:  55%|████████████████████████████████████████████▏                                   | 5.51G/9.98G [00:26<00:23, 194MB/s]model-00001-of-00002.safetensors:  55%|████████████████████████████████████████████▍                                   | 5.54G/9.98G [00:26<00:21, 205MB/s]model-00001-of-00002.safetensors:  56%|████████████████████████████████████████████▊                                   | 5.58G/9.98G [00:27<00:19, 225MB/s]model-00001-of-00002.safetensors:  57%|█████████████████████████████████████████████▎                                  | 5.66G/9.98G [00:27<00:17, 254MB/s]model-00001-of-00002.safetensors:  57%|█████████████████████████████████████████████▋                                  | 5.70G/9.98G [00:27<00:16, 261MB/s]model-00001-of-00002.safetensors:  59%|██████████████████████████████████████████████▉                                 | 5.85G/9.98G [00:27<00:10, 396MB/s]model-00001-of-00002.safetensors:  59%|███████████████████████████████████████████████▍                                | 5.92G/9.98G [00:28<00:14, 271MB/s]model-00001-of-00002.safetensors:  60%|████████████████████████████████████████████████                                | 6.00G/9.98G [00:28<00:12, 328MB/s]model-00001-of-00002.safetensors:  61%|████████████████████████████████████████████████▋                               | 6.07G/9.98G [00:28<00:10, 373MB/s]model-00001-of-00002.safetensors:  62%|█████████████████████████████████████████████████▏                              | 6.14G/9.98G [00:28<00:10, 351MB/s]model-00001-of-00002.safetensors:  62%|█████████████████████████████████████████████████▌                              | 6.18G/9.98G [00:28<00:15, 250MB/s]model-00001-of-00002.safetensors:  63%|██████████████████████████████████████████████████▎                             | 6.27G/9.98G [00:29<00:11, 332MB/s]model-00001-of-00002.safetensors:  63%|██████████████████████████████████████████████████▋                             | 6.33G/9.98G [00:29<00:10, 347MB/s]model-00001-of-00002.safetensors:  64%|███████████████████████████████████████████████████▎                            | 6.40G/9.98G [00:29<00:16, 214MB/s]model-00001-of-00002.safetensors:  65%|███████████████████████████████████████████████████▊                            | 6.47G/9.98G [00:30<00:14, 247MB/s]model-00001-of-00002.safetensors:  65%|████████████████████████████████████████████████████▍                           | 6.54G/9.98G [00:30<00:17, 198MB/s]model-00001-of-00002.safetensors:  66%|████████████████████████████████████████████████████▋                           | 6.57G/9.98G [00:30<00:16, 211MB/s]model-00001-of-00002.safetensors:  66%|█████████████████████████████████████████████████████                           | 6.62G/9.98G [00:30<00:15, 214MB/s]model-00001-of-00002.safetensors:  67%|█████████████████████████████████████████████████████▎                          | 6.65G/9.98G [00:31<00:17, 185MB/s]model-00001-of-00002.safetensors:  67%|█████████████████████████████████████████████████████▋                          | 6.70G/9.98G [00:31<00:14, 228MB/s]model-00001-of-00002.safetensors:  68%|██████████████████████████████████████████████████████▋                         | 6.83G/9.98G [00:31<00:10, 314MB/s]model-00001-of-00002.safetensors:  69%|███████████████████████████████████████████████████████▏                        | 6.89G/9.98G [00:31<00:08, 345MB/s]model-00001-of-00002.safetensors:  69%|███████████████████████████████████████████████████████▌                        | 6.93G/9.98G [00:31<00:10, 299MB/s]model-00001-of-00002.safetensors:  70%|███████████████████████████████████████████████████████▉                        | 6.97G/9.98G [00:32<00:17, 171MB/s]model-00001-of-00002.safetensors:  70%|████████████████████████████████████████████████████████                        | 7.00G/9.98G [00:32<00:17, 169MB/s]model-00001-of-00002.safetensors:  71%|████████████████████████████████████████████████████████▊                       | 7.08G/9.98G [00:32<00:14, 199MB/s]model-00001-of-00002.safetensors:  72%|█████████████████████████████████████████████████████████▊                      | 7.21G/9.98G [00:33<00:08, 328MB/s]model-00001-of-00002.safetensors:  74%|██████████████████████████████████████████████████████████▊                     | 7.34G/9.98G [00:33<00:05, 460MB/s]model-00001-of-00002.safetensors:  74%|███████████████████████████████████████████████████████████▌                    | 7.43G/9.98G [00:33<00:07, 327MB/s]model-00001-of-00002.safetensors:  75%|████████████████████████████████████████████████████████████▏                   | 7.50G/9.98G [00:33<00:07, 333MB/s]model-00001-of-00002.safetensors:  76%|████████████████████████████████████████████████████████████▌                   | 7.55G/9.98G [00:34<00:07, 313MB/s]model-00001-of-00002.safetensors:  77%|█████████████████████████████████████████████████████████████▏                  | 7.64G/9.98G [00:34<00:06, 368MB/s]model-00001-of-00002.safetensors:  77%|█████████████████████████████████████████████████████████████▌                  | 7.69G/9.98G [00:34<00:07, 318MB/s]model-00001-of-00002.safetensors:  79%|███████████████████████████████████████████████████████████████                 | 7.86G/9.98G [00:34<00:04, 507MB/s]model-00001-of-00002.safetensors:  80%|███████████████████████████████████████████████████████████████▋                | 7.95G/9.98G [00:34<00:04, 437MB/s]model-00001-of-00002.safetensors:  81%|████████████████████████████████████████████████████████████████▊               | 8.08G/9.98G [00:35<00:04, 474MB/s]model-00001-of-00002.safetensors:  82%|█████████████████████████████████████████████████████████████████▍              | 8.16G/9.98G [00:35<00:04, 417MB/s]model-00001-of-00002.safetensors:  82%|█████████████████████████████████████████████████████████████████▊              | 8.22G/9.98G [00:35<00:04, 413MB/s]model-00001-of-00002.safetensors:  83%|██████████████████████████████████████████████████████████████████▍             | 8.28G/9.98G [00:35<00:03, 455MB/s]model-00001-of-00002.safetensors:  84%|███████████████████████████████████████████████████████████████████             | 8.36G/9.98G [00:36<00:06, 267MB/s]model-00001-of-00002.safetensors:  85%|███████████████████████████████████████████████████████████████████▌            | 8.43G/9.98G [00:36<00:06, 257MB/s]model-00001-of-00002.safetensors:  85%|████████████████████████████████████████████████████████████████████▏           | 8.50G/9.98G [00:36<00:05, 281MB/s]model-00001-of-00002.safetensors:  86%|████████████████████████████████████████████████████████████████████▋           | 8.57G/9.98G [00:36<00:05, 271MB/s]model-00001-of-00002.safetensors:  86%|█████████████████████████████████████████████████████████████████████           | 8.61G/9.98G [00:37<00:06, 205MB/s]model-00001-of-00002.safetensors:  87%|█████████████████████████████████████████████████████████████████████▊          | 8.71G/9.98G [00:37<00:04, 263MB/s]model-00001-of-00002.safetensors:  88%|██████████████████████████████████████████████████████████████████████▍         | 8.78G/9.98G [00:37<00:04, 277MB/s]model-00001-of-00002.safetensors:  89%|██████████████████████████████████████████████████████████████████████▉         | 8.85G/9.98G [00:38<00:04, 271MB/s]model-00001-of-00002.safetensors:  89%|███████████████████████████████████████████████████████████████████████▍        | 8.92G/9.98G [00:38<00:03, 314MB/s]model-00001-of-00002.safetensors:  90%|████████████████████████████████████████████████████████████████████████        | 8.99G/9.98G [00:38<00:03, 315MB/s]model-00001-of-00002.safetensors:  91%|████████████████████████████████████████████████████████████████████████▊       | 9.09G/9.98G [00:38<00:03, 271MB/s]model-00001-of-00002.safetensors:  92%|█████████████████████████████████████████████████████████████████████████▎      | 9.15G/9.98G [00:39<00:02, 282MB/s]model-00001-of-00002.safetensors:  93%|██████████████████████████████████████████████████████████████████████████▌     | 9.30G/9.98G [00:39<00:01, 427MB/s]model-00001-of-00002.safetensors:  94%|███████████████████████████████████████████████████████████████████████████▏    | 9.37G/9.98G [00:39<00:01, 372MB/s]model-00001-of-00002.safetensors:  94%|███████████████████████████████████████████████████████████████████████████▌    | 9.42G/9.98G [00:39<00:01, 357MB/s]model-00001-of-00002.safetensors:  96%|████████████████████████████████████████████████████████████████████████████▌   | 9.54G/9.98G [00:39<00:00, 486MB/s]model-00001-of-00002.safetensors:  98%|██████████████████████████████████████████████████████████████████████████████  | 9.74G/9.98G [00:39<00:00, 660MB/s]model-00001-of-00002.safetensors: 100%|████████████████████████████████████████████████████████████████████████████████| 9.98G/9.98G [00:40<00:00, 947MB/s]model-00001-of-00002.safetensors: 100%|████████████████████████████████████████████████████████████████████████████████| 9.98G/9.98G [00:40<00:00, 249MB/s]
model-00002-of-00002.safetensors:   0%|                                                                                        | 0.00/3.50G [00:00<?, ?B/s]model-00002-of-00002.safetensors:   0%|                                                                              | 2.12M/3.50G [00:03<1:30:18, 646kB/s]model-00002-of-00002.safetensors:   0%|▍                                                                              | 16.9M/3.50G [00:03<09:25, 6.17MB/s]model-00002-of-00002.safetensors:   1%|▍                                                                              | 20.9M/3.50G [00:03<07:44, 7.49MB/s]model-00002-of-00002.safetensors:   1%|▉                                                                              | 42.6M/3.50G [00:03<02:45, 20.9MB/s]model-00002-of-00002.safetensors:   2%|█▌                                                                             | 67.5M/3.50G [00:04<01:51, 30.9MB/s]model-00002-of-00002.safetensors:   3%|██▌                                                                             | 112M/3.50G [00:04<00:54, 61.7MB/s]model-00002-of-00002.safetensors:   4%|███▏                                                                            | 142M/3.50G [00:04<00:43, 77.9MB/s]model-00002-of-00002.safetensors:   6%|████▋                                                                            | 202M/3.50G [00:04<00:25, 132MB/s]model-00002-of-00002.safetensors:   7%|█████▊                                                                           | 251M/3.50G [00:05<00:19, 163MB/s]model-00002-of-00002.safetensors:   8%|██████▍                                                                          | 277M/3.50G [00:05<00:22, 144MB/s]model-00002-of-00002.safetensors:   9%|██████▉                                                                         | 303M/3.50G [00:06<00:52, 61.4MB/s]model-00002-of-00002.safetensors:  19%|███████████████                                                                  | 649M/3.50G [00:06<00:11, 259MB/s]model-00002-of-00002.safetensors:  20%|████████████████▎                                                                | 705M/3.50G [00:07<00:12, 222MB/s]model-00002-of-00002.safetensors:  22%|█████████████████▉                                                               | 775M/3.50G [00:07<00:10, 253MB/s]model-00002-of-00002.safetensors:  23%|██████████████████▉                                                              | 820M/3.50G [00:07<00:11, 224MB/s]model-00002-of-00002.safetensors:  25%|████████████████████▎                                                            | 880M/3.50G [00:08<00:11, 223MB/s]model-00002-of-00002.safetensors:  26%|█████████████████████▎                                                           | 922M/3.50G [00:08<00:10, 242MB/s]model-00002-of-00002.safetensors:  28%|██████████████████████▉                                                          | 989M/3.50G [00:08<00:09, 264MB/s]model-00002-of-00002.safetensors:  30%|████████████████████████▏                                                       | 1.06G/3.50G [00:08<00:10, 242MB/s]model-00002-of-00002.safetensors:  31%|█████████████████████████▏                                                      | 1.10G/3.50G [00:09<00:12, 188MB/s]model-00002-of-00002.safetensors:  35%|███████████████████████████▉                                                    | 1.22G/3.50G [00:09<00:07, 297MB/s]model-00002-of-00002.safetensors:  37%|█████████████████████████████▍                                                  | 1.29G/3.50G [00:09<00:07, 307MB/s]model-00002-of-00002.safetensors:  41%|████████████████████████████████▍                                               | 1.42G/3.50G [00:09<00:05, 391MB/s]model-00002-of-00002.safetensors:  43%|██████████████████████████████████▏                                             | 1.49G/3.50G [00:09<00:04, 429MB/s]model-00002-of-00002.safetensors:  45%|████████████████████████████████████                                            | 1.58G/3.50G [00:09<00:03, 488MB/s]model-00002-of-00002.safetensors:  48%|██████████████████████████████████████                                          | 1.67G/3.50G [00:10<00:03, 463MB/s]model-00002-of-00002.safetensors:  49%|███████████████████████████████████████▍                                        | 1.73G/3.50G [00:10<00:04, 408MB/s]model-00002-of-00002.safetensors:  52%|█████████████████████████████████████████▍                                      | 1.82G/3.50G [00:10<00:05, 320MB/s]model-00002-of-00002.safetensors:  54%|███████████████████████████████████████████▍                                    | 1.90G/3.50G [00:11<00:05, 286MB/s]model-00002-of-00002.safetensors:  58%|██████████████████████████████████████████████▏                                 | 2.02G/3.50G [00:11<00:04, 368MB/s]model-00002-of-00002.safetensors:  60%|███████████████████████████████████████████████▊                                | 2.09G/3.50G [00:11<00:04, 312MB/s]model-00002-of-00002.safetensors:  61%|████████████████████████████████████████████████▊                               | 2.13G/3.50G [00:11<00:05, 258MB/s]model-00002-of-00002.safetensors:  63%|██████████████████████████████████████████████████▌                             | 2.21G/3.50G [00:12<00:04, 318MB/s]model-00002-of-00002.safetensors:  65%|███████████████████████████████████████████████████▊                            | 2.27G/3.50G [00:12<00:04, 284MB/s]model-00002-of-00002.safetensors:  67%|█████████████████████████████████████████████████████▍                          | 2.34G/3.50G [00:12<00:04, 248MB/s]model-00002-of-00002.safetensors:  69%|███████████████████████████████████████████████████████▏                        | 2.42G/3.50G [00:12<00:03, 284MB/s]model-00002-of-00002.safetensors:  70%|███████████████████████████████████████████████████████▉                        | 2.45G/3.50G [00:13<00:03, 283MB/s]model-00002-of-00002.safetensors:  73%|██████████████████████████████████████████████████████████▊                     | 2.57G/3.50G [00:13<00:02, 412MB/s]model-00002-of-00002.safetensors:  76%|████████████████████████████████████████████████████████████▋                   | 2.66G/3.50G [00:13<00:01, 448MB/s]model-00002-of-00002.safetensors:  78%|██████████████████████████████████████████████████████████████▎                 | 2.73G/3.50G [00:13<00:02, 346MB/s]model-00002-of-00002.safetensors:  80%|████████████████████████████████████████████████████████████████▏               | 2.81G/3.50G [00:13<00:01, 413MB/s]model-00002-of-00002.safetensors:  87%|█████████████████████████████████████████████████████████████████████▊          | 3.06G/3.50G [00:14<00:00, 635MB/s]model-00002-of-00002.safetensors:  90%|████████████████████████████████████████████████████████████████████████▎       | 3.16G/3.50G [00:14<00:00, 637MB/s]model-00002-of-00002.safetensors:  96%|█████████████████████████████████████████████████████████████████████████████▏  | 3.38G/3.50G [00:14<00:00, 843MB/s]model-00002-of-00002.safetensors: 100%|████████████████████████████████████████████████████████████████████████████████| 3.50G/3.50G [00:14<00:00, 645MB/s]model-00002-of-00002.safetensors: 100%|████████████████████████████████████████████████████████████████████████████████| 3.50G/3.50G [00:14<00:00, 239MB/s]
Loading checkpoint shards:   0%|                                                                                                     | 0/2 [00:00<?, ?it/s]Loading checkpoint shards:  50%|██████████████████████████████████████████████▌                                              | 1/2 [00:04<00:04,  4.27s/it]Loading checkpoint shards: 100%|█████████████████████████████████████████████████████████████████████████████████████████████| 2/2 [00:05<00:00,  2.50s/it]Loading checkpoint shards: 100%|█████████████████████████████████████████████████████████████████████████████████████████████| 2/2 [00:05<00:00,  2.77s/it]
generation_config.json:   0%|                                                                                                    | 0.00/119 [00:00<?, ?B/s]generation_config.json: 100%|█████████████████████████████████████████████████████████████████████████████████████████████| 119/119 [00:00<00:00, 1.16MB/s]
[2025-12-26 10:11:25,449] [DEBUG] [axolotl.loaders.model.log_gpu_memory_usage:127] [PID:1090] Memory usage after model load 6.250GB (+6.250GB allocated, +6.354GB reserved)
[2025-12-26 10:11:25,449] [INFO] [axolotl.loaders.adapter.load_lora:81] [PID:1090] found linear modules: ['down_proj', 'gate_proj', 'k_proj', 'o_proj', 'q_proj', 'up_proj', 'v_proj']
trainable params: 79,953,920 || all params: 6,820,466,688 || trainable%: 1.1723
[2025-12-26 10:11:25,779] [DEBUG] [axolotl.loaders.model.log_gpu_memory_usage:127] [PID:1090] after adapters 3.962GB (+3.962GB allocated, +6.525GB reserved)
[2025-12-26 10:11:29,534] [INFO] [axolotl.train.save_initial_configs:413] [PID:1090] Pre-saving adapter config to ./outputs/deepseek-luau-finetune...
[2025-12-26 10:11:29,535] [INFO] [axolotl.train.save_initial_configs:417] [PID:1090] Pre-saving tokenizer to ./outputs/deepseek-luau-finetune...
[2025-12-26 10:11:29,543] [INFO] [axolotl.train.save_initial_configs:422] [PID:1090] Pre-saving model config to ./outputs/deepseek-luau-finetune...
[2025-12-26 10:11:29,544] [INFO] [axolotl.train.execute_training:212] [PID:1090] Starting trainer...
[2025-12-26 10:11:30,941] [DEBUG] [axolotl.utils.samplers.multipack.__len__:462] [PID:1090] generate_batches time: 0.46141600608825684
[2025-12-26 10:11:31,417] [DEBUG] [axolotl.utils.samplers.multipack.__len__:462] [PID:1090] generate_batches time: 0.4759054183959961
[2025-12-26 10:11:31,884] [DEBUG] [axolotl.utils.samplers.multipack.__len__:462] [PID:1090] generate_batches time: 0.46620774269104004
[2025-12-26 10:11:32,353] [DEBUG] [axolotl.utils.samplers.multipack.__len__:462] [PID:1090] generate_batches time: 0.4690563678741455
[2025-12-26 10:11:32,353] [INFO] [axolotl.utils.samplers.multipack.calc_min_len:438] [PID:1090] gather_len_batches: [108]
[34m[1mwandb[0m: (1) Create a W&B account
[34m[1mwandb[0m: (2) Use an existing W&B account
[34m[1mwandb[0m: (3) Don't visualize my results
[34m[1mwandb[0m: Enter your choice:[34m[1mwandb[0m: You chose "Don't visualize my results"
[34m[1mwandb[0m: Tracking run with wandb version 0.23.1
[34m[1mwandb[0m: W&B syncing is set to [1m`offline`[0m in this directory. Run [1m`wandb online`[0m or set [1mWANDB_MODE=online[0m to enable cloud syncing.
[34m[1mwandb[0m: Run data is saved locally in [35m[1m/workspace/axolotl/wandb/offline-run-20251226_101905-r4z0laps[0m
[34m[1mwandb[0m: Detected [huggingface_hub.inference] in use.
[34m[1mwandb[0m: Use W&B Weave for improved LLM call tracing. Install Weave with `pip install weave` then add `import weave` to the top of your script.
[34m[1mwandb[0m: For more information, check out the docs at: https://weave-docs.wandb.ai/
[34m[1mwandb[0m: [33mWARNING[0m Saving files without folders. If you want to preserve subdirectories pass base_path to wandb.save, i.e. wandb.save("/mnt/folder/file.h5", base_path="/mnt")
[34m[1mwandb[0m: [33mWARNING[0m Symlinked 1 file into the W&B run directory; call wandb.save again to sync new files.
[2025-12-26 10:19:06,116] [INFO] [axolotl.utils.callbacks.on_train_begin:757] [PID:1090] The Axolotl config has been saved to the WandB run under files.
  0%|                                                                                                                              | 0/162 [00:00<?, ?it/s][2025-12-26 10:19:06,118] [INFO] [axolotl.core.trainers.base.evaluate:388] [PID:1090] Running evaluation step...
[2025-12-26 10:19:07,077] [DEBUG] [axolotl.utils.samplers.multipack.__len__:462] [PID:1090] generate_batches time: 0.486325740814209
[2025-12-26 10:19:07,546] [DEBUG] [axolotl.utils.samplers.multipack.__len__:462] [PID:1090] generate_batches time: 0.46843433380126953
[2025-12-26 10:19:08,027] [DEBUG] [axolotl.utils.samplers.multipack.__len__:462] [PID:1090] generate_batches time: 0.48073744773864746
[2025-12-26 10:19:08,514] [DEBUG] [axolotl.utils.samplers.multipack.__len__:462] [PID:1090] generate_batches time: 0.4870021343231201
[2025-12-26 10:19:08,515] [INFO] [axolotl.utils.samplers.multipack.calc_min_len:438] [PID:1090] gather_len_batches: [6]

  0%|                                                                                                                                | 0/6 [00:00<?, ?it/s][A
 33%|████████████████████████████████████████                                                                                | 2/6 [00:01<00:02,  1.42it/s][A
 50%|████████████████████████████████████████████████████████████                                                            | 3/6 [00:02<00:02,  1.22it/s][A
 67%|████████████████████████████████████████████████████████████████████████████████                                        | 4/6 [00:03<00:02,  1.04s/it][A
 83%|████████████████████████████████████████████████████████████████████████████████████████████████████                    | 5/6 [00:04<00:01,  1.02s/it][A
100%|████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████| 6/6 [00:05<00:00,  1.02it/s][A                                                                                                                                                           
                                                                                                                                                           [A{'eval_loss': 3.8515024185180664, 'eval_runtime': 7.3032, 'eval_samples_per_second': 155.0, 'eval_steps_per_second': 25.879, 'eval_ppl': 47.0637, 'memory/max_active (GiB)': 7.0, 'memory/max_allocated (GiB)': 7.0, 'memory/device_reserved (GiB)': 7.26, 'epoch': 0}
  0%|                                                                                                                              | 0/162 [00:09<?, ?it/s]
100%|████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████| 6/6 [00:05<00:00,  1.02it/s][A
                                                                                                                                                           [A  1%|▋                                                                                                                     | 1/162 [00:16<45:18, 16.89s/it]  1%|█▍                                                                                                                    | 2/162 [00:26<33:45, 12.66s/it]  2%|██▏                                                                                                                   | 3/162 [00:36<30:33, 11.53s/it]  2%|██▉                                                                                                                   | 4/162 [00:47<29:13, 11.10s/it]  3%|███▋                                                                                                                  | 5/162 [00:57<28:35, 10.92s/it]  4%|████▎                                                                                                                 | 6/162 [01:04<24:53,  9.57s/it]  4%|█████                                                                                                                 | 7/162 [01:13<24:14,  9.39s/it]  5%|█████▊                                                                                                                | 8/162 [01:24<25:25,  9.91s/it]  6%|██████▌                                                                                                               | 9/162 [01:35<26:13, 10.29s/it]  6%|███████▏                                                                                                             | 10/162 [01:47<26:42, 10.54s/it]                                                                                                                                                           {'loss': 3.2644, 'grad_norm': 0.8961077332496643, 'learning_rate': 0.00011250000000000001, 'ppl': 26.1644, 'memory/max_active (GiB)': 10.65, 'memory/max_allocated (GiB)': 10.65, 'memory/device_reserved (GiB)': 12.22, 'tokens_per_second_per_gpu': 1580.82, 'total_tokens': 175504, 'epoch': 0.19}
  6%|███████▏                                                                                                             | 10/162 [01:47<26:42, 10.54s/it]  7%|███████▉                                                                                                             | 11/162 [01:54<23:57,  9.52s/it]  7%|████████▋                                                                                                            | 12/162 [02:01<22:00,  8.80s/it]  8%|█████████▍                                                                                                           | 13/162 [02:10<22:07,  8.91s/it]  9%|██████████                                                                                                           | 14/162 [02:21<23:43,  9.62s/it][2025-12-26 10:21:27,923] [INFO] [axolotl.core.trainers.base.evaluate:388] [PID:1090] Running evaluation step...
[2025-12-26 10:21:28,932] [DEBUG] [axolotl.utils.samplers.multipack.__len__:462] [PID:1090] generate_batches time: 0.5047972202301025
[2025-12-26 10:21:29,436] [DEBUG] [axolotl.utils.samplers.multipack.__len__:462] [PID:1090] generate_batches time: 0.5044569969177246
[2025-12-26 10:21:29,928] [DEBUG] [axolotl.utils.samplers.multipack.__len__:462] [PID:1090] generate_batches time: 0.4910407066345215
[2025-12-26 10:21:30,414] [DEBUG] [axolotl.utils.samplers.multipack.__len__:462] [PID:1090] generate_batches time: 0.48651576042175293
[2025-12-26 10:21:30,414] [INFO] [axolotl.utils.samplers.multipack.calc_min_len:438] [PID:1090] gather_len_batches: [6]

  0%|                                                                                                                                | 0/6 [00:00<?, ?it/s][A
 33%|████████████████████████████████████████                                                                                | 2/6 [00:01<00:03,  1.17it/s][A
 50%|████████████████████████████████████████████████████████████                                                            | 3/6 [00:02<00:03,  1.01s/it][A
 67%|████████████████████████████████████████████████████████████████████████████████                                        | 4/6 [00:04<00:02,  1.25s/it][A
 83%|████████████████████████████████████████████████████████████████████████████████████████████████████                    | 5/6 [00:05<00:01,  1.21s/it][A
100%|████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████| 6/6 [00:06<00:00,  1.16s/it][A                                                                                                                                                           
                                                                                                                                                           [A{'eval_loss': 2.8645222187042236, 'eval_runtime': 8.4222, 'eval_samples_per_second': 134.407, 'eval_steps_per_second': 22.441, 'eval_ppl': 17.5407, 'memory/max_active (GiB)': 10.65, 'memory/max_allocated (GiB)': 10.65, 'memory/device_reserved (GiB)': 12.22, 'epoch': 0.26}
  9%|██████████                                                                                                           | 14/162 [02:32<23:43,  9.62s/it]
100%|████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████| 6/6 [00:06<00:00,  1.16s/it][A
                                                                                                                                                           [A  9%|██████████▊                                                                                                          | 15/162 [02:43<32:38, 13.32s/it] 10%|███████████▌                                                                                                         | 16/162 [02:50<27:50, 11.44s/it] 10%|████████████▎                                                                                                        | 17/162 [02:59<25:57, 10.74s/it] 11%|█████████████                                                                                                        | 18/162 [03:12<27:27, 11.44s/it] 12%|█████████████▋                                                                                                       | 19/162 [03:24<27:04, 11.36s/it] 12%|██████████████▍                                                                                                      | 20/162 [03:35<26:43, 11.29s/it]                                                                                                                                                           {'loss': 2.6242, 'grad_norm': 0.32017260789871216, 'learning_rate': 0.00019979171608653924, 'ppl': 13.7935, 'memory/max_active (GiB)': 12.57, 'memory/max_allocated (GiB)': 12.57, 'memory/device_reserved (GiB)': 14.58, 'tokens_per_second_per_gpu': 794.91, 'total_tokens': 350280, 'epoch': 0.37}
 12%|██████████████▍                                                                                                      | 20/162 [03:35<26:43, 11.29s/it] 13%|███████████████▏                                                                                                     | 21/162 [03:42<23:37, 10.05s/it] 14%|███████████████▉                                                                                                     | 22/162 [03:53<24:17, 10.41s/it] 14%|████████████████▌                                                                                                    | 23/162 [04:02<23:14, 10.03s/it] 15%|█████████████████▎                                                                                                   | 24/162 [04:09<21:04,  9.16s/it] 15%|██████████████████                                                                                                   | 25/162 [04:19<20:55,  9.16s/it] 16%|██████████████████▊                                                                                                  | 26/162 [04:28<20:44,  9.15s/it] 17%|███████████████████▌                                                                                                 | 27/162 [04:41<23:21, 10.38s/it] 17%|████████████████████▏                                                                                                | 28/162 [04:50<22:21, 10.01s/it][2025-12-26 10:23:56,783] [INFO] [axolotl.core.trainers.base.evaluate:388] [PID:1090] Running evaluation step...
[2025-12-26 10:23:57,767] [DEBUG] [axolotl.utils.samplers.multipack.__len__:462] [PID:1090] generate_batches time: 0.4813659191131592
[2025-12-26 10:23:58,258] [DEBUG] [axolotl.utils.samplers.multipack.__len__:462] [PID:1090] generate_batches time: 0.4907357692718506
[2025-12-26 10:23:58,759] [DEBUG] [axolotl.utils.samplers.multipack.__len__:462] [PID:1090] generate_batches time: 0.5011489391326904
[2025-12-26 10:23:59,262] [DEBUG] [axolotl.utils.samplers.multipack.__len__:462] [PID:1090] generate_batches time: 0.503136157989502
[2025-12-26 10:23:59,262] [INFO] [axolotl.utils.samplers.multipack.calc_min_len:438] [PID:1090] gather_len_batches: [6]

  0%|                                                                                                                                | 0/6 [00:00<?, ?it/s][A
 33%|████████████████████████████████████████                                                                                | 2/6 [00:01<00:03,  1.17it/s][A
 50%|████████████████████████████████████████████████████████████                                                            | 3/6 [00:02<00:03,  1.03s/it][A
 67%|████████████████████████████████████████████████████████████████████████████████                                        | 4/6 [00:04<00:02,  1.26s/it][A
 83%|████████████████████████████████████████████████████████████████████████████████████████████████████                    | 5/6 [00:05<00:01,  1.22s/it][A
100%|████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████| 6/6 [00:06<00:00,  1.16s/it][A                                                                                                                                                           
                                                                                                                                                           [A{'eval_loss': 2.263291597366333, 'eval_runtime': 8.4748, 'eval_samples_per_second': 133.572, 'eval_steps_per_second': 22.301, 'eval_ppl': 9.6147, 'memory/max_active (GiB)': 12.27, 'memory/max_allocated (GiB)': 12.27, 'memory/device_reserved (GiB)': 14.58, 'epoch': 0.52}
 17%|████████████████████▏                                                                                                | 28/162 [05:01<22:21, 10.01s/it]
100%|████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████| 6/6 [00:06<00:00,  1.16s/it][A
                                                                                                                                                           [A 18%|████████████████████▉                                                                                                | 29/162 [05:12<30:13, 13.64s/it] 19%|█████████████████████▋                                                                                               | 30/162 [05:23<28:16, 12.85s/it]                                                                                                                                                           {'loss': 2.269, 'grad_norm': 0.2529691457748413, 'learning_rate': 0.0001961129783872301, 'ppl': 9.6697, 'memory/max_active (GiB)': 10.65, 'memory/max_allocated (GiB)': 10.65, 'memory/device_reserved (GiB)': 11.62, 'tokens_per_second_per_gpu': 265.55, 'total_tokens': 521824, 'epoch': 0.56}
 19%|█████████████████████▋                                                                                               | 30/162 [05:23<28:16, 12.85s/it] 19%|██████████████████████▍                                                                                              | 31/162 [05:30<24:16, 11.12s/it] 20%|███████████████████████                                                                                              | 32/162 [05:41<24:04, 11.11s/it] 20%|███████████████████████▊                                                                                             | 33/162 [05:53<23:54, 11.12s/it] 21%|████████████████████████▌                                                                                            | 34/162 [06:04<23:42, 11.11s/it] 22%|█████████████████████████▎                                                                                           | 35/162 [06:17<24:44, 11.69s/it] 22%|██████████████████████████                                                                                           | 36/162 [06:26<22:56, 10.93s/it] 23%|██████████████████████████▋                                                                                          | 37/162 [06:35<21:39, 10.39s/it] 23%|███████████████████████████▍                                                                                         | 38/162 [06:46<21:58, 10.63s/it] 24%|████████████████████████████▏                                                                                        | 39/162 [06:55<20:53, 10.19s/it] 25%|████████████████████████████▉                                                                                        | 40/162 [07:02<18:51,  9.27s/it]                                                                                                                                                           {'loss': 2.0431, 'grad_norm': 0.13949531316757202, 'learning_rate': 0.00018800122039735358, 'ppl': 7.7145, 'memory/max_active (GiB)': 12.27, 'memory/max_allocated (GiB)': 12.27, 'memory/device_reserved (GiB)': 13.92, 'tokens_per_second_per_gpu': 1855.32, 'total_tokens': 654204, 'epoch': 0.74}
 25%|████████████████████████████▉                                                                                        | 40/162 [07:02<18:51,  9.27s/it] 25%|█████████████████████████████▌                                                                                       | 41/162 [07:14<19:49,  9.83s/it] 26%|██████████████████████████████▎                                                                                      | 42/162 [07:23<19:13,  9.61s/it][2025-12-26 10:26:29,338] [INFO] [axolotl.core.trainers.base.evaluate:388] [PID:1090] Running evaluation step...
[2025-12-26 10:26:30,354] [DEBUG] [axolotl.utils.samplers.multipack.__len__:462] [PID:1090] generate_batches time: 0.5070016384124756
[2025-12-26 10:26:30,861] [DEBUG] [axolotl.utils.samplers.multipack.__len__:462] [PID:1090] generate_batches time: 0.5069420337677002
[2025-12-26 10:26:31,365] [DEBUG] [axolotl.utils.samplers.multipack.__len__:462] [PID:1090] generate_batches time: 0.5042150020599365
[2025-12-26 10:26:31,868] [DEBUG] [axolotl.utils.samplers.multipack.__len__:462] [PID:1090] generate_batches time: 0.5027403831481934
[2025-12-26 10:26:31,868] [INFO] [axolotl.utils.samplers.multipack.calc_min_len:438] [PID:1090] gather_len_batches: [6]

  0%|                                                                                                                                | 0/6 [00:00<?, ?it/s][A
 33%|████████████████████████████████████████                                                                                | 2/6 [00:01<00:03,  1.17it/s][A
 50%|████████████████████████████████████████████████████████████                                                            | 3/6 [00:02<00:03,  1.03s/it][A
 67%|████████████████████████████████████████████████████████████████████████████████                                        | 4/6 [00:04<00:02,  1.26s/it][A
 83%|████████████████████████████████████████████████████████████████████████████████████████████████████                    | 5/6 [00:05<00:01,  1.22s/it][A
100%|████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████| 6/6 [00:06<00:00,  1.16s/it][A                                                                                                                                                           
                                                                                                                                                           [A{'eval_loss': 2.0478811264038086, 'eval_runtime': 8.4599, 'eval_samples_per_second': 133.807, 'eval_steps_per_second': 22.341, 'eval_ppl': 7.7515, 'memory/max_active (GiB)': 10.65, 'memory/max_allocated (GiB)': 10.65, 'memory/device_reserved (GiB)': 13.92, 'epoch': 0.78}
 26%|██████████████████████████████▎                                                                                      | 42/162 [07:34<19:13,  9.61s/it]
100%|████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████| 6/6 [00:06<00:00,  1.16s/it][A
                                                                                                                                                           [A 27%|███████████████████████████████                                                                                      | 43/162 [07:44<26:18, 13.26s/it] 27%|███████████████████████████████▊                                                                                     | 44/162 [07:52<22:24, 11.40s/it] 28%|████████████████████████████████▌                                                                                    | 45/162 [08:01<20:52, 10.70s/it] 28%|█████████████████████████████████▏                                                                                   | 46/162 [08:12<20:52, 10.79s/it] 29%|█████████████████████████████████▉                                                                                   | 47/162 [08:19<18:35,  9.70s/it] 30%|██████████████████████████████████▋                                                                                  | 48/162 [08:26<16:58,  8.94s/it] 30%|███████████████████████████████████▍                                                                                 | 49/162 [08:39<19:11, 10.19s/it] 31%|████████████████████████████████████                                                                                 | 50/162 [08:46<17:20,  9.29s/it]                                                                                                                                                           {'loss': 1.9054, 'grad_norm': 0.14704816043376923, 'learning_rate': 0.00017583058084785625, 'ppl': 6.7221, 'memory/max_active (GiB)': 12.57, 'memory/max_allocated (GiB)': 12.57, 'memory/device_reserved (GiB)': 14.72, 'tokens_per_second_per_gpu': 1463.61, 'total_tokens': 821109, 'epoch': 0.93}
 31%|████████████████████████████████████                                                                                 | 50/162 [08:46<17:20,  9.29s/it] 31%|████████████████████████████████████▊                                                                                | 51/162 [08:55<17:05,  9.24s/it] 32%|█████████████████████████████████████▌                                                                               | 52/162 [09:05<16:54,  9.22s/it] 33%|██████████████████████████████████████▎                                                                              | 53/162 [09:14<16:43,  9.21s/it] 33%|███████████████████████████████████████                                                                              | 54/162 [09:21<15:37,  8.68s/it][2025-12-26 10:28:27,778] [INFO] [axolotl.core.trainers.base._save:692] [PID:1090] Saving model checkpoint to ./outputs/deepseek-luau-finetune/checkpoint-54
 34%|███████████████████████████████████████▋                                                                             | 55/162 [09:34<17:54, 10.04s/it] 35%|████████████████████████████████████████▍                                                                            | 56/162 [09:41<16:10,  9.16s/it][2025-12-26 10:28:48,084] [INFO] [axolotl.core.trainers.base.evaluate:388] [PID:1090] Running evaluation step...
[2025-12-26 10:28:49,057] [DEBUG] [axolotl.utils.samplers.multipack.__len__:462] [PID:1090] generate_batches time: 0.4869377613067627
[2025-12-26 10:28:49,556] [DEBUG] [axolotl.utils.samplers.multipack.__len__:462] [PID:1090] generate_batches time: 0.4984874725341797
[2025-12-26 10:28:50,048] [DEBUG] [axolotl.utils.samplers.multipack.__len__:462] [PID:1090] generate_batches time: 0.49226832389831543
[2025-12-26 10:28:50,547] [DEBUG] [axolotl.utils.samplers.multipack.__len__:462] [PID:1090] generate_batches time: 0.4985942840576172
[2025-12-26 10:28:50,547] [INFO] [axolotl.utils.samplers.multipack.calc_min_len:438] [PID:1090] gather_len_batches: [6]

  0%|                                                                                                                                | 0/6 [00:00<?, ?it/s][A
 33%|████████████████████████████████████████                                                                                | 2/6 [00:01<00:03,  1.18it/s][A
 50%|████████████████████████████████████████████████████████████                                                            | 3/6 [00:02<00:03,  1.03s/it][A
 67%|████████████████████████████████████████████████████████████████████████████████                                        | 4/6 [00:04<00:02,  1.26s/it][A
 83%|████████████████████████████████████████████████████████████████████████████████████████████████████                    | 5/6 [00:05<00:01,  1.22s/it][A
100%|████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████| 6/6 [00:06<00:00,  1.16s/it][A                                                                                                                                                           
                                                                                                                                                           [A{'eval_loss': 1.9163343906402588, 'eval_runtime': 8.4596, 'eval_samples_per_second': 133.813, 'eval_steps_per_second': 22.342, 'eval_ppl': 6.796, 'memory/max_active (GiB)': 10.65, 'memory/max_allocated (GiB)': 10.65, 'memory/device_reserved (GiB)': 14.72, 'epoch': 1.04}
 35%|████████████████████████████████████████▍                                                                            | 56/162 [09:52<16:10,  9.16s/it]
100%|████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████| 6/6 [00:06<00:00,  1.16s/it][A
                                                                                                                                                           [A 35%|█████████████████████████████████████████▏                                                                           | 57/162 [10:01<21:39, 12.38s/it] 36%|█████████████████████████████████████████▉                                                                           | 58/162 [10:08<18:41, 10.78s/it] 36%|██████████████████████████████████████████▌                                                                          | 59/162 [10:18<17:39, 10.29s/it] 37%|███████████████████████████████████████████▎                                                                         | 60/162 [10:31<18:54, 11.12s/it]                                                                                                                                                           {'loss': 1.852, 'grad_norm': 0.12450622767210007, 'learning_rate': 0.00016016240632249224, 'ppl': 6.3726, 'memory/max_active (GiB)': 12.27, 'memory/max_allocated (GiB)': 12.27, 'memory/device_reserved (GiB)': 13.92, 'tokens_per_second_per_gpu': 414.94, 'total_tokens': 985746, 'epoch': 1.11}
 37%|███████████████████████████████████████████▎                                                                         | 60/162 [10:31<18:54, 11.12s/it] 38%|████████████████████████████████████████████                                                                         | 61/162 [10:38<16:42,  9.93s/it] 38%|████████████████████████████████████████████▊                                                                        | 62/162 [10:47<16:09,  9.70s/it] 39%|█████████████████████████████████████████████▌                                                                       | 63/162 [10:56<15:45,  9.55s/it] 40%|██████████████████████████████████████████████▏                                                                      | 64/162 [11:05<15:26,  9.45s/it] 40%|██████████████████████████████████████████████▉                                                                      | 65/162 [11:15<15:09,  9.38s/it] 41%|███████████████████████████████████████████████▋                                                                     | 66/162 [11:22<13:56,  8.71s/it] 41%|████████████████████████████████████████████████▍                                                                    | 67/162 [11:29<13:03,  8.25s/it] 42%|█████████████████████████████████████████████████                                                                    | 68/162 [11:40<14:17,  9.13s/it] 43%|█████████████████████████████████████████████████▊                                                                   | 69/162 [11:51<15:06,  9.75s/it] 43%|██████████████████████████████████████████████████▌                                                                  | 70/162 [11:58<13:44,  8.96s/it]                                                                                                                                                           {'loss': 1.7318, 'grad_norm': 0.19961747527122498, 'learning_rate': 0.00014171936026123168, 'ppl': 5.6508, 'memory/max_active (GiB)': 10.65, 'memory/max_allocated (GiB)': 10.65, 'memory/device_reserved (GiB)': 13.92, 'tokens_per_second_per_gpu': 1767.48, 'total_tokens': 1111582, 'epoch': 1.3}
 43%|██████████████████████████████████████████████████▌                                                                  | 70/162 [11:58<13:44,  8.96s/it][2025-12-26 10:31:05,030] [INFO] [axolotl.core.trainers.base.evaluate:388] [PID:1090] Running evaluation step...
[2025-12-26 10:31:06,068] [DEBUG] [axolotl.utils.samplers.multipack.__len__:462] [PID:1090] generate_batches time: 0.5160894393920898
[2025-12-26 10:31:06,581] [DEBUG] [axolotl.utils.samplers.multipack.__len__:462] [PID:1090] generate_batches time: 0.5119650363922119
[2025-12-26 10:31:07,079] [DEBUG] [axolotl.utils.samplers.multipack.__len__:462] [PID:1090] generate_batches time: 0.498187780380249
[2025-12-26 10:31:07,590] [DEBUG] [axolotl.utils.samplers.multipack.__len__:462] [PID:1090] generate_batches time: 0.5106852054595947
[2025-12-26 10:31:07,590] [INFO] [axolotl.utils.samplers.multipack.calc_min_len:438] [PID:1090] gather_len_batches: [6]

  0%|                                                                                                                                | 0/6 [00:00<?, ?it/s][A
 33%|████████████████████████████████████████                                                                                | 2/6 [00:01<00:03,  1.17it/s][A
 50%|████████████████████████████████████████████████████████████                                                            | 3/6 [00:02<00:03,  1.03s/it][A
 67%|████████████████████████████████████████████████████████████████████████████████                                        | 4/6 [00:04<00:02,  1.26s/it][A
 83%|████████████████████████████████████████████████████████████████████████████████████████████████████                    | 5/6 [00:05<00:01,  1.22s/it][A
100%|████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████| 6/6 [00:06<00:00,  1.16s/it][A                                                                                                                                                           
                                                                                                                                                           [A{'eval_loss': 1.8184418678283691, 'eval_runtime': 8.4746, 'eval_samples_per_second': 133.576, 'eval_steps_per_second': 22.302, 'eval_ppl': 6.1622, 'memory/max_active (GiB)': 7.61, 'memory/max_allocated (GiB)': 7.61, 'memory/device_reserved (GiB)': 13.92, 'epoch': 1.3}
 43%|██████████████████████████████████████████████████▌                                                                  | 70/162 [12:09<13:44,  8.96s/it]
100%|████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████| 6/6 [00:06<00:00,  1.16s/it][A
                                                                                                                                                           [A 44%|███████████████████████████████████████████████████▎                                                                 | 71/162 [12:18<18:37, 12.28s/it] 44%|████████████████████████████████████████████████████                                                                 | 72/162 [12:28<16:58, 11.32s/it] 45%|████████████████████████████████████████████████████▋                                                                | 73/162 [12:39<16:43, 11.28s/it] 46%|█████████████████████████████████████████████████████▍                                                               | 74/162 [12:50<16:25, 11.20s/it] 46%|██████████████████████████████████████████████████████▏                                                              | 75/162 [13:01<16:12, 11.17s/it] 47%|██████████████████████████████████████████████████████▉                                                              | 76/162 [13:10<15:09, 10.57s/it] 48%|███████████████████████████████████████████████████████▌                                                             | 77/162 [13:17<13:31,  9.55s/it] 48%|████████████████████████████████████████████████████████▎                                                            | 78/162 [13:26<13:12,  9.44s/it] 49%|█████████████████████████████████████████████████████████                                                            | 79/162 [13:39<14:36, 10.56s/it] 49%|█████████████████████████████████████████████████████████▊                                                           | 80/162 [13:49<13:51, 10.14s/it]                                                                                                                                                           {'loss': 1.6119, 'grad_norm': 0.16495195031166077, 'learning_rate': 0.00012135209154397962, 'ppl': 5.0123, 'memory/max_active (GiB)': 12.57, 'memory/max_allocated (GiB)': 12.57, 'memory/device_reserved (GiB)': 14.54, 'tokens_per_second_per_gpu': 1562.35, 'total_tokens': 1289641, 'epoch': 1.48}
 49%|█████████████████████████████████████████████████████████▊                                                           | 80/162 [13:49<13:51, 10.14s/it] 50%|██████████████████████████████████████████████████████████▌                                                          | 81/162 [14:00<14:02, 10.40s/it] 51%|███████████████████████████████████████████████████████████▏                                                         | 82/162 [14:09<13:21, 10.02s/it] 51%|███████████████████████████████████████████████████████████▉                                                         | 83/162 [14:20<13:40, 10.39s/it] 52%|████████████████████████████████████████████████████████████▋                                                        | 84/162 [14:29<13:01, 10.02s/it][2025-12-26 10:33:35,815] [INFO] [axolotl.core.trainers.base.evaluate:388] [PID:1090] Running evaluation step...
[2025-12-26 10:33:36,817] [DEBUG] [axolotl.utils.samplers.multipack.__len__:462] [PID:1090] generate_batches time: 0.49897122383117676
[2025-12-26 10:33:37,325] [DEBUG] [axolotl.utils.samplers.multipack.__len__:462] [PID:1090] generate_batches time: 0.508049488067627
[2025-12-26 10:33:37,816] [DEBUG] [axolotl.utils.samplers.multipack.__len__:462] [PID:1090] generate_batches time: 0.4906184673309326
[2025-12-26 10:33:38,327] [DEBUG] [axolotl.utils.samplers.multipack.__len__:462] [PID:1090] generate_batches time: 0.5105898380279541
[2025-12-26 10:33:38,327] [INFO] [axolotl.utils.samplers.multipack.calc_min_len:438] [PID:1090] gather_len_batches: [6]

  0%|                                                                                                                                | 0/6 [00:00<?, ?it/s][A
 33%|████████████████████████████████████████                                                                                | 2/6 [00:01<00:03,  1.18it/s][A
 50%|████████████████████████████████████████████████████████████                                                            | 3/6 [00:02<00:03,  1.03s/it][A
 67%|████████████████████████████████████████████████████████████████████████████████                                        | 4/6 [00:04<00:02,  1.26s/it][A
 83%|████████████████████████████████████████████████████████████████████████████████████████████████████                    | 5/6 [00:05<00:01,  1.21s/it][A
100%|████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████| 6/6 [00:06<00:00,  1.16s/it][A                                                                                                                                                           
                                                                                                                                                           [A{'eval_loss': 1.7550275325775146, 'eval_runtime': 8.4584, 'eval_samples_per_second': 133.831, 'eval_steps_per_second': 22.345, 'eval_ppl': 5.7836, 'memory/max_active (GiB)': 12.27, 'memory/max_allocated (GiB)': 12.27, 'memory/device_reserved (GiB)': 14.54, 'epoch': 1.56}
 52%|████████████████████████████████████████████████████████████▋                                                        | 84/162 [14:40<13:01, 10.02s/it]
100%|████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████| 6/6 [00:06<00:00,  1.16s/it][A
                                                                                                                                                           [A 52%|█████████████████████████████████████████████████████████████▍                                                       | 85/162 [14:51<17:27, 13.61s/it] 53%|██████████████████████████████████████████████████████████████                                                       | 86/162 [15:02<16:16, 12.85s/it] 54%|██████████████████████████████████████████████████████████████▊                                                      | 87/162 [15:11<14:38, 11.72s/it] 54%|███████████████████████████████████████████████████████████████▌                                                     | 88/162 [15:18<12:45, 10.34s/it] 55%|████████████████████████████████████████████████████████████████▎                                                    | 89/162 [15:30<12:51, 10.57s/it] 56%|█████████████████████████████████████████████████████████████████                                                    | 90/162 [15:41<12:53, 10.75s/it]                                                                                                                                                           {'loss': 1.6022, 'grad_norm': 0.19144544005393982, 'learning_rate': 0.0001, 'ppl': 4.9639, 'memory/max_active (GiB)': 12.57, 'memory/max_allocated (GiB)': 12.57, 'memory/device_reserved (GiB)': 14.23, 'tokens_per_second_per_gpu': 713.49, 'total_tokens': 1460903, 'epoch': 1.67}
 56%|█████████████████████████████████████████████████████████████████                                                    | 90/162 [15:41<12:53, 10.75s/it] 56%|█████████████████████████████████████████████████████████████████▋                                                   | 91/162 [15:52<12:52, 10.87s/it] 57%|██████████████████████████████████████████████████████████████████▍                                                  | 92/162 [15:59<11:23,  9.76s/it] 57%|███████████████████████████████████████████████████████████████████▏                                                 | 93/162 [16:08<11:01,  9.59s/it] 58%|███████████████████████████████████████████████████████████████████▉                                                 | 94/162 [16:19<11:25, 10.08s/it] 59%|████████████████████████████████████████████████████████████████████▌                                                | 95/162 [16:31<11:37, 10.41s/it] 59%|█████████████████████████████████████████████████████████████████████▎                                               | 96/162 [16:42<11:40, 10.61s/it] 60%|██████████████████████████████████████████████████████████████████████                                               | 97/162 [16:51<11:01, 10.17s/it] 60%|██████████████████████████████████████████████████████████████████████▊                                              | 98/162 [17:02<11:10, 10.48s/it][2025-12-26 10:36:08,693] [INFO] [axolotl.core.trainers.base.evaluate:388] [PID:1090] Running evaluation step...
[2025-12-26 10:36:09,699] [DEBUG] [axolotl.utils.samplers.multipack.__len__:462] [PID:1090] generate_batches time: 0.49933719635009766
[2025-12-26 10:36:10,199] [DEBUG] [axolotl.utils.samplers.multipack.__len__:462] [PID:1090] generate_batches time: 0.4997081756591797
[2025-12-26 10:36:10,707] [DEBUG] [axolotl.utils.samplers.multipack.__len__:462] [PID:1090] generate_batches time: 0.5083022117614746
[2025-12-26 10:36:11,205] [DEBUG] [axolotl.utils.samplers.multipack.__len__:462] [PID:1090] generate_batches time: 0.49825024604797363
[2025-12-26 10:36:11,206] [INFO] [axolotl.utils.samplers.multipack.calc_min_len:438] [PID:1090] gather_len_batches: [6]

  0%|                                                                                                                                | 0/6 [00:00<?, ?it/s][A
 33%|████████████████████████████████████████                                                                                | 2/6 [00:01<00:03,  1.17it/s][A
 50%|████████████████████████████████████████████████████████████                                                            | 3/6 [00:02<00:03,  1.03s/it][A
 67%|████████████████████████████████████████████████████████████████████████████████                                        | 4/6 [00:04<00:02,  1.26s/it][A
 83%|████████████████████████████████████████████████████████████████████████████████████████████████████                    | 5/6 [00:05<00:01,  1.21s/it][A
100%|████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████| 6/6 [00:06<00:00,  1.16s/it][A                                                                                                                                                           
                                                                                                                                                           [A{'eval_loss': 1.7048498392105103, 'eval_runtime': 8.437, 'eval_samples_per_second': 134.171, 'eval_steps_per_second': 22.401, 'eval_ppl': 5.5006, 'memory/max_active (GiB)': 10.65, 'memory/max_allocated (GiB)': 10.65, 'memory/device_reserved (GiB)': 14.23, 'epoch': 1.81}
 60%|██████████████████████████████████████████████████████████████████████▊                                              | 98/162 [17:13<11:10, 10.48s/it]
100%|████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████| 6/6 [00:06<00:00,  1.16s/it][A
                                                                                                                                                           [A 61%|███████████████████████████████████████████████████████████████████████▌                                             | 99/162 [17:22<13:58, 13.32s/it] 62%|███████████████████████████████████████████████████████████████████████▌                                            | 100/162 [17:29<11:49, 11.44s/it]                                                                                                                                                           {'loss': 1.586, 'grad_norm': 0.22872120141983032, 'learning_rate': 7.864790845602039e-05, 'ppl': 4.8842, 'memory/max_active (GiB)': 10.65, 'memory/max_allocated (GiB)': 10.65, 'memory/device_reserved (GiB)': 11.96, 'tokens_per_second_per_gpu': 345.88, 'total_tokens': 1632793, 'epoch': 1.85}
 62%|███████████████████████████████████████████████████████████████████████▌                                            | 100/162 [17:29<11:49, 11.44s/it] 62%|████████████████████████████████████████████████████████████████████████▎                                           | 101/162 [17:40<11:29, 11.31s/it] 63%|█████████████████████████████████████████████████████████████████████████                                           | 102/162 [17:53<11:50, 11.84s/it] 64%|█████████████████████████████████████████████████████████████████████████▊                                          | 103/162 [18:04<11:27, 11.65s/it] 64%|██████████████████████████████████████████████████████████████████████████▍                                         | 104/162 [18:14<10:32, 10.90s/it] 65%|███████████████████████████████████████████████████████████████████████████▏                                        | 105/162 [18:23<09:50, 10.36s/it] 65%|███████████████████████████████████████████████████████████████████████████▉                                        | 106/162 [18:30<08:45,  9.39s/it] 66%|████████████████████████████████████████████████████████████████████████████▌                                       | 107/162 [18:41<09:06,  9.93s/it] 67%|█████████████████████████████████████████████████████████████████████████████▎                                      | 108/162 [18:48<08:15,  9.18s/it][2025-12-26 10:37:54,977] [INFO] [axolotl.core.trainers.base._save:692] [PID:1090] Saving model checkpoint to ./outputs/deepseek-luau-finetune/checkpoint-108
 67%|██████████████████████████████████████████████████████████████████████████████                                      | 109/162 [19:03<09:38, 10.92s/it] 68%|██████████████████████████████████████████████████████████████████████████████▊                                     | 110/162 [19:10<08:28,  9.77s/it]                                                                                                                                                           {'loss': 1.6249, 'grad_norm': 0.22108827531337738, 'learning_rate': 5.828063973876834e-05, 'ppl': 5.0779, 'memory/max_active (GiB)': 12.27, 'memory/max_allocated (GiB)': 12.27, 'memory/device_reserved (GiB)': 13.99, 'tokens_per_second_per_gpu': 1918.03, 'total_tokens': 1768690, 'epoch': 2.04}
 68%|██████████████████████████████████████████████████████████████████████████████▊                                     | 110/162 [19:10<08:28,  9.77s/it] 69%|███████████████████████████████████████████████████████████████████████████████▍                                    | 111/162 [19:18<07:37,  8.97s/it] 69%|████████████████████████████████████████████████████████████████████████████████▏                                   | 112/162 [19:29<08:00,  9.61s/it][2025-12-26 10:38:35,256] [INFO] [axolotl.core.trainers.base.evaluate:388] [PID:1090] Running evaluation step...
[2025-12-26 10:38:36,280] [DEBUG] [axolotl.utils.samplers.multipack.__len__:462] [PID:1090] generate_batches time: 0.5116095542907715
[2025-12-26 10:38:36,785] [DEBUG] [axolotl.utils.samplers.multipack.__len__:462] [PID:1090] generate_batches time: 0.5051100254058838
[2025-12-26 10:38:37,293] [DEBUG] [axolotl.utils.samplers.multipack.__len__:462] [PID:1090] generate_batches time: 0.507728099822998
[2025-12-26 10:38:37,809] [DEBUG] [axolotl.utils.samplers.multipack.__len__:462] [PID:1090] generate_batches time: 0.5157632827758789
[2025-12-26 10:38:37,809] [INFO] [axolotl.utils.samplers.multipack.calc_min_len:438] [PID:1090] gather_len_batches: [6]

  0%|                                                                                                                                | 0/6 [00:00<?, ?it/s][A
 33%|████████████████████████████████████████                                                                                | 2/6 [00:01<00:03,  1.17it/s][A
 50%|████████████████████████████████████████████████████████████                                                            | 3/6 [00:02<00:03,  1.03s/it][A
 67%|████████████████████████████████████████████████████████████████████████████████                                        | 4/6 [00:04<00:02,  1.26s/it][A
 83%|████████████████████████████████████████████████████████████████████████████████████████████████████                    | 5/6 [00:05<00:01,  1.21s/it][A
100%|████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████| 6/6 [00:06<00:00,  1.16s/it][A                                                                                                                                                           
                                                                                                                                                           [A{'eval_loss': 1.672270655632019, 'eval_runtime': 8.4743, 'eval_samples_per_second': 133.58, 'eval_steps_per_second': 22.303, 'eval_ppl': 5.3242, 'memory/max_active (GiB)': 10.65, 'memory/max_allocated (GiB)': 10.65, 'memory/device_reserved (GiB)': 13.99, 'epoch': 2.07}
 69%|████████████████████████████████████████████████████████████████████████████████▏                                   | 112/162 [19:40<08:00,  9.61s/it]
100%|████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████| 6/6 [00:06<00:00,  1.16s/it][A
                                                                                                                                                           [A 70%|████████████████████████████████████████████████████████████████████████████████▉                                   | 113/162 [19:51<10:54, 13.36s/it] 70%|█████████████████████████████████████████████████████████████████████████████████▋                                  | 114/162 [20:00<09:40, 12.10s/it] 71%|██████████████████████████████████████████████████████████████████████████████████▎                                 | 115/162 [20:07<08:18, 10.61s/it] 72%|███████████████████████████████████████████████████████████████████████████████████                                 | 116/162 [20:18<08:15, 10.78s/it] 72%|███████████████████████████████████████████████████████████████████████████████████▊                                | 117/162 [20:27<07:44, 10.31s/it] 73%|████████████████████████████████████████████████████████████████████████████████████▍                               | 118/162 [20:35<06:52,  9.37s/it] 73%|█████████████████████████████████████████████████████████████████████████████████████▏                              | 119/162 [20:44<06:40,  9.32s/it] 74%|█████████████████████████████████████████████████████████████████████████████████████▉                              | 120/162 [20:53<06:29,  9.28s/it]                                                                                                                                                           {'loss': 1.4995, 'grad_norm': 0.24357792735099792, 'learning_rate': 3.9837593677507726e-05, 'ppl': 4.4794, 'memory/max_active (GiB)': 10.65, 'memory/max_allocated (GiB)': 10.65, 'memory/device_reserved (GiB)': 11.93, 'tokens_per_second_per_gpu': 1116.13, 'total_tokens': 1932966, 'epoch': 2.22}
 74%|█████████████████████████████████████████████████████████████████████████████████████▉                              | 120/162 [20:53<06:29,  9.28s/it] 75%|██████████████████████████████████████████████████████████████████████████████████████▋                             | 121/162 [21:00<05:54,  8.65s/it] 75%|███████████████████████████████████████████████████████████████████████████████████████▎                            | 122/162 [21:11<06:17,  9.44s/it] 76%|████████████████████████████████████████████████████████████████████████████████████████                            | 123/162 [21:19<05:41,  8.76s/it] 77%|████████████████████████████████████████████████████████████████████████████████████████▊                           | 124/162 [21:28<05:37,  8.88s/it] 77%|█████████████████████████████████████████████████████████████████████████████████████████▌                          | 125/162 [21:39<05:54,  9.58s/it] 78%|██████████████████████████████████████████████████████████████████████████████████████████▏                         | 126/162 [21:48<05:40,  9.45s/it][2025-12-26 10:40:54,755] [INFO] [axolotl.core.trainers.base.evaluate:388] [PID:1090] Running evaluation step...
[2025-12-26 10:40:55,727] [DEBUG] [axolotl.utils.samplers.multipack.__len__:462] [PID:1090] generate_batches time: 0.48783421516418457
[2025-12-26 10:40:56,244] [DEBUG] [axolotl.utils.samplers.multipack.__len__:462] [PID:1090] generate_batches time: 0.5166926383972168
[2025-12-26 10:40:56,750] [DEBUG] [axolotl.utils.samplers.multipack.__len__:462] [PID:1090] generate_batches time: 0.5060973167419434
[2025-12-26 10:40:57,267] [DEBUG] [axolotl.utils.samplers.multipack.__len__:462] [PID:1090] generate_batches time: 0.5172219276428223
[2025-12-26 10:40:57,267] [INFO] [axolotl.utils.samplers.multipack.calc_min_len:438] [PID:1090] gather_len_batches: [6]

  0%|                                                                                                                                | 0/6 [00:00<?, ?it/s][A
 33%|████████████████████████████████████████                                                                                | 2/6 [00:01<00:03,  1.18it/s][A
 50%|████████████████████████████████████████████████████████████                                                            | 3/6 [00:02<00:03,  1.01s/it][A
 67%|████████████████████████████████████████████████████████████████████████████████                                        | 4/6 [00:04<00:02,  1.25s/it][A
 83%|████████████████████████████████████████████████████████████████████████████████████████████████████                    | 5/6 [00:05<00:01,  1.21s/it][A
100%|████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████| 6/6 [00:06<00:00,  1.15s/it][A                                                                                                                                                           
                                                                                                                                                           [A{'eval_loss': 1.6503404378890991, 'eval_runtime': 8.4269, 'eval_samples_per_second': 134.332, 'eval_steps_per_second': 22.428, 'eval_ppl': 5.2088, 'memory/max_active (GiB)': 10.65, 'memory/max_allocated (GiB)': 10.65, 'memory/device_reserved (GiB)': 11.93, 'epoch': 2.33}
 78%|██████████████████████████████████████████████████████████████████████████████████████████▏                         | 126/162 [21:59<05:40,  9.45s/it]
100%|████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████| 6/6 [00:06<00:00,  1.15s/it][A
                                                                                                                                                           [A 78%|██████████████████████████████████████████████████████████████████████████████████████████▉                         | 127/162 [22:10<07:42, 13.20s/it] 79%|███████████████████████████████████████████████████████████████████████████████████████████▋                        | 128/162 [22:23<07:26, 13.12s/it] 80%|████████████████████████████████████████████████████████████████████████████████████████████▎                       | 129/162 [22:34<06:53, 12.52s/it] 80%|█████████████████████████████████████████████████████████████████████████████████████████████                       | 130/162 [22:45<06:26, 12.09s/it]                                                                                                                                                           {'loss': 1.436, 'grad_norm': 0.21442264318466187, 'learning_rate': 2.4169419152143768e-05, 'ppl': 4.2038, 'memory/max_active (GiB)': 12.57, 'memory/max_allocated (GiB)': 12.57, 'memory/device_reserved (GiB)': 14.57, 'tokens_per_second_per_gpu': 519.75, 'total_tokens': 2102688, 'epoch': 2.41}
 80%|█████████████████████████████████████████████████████████████████████████████████████████████                       | 130/162 [22:45<06:26, 12.09s/it] 81%|█████████████████████████████████████████████████████████████████████████████████████████████▊                      | 131/162 [22:56<06:06, 11.82s/it] 81%|██████████████████████████████████████████████████████████████████████████████████████████████▌                     | 132/162 [23:08<05:48, 11.63s/it] 82%|███████████████████████████████████████████████████████████████████████████████████████████████▏                    | 133/162 [23:17<05:15, 10.89s/it] 83%|███████████████████████████████████████████████████████████████████████████████████████████████▉                    | 134/162 [23:28<05:07, 10.97s/it] 83%|████████████████████████████████████████████████████████████████████████████████████████████████▋                   | 135/162 [23:35<04:25,  9.83s/it] 84%|█████████████████████████████████████████████████████████████████████████████████████████████████▍                  | 136/162 [23:48<04:41, 10.82s/it] 85%|██████████████████████████████████████████████████████████████████████████████████████████████████                  | 137/162 [23:59<04:32, 10.91s/it] 85%|██████████████████████████████████████████████████████████████████████████████████████████████████▊                 | 138/162 [24:08<04:09, 10.38s/it] 86%|███████████████████████████████████████████████████████████████████████████████████████████████████▌                | 139/162 [24:18<03:49,  9.99s/it] 86%|████████████████████████████████████████████████████████████████████████████████████████████████████▏               | 140/162 [24:29<03:48, 10.36s/it]                                                                                                                                                           {'loss': 1.4803, 'grad_norm': 0.1955472230911255, 'learning_rate': 1.1998779602646437e-05, 'ppl': 4.3943, 'memory/max_active (GiB)': 12.27, 'memory/max_allocated (GiB)': 12.27, 'memory/device_reserved (GiB)': 14.58, 'tokens_per_second_per_gpu': 1221.86, 'total_tokens': 2239834, 'epoch': 2.59}
 86%|████████████████████████████████████████████████████████████████████████████████████████████████████▏               | 140/162 [24:29<03:48, 10.36s/it][2025-12-26 10:43:35,430] [INFO] [axolotl.core.trainers.base.evaluate:388] [PID:1090] Running evaluation step...
[2025-12-26 10:43:36,458] [DEBUG] [axolotl.utils.samplers.multipack.__len__:462] [PID:1090] generate_batches time: 0.5145120620727539
[2025-12-26 10:43:36,960] [DEBUG] [axolotl.utils.samplers.multipack.__len__:462] [PID:1090] generate_batches time: 0.5021951198577881
[2025-12-26 10:43:37,460] [DEBUG] [axolotl.utils.samplers.multipack.__len__:462] [PID:1090] generate_batches time: 0.49991607666015625
[2025-12-26 10:43:37,956] [DEBUG] [axolotl.utils.samplers.multipack.__len__:462] [PID:1090] generate_batches time: 0.4953134059906006
[2025-12-26 10:43:37,956] [INFO] [axolotl.utils.samplers.multipack.calc_min_len:438] [PID:1090] gather_len_batches: [6]

  0%|                                                                                                                                | 0/6 [00:00<?, ?it/s][A
 33%|████████████████████████████████████████                                                                                | 2/6 [00:01<00:03,  1.19it/s][A
 50%|████████████████████████████████████████████████████████████                                                            | 3/6 [00:02<00:03,  1.03s/it][A
 67%|████████████████████████████████████████████████████████████████████████████████                                        | 4/6 [00:04<00:02,  1.26s/it][A
 83%|████████████████████████████████████████████████████████████████████████████████████████████████████                    | 5/6 [00:05<00:01,  1.21s/it][A
100%|████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████| 6/6 [00:06<00:00,  1.16s/it][A                                                                                                                                                           
                                                                                                                                                           [A{'eval_loss': 1.638063669204712, 'eval_runtime': 8.4534, 'eval_samples_per_second': 133.911, 'eval_steps_per_second': 22.358, 'eval_ppl': 5.1452, 'memory/max_active (GiB)': 7.61, 'memory/max_allocated (GiB)': 7.61, 'memory/device_reserved (GiB)': 14.58, 'epoch': 2.59}
 86%|████████████████████████████████████████████████████████████████████████████████████████████████████▏               | 140/162 [24:40<03:48, 10.36s/it]
100%|████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████| 6/6 [00:06<00:00,  1.16s/it][A
                                                                                                                                                           [A 87%|████████████████████████████████████████████████████████████████████████████████████████████████████▉               | 141/162 [24:51<04:51, 13.86s/it] 88%|█████████████████████████████████████████████████████████████████████████████████████████████████████▋              | 142/162 [25:00<04:09, 12.45s/it] 88%|██████████████████████████████████████████████████████████████████████████████████████████████████████▍             | 143/162 [25:09<03:37, 11.44s/it] 89%|███████████████████████████████████████████████████████████████████████████████████████████████████████             | 144/162 [25:16<03:02, 10.15s/it] 90%|███████████████████████████████████████████████████████████████████████████████████████████████████████▊            | 145/162 [25:25<02:47,  9.85s/it] 90%|████████████████████████████████████████████████████████████████████████████████████████████████████████▌           | 146/162 [25:37<02:43, 10.25s/it] 91%|█████████████████████████████████████████████████████████████████████████████████████████████████████████▎          | 147/162 [25:48<02:37, 10.53s/it] 91%|█████████████████████████████████████████████████████████████████████████████████████████████████████████▉          | 148/162 [25:59<02:30, 10.74s/it] 92%|██████████████████████████████████████████████████████████████████████████████████████████████████████████▋         | 149/162 [26:08<02:13, 10.27s/it] 93%|███████████████████████████████████████████████████████████████████████████████████████████████████████████▍        | 150/162 [26:19<02:06, 10.54s/it]                                                                                                                                                           {'loss': 1.4872, 'grad_norm': 0.22001619637012482, 'learning_rate': 3.887021612769936e-06, 'ppl': 4.4247, 'memory/max_active (GiB)': 10.65, 'memory/max_allocated (GiB)': 10.65, 'memory/device_reserved (GiB)': 11.92, 'tokens_per_second_per_gpu': 1241.05, 'total_tokens': 2413606, 'epoch': 2.78}
 93%|███████████████████████████████████████████████████████████████████████████████████████████████████████████▍        | 150/162 [26:19<02:06, 10.54s/it] 93%|████████████████████████████████████████████████████████████████████████████████████████████████████████████        | 151/162 [26:26<01:44,  9.52s/it] 94%|████████████████████████████████████████████████████████████████████████████████████████████████████████████▊       | 152/162 [26:38<01:40, 10.03s/it] 94%|█████████████████████████████████████████████████████████████████████████████████████████████████████████████▌      | 153/162 [26:47<01:27,  9.77s/it] 95%|██████████████████████████████████████████████████████████████████████████████████████████████████████████████▎     | 154/162 [26:58<01:21, 10.18s/it][2025-12-26 10:46:04,571] [INFO] [axolotl.core.trainers.base.evaluate:388] [PID:1090] Running evaluation step...
[2025-12-26 10:46:05,560] [DEBUG] [axolotl.utils.samplers.multipack.__len__:462] [PID:1090] generate_batches time: 0.49736905097961426
[2025-12-26 10:46:06,063] [DEBUG] [axolotl.utils.samplers.multipack.__len__:462] [PID:1090] generate_batches time: 0.5023696422576904
[2025-12-26 10:46:06,565] [DEBUG] [axolotl.utils.samplers.multipack.__len__:462] [PID:1090] generate_batches time: 0.5025477409362793
[2025-12-26 10:46:07,067] [DEBUG] [axolotl.utils.samplers.multipack.__len__:462] [PID:1090] generate_batches time: 0.5012121200561523
[2025-12-26 10:46:07,067] [INFO] [axolotl.utils.samplers.multipack.calc_min_len:438] [PID:1090] gather_len_batches: [6]

  0%|                                                                                                                                | 0/6 [00:00<?, ?it/s][A
 33%|████████████████████████████████████████                                                                                | 2/6 [00:01<00:03,  1.17it/s][A
 50%|████████████████████████████████████████████████████████████                                                            | 3/6 [00:02<00:03,  1.01s/it][A
 67%|████████████████████████████████████████████████████████████████████████████████                                        | 4/6 [00:04<00:02,  1.25s/it][A
 83%|████████████████████████████████████████████████████████████████████████████████████████████████████                    | 5/6 [00:05<00:01,  1.21s/it][A
100%|████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████| 6/6 [00:06<00:00,  1.16s/it][A                                                                                                                                                           
                                                                                                                                                           [A{'eval_loss': 1.6345535516738892, 'eval_runtime': 8.4191, 'eval_samples_per_second': 134.456, 'eval_steps_per_second': 22.449, 'eval_ppl': 5.1272, 'memory/max_active (GiB)': 10.65, 'memory/max_allocated (GiB)': 10.65, 'memory/device_reserved (GiB)': 11.93, 'epoch': 2.85}
 95%|██████████████████████████████████████████████████████████████████████████████████████████████████████████████▎     | 154/162 [27:09<01:21, 10.18s/it]
100%|████████████████████████████████████████████████████████████████████████████████████████████████████████████████████████| 6/6 [00:06<00:00,  1.16s/it][A
                                                                                                                                                           [A 96%|██████████████████████████████████████████████████████████████████████████████████████████████████████████████▉     | 155/162 [27:20<01:35, 13.68s/it] 96%|███████████████████████████████████████████████████████████████████████████████████████████████████████████████▋    | 156/162 [27:31<01:17, 12.89s/it] 97%|████████████████████████████████████████████████████████████████████████████████████████████████████████████████▍   | 157/162 [27:40<00:58, 11.76s/it] 98%|█████████████████████████████████████████████████████████████████████████████████████████████████████████████████▏  | 158/162 [27:53<00:48, 12.17s/it] 98%|█████████████████████████████████████████████████████████████████████████████████████████████████████████████████▊  | 159/162 [28:02<00:33, 11.27s/it] 99%|██████████████████████████████████████████████████████████████████████████████████████████████████████████████████▌ | 160/162 [28:13<00:22, 11.24s/it]                                                                                                                                                           {'loss': 1.4862, 'grad_norm': 0.22576645016670227, 'learning_rate': 2.082839134607828e-07, 'ppl': 4.4203, 'memory/max_active (GiB)': 12.57, 'memory/max_allocated (GiB)': 12.57, 'memory/device_reserved (GiB)': 14.72, 'tokens_per_second_per_gpu': 799.33, 'total_tokens': 2585902, 'epoch': 2.96}
 99%|██████████████████████████████████████████████████████████████████████████████████████████████████████████████████▌ | 160/162 [28:13<00:22, 11.24s/it] 99%|███████████████████████████████████████████████████████████████████████████████████████████████████████████████████▎| 161/162 [28:21<00:10, 10.02s/it]100%|████████████████████████████████████████████████████████████████████████████████████████████████████████████████████| 162/162 [28:30<00:00,  9.77s/it][2025-12-26 10:47:36,421] [INFO] [axolotl.core.trainers.base._save:692] [PID:1090] Saving model checkpoint to ./outputs/deepseek-luau-finetune/checkpoint-162
                                                                                                                                                           {'train_runtime': 2165.1082, 'train_samples_per_second': 0.898, 'train_steps_per_second': 0.075, 'train_loss': 1.8391567159582067, 'memory/max_active (GiB)': 10.35, 'memory/max_allocated (GiB)': 10.35, 'memory/device_reserved (GiB)': 14.72, 'epoch': 3.0}
100%|████████████████████████████████████████████████████████████████████████████████████████████████████████████████████| 162/162 [28:31<00:00,  9.77s/it]100%|████████████████████████████████████████████████████████████████████████████████████████████████████████████████████| 162/162 [28:31<00:00, 10.56s/it]
[2025-12-26 10:47:37,717] [INFO] [axolotl.train.save_trained_model:233] [PID:1090] Training completed! Saving trained model to ./outputs/deepseek-luau-finetune.
[2025-12-26 10:47:38,387] [INFO] [axolotl.train.save_trained_model:351] [PID:1090] Model successfully saved to ./outputs/deepseek-luau-finetune
[2025-12-26 10:47:38,396] [INFO] [axolotl.core.trainers.base._save:692] [PID:1090] Saving model checkpoint to ./outputs/deepseek-luau-finetune
Processing Files (0 / 0)      : |                                                                                             |  0.00B /  0.00B            
New Data Upload               : |                                                                                             |  0.00B /  0.00B            [A

  ...adapter_model.safetensors:   0%|▏                                                                                        |  562kB /  320MB            [A[A

  ...adapter_model.safetensors:   0%|▏                                                                                        |  562kB /  320MB            [A[AProcessing Files (0 / 1)      :   0%|▏                                                                                        |  562kB /  320MB,  351kB/s  
New Data Upload               :   0%|▎                                                                                        |  562kB /  134MB,  351kB/s  [A

  ...adapter_model.safetensors:   0%|▏                                                                                        |  562kB /  320MB            [A[A

  ...adapter_model.safetensors:   0%|▎                                                                                        | 1.12MB /  320MB            [A[AProcessing Files (0 / 1)      :   0%|▎                                                                                        | 1.12MB /  320MB,  562kB/s  
New Data Upload               :   1%|▋                                                                                        | 1.12MB /  134MB,  562kB/s  [A

  ...adapter_model.safetensors:   1%|▍                                                                                        | 1.69MB /  320MB            [A[AProcessing Files (0 / 1)      :   1%|▍                                                                                        | 1.69MB /  320MB,  766kB/s  
New Data Upload               :   1%|█                                                                                        | 1.69MB /  134MB,  766kB/s  [A

  ...adapter_model.safetensors:   1%|▊                                                                                        | 2.81MB /  320MB            [A[AProcessing Files (0 / 1)      :   1%|▊                                                                                        | 2.81MB /  320MB, 1.17MB/s  
New Data Upload               :   2%|█▊                                                                                       | 2.81MB /  134MB, 1.17MB/s  [A

  ...adapter_model.safetensors:   2%|█▌                                                                                       | 5.62MB /  320MB            [A[AProcessing Files (0 / 1)      :   2%|█▌                                                                                       | 5.62MB /  320MB, 2.16MB/s  
New Data Upload               :   4%|███▋                                                                                     | 5.62MB /  134MB, 2.16MB/s  [A

  ...adapter_model.safetensors:   2%|█▉                                                                                       | 6.74MB /  320MB            [A[AProcessing Files (0 / 1)      :   2%|█▉                                                                                       | 6.74MB /  320MB, 2.41MB/s  
New Data Upload               :   3%|██▉                                                                                      | 6.74MB /  201MB, 2.41MB/s  [A

  ...adapter_model.safetensors:   4%|███▎                                                                                     | 11.8MB /  320MB            [A[AProcessing Files (0 / 1)      :   4%|███▎                                                                                     | 11.8MB /  320MB, 3.93MB/s  
New Data Upload               :   6%|█████▏                                                                                   | 11.8MB /  201MB, 3.93MB/s  [A

  ...adapter_model.safetensors:   5%|████▌                                                                                    | 16.3MB /  320MB            [A[AProcessing Files (0 / 1)      :   5%|████▌                                                                                    | 16.3MB /  320MB, 5.09MB/s  
New Data Upload               :   8%|███████▏                                                                                 | 16.3MB /  201MB, 5.09MB/s  [A

  ...adapter_model.safetensors:   6%|█████▍                                                                                   | 19.7MB /  320MB            [A[AProcessing Files (0 / 1)      :   6%|█████▍                                                                                   | 19.7MB /  320MB, 5.78MB/s  
New Data Upload               :  10%|████████▋                                                                                | 19.7MB /  201MB, 5.78MB/s  [A

  ...adapter_model.safetensors:   8%|███████                                                                                  | 25.3MB /  320MB            [A[AProcessing Files (0 / 1)      :   8%|███████                                                                                  | 25.3MB /  320MB, 7.02MB/s  
New Data Upload               :  13%|███████████▏                                                                             | 25.3MB /  201MB, 7.02MB/s  [A

  ...adapter_model.safetensors:  10%|████████▌                                                                                | 30.9MB /  320MB            [A[AProcessing Files (0 / 1)      :  10%|████████▌                                                                                | 30.9MB /  320MB, 8.13MB/s  
New Data Upload               :  12%|██████████▎                                                                              | 30.9MB /  268MB, 8.13MB/s  [A

  ...adapter_model.safetensors:  12%|██████████▊                                                                              | 38.8MB /  320MB            [A[AProcessing Files (0 / 1)      :  12%|██████████▊                                                                              | 38.8MB /  320MB, 9.69MB/s  
New Data Upload               :  14%|████████████▊                                                                            | 38.8MB /  268MB, 9.69MB/s  [A

  ...adapter_model.safetensors:  15%|█████████████▏                                                                           | 47.2MB /  320MB            [A[AProcessing Files (0 / 1)      :  15%|█████████████▏                                                                           | 47.2MB /  320MB, 11.2MB/s  
New Data Upload               :  15%|█████████████▏                                                                           | 47.2MB /  320MB, 11.2MB/s  [A

  ...adapter_model.safetensors:  17%|██████████████▋                                                                          | 52.8MB /  320MB            [A[AProcessing Files (0 / 1)      :  17%|██████████████▋                                                                          | 52.8MB /  320MB, 12.0MB/s  
New Data Upload               :  17%|██████████████▋                                                                          | 52.8MB /  320MB, 12.0MB/s  [A


  ...inetune/training_args.bin:   1%|▉                                                                                        |  80.0B / 7.44kB            [A[A[A

  ...adapter_model.safetensors:  19%|████████████████▌                                                                        | 59.6MB /  320MB            [A[A


  ...inetune/training_args.bin:   1%|▉                                                                                        |  80.0B / 7.44kB            [A[A[AProcessing Files (0 / 2)      :  19%|████████████████▌                                                                        | 59.6MB /  320MB, 13.0MB/s  
New Data Upload               :  19%|████████████████▌                                                                        | 59.6MB /  320MB, 13.0MB/s  [A

  ...adapter_model.safetensors:  22%|███████████████████▌                                                                     | 70.2MB /  320MB            [A[A


  ...inetune/training_args.bin:   1%|▉                                                                                        |  80.0B / 7.44kB            [A[A[AProcessing Files (0 / 2)      :  22%|███████████████████▌                                                                     | 70.2MB /  320MB, 14.6MB/s  
New Data Upload               :  22%|███████████████████▌                                                                     | 70.2MB /  320MB, 14.6MB/s  [A

  ...adapter_model.safetensors:  23%|████████████████████▍                                                                    | 73.6MB /  320MB            [A[A


  ...inetune/training_args.bin:   1%|▉                                                                                        |  80.0B / 7.44kB            [A[A[AProcessing Files (0 / 2)      :  23%|████████████████████▍                                                                    | 73.6MB /  320MB, 14.7MB/s  
New Data Upload               :  23%|████████████████████▍                                                                    | 73.6MB /  320MB, 14.7MB/s  [A

  ...adapter_model.safetensors:  26%|██████████████████████▉                                                                  | 82.6MB /  320MB            [A[A


  ...inetune/training_args.bin:   2%|█▉                                                                                       |   161B / 7.44kB            [A[A[AProcessing Files (0 / 2)      :  26%|██████████████████████▉                                                                  | 82.6MB /  320MB, 15.9MB/s  
New Data Upload               :  26%|██████████████████████▉                                                                  | 82.6MB /  320MB, 15.9MB/s  [A

  ...adapter_model.safetensors:  29%|█████████████████████████▍                                                               | 91.6MB /  320MB            [A[A


  ...inetune/training_args.bin:   5%|████▊                                                                                    |   404B / 7.44kB            [A[A[AProcessing Files (0 / 2)      :  29%|█████████████████████████▍                                                               | 91.6MB /  320MB, 17.0MB/s  
New Data Upload               :  29%|█████████████████████████▍                                                               | 91.6MB /  320MB, 17.0MB/s  [A

  ...adapter_model.safetensors:  30%|██████████████████████████▋                                                              | 96.1MB /  320MB            [A[A


  ...inetune/training_args.bin:   9%|███████▋                                                                                 |   646B / 7.44kB            [A[A[AProcessing Files (0 / 2)      :  30%|██████████████████████████▋                                                              | 96.1MB /  320MB, 17.2MB/s  
New Data Upload               :  30%|██████████████████████████▋                                                              | 96.1MB /  320MB, 17.2MB/s  [A

  ...adapter_model.safetensors:  32%|████████████████████████████▍                                                            |  102MB /  320MB            [A[A


  ...inetune/training_args.bin:  11%|█████████▋                                                                               |   808B / 7.44kB            [A[A[AProcessing Files (0 / 2)      :  32%|████████████████████████████▍                                                            |  102MB /  320MB, 17.6MB/s  
New Data Upload               :  32%|████████████████████████████▍                                                            |  102MB /  320MB, 17.6MB/s  [A

  ...adapter_model.safetensors:  36%|████████████████████████████████                                                         |  115MB /  320MB            [A[A


  ...inetune/training_args.bin:  14%|████████████▌                                                                            | 1.05kB / 7.44kB            [A[A[AProcessing Files (0 / 2)      :  36%|████████████████████████████████                                                         |  115MB /  320MB, 19.2MB/s  
New Data Upload               :  36%|████████████████████████████████                                                         |  115MB /  320MB, 19.2MB/s  [A

  ...adapter_model.safetensors:  38%|██████████████████████████████████                                                       |  122MB /  320MB            [A[A


  ...inetune/training_args.bin:  21%|██████████████████▎                                                                      | 1.54kB / 7.44kB            [A[A[AProcessing Files (0 / 2)      :  38%|██████████████████████████████████                                                       |  122MB /  320MB, 19.8MB/s  
New Data Upload               :  38%|██████████████████████████████████                                                       |  122MB /  320MB, 19.8MB/s  [A

  ...adapter_model.safetensors:  40%|███████████████████████████████████▏                                                     |  126MB /  320MB            [A[A


  ...inetune/training_args.bin:  21%|██████████████████▎                                                                      | 1.54kB / 7.44kB            [A[A[AProcessing Files (0 / 2)      :  40%|███████████████████████████████████▏                                                     |  126MB /  320MB, 19.8MB/s  
New Data Upload               :  40%|███████████████████████████████████▏                                                     |  126MB /  320MB, 19.8MB/s  [A

  ...adapter_model.safetensors:  44%|███████████████████████████████████████▍                                                 |  142MB /  320MB            [A[A


  ...inetune/training_args.bin:  28%|█████████████████████████▏                                                               | 2.10kB / 7.44kB            [A[A[AProcessing Files (0 / 2)      :  44%|███████████████████████████████████████▍                                                 |  142MB /  320MB, 21.5MB/s  
New Data Upload               :  44%|███████████████████████████████████████▍                                                 |  142MB /  320MB, 21.5MB/s  [A

  ...adapter_model.safetensors:  46%|█████████████████████████████████████████▎                                               |  148MB /  320MB            [A[A


  ...inetune/training_args.bin:  28%|█████████████████████████▏                                                               | 2.10kB / 7.44kB            [A[A[AProcessing Files (0 / 2)      :  46%|█████████████████████████████████████████▎                                               |  148MB /  320MB, 21.8MB/s  
New Data Upload               :  46%|█████████████████████████████████████████▎                                               |  148MB /  320MB, 21.8MB/s  [A

  ...adapter_model.safetensors:  50%|████████████████████████████████████████████                                             |  158MB /  320MB            [A[A


  ...inetune/training_args.bin:  32%|████████████████████████████                                                             | 2.35kB / 7.44kB            [A[A[AProcessing Files (0 / 2)      :  50%|████████████████████████████████████████████                                             |  158MB /  320MB, 22.6MB/s  
New Data Upload               :  50%|████████████████████████████████████████████                                             |  158MB /  320MB, 22.6MB/s  [A

  ...adapter_model.safetensors:  52%|██████████████████████████████████████████████▌                                          |  167MB /  320MB            [A[A


  ...inetune/training_args.bin:  32%|████████████████████████████                                                             | 2.35kB / 7.44kB            [A[A[AProcessing Files (0 / 2)      :  52%|██████████████████████████████████████████████▌                                          |  167MB /  320MB, 23.3MB/s  
New Data Upload               :  52%|██████████████████████████████████████████████▌                                          |  167MB /  320MB, 23.3MB/s  [A

  ...adapter_model.safetensors:  56%|█████████████████████████████████████████████████▋                                       |  179MB /  320MB            [A[A


  ...inetune/training_args.bin:  39%|██████████████████████████████████▊                                                      | 2.91kB / 7.44kB            [A[A[AProcessing Files (0 / 2)      :  56%|█████████████████████████████████████████████████▋                                       |  179MB /  320MB, 24.1MB/s  
New Data Upload               :  56%|█████████████████████████████████████████████████▋                                       |  179MB /  320MB, 24.1MB/s  [A

  ...adapter_model.safetensors:  59%|████████████████████████████████████████████████████▌                                    |  189MB /  320MB            [A[A


  ...inetune/training_args.bin:  42%|█████████████████████████████████████▋                                                   | 3.15kB / 7.44kB            [A[A[AProcessing Files (0 / 2)      :  59%|████████████████████████████████████████████████████▌                                    |  189MB /  320MB, 24.8MB/s  
New Data Upload               :  59%|████████████████████████████████████████████████████▌                                    |  189MB /  320MB, 24.8MB/s  [A

  ...adapter_model.safetensors:  62%|██████████████████████████████████████████████████████▊                                  |  197MB /  320MB            [A[A


  ...inetune/training_args.bin:  48%|██████████████████████████████████████████▌                                              | 3.56kB / 7.44kB            [A[A[AProcessing Files (0 / 2)      :  62%|██████████████████████████████████████████████████████▊                                  |  197MB /  320MB, 25.3MB/s  
New Data Upload               :  62%|██████████████████████████████████████████████████████▊                                  |  197MB /  320MB, 25.3MB/s  [A

  ...adapter_model.safetensors:  65%|█████████████████████████████████████████████████████████▉                               |  208MB /  320MB            [A[A


  ...inetune/training_args.bin:  54%|████████████████████████████████████████████████▎                                        | 4.04kB / 7.44kB            [A[A[AProcessing Files (0 / 2)      :  65%|█████████████████████████████████████████████████████████▉                               |  208MB /  320MB, 26.1MB/s  
New Data Upload               :  65%|█████████████████████████████████████████████████████████▉                               |  208MB /  320MB, 26.1MB/s  [A

  ...adapter_model.safetensors:  67%|███████████████████████████████████████████████████████████▊                             |  215MB /  320MB            [A[A


  ...inetune/training_args.bin:  60%|█████████████████████████████████████████████████████▏                                   | 4.45kB / 7.44kB            [A[A[AProcessing Files (0 / 2)      :  67%|███████████████████████████████████████████████████████████▊                             |  215MB /  320MB, 26.2MB/s  
New Data Upload               :  67%|███████████████████████████████████████████████████████████▊                             |  215MB /  320MB, 26.2MB/s  [A

  ...adapter_model.safetensors:  69%|█████████████████████████████████████████████████████████████▋                           |  222MB /  320MB            [A[A


  ...inetune/training_args.bin:  65%|██████████████████████████████████████████████████████████                               | 4.85kB / 7.44kB            [A[A[AProcessing Files (0 / 2)      :  69%|█████████████████████████████████████████████████████████████▋                           |  222MB /  320MB, 26.4MB/s  
New Data Upload               :  69%|█████████████████████████████████████████████████████████████▋                           |  222MB /  320MB, 26.4MB/s  [A

  ...adapter_model.safetensors:  71%|███████████████████████████████████████████████████████████████▍                         |  228MB /  320MB            [A[A


  ...inetune/training_args.bin:  72%|███████████████████████████████████████████████████████████████▊                         | 5.34kB / 7.44kB            [A[A[AProcessing Files (0 / 2)      :  71%|███████████████████████████████████████████████████████████████▍                         |  228MB /  320MB, 26.5MB/s  
New Data Upload               :  71%|███████████████████████████████████████████████████████████████▍                         |  228MB /  320MB, 26.5MB/s  [A

  ...adapter_model.safetensors:  73%|█████████████████████████████████████████████████████████████████▎                       |  235MB /  320MB            [A[A


  ...inetune/training_args.bin:  77%|████████████████████████████████████████████████████████████████████▋                    | 5.74kB / 7.44kB            [A[A[AProcessing Files (0 / 2)      :  73%|█████████████████████████████████████████████████████████████████▎                       |  235MB /  320MB, 26.7MB/s  
New Data Upload               :  73%|█████████████████████████████████████████████████████████████████▎                       |  235MB /  320MB, 26.7MB/s  [A

  ...adapter_model.safetensors:  75%|██████████████████████████████████████████████████████████████████▋                      |  239MB /  320MB            [A[A


  ...inetune/training_args.bin:  80%|███████████████████████████████████████████████████████████████████████▌                 | 5.98kB / 7.44kB            [A[A[AProcessing Files (0 / 2)      :  75%|██████████████████████████████████████████████████████████████████▋                      |  239MB /  320MB, 26.6MB/s  
New Data Upload               :  75%|██████████████████████████████████████████████████████████████████▋                      |  239MB /  320MB, 26.6MB/s  [A

  ...adapter_model.safetensors:  77%|████████████████████████████████████████████████████████████████████▌                    |  246MB /  320MB            [A[A


  ...inetune/training_args.bin:  86%|████████████████████████████████████████████████████████████████████████████▍            | 6.39kB / 7.44kB            [A[A[AProcessing Files (0 / 2)      :  77%|████████████████████████████████████████████████████████████████████▌                    |  246MB /  320MB, 26.8MB/s  
New Data Upload               :  77%|████████████████████████████████████████████████████████████████████▌                    |  246MB /  320MB, 26.8MB/s  [A

  ...adapter_model.safetensors:  78%|█████████████████████████████████████████████████████████████████████▊                   |  251MB /  320MB            [A[A


  ...inetune/training_args.bin:  89%|███████████████████████████████████████████████████████████████████████████████▎         | 6.63kB / 7.44kB            [A[A[AProcessing Files (0 / 2)      :  78%|█████████████████████████████████████████████████████████████████████▊                   |  251MB /  320MB, 26.7MB/s  
New Data Upload               :  78%|█████████████████████████████████████████████████████████████████████▊                   |  251MB /  320MB, 26.7MB/s  [A

  ...adapter_model.safetensors:  81%|███████████████████████████████████████████████████████████████████████▋                 |  258MB /  320MB            [A[A


  ...inetune/training_args.bin:  95%|████████████████████████████████████████████████████████████████████████████████████▏    | 7.04kB / 7.44kB            [A[A[AProcessing Files (0 / 2)      :  81%|███████████████████████████████████████████████████████████████████████▋                 |  258MB /  320MB, 26.8MB/s  
New Data Upload               :  81%|███████████████████████████████████████████████████████████████████████▋                 |  258MB /  320MB, 26.8MB/s  [A

  ...adapter_model.safetensors:  82%|████████████████████████████████████████████████████████████████████████▊                |  262MB /  320MB            [A[A


  ...inetune/training_args.bin: 100%|████████████████████████████████████████████████████████████████████████████████████████▉| 7.44kB / 7.44kB            [A[A[AProcessing Files (0 / 2)      :  82%|████████████████████████████████████████████████████████████████████████▊                |  262MB /  320MB, 26.7MB/s  
New Data Upload               :  82%|████████████████████████████████████████████████████████████████████████▊                |  262MB /  320MB, 26.7MB/s  [A

  ...adapter_model.safetensors:  82%|████████████████████████████████████████████████████████████████████████▊                |  262MB /  320MB            [A[A


  ...inetune/training_args.bin: 100%|████████████████████████████████████████████████████████████████████████████████████████▉| 7.44kB / 7.44kB            [A[A[A

  ...adapter_model.safetensors:  82%|████████████████████████████████████████████████████████████████████████▉                |  262MB /  320MB            [A[A


  ...inetune/training_args.bin: 100%|████████████████████████████████████████████████████████████████████████████████████████▉| 7.44kB / 7.44kB            [A[A[AProcessing Files (0 / 2)      :  82%|████████████████████████████████████████████████████████████████████████▉                |  262MB /  320MB, 25.7MB/s  
New Data Upload               :  82%|████████████████████████████████████████████████████████████████████████▉                |  262MB /  320MB, 25.7MB/s  [A

  ...adapter_model.safetensors:  82%|████████████████████████████████████████████████████████████████████████▉                |  262MB /  320MB            [A[A


  ...inetune/training_args.bin: 100%|█████████████████████████████████████████████████████████████████████████████████████████| 7.44kB / 7.44kB            [A[A[AProcessing Files (1 / 2)      :  82%|████████████████████████████████████████████████████████████████████████▉                |  262MB /  320MB, 25.7MB/s  
New Data Upload               :  82%|████████████████████████████████████████████████████████████████████████▉                |  262MB /  320MB, 25.7MB/s  [A

  ...adapter_model.safetensors:  82%|█████████████████████████████████████████████████████████████████████████                |  263MB /  320MB            [A[A


  ...inetune/training_args.bin: 100%|█████████████████████████████████████████████████████████████████████████████████████████| 7.44kB / 7.44kB            [A[A[AProcessing Files (1 / 2)      :  82%|█████████████████████████████████████████████████████████████████████████                |  263MB /  320MB, 25.8MB/s  
New Data Upload               :  82%|█████████████████████████████████████████████████████████████████████████                |  263MB /  320MB, 25.8MB/s  [A

  ...adapter_model.safetensors:  82%|█████████████████████████████████████████████████████████████████████████▏               |  263MB /  320MB            [A[A


  ...inetune/training_args.bin: 100%|█████████████████████████████████████████████████████████████████████████████████████████| 7.44kB / 7.44kB            [A[A[AProcessing Files (1 / 2)      :  82%|█████████████████████████████████████████████████████████████████████████▏               |  263MB /  320MB, 25.8MB/s  
New Data Upload               :  82%|█████████████████████████████████████████████████████████████████████████▏               |  263MB /  320MB, 25.8MB/s  [A

  ...adapter_model.safetensors:  82%|█████████████████████████████████████████████████████████████████████████▏               |  263MB /  320MB            [A[A


  ...inetune/training_args.bin: 100%|█████████████████████████████████████████████████████████████████████████████████████████| 7.44kB / 7.44kB            [A[A[A

  ...adapter_model.safetensors:  83%|█████████████████████████████████████████████████████████████████████████▍               |  264MB /  320MB            [A[A


  ...inetune/training_args.bin: 100%|█████████████████████████████████████████████████████████████████████████████████████████| 7.44kB / 7.44kB            [A[A[AProcessing Files (1 / 2)      :  83%|█████████████████████████████████████████████████████████████████████████▍               |  264MB /  320MB, 25.9MB/s  
New Data Upload               :  83%|█████████████████████████████████████████████████████████████████████████▍               |  264MB /  320MB, 25.9MB/s  [A

  ...adapter_model.safetensors:  83%|█████████████████████████████████████████████████████████████████████████▍               |  264MB /  320MB            [A[A


  ...inetune/training_args.bin: 100%|█████████████████████████████████████████████████████████████████████████████████████████| 7.44kB / 7.44kB            [A[A[A

  ...adapter_model.safetensors:  83%|█████████████████████████████████████████████████████████████████████████▌               |  265MB /  320MB            [A[A


  ...inetune/training_args.bin: 100%|█████████████████████████████████████████████████████████████████████████████████████████| 7.44kB / 7.44kB            [A[A[AProcessing Files (1 / 2)      :  83%|█████████████████████████████████████████████████████████████████████████▋               |  265MB /  320MB, 25.9MB/s  
New Data Upload               :  83%|█████████████████████████████████████████████████████████████████████████▋               |  265MB /  320MB, 25.9MB/s  [A

  ...adapter_model.safetensors:  83%|█████████████████████████████████████████████████████████████████████████▌               |  265MB /  320MB            [A[A


  ...inetune/training_args.bin: 100%|█████████████████████████████████████████████████████████████████████████████████████████| 7.44kB / 7.44kB            [A[A[A

  ...adapter_model.safetensors:  83%|█████████████████████████████████████████████████████████████████████████▊               |  265MB /  320MB            [A[A


  ...inetune/training_args.bin: 100%|█████████████████████████████████████████████████████████████████████████████████████████| 7.44kB / 7.44kB            [A[A[AProcessing Files (1 / 2)      :  83%|█████████████████████████████████████████████████████████████████████████▊               |  265MB /  320MB, 25.9MB/s  
New Data Upload               :  83%|█████████████████████████████████████████████████████████████████████████▊               |  265MB /  320MB, 25.9MB/s  [A

  ...adapter_model.safetensors:  83%|█████████████████████████████████████████████████████████████████████████▊               |  265MB /  320MB            [A[A


  ...inetune/training_args.bin: 100%|█████████████████████████████████████████████████████████████████████████████████████████| 7.44kB / 7.44kB            [A[A[A

  ...adapter_model.safetensors:  83%|██████████████████████████████████████████████████████████████████████████               |  266MB /  320MB            [A[A


  ...inetune/training_args.bin: 100%|█████████████████████████████████████████████████████████████████████████████████████████| 7.44kB / 7.44kB            [A[A[AProcessing Files (1 / 2)      :  83%|██████████████████████████████████████████████████████████████████████████               |  266MB /  320MB, 25.9MB/s  
New Data Upload               :  83%|██████████████████████████████████████████████████████████████████████████               |  266MB /  320MB, 25.9MB/s  [A

  ...adapter_model.safetensors:  83%|██████████████████████████████████████████████████████████████████████████               |  266MB /  320MB            [A[A


  ...inetune/training_args.bin: 100%|█████████████████████████████████████████████████████████████████████████████████████████| 7.44kB / 7.44kB            [A[A[A

  ...adapter_model.safetensors:  83%|██████████████████████████████████████████████████████████████████████████▎              |  267MB /  320MB            [A[A


  ...inetune/training_args.bin: 100%|█████████████████████████████████████████████████████████████████████████████████████████| 7.44kB / 7.44kB            [A[A[AProcessing Files (1 / 2)      :  83%|██████████████████████████████████████████████████████████████████████████▎              |  267MB /  320MB, 25.6MB/s  
New Data Upload               :  83%|██████████████████████████████████████████████████████████████████████████▎              |  267MB /  320MB, 25.6MB/s  [A

  ...adapter_model.safetensors:  83%|██████████████████████████████████████████████████████████████████████████▎              |  267MB /  320MB            [A[A


  ...inetune/training_args.bin: 100%|█████████████████████████████████████████████████████████████████████████████████████████| 7.44kB / 7.44kB            [A[A[A

  ...adapter_model.safetensors:  84%|██████████████████████████████████████████████████████████████████████████▌              |  268MB /  320MB            [A[A


  ...inetune/training_args.bin: 100%|█████████████████████████████████████████████████████████████████████████████████████████| 7.44kB / 7.44kB            [A[A[AProcessing Files (1 / 2)      :  84%|██████████████████████████████████████████████████████████████████████████▌              |  268MB /  320MB, 25.1MB/s  
New Data Upload               :  84%|██████████████████████████████████████████████████████████████████████████▌              |  268MB /  320MB, 25.1MB/s  [A

  ...adapter_model.safetensors:  84%|██████████████████████████████████████████████████████████████████████████▌              |  268MB /  320MB            [A[A


  ...inetune/training_args.bin: 100%|█████████████████████████████████████████████████████████████████████████████████████████| 7.44kB / 7.44kB            [A[A[A

  ...adapter_model.safetensors:  84%|██████████████████████████████████████████████████████████████████████████▌              |  268MB /  320MB            [A[A


  ...inetune/training_args.bin: 100%|█████████████████████████████████████████████████████████████████████████████████████████| 7.44kB / 7.44kB            [A[A[A

  ...adapter_model.safetensors:  84%|██████████████████████████████████████████████████████████████████████████▋              |  269MB /  320MB            [A[A


  ...inetune/training_args.bin: 100%|█████████████████████████████████████████████████████████████████████████████████████████| 7.44kB / 7.44kB            [A[A[AProcessing Files (1 / 2)      :  84%|██████████████████████████████████████████████████████████████████████████▋              |  269MB /  320MB, 23.8MB/s  
New Data Upload               :  84%|██████████████████████████████████████████████████████████████████████████▋              |  269MB /  320MB, 23.8MB/s  [A

  ...adapter_model.safetensors:  84%|██████████████████████████████████████████████████████████████████████████▋              |  269MB /  320MB            [A[A


  ...inetune/training_args.bin: 100%|█████████████████████████████████████████████████████████████████████████████████████████| 7.44kB / 7.44kB            [A[A[A

  ...adapter_model.safetensors:  84%|██████████████████████████████████████████████████████████████████████████▋              |  269MB /  320MB            [A[A


  ...inetune/training_args.bin: 100%|█████████████████████████████████████████████████████████████████████████████████████████| 7.44kB / 7.44kB            [A[A[A

  ...adapter_model.safetensors:  84%|██████████████████████████████████████████████████████████████████████████▉              |  269MB /  320MB            [A[A


  ...inetune/training_args.bin: 100%|█████████████████████████████████████████████████████████████████████████████████████████| 7.44kB / 7.44kB            [A[A[AProcessing Files (1 / 2)      :  84%|██████████████████████████████████████████████████████████████████████████▉              |  269MB /  320MB, 21.8MB/s  
New Data Upload               :  84%|██████████████████████████████████████████████████████████████████████████▉              |  269MB /  320MB, 21.8MB/s  [A

  ...adapter_model.safetensors:  84%|██████████████████████████████████████████████████████████████████████████▉              |  269MB /  320MB            [A[A


  ...inetune/training_args.bin: 100%|█████████████████████████████████████████████████████████████████████████████████████████| 7.44kB / 7.44kB            [A[A[A

  ...adapter_model.safetensors:  84%|███████████████████████████████████████████████████████████████████████████▏             |  270MB /  320MB            [A[A


  ...inetune/training_args.bin: 100%|█████████████████████████████████████████████████████████████████████████████████████████| 7.44kB / 7.44kB            [A[A[AProcessing Files (1 / 2)      :  84%|███████████████████████████████████████████████████████████████████████████▏             |  270MB /  320MB, 20.7MB/s  
New Data Upload               :  84%|███████████████████████████████████████████████████████████████████████████▏             |  270MB /  320MB, 20.7MB/s  [A

  ...adapter_model.safetensors:  84%|███████████████████████████████████████████████████████████████████████████▏             |  270MB /  320MB            [A[A


  ...inetune/training_args.bin: 100%|█████████████████████████████████████████████████████████████████████████████████████████| 7.44kB / 7.44kB            [A[A[A

  ...adapter_model.safetensors:  85%|███████████████████████████████████████████████████████████████████████████▎             |  271MB /  320MB            [A[A


  ...inetune/training_args.bin: 100%|█████████████████████████████████████████████████████████████████████████████████████████| 7.44kB / 7.44kB            [A[A[AProcessing Files (1 / 2)      :  85%|███████████████████████████████████████████████████████████████████████████▎             |  271MB /  320MB, 19.3MB/s  
New Data Upload               :  85%|███████████████████████████████████████████████████████████████████████████▎             |  271MB /  320MB, 19.3MB/s  [A

  ...adapter_model.safetensors:  85%|███████████████████████████████████████████████████████████████████████████▎             |  271MB /  320MB            [A[A


  ...inetune/training_args.bin: 100%|█████████████████████████████████████████████████████████████████████████████████████████| 7.44kB / 7.44kB            [A[A[A

  ...adapter_model.safetensors:  85%|███████████████████████████████████████████████████████████████████████████▌             |  271MB /  320MB            [A[A


  ...inetune/training_args.bin: 100%|█████████████████████████████████████████████████████████████████████████████████████████| 7.44kB / 7.44kB            [A[A[AProcessing Files (1 / 2)      :  85%|███████████████████████████████████████████████████████████████████████████▌             |  271MB /  320MB, 17.6MB/s  
New Data Upload               :  85%|███████████████████████████████████████████████████████████████████████████▌             |  271MB /  320MB, 17.6MB/s  [A

  ...adapter_model.safetensors:  85%|███████████████████████████████████████████████████████████████████████████▊             |  272MB /  320MB            [A[A


  ...inetune/training_args.bin: 100%|█████████████████████████████████████████████████████████████████████████████████████████| 7.44kB / 7.44kB            [A[A[AProcessing Files (1 / 2)      :  85%|███████████████████████████████████████████████████████████████████████████▊             |  272MB /  320MB, 17.3MB/s  
New Data Upload               :  85%|███████████████████████████████████████████████████████████████████████████▊             |  272MB /  320MB, 17.3MB/s  [A

  ...adapter_model.safetensors:  85%|███████████████████████████████████████████████████████████████████████████▊             |  272MB /  320MB            [A[A


  ...inetune/training_args.bin: 100%|█████████████████████████████████████████████████████████████████████████████████████████| 7.44kB / 7.44kB            [A[A[A

  ...adapter_model.safetensors:  85%|███████████████████████████████████████████████████████████████████████████▉             |  273MB /  320MB            [A[A


  ...inetune/training_args.bin: 100%|█████████████████████████████████████████████████████████████████████████████████████████| 7.44kB / 7.44kB            [A[A[AProcessing Files (1 / 2)      :  85%|███████████████████████████████████████████████████████████████████████████▉             |  273MB /  320MB, 15.5MB/s  
New Data Upload               :  85%|███████████████████████████████████████████████████████████████████████████▉             |  273MB /  320MB, 15.5MB/s  [A

  ...adapter_model.safetensors:  85%|███████████████████████████████████████████████████████████████████████████▉             |  273MB /  320MB            [A[A


  ...inetune/training_args.bin: 100%|█████████████████████████████████████████████████████████████████████████████████████████| 7.44kB / 7.44kB            [A[A[A

  ...adapter_model.safetensors:  86%|████████████████████████████████████████████████████████████████████████████▎            |  274MB /  320MB            [A[A


  ...inetune/training_args.bin: 100%|█████████████████████████████████████████████████████████████████████████████████████████| 7.44kB / 7.44kB            [A[A[AProcessing Files (1 / 2)      :  86%|████████████████████████████████████████████████████████████████████████████▎            |  274MB /  320MB, 14.5MB/s  
New Data Upload               :  86%|████████████████████████████████████████████████████████████████████████████▎            |  274MB /  320MB, 14.5MB/s  [A

  ...adapter_model.safetensors:  86%|████████████████████████████████████████████████████████████████████████████▎            |  274MB /  320MB            [A[A


  ...inetune/training_args.bin: 100%|█████████████████████████████████████████████████████████████████████████████████████████| 7.44kB / 7.44kB            [A[A[A

  ...adapter_model.safetensors:  86%|████████████████████████████████████████████████████████████████████████████▎            |  274MB /  320MB            [A[A


  ...inetune/training_args.bin: 100%|█████████████████████████████████████████████████████████████████████████████████████████| 7.44kB / 7.44kB            [A[A[A

  ...adapter_model.safetensors:  86%|████████████████████████████████████████████████████████████████████████████▌            |  275MB /  320MB            [A[A


  ...inetune/training_args.bin: 100%|█████████████████████████████████████████████████████████████████████████████████████████| 7.44kB / 7.44kB            [A[A[AProcessing Files (1 / 2)      :  86%|████████████████████████████████████████████████████████████████████████████▌            |  275MB /  320MB, 11.5MB/s  
New Data Upload               :  86%|████████████████████████████████████████████████████████████████████████████▌            |  275MB /  320MB, 11.5MB/s  [A

  ...adapter_model.safetensors:  86%|████████████████████████████████████████████████████████████████████████████▌            |  275MB /  320MB            [A[A


  ...inetune/training_args.bin: 100%|█████████████████████████████████████████████████████████████████████████████████████████| 7.44kB / 7.44kB            [A[A[A

  ...adapter_model.safetensors:  86%|████████████████████████████████████████████████████████████████████████████▊            |  276MB /  320MB            [A[A


  ...inetune/training_args.bin: 100%|█████████████████████████████████████████████████████████████████████████████████████████| 7.44kB / 7.44kB            [A[A[AProcessing Files (1 / 2)      :  86%|████████████████████████████████████████████████████████████████████████████▊            |  276MB /  320MB, 9.53MB/s  
New Data Upload               :  86%|████████████████████████████████████████████████████████████████████████████▊            |  276MB /  320MB, 9.53MB/s  [A

  ...adapter_model.safetensors:  86%|████████████████████████████████████████████████████████████████████████████▊            |  276MB /  320MB            [A[A


  ...inetune/training_args.bin: 100%|█████████████████████████████████████████████████████████████████████████████████████████| 7.44kB / 7.44kB            [A[A[A

  ...adapter_model.safetensors:  87%|█████████████████████████████████████████████████████████████████████████████            |  277MB /  320MB            [A[A


  ...inetune/training_args.bin: 100%|█████████████████████████████████████████████████████████████████████████████████████████| 7.44kB / 7.44kB            [A[A[AProcessing Files (1 / 2)      :  87%|█████████████████████████████████████████████████████████████████████████████            |  277MB /  320MB, 7.83MB/s  
New Data Upload               :  87%|█████████████████████████████████████████████████████████████████████████████            |  277MB /  320MB, 7.83MB/s  [A

  ...adapter_model.safetensors:  87%|█████████████████████████████████████████████████████████████████████████████            |  277MB /  320MB            [A[A


  ...inetune/training_args.bin: 100%|█████████████████████████████████████████████████████████████████████████████████████████| 7.44kB / 7.44kB            [A[A[A

  ...adapter_model.safetensors:  87%|█████████████████████████████████████████████████████████████████████████████▍           |  278MB /  320MB            [A[A


  ...inetune/training_args.bin: 100%|█████████████████████████████████████████████████████████████████████████████████████████| 7.44kB / 7.44kB            [A[A[AProcessing Files (1 / 2)      :  87%|█████████████████████████████████████████████████████████████████████████████▍           |  278MB /  320MB, 6.17MB/s  
New Data Upload               :  87%|█████████████████████████████████████████████████████████████████████████████▍           |  278MB /  320MB, 6.17MB/s  [A

  ...adapter_model.safetensors:  87%|█████████████████████████████████████████████████████████████████████████████▍           |  278MB /  320MB            [A[A


  ...inetune/training_args.bin: 100%|█████████████████████████████████████████████████████████████████████████████████████████| 7.44kB / 7.44kB            [A[A[A

  ...adapter_model.safetensors:  87%|█████████████████████████████████████████████████████████████████████████████▋           |  279MB /  320MB            [A[A


  ...inetune/training_args.bin: 100%|█████████████████████████████████████████████████████████████████████████████████████████| 7.44kB / 7.44kB            [A[A[AProcessing Files (1 / 2)      :  87%|█████████████████████████████████████████████████████████████████████████████▋           |  279MB /  320MB, 5.02MB/s  
New Data Upload               :  87%|█████████████████████████████████████████████████████████████████████████████▋           |  279MB /  320MB, 5.02MB/s  [A

  ...adapter_model.safetensors:  88%|██████████████████████████████████████████████████████████████████████████████           |  280MB /  320MB            [A[A


  ...inetune/training_args.bin: 100%|█████████████████████████████████████████████████████████████████████████████████████████| 7.44kB / 7.44kB            [A[A[AProcessing Files (1 / 2)      :  88%|██████████████████████████████████████████████████████████████████████████████           |  280MB /  320MB, 4.47MB/s  
New Data Upload               :  88%|██████████████████████████████████████████████████████████████████████████████           |  280MB /  320MB, 4.47MB/s  [A

  ...adapter_model.safetensors:  88%|██████████████████████████████████████████████████████████████████████████████           |  280MB /  320MB            [A[A


  ...inetune/training_args.bin: 100%|█████████████████████████████████████████████████████████████████████████████████████████| 7.44kB / 7.44kB            [A[A[A

  ...adapter_model.safetensors:  88%|██████████████████████████████████████████████████████████████████████████████▎          |  281MB /  320MB            [A[A


  ...inetune/training_args.bin: 100%|█████████████████████████████████████████████████████████████████████████████████████████| 7.44kB / 7.44kB            [A[A[AProcessing Files (1 / 2)      :  88%|██████████████████████████████████████████████████████████████████████████████▎          |  281MB /  320MB, 3.46MB/s  
New Data Upload               :  88%|██████████████████████████████████████████████████████████████████████████████▎          |  281MB /  320MB, 3.46MB/s  [A

  ...adapter_model.safetensors:  88%|██████████████████████████████████████████████████████████████████████████████▎          |  281MB /  320MB            [A[A


  ...inetune/training_args.bin: 100%|█████████████████████████████████████████████████████████████████████████████████████████| 7.44kB / 7.44kB            [A[A[A

  ...adapter_model.safetensors:  89%|██████████████████████████████████████████████████████████████████████████████▊          |  283MB /  320MB            [A[A


  ...inetune/training_args.bin: 100%|█████████████████████████████████████████████████████████████████████████████████████████| 7.44kB / 7.44kB            [A[A[AProcessing Files (1 / 2)      :  89%|██████████████████████████████████████████████████████████████████████████████▊          |  283MB /  320MB, 2.50MB/s  
New Data Upload               :  89%|██████████████████████████████████████████████████████████████████████████████▊          |  283MB /  320MB, 2.50MB/s  [A

  ...adapter_model.safetensors:  89%|██████████████████████████████████████████████████████████████████████████████▊          |  283MB /  320MB            [A[A


  ...inetune/training_args.bin: 100%|█████████████████████████████████████████████████████████████████████████████████████████| 7.44kB / 7.44kB            [A[A[A

  ...adapter_model.safetensors:  89%|███████████████████████████████████████████████████████████████████████████████          |  284MB /  320MB            [A[A


  ...inetune/training_args.bin: 100%|█████████████████████████████████████████████████████████████████████████████████████████| 7.44kB / 7.44kB            [A[A[AProcessing Files (1 / 2)      :  89%|███████████████████████████████████████████████████████████████████████████████          |  284MB /  320MB, 2.23MB/s  
New Data Upload               :  89%|███████████████████████████████████████████████████████████████████████████████          |  284MB /  320MB, 2.23MB/s  [A

  ...adapter_model.safetensors:  89%|███████████████████████████████████████████████████████████████████████████████          |  284MB /  320MB            [A[A


  ...inetune/training_args.bin: 100%|█████████████████████████████████████████████████████████████████████████████████████████| 7.44kB / 7.44kB            [A[A[A

  ...adapter_model.safetensors:  89%|███████████████████████████████████████████████████████████████████████████████          |  284MB /  320MB            [A[A


  ...inetune/training_args.bin: 100%|█████████████████████████████████████████████████████████████████████████████████████████| 7.44kB / 7.44kB            [A[A[A

  ...adapter_model.safetensors:  89%|███████████████████████████████████████████████████████████████████████████████▌         |  286MB /  320MB            [A[A


  ...inetune/training_args.bin: 100%|█████████████████████████████████████████████████████████████████████████████████████████| 7.44kB / 7.44kB            [A[A[AProcessing Files (1 / 2)      :  89%|███████████████████████████████████████████████████████████████████████████████▌         |  286MB /  320MB, 2.28MB/s  
New Data Upload               :  89%|███████████████████████████████████████████████████████████████████████████████▌         |  286MB /  320MB, 2.28MB/s  [A

  ...adapter_model.safetensors:  89%|███████████████████████████████████████████████████████████████████████████████▌         |  286MB /  320MB            [A[A


  ...inetune/training_args.bin: 100%|█████████████████████████████████████████████████████████████████████████████████████████| 7.44kB / 7.44kB            [A[A[A

  ...adapter_model.safetensors:  90%|████████████████████████████████████████████████████████████████████████████████         |  288MB /  320MB            [A[A


  ...inetune/training_args.bin: 100%|█████████████████████████████████████████████████████████████████████████████████████████| 7.44kB / 7.44kB            [A[A[AProcessing Files (1 / 2)      :  90%|████████████████████████████████████████████████████████████████████████████████         |  288MB /  320MB, 2.43MB/s  
New Data Upload               :  90%|████████████████████████████████████████████████████████████████████████████████         |  288MB /  320MB, 2.43MB/s  [A

  ...adapter_model.safetensors:  90%|████████████████████████████████████████████████████████████████████████████████▌        |  289MB /  320MB            [A[A


  ...inetune/training_args.bin: 100%|█████████████████████████████████████████████████████████████████████████████████████████| 7.44kB / 7.44kB            [A[A[AProcessing Files (1 / 2)      :  90%|████████████████████████████████████████████████████████████████████████████████▌        |  289MB /  320MB, 2.48MB/s  
New Data Upload               :  90%|████████████████████████████████████████████████████████████████████████████████▌        |  289MB /  320MB, 2.48MB/s  [A

  ...adapter_model.safetensors:  90%|████████████████████████████████████████████████████████████████████████████████▌        |  289MB /  320MB            [A[A


  ...inetune/training_args.bin: 100%|█████████████████████████████████████████████████████████████████████████████████████████| 7.44kB / 7.44kB            [A[A[A

  ...adapter_model.safetensors:  91%|████████████████████████████████████████████████████████████████████████████████▊        |  290MB /  320MB            [A[A


  ...inetune/training_args.bin: 100%|█████████████████████████████████████████████████████████████████████████████████████████| 7.44kB / 7.44kB            [A[A[AProcessing Files (1 / 2)      :  91%|████████████████████████████████████████████████████████████████████████████████▊        |  290MB /  320MB, 2.54MB/s  
New Data Upload               :  91%|████████████████████████████████████████████████████████████████████████████████▊        |  290MB /  320MB, 2.54MB/s  [A

  ...adapter_model.safetensors:  91%|████████████████████████████████████████████████████████████████████████████████▊        |  290MB /  320MB            [A[A


  ...inetune/training_args.bin: 100%|█████████████████████████████████████████████████████████████████████████████████████████| 7.44kB / 7.44kB            [A[A[A

  ...adapter_model.safetensors:  91%|█████████████████████████████████████████████████████████████████████████████████▎       |  292MB /  320MB            [A[A


  ...inetune/training_args.bin: 100%|█████████████████████████████████████████████████████████████████████████████████████████| 7.44kB / 7.44kB            [A[A[AProcessing Files (1 / 2)      :  91%|█████████████████████████████████████████████████████████████████████████████████▎       |  292MB /  320MB, 2.65MB/s  
New Data Upload               :  91%|█████████████████████████████████████████████████████████████████████████████████▎       |  292MB /  320MB, 2.65MB/s  [A

  ...adapter_model.safetensors:  92%|█████████████████████████████████████████████████████████████████████████████████▊       |  294MB /  320MB            [A[A


  ...inetune/training_args.bin: 100%|█████████████████████████████████████████████████████████████████████████████████████████| 7.44kB / 7.44kB            [A[A[AProcessing Files (1 / 2)      :  92%|█████████████████████████████████████████████████████████████████████████████████▊       |  294MB /  320MB, 2.81MB/s  
New Data Upload               :  92%|█████████████████████████████████████████████████████████████████████████████████▊       |  294MB /  320MB, 2.81MB/s  [A

  ...adapter_model.safetensors:  92%|█████████████████████████████████████████████████████████████████████████████████▊       |  294MB /  320MB            [A[A


  ...inetune/training_args.bin: 100%|█████████████████████████████████████████████████████████████████████████████████████████| 7.44kB / 7.44kB            [A[A[A

  ...adapter_model.safetensors:  92%|██████████████████████████████████████████████████████████████████████████████████▏      |  296MB /  320MB            [A[A


  ...inetune/training_args.bin: 100%|█████████████████████████████████████████████████████████████████████████████████████████| 7.44kB / 7.44kB            [A[A[AProcessing Files (1 / 2)      :  92%|██████████████████████████████████████████████████████████████████████████████████▏      |  296MB /  320MB, 2.87MB/s  
New Data Upload               :  92%|██████████████████████████████████████████████████████████████████████████████████▏      |  296MB /  320MB, 2.87MB/s  [A

  ...adapter_model.safetensors:  93%|██████████████████████████████████████████████████████████████████████████████████▌      |  297MB /  320MB            [A[A


  ...inetune/training_args.bin: 100%|█████████████████████████████████████████████████████████████████████████████████████████| 7.44kB / 7.44kB            [A[A[AProcessing Files (1 / 2)      :  93%|██████████████████████████████████████████████████████████████████████████████████▌      |  297MB /  320MB, 2.92MB/s  
New Data Upload               :  93%|██████████████████████████████████████████████████████████████████████████████████▌      |  297MB /  320MB, 2.92MB/s  [A

  ...adapter_model.safetensors:  93%|███████████████████████████████████████████████████████████████████████████████████      |  298MB /  320MB            [A[A


  ...inetune/training_args.bin: 100%|█████████████████████████████████████████████████████████████████████████████████████████| 7.44kB / 7.44kB            [A[A[AProcessing Files (1 / 2)      :  93%|███████████████████████████████████████████████████████████████████████████████████      |  298MB /  320MB, 3.09MB/s  
New Data Upload               :  93%|███████████████████████████████████████████████████████████████████████████████████      |  298MB /  320MB, 3.09MB/s  [A

  ...adapter_model.safetensors:  93%|███████████████████████████████████████████████████████████████████████████████████      |  298MB /  320MB            [A[A


  ...inetune/training_args.bin: 100%|█████████████████████████████████████████████████████████████████████████████████████████| 7.44kB / 7.44kB            [A[A[A

  ...adapter_model.safetensors:  94%|███████████████████████████████████████████████████████████████████████████████████▍     |  300MB /  320MB            [A[A


  ...inetune/training_args.bin: 100%|█████████████████████████████████████████████████████████████████████████████████████████| 7.44kB / 7.44kB            [A[A[AProcessing Files (1 / 2)      :  94%|███████████████████████████████████████████████████████████████████████████████████▍     |  300MB /  320MB, 3.14MB/s  
New Data Upload               :  94%|███████████████████████████████████████████████████████████████████████████████████▍     |  300MB /  320MB, 3.14MB/s  [A

  ...adapter_model.safetensors:  94%|███████████████████████████████████████████████████████████████████████████████████▍     |  300MB /  320MB            [A[A


  ...inetune/training_args.bin: 100%|█████████████████████████████████████████████████████████████████████████████████████████| 7.44kB / 7.44kB            [A[A[A

  ...adapter_model.safetensors:  94%|███████████████████████████████████████████████████████████████████████████████████▉     |  302MB /  320MB            [A[A


  ...inetune/training_args.bin: 100%|█████████████████████████████████████████████████████████████████████████████████████████| 7.44kB / 7.44kB            [A[A[AProcessing Files (1 / 2)      :  94%|███████████████████████████████████████████████████████████████████████████████████▉     |  302MB /  320MB, 3.25MB/s  
New Data Upload               :  94%|███████████████████████████████████████████████████████████████████████████████████▉     |  302MB /  320MB, 3.25MB/s  [A

  ...adapter_model.safetensors:  95%|████████████████████████████████████████████████████████████████████████████████████▎    |  303MB /  320MB            [A[A


  ...inetune/training_args.bin: 100%|█████████████████████████████████████████████████████████████████████████████████████████| 7.44kB / 7.44kB            [A[A[AProcessing Files (1 / 2)      :  95%|████████████████████████████████████████████████████████████████████████████████████▎    |  303MB /  320MB, 3.36MB/s  
New Data Upload               :  95%|████████████████████████████████████████████████████████████████████████████████████▎    |  303MB /  320MB, 3.36MB/s  [A

  ...adapter_model.safetensors:  95%|████████████████████████████████████████████████████████████████████████████████████▋    |  305MB /  320MB            [A[A


  ...inetune/training_args.bin: 100%|█████████████████████████████████████████████████████████████████████████████████████████| 7.44kB / 7.44kB            [A[A[AProcessing Files (1 / 2)      :  95%|████████████████████████████████████████████████████████████████████████████████████▋    |  305MB /  320MB, 3.53MB/s  
New Data Upload               :  95%|████████████████████████████████████████████████████████████████████████████████████▋    |  305MB /  320MB, 3.53MB/s  [A

  ...adapter_model.safetensors:  96%|█████████████████████████████████████████████████████████████████████████████████████▏   |  306MB /  320MB            [A[A


  ...inetune/training_args.bin: 100%|█████████████████████████████████████████████████████████████████████████████████████████| 7.44kB / 7.44kB            [A[A[AProcessing Files (1 / 2)      :  96%|█████████████████████████████████████████████████████████████████████████████████████▏   |  306MB /  320MB, 3.64MB/s  
New Data Upload               :  96%|█████████████████████████████████████████████████████████████████████████████████████▏   |  306MB /  320MB, 3.64MB/s  [A

  ...adapter_model.safetensors:  96%|█████████████████████████████████████████████████████████████████████████████████████▌   |  307MB /  320MB            [A[A


  ...inetune/training_args.bin: 100%|█████████████████████████████████████████████████████████████████████████████████████████| 7.44kB / 7.44kB            [A[A[AProcessing Files (1 / 2)      :  96%|█████████████████████████████████████████████████████████████████████████████████████▌   |  307MB /  320MB, 3.75MB/s  
New Data Upload               :  96%|█████████████████████████████████████████████████████████████████████████████████████▌   |  307MB /  320MB, 3.75MB/s  [A

  ...adapter_model.safetensors:  97%|█████████████████████████████████████████████████████████████████████████████████████▉   |  309MB /  320MB            [A[A


  ...inetune/training_args.bin: 100%|█████████████████████████████████████████████████████████████████████████████████████████| 7.44kB / 7.44kB            [A[A[AProcessing Files (1 / 2)      :  97%|█████████████████████████████████████████████████████████████████████████████████████▉   |  309MB /  320MB, 3.81MB/s  
New Data Upload               :  97%|█████████████████████████████████████████████████████████████████████████████████████▉   |  309MB /  320MB, 3.81MB/s  [A

  ...adapter_model.safetensors:  98%|██████████████████████████████████████████████████████████████████████████████████████▉  |  312MB /  320MB            [A[A


  ...inetune/training_args.bin: 100%|█████████████████████████████████████████████████████████████████████████████████████████| 7.44kB / 7.44kB            [A[A[AProcessing Files (1 / 2)      :  98%|██████████████████████████████████████████████████████████████████████████████████████▉  |  312MB /  320MB, 4.14MB/s  
New Data Upload               :  98%|██████████████████████████████████████████████████████████████████████████████████████▉  |  312MB /  320MB, 4.14MB/s  [A

  ...adapter_model.safetensors:  98%|███████████████████████████████████████████████████████████████████████████████████████▏ |  314MB /  320MB            [A[A


  ...inetune/training_args.bin: 100%|█████████████████████████████████████████████████████████████████████████████████████████| 7.44kB / 7.44kB            [A[A[AProcessing Files (1 / 2)      :  98%|███████████████████████████████████████████████████████████████████████████████████████▏ |  314MB /  320MB, 4.19MB/s  
New Data Upload               :  98%|███████████████████████████████████████████████████████████████████████████████████████▏ |  314MB /  320MB, 4.19MB/s  [A

  ...adapter_model.safetensors:  99%|███████████████████████████████████████████████████████████████████████████████████████▋ |  315MB /  320MB            [A[A


  ...inetune/training_args.bin: 100%|█████████████████████████████████████████████████████████████████████████████████████████| 7.44kB / 7.44kB            [A[A[AProcessing Files (1 / 2)      :  99%|███████████████████████████████████████████████████████████████████████████████████████▋ |  315MB /  320MB, 4.36MB/s  
New Data Upload               :  99%|███████████████████████████████████████████████████████████████████████████████████████▋ |  315MB /  320MB, 4.36MB/s  [A

  ...adapter_model.safetensors:  99%|████████████████████████████████████████████████████████████████████████████████████████▏|  317MB /  320MB            [A[A


  ...inetune/training_args.bin: 100%|█████████████████████████████████████████████████████████████████████████████████████████| 7.44kB / 7.44kB            [A[A[AProcessing Files (1 / 2)      :  99%|████████████████████████████████████████████████████████████████████████████████████████▏|  317MB /  320MB, 4.47MB/s  
New Data Upload               :  99%|████████████████████████████████████████████████████████████████████████████████████████▏|  317MB /  320MB, 4.47MB/s  [A

  ...adapter_model.safetensors: 100%|████████████████████████████████████████████████████████████████████████████████████████▋|  319MB /  320MB            [A[A


  ...inetune/training_args.bin: 100%|█████████████████████████████████████████████████████████████████████████████████████████| 7.44kB / 7.44kB            [A[A[AProcessing Files (1 / 2)      : 100%|████████████████████████████████████████████████████████████████████████████████████████▋|  319MB /  320MB, 4.52MB/s  
New Data Upload               : 100%|████████████████████████████████████████████████████████████████████████████████████████▋|  319MB /  320MB, 4.52MB/s  [A

  ...adapter_model.safetensors: 100%|████████████████████████████████████████████████████████████████████████████████████████▉|  320MB /  320MB            [A[A


  ...inetune/training_args.bin: 100%|█████████████████████████████████████████████████████████████████████████████████████████| 7.44kB / 7.44kB            [A[A[AProcessing Files (1 / 2)      : 100%|████████████████████████████████████████████████████████████████████████████████████████▉|  320MB /  320MB, 4.63MB/s  
New Data Upload               : 100%|████████████████████████████████████████████████████████████████████████████████████████▉|  320MB /  320MB, 4.63MB/s  [A

  ...adapter_model.safetensors: 100%|████████████████████████████████████████████████████████████████████████████████████████▉|  320MB /  320MB            [A[A


  ...inetune/training_args.bin: 100%|█████████████████████████████████████████████████████████████████████████████████████████| 7.44kB / 7.44kB            [A[A[A

  ...adapter_model.safetensors: 100%|████████████████████████████████████████████████████████████████████████████████████████▉|  320MB /  320MB            [A[A


  ...inetune/training_args.bin: 100%|█████████████████████████████████████████████████████████████████████████████████████████| 7.44kB / 7.44kB            [A[A[A

  ...adapter_model.safetensors: 100%|████████████████████████████████████████████████████████████████████████████████████████▉|  320MB /  320MB            [A[A


  ...inetune/training_args.bin: 100%|█████████████████████████████████████████████████████████████████████████████████████████| 7.44kB / 7.44kB            [A[A[A

  ...adapter_model.safetensors: 100%|████████████████████████████████████████████████████████████████████████████████████████▉|  320MB /  320MB            [A[A


  ...inetune/training_args.bin: 100%|█████████████████████████████████████████████████████████████████████████████████████████| 7.44kB / 7.44kB            [A[A[A

  ...adapter_model.safetensors: 100%|████████████████████████████████████████████████████████████████████████████████████████▉|  320MB /  320MB            [A[A


  ...inetune/training_args.bin: 100%|█████████████████████████████████████████████████████████████████████████████████████████| 7.44kB / 7.44kB            [A[A[A

  ...adapter_model.safetensors: 100%|█████████████████████████████████████████████████████████████████████████████████████████|  320MB /  320MB            [A[A


  ...inetune/training_args.bin: 100%|█████████████████████████████████████████████████████████████████████████████████████████| 7.44kB / 7.44kB            [A[A[AProcessing Files (2 / 2)      : 100%|█████████████████████████████████████████████████████████████████████████████████████████|  320MB /  320MB, 4.37MB/s  
New Data Upload               : 100%|█████████████████████████████████████████████████████████████████████████████████████████|  320MB /  320MB, 4.37MB/s  [A

  ...adapter_model.safetensors: 100%|█████████████████████████████████████████████████████████████████████████████████████████|  320MB /  320MB            [A[A


  ...inetune/training_args.bin: 100%|█████████████████████████████████████████████████████████████████████████████████████████| 7.44kB / 7.44kB            [A[A[A

  ...adapter_model.safetensors: 100%|█████████████████████████████████████████████████████████████████████████████████████████|  320MB /  320MB            [A[A


  ...inetune/training_args.bin: 100%|█████████████████████████████████████████████████████████████████████████████████████████| 7.44kB / 7.44kB            [A[A[A

  ...adapter_model.safetensors: 100%|█████████████████████████████████████████████████████████████████████████████████████████|  320MB /  320MB            [A[A


  ...inetune/training_args.bin: 100%|█████████████████████████████████████████████████████████████████████████████████████████| 7.44kB / 7.44kB            [A[A[AProcessing Files (2 / 2)      : 100%|█████████████████████████████████████████████████████████████████████████████████████████|  320MB /  320MB, 4.40MB/s  
New Data Upload               : 100%|█████████████████████████████████████████████████████████████████████████████████████████|  320MB /  320MB, 4.40MB/s  
  ...adapter_model.safetensors: 100%|█████████████████████████████████████████████████████████████████████████████████████████|  320MB /  320MB            
  ...inetune/training_args.bin: 100%|█████████████████████████████████████████████████████████████████████████████████████████| 7.44kB / 7.44kB