Pamzyy commited on
Commit
dc6ff7c
·
verified ·
1 Parent(s): 0edba91

Final logs after training

Browse files
.gitattributes CHANGED
@@ -34,3 +34,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
  tokenizer.json filter=lfs diff=lfs merge=lfs -text
 
 
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
  tokenizer.json filter=lfs diff=lfs merge=lfs -text
37
+ session_logs/lora_finetuning_report.pdf filter=lfs diff=lfs merge=lfs -text
session_logs/logs/events.out.tfevents.1739444870.30dae5ad871f.6130.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:04ab353d501a1353abcae20ec8a3f4065c89fbb65295601ee85675d8e53e3ae5
3
+ size 6880
session_logs/logs/events.out.tfevents.1739445167.30dae5ad871f.13649.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:28516573d16fe33e07b63fa3c8b64213bc33f7e80151cc88d564db110eb8ca6e
3
+ size 6501
session_logs/logs/events.out.tfevents.1739445528.30dae5ad871f.16400.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7783c4d63f85dce620d2ee7f348d58e7d837517eb76c7c3daa9059a131c23122
3
+ size 174790
session_logs/logs/events.out.tfevents.1739532681.30dae5ad871f.16400.1 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a6f1784bd4ee809a729facdecdc483b8a5af0f98283ffadcea2a6d2915fa17f9
3
+ size 364
session_logs/lora_finetuning.log ADDED
@@ -0,0 +1,12 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ 2025-02-13 11:17:52,968 - Logging initialized for session: 565629c2-b9c1-4f20-8f6e-6c380b743216
2
+ 2025-02-13 11:17:53,656 - We will use 90% of the memory on device 0 for storing the model, and 10% for the buffer to avoid OOM. You can set `max_memory` in to a higher value to use more memory (at your own risk).
3
+ 2025-02-14 11:34:23,998 - Using default tokenizer.
4
+ 2025-02-14 11:34:25,367 - Hyperparameters: {'output_dir': './lora_finetuned', 'overwrite_output_dir': False, 'do_train': False, 'do_eval': True, 'do_predict': False, 'eval_strategy': <IntervalStrategy.STEPS: 'steps'>, 'prediction_loss_only': False, 'per_device_train_batch_size': 1, 'per_device_eval_batch_size': 2, 'per_gpu_train_batch_size': None, 'per_gpu_eval_batch_size': None, 'gradient_accumulation_steps': 1, 'eval_accumulation_steps': None, 'eval_delay': 0, 'torch_empty_cache_steps': None, 'learning_rate': 0.0002, 'weight_decay': 0.0, 'adam_beta1': 0.9, 'adam_beta2': 0.999, 'adam_epsilon': 1e-08, 'max_grad_norm': 0.3, 'num_train_epochs': 1, 'max_steps': 35000, 'lr_scheduler_type': <SchedulerType.LINEAR: 'linear'>, 'lr_scheduler_kwargs': {}, 'warmup_ratio': 0.0, 'warmup_steps': 1000, 'log_level': 'passive', 'log_level_replica': 'warning', 'log_on_each_node': True, 'logging_dir': './logs', 'logging_strategy': <IntervalStrategy.STEPS: 'steps'>, 'logging_first_step': False, 'logging_steps': 50, 'logging_nan_inf_filter': True, 'save_strategy': <SaveStrategy.STEPS: 'steps'>, 'save_steps': 10000, 'save_total_limit': None, 'save_safetensors': True, 'save_on_each_node': False, 'save_only_model': False, 'restore_callback_states_from_checkpoint': False, 'no_cuda': False, 'use_cpu': False, 'use_mps_device': False, 'seed': 42, 'data_seed': None, 'jit_mode_eval': False, 'use_ipex': False, 'bf16': True, 'fp16': False, 'fp16_opt_level': 'O1', 'half_precision_backend': 'auto', 'bf16_full_eval': False, 'fp16_full_eval': False, 'tf32': True, 'local_rank': 0, 'ddp_backend': None, 'tpu_num_cores': None, 'tpu_metrics_debug': False, 'debug': [], 'dataloader_drop_last': False, 'eval_steps': 500, 'dataloader_num_workers': 0, 'dataloader_prefetch_factor': None, 'past_index': -1, 'run_name': './lora_finetuned', 'disable_tqdm': False, 'remove_unused_columns': False, 'label_names': None, 'load_best_model_at_end': False, 'metric_for_best_model': None, 'greater_is_better': None, 'ignore_data_skip': False, 'fsdp': [], 'fsdp_min_num_params': 0, 'fsdp_config': {'min_num_params': 0, 'xla': False, 'xla_fsdp_v2': False, 'xla_fsdp_grad_ckpt': False}, 'fsdp_transformer_layer_cls_to_wrap': None, 'accelerator_config': AcceleratorConfig(split_batches=False, dispatch_batches=None, even_batches=True, use_seedable_sampler=True, non_blocking=False, gradient_accumulation_kwargs=None, use_configured_state=False), 'deepspeed': None, 'label_smoothing_factor': 0.0, 'optim': <OptimizerNames.PAGED_ADAMW_8BIT: 'paged_adamw_8bit'>, 'optim_args': None, 'adafactor': False, 'group_by_length': False, 'length_column_name': 'length', 'report_to': ['tensorboard'], 'ddp_find_unused_parameters': None, 'ddp_bucket_cap_mb': None, 'ddp_broadcast_buffers': None, 'dataloader_pin_memory': True, 'dataloader_persistent_workers': False, 'skip_memory_metrics': True, 'use_legacy_prediction_loop': False, 'push_to_hub': True, 'resume_from_checkpoint': None, 'hub_model_id': 'Pamzyy/Packing_test', 'hub_strategy': <HubStrategy.EVERY_SAVE: 'every_save'>, 'hub_private_repo': None, 'hub_always_push': False, 'gradient_checkpointing': True, 'gradient_checkpointing_kwargs': None, 'include_inputs_for_metrics': False, 'include_for_metrics': [], 'eval_do_concat_batches': True, 'fp16_backend': 'auto', 'evaluation_strategy': 'steps', 'push_to_hub_model_id': None, 'push_to_hub_organization': None, 'push_to_hub_token': None, 'mp_parameters': '', 'auto_find_batch_size': False, 'full_determinism': False, 'torchdynamo': None, 'ray_scope': 'last', 'ddp_timeout': 1800, 'torch_compile': False, 'torch_compile_backend': None, 'torch_compile_mode': None, 'dispatch_batches': None, 'split_batches': None, 'include_tokens_per_second': False, 'include_num_input_tokens_seen': False, 'neftune_noise_alpha': None, 'optim_target_modules': None, 'batch_eval_metrics': False, 'eval_on_start': False, 'use_liger_kernel': False, 'eval_use_gather_object': False, 'average_tokens_across_devices': False, 'distributed_state': Distributed environment: NO
5
+ Num processes: 1
6
+ Process index: 0
7
+ Local process index: 0
8
+ Device: cuda
9
+ , '_n_gpu': 1, '__cached__setup_devices': device(type='cuda', index=0), 'deepspeed_plugin': None}
10
+ 2025-02-14 11:34:25,367 - Training details: {'Epochs': 1, 'Training Steps': 35000, 'Final Loss': 1.5239, 'Final Learning Rate': 0.0, 'Total Training Time (s)': '87095.12'}
11
+ 2025-02-14 11:34:25,367 - Training metrics: {'epochs': [50, 100, 150, 200, 250, 300, 350, 400, 450, 500, 550, 600, 650, 700, 750, 800, 850, 900, 950, 1000, 1050, 1100, 1150, 1200, 1250, 1300, 1350, 1400, 1450, 1500, 1550, 1600, 1650, 1700, 1750, 1800, 1850, 1900, 1950, 2000, 2050, 2100, 2150, 2200, 2250, 2300, 2350, 2400, 2450, 2500, 2550, 2600, 2650, 2700, 2750, 2800, 2850, 2900, 2950, 3000, 3050, 3100, 3150, 3200, 3250, 3300, 3350, 3400, 3450, 3500, 3550, 3600, 3650, 3700, 3750, 3800, 3850, 3900, 3950, 4000, 4050, 4100, 4150, 4200, 4250, 4300, 4350, 4400, 4450, 4500, 4550, 4600, 4650, 4700, 4750, 4800, 4850, 4900, 4950, 5000, 5050, 5100, 5150, 5200, 5250, 5300, 5350, 5400, 5450, 5500, 5550, 5600, 5650, 5700, 5750, 5800, 5850, 5900, 5950, 6000, 6050, 6100, 6150, 6200, 6250, 6300, 6350, 6400, 6450, 6500, 6550, 6600, 6650, 6700, 6750, 6800, 6850, 6900, 6950, 7000, 7050, 7100, 7150, 7200, 7250, 7300, 7350, 7400, 7450, 7500, 7550, 7600, 7650, 7700, 7750, 7800, 7850, 7900, 7950, 8000, 8050, 8100, 8150, 8200, 8250, 8300, 8350, 8400, 8450, 8500, 8550, 8600, 8650, 8700, 8750, 8800, 8850, 8900, 8950, 9000, 9050, 9100, 9150, 9200, 9250, 9300, 9350, 9400, 9450, 9500, 9550, 9600, 9650, 9700, 9750, 9800, 9850, 9900, 9950, 10000, 10050, 10100, 10150, 10200, 10250, 10300, 10350, 10400, 10450, 10500, 10550, 10600, 10650, 10700, 10750, 10800, 10850, 10900, 10950, 11000, 11050, 11100, 11150, 11200, 11250, 11300, 11350, 11400, 11450, 11500, 11550, 11600, 11650, 11700, 11750, 11800, 11850, 11900, 11950, 12000, 12050, 12100, 12150, 12200, 12250, 12300, 12350, 12400, 12450, 12500, 12550, 12600, 12650, 12700, 12750, 12800, 12850, 12900, 12950, 13000, 13050, 13100, 13150, 13200, 13250, 13300, 13350, 13400, 13450, 13500, 13550, 13600, 13650, 13700, 13750, 13800, 13850, 13900, 13950, 14000, 14050, 14100, 14150, 14200, 14250, 14300, 14350, 14400, 14450, 14500, 14550, 14600, 14650, 14700, 14750, 14800, 14850, 14900, 14950, 15000, 15050, 15100, 15150, 15200, 15250, 15300, 15350, 15400, 15450, 15500, 15550, 15600, 15650, 15700, 15750, 15800, 15850, 15900, 15950, 16000, 16050, 16100, 16150, 16200, 16250, 16300, 16350, 16400, 16450, 16500, 16550, 16600, 16650, 16700, 16750, 16800, 16850, 16900, 16950, 17000, 17050, 17100, 17150, 17200, 17250, 17300, 17350, 17400, 17450, 17500, 17550, 17600, 17650, 17700, 17750, 17800, 17850, 17900, 17950, 18000, 18050, 18100, 18150, 18200, 18250, 18300, 18350, 18400, 18450, 18500, 18550, 18600, 18650, 18700, 18750, 18800, 18850, 18900, 18950, 19000, 19050, 19100, 19150, 19200, 19250, 19300, 19350, 19400, 19450, 19500, 19550, 19600, 19650, 19700, 19750, 19800, 19850, 19900, 19950, 20000, 20050, 20100, 20150, 20200, 20250, 20300, 20350, 20400, 20450, 20500, 20550, 20600, 20650, 20700, 20750, 20800, 20850, 20900, 20950, 21000, 21050, 21100, 21150, 21200, 21250, 21300, 21350, 21400, 21450, 21500, 21550, 21600, 21650, 21700, 21750, 21800, 21850, 21900, 21950, 22000, 22050, 22100, 22150, 22200, 22250, 22300, 22350, 22400, 22450, 22500, 22550, 22600, 22650, 22700, 22750, 22800, 22850, 22900, 22950, 23000, 23050, 23100, 23150, 23200, 23250, 23300, 23350, 23400, 23450, 23500, 23550, 23600, 23650, 23700, 23750, 23800, 23850, 23900, 23950, 24000, 24050, 24100, 24150, 24200, 24250, 24300, 24350, 24400, 24450, 24500, 24550, 24600, 24650, 24700, 24750, 24800, 24850, 24900, 24950, 25000, 25050, 25100, 25150, 25200, 25250, 25300, 25350, 25400, 25450, 25500, 25550, 25600, 25650, 25700, 25750, 25800, 25850, 25900, 25950, 26000, 26050, 26100, 26150, 26200, 26250, 26300, 26350, 26400, 26450, 26500, 26550, 26600, 26650, 26700, 26750, 26800, 26850, 26900, 26950, 27000, 27050, 27100, 27150, 27200, 27250, 27300, 27350, 27400, 27450, 27500, 27550, 27600, 27650, 27700, 27750, 27800, 27850, 27900, 27950, 28000, 28050, 28100, 28150, 28200, 28250, 28300, 28350, 28400, 28450, 28500, 28550, 28600, 28650, 28700, 28750, 28800, 28850, 28900, 28950, 29000, 29050, 29100, 29150, 29200, 29250, 29300, 29350, 29400, 29450, 29500, 29550, 29600, 29650, 29700, 29750, 29800, 29850, 29900, 29950, 30000, 30050, 30100, 30150, 30200, 30250, 30300, 30350, 30400, 30450, 30500, 30550, 30600, 30650, 30700, 30750, 30800, 30850, 30900, 30950, 31000, 31050, 31100, 31150, 31200, 31250, 31300, 31350, 31400, 31450, 31500, 31550, 31600, 31650, 31700, 31750, 31800, 31850, 31900, 31950, 32000, 32050, 32100, 32150, 32200, 32250, 32300, 32350, 32400, 32450, 32500, 32550, 32600, 32650, 32700, 32750, 32800, 32850, 32900, 32950, 33000, 33050, 33100, 33150, 33200, 33250, 33300, 33350, 33400, 33450, 33500, 33550, 33600, 33650, 33700, 33750, 33800, 33850, 33900, 33950, 34000, 34050, 34100, 34150, 34200, 34250, 34300, 34350, 34400, 34450, 34500, 34550, 34600, 34650, 34700, 34750, 34800, 34850, 34900, 34950, 35000], 'loss': [3.4393, 2.9346, 2.6116, 2.5777, 2.4135, 2.292, 2.25, 2.3119, 2.2479, 2.2356, 2.1795, 2.1244, 2.2056, 2.1674, 2.1038, 2.1065, 2.2026, 2.1706, 2.1342, 2.1518, 2.1897, 2.0642, 2.0254, 2.0583, 2.0562, 2.0778, 2.0987, 2.09, 2.1035, 2.0662, 2.0073, 2.1855, 1.9037, 2.0224, 1.9927, 1.9913, 1.9816, 1.9986, 2.0411, 1.8898, 2.0139, 2.0245, 1.9435, 1.8744, 1.9816, 1.9488, 2.013, 1.9855, 1.8829, 1.9859, 1.9737, 1.9791, 1.9055, 1.8894, 1.8236, 1.9786, 1.9607, 1.9765, 1.855, 1.9117, 1.9955, 1.9652, 1.8837, 1.8285, 2.0144, 1.8574, 1.9567, 1.8877, 1.9545, 1.8189, 1.9405, 1.8712, 1.8562, 1.8592, 1.9066, 1.8316, 1.8717, 1.9361, 1.8683, 1.8029, 1.8781, 1.8764, 1.9135, 1.8729, 1.8143, 1.8982, 1.7971, 1.8181, 1.7903, 1.8462, 1.8855, 1.8797, 1.82, 1.783, 1.8709, 1.8532, 1.8981, 1.9138, 1.9574, 1.7711, 1.8022, 1.8546, 1.908, 1.8705, 1.8311, 1.8904, 1.7629, 1.8221, 1.7904, 1.8791, 1.7977, 1.8337, 1.7775, 1.9295, 1.7888, 1.8667, 1.8126, 1.8333, 1.8461, 1.9432, 1.7875, 1.7999, 1.8548, 1.7556, 1.7593, 1.7566, 1.8218, 1.7793, 1.8919, 1.8381, 1.8409, 1.7581, 1.7837, 1.7583, 1.7035, 1.7211, 1.9914, 1.7564, 1.7443, 1.7639, 1.7241, 1.8012, 1.7524, 1.7853, 1.7487, 1.7717, 1.7464, 1.7696, 1.8237, 1.7591, 1.8245, 1.7565, 1.6927, 1.8199, 1.7233, 1.7073, 1.8073, 1.7437, 1.7509, 1.8396, 1.7182, 1.7387, 1.7671, 1.7621, 1.7809, 1.77, 1.7383, 1.6953, 1.7329, 1.7181, 1.6799, 1.7102, 1.7555, 1.7906, 1.7279, 1.7784, 1.6768, 1.6992, 1.832, 1.7601, 1.8571, 1.6978, 1.7479, 1.7472, 1.7054, 1.7068, 1.6754, 1.7526, 1.6936, 1.7366, 1.8304, 1.6824, 1.6979, 1.7696, 1.7613, 1.7015, 1.7418, 1.741, 1.8003, 1.8083, 1.7131, 1.7374, 1.7471, 1.7338, 1.6776, 1.7428, 1.7145, 1.7632, 1.7881, 1.6766, 1.691, 1.7238, 1.6613, 1.6135, 1.7063, 1.7814, 1.8215, 1.7257, 1.6485, 1.804, 1.6577, 1.6552, 1.6902, 1.6977, 1.6564, 1.6948, 1.719, 1.714, 1.6794, 1.7796, 1.6905, 1.6855, 1.7949, 1.8425, 1.6823, 1.7041, 1.7356, 1.7596, 1.707, 1.7224, 1.7311, 1.7007, 1.7198, 1.748, 1.6958, 1.64, 1.6876, 1.6651, 1.7525, 1.6308, 1.6039, 1.6361, 1.7341, 1.6957, 1.6328, 1.639, 1.6635, 1.633, 1.6028, 1.7304, 1.6729, 1.7277, 1.6458, 1.6491, 1.6845, 1.6339, 1.6831, 1.6511, 1.7042, 1.708, 1.6696, 1.6675, 1.6914, 1.7759, 1.7233, 1.6161, 1.6042, 1.6683, 1.6506, 1.6877, 1.6705, 1.633, 1.6785, 1.7139, 1.6084, 1.7552, 1.6707, 1.6656, 1.7214, 1.6521, 1.5842, 1.6507, 1.5901, 1.6652, 1.6481, 1.652, 1.6513, 1.7099, 1.6056, 1.6318, 1.6433, 1.6804, 1.7094, 1.6102, 1.6882, 1.6097, 1.681, 1.6695, 1.6675, 1.6867, 1.6244, 1.6454, 1.673, 1.6118, 1.5541, 1.6141, 1.676, 1.6911, 1.6938, 1.6326, 1.6532, 1.6121, 1.6769, 1.6344, 1.6984, 1.5735, 1.6623, 1.705, 1.6453, 1.7143, 1.6986, 1.5865, 1.5982, 1.728, 1.5591, 1.7532, 1.5962, 1.7055, 1.6921, 1.6922, 1.6053, 1.7552, 1.6699, 1.7459, 1.6286, 1.6566, 1.5823, 1.6934, 1.6943, 1.5701, 1.6078, 1.5665, 1.6028, 1.5917, 1.6209, 1.6109, 1.6538, 1.6385, 1.6154, 1.5731, 1.6057, 1.6035, 1.5512, 1.6227, 1.6121, 1.6539, 1.7007, 1.5562, 1.6502, 1.6103, 1.5647, 1.597, 1.5677, 1.6981, 1.5838, 1.5751, 1.5926, 1.5912, 1.6704, 1.5977, 1.6502, 1.567, 1.5954, 1.641, 1.6533, 1.6038, 1.6529, 1.6238, 1.5295, 1.5531, 1.6902, 1.6325, 1.6293, 1.6038, 1.5699, 1.627, 1.6483, 1.6093, 1.586, 1.5419, 1.6337, 1.6055, 1.6046, 1.6051, 1.5462, 1.5633, 1.62, 1.6113, 1.5892, 1.6875, 1.5279, 1.5557, 1.6127, 1.6305, 1.5596, 1.6051, 1.6364, 1.7188, 1.582, 1.6409, 1.5316, 1.6672, 1.5641, 1.5821, 1.6014, 1.5768, 1.5659, 1.632, 1.5723, 1.5722, 1.5975, 1.6193, 1.6655, 1.6429, 1.544, 1.4992, 1.6101, 1.5714, 1.5902, 1.5297, 1.5118, 1.5353, 1.6562, 1.6595, 1.6179, 1.6006, 1.5698, 1.6715, 1.5923, 1.6445, 1.6601, 1.5542, 1.634, 1.5656, 1.5754, 1.6163, 1.5978, 1.6005, 1.5709, 1.646, 1.5714, 1.6197, 1.5975, 1.6902, 1.647, 1.6043, 1.5424, 1.5446, 1.5932, 1.5411, 1.6969, 1.6064, 1.5994, 1.6088, 1.5438, 1.5453, 1.5924, 1.6654, 1.5608, 1.5673, 1.546, 1.5654, 1.6169, 1.5944, 1.5974, 1.5671, 1.6502, 1.5665, 1.6248, 1.5574, 1.5747, 1.5653, 1.493, 1.5918, 1.5406, 1.5347, 1.5198, 1.6345, 1.5361, 1.6036, 1.5375, 1.599, 1.6221, 1.511, 1.5371, 1.5351, 1.5257, 1.4959, 1.5428, 1.5872, 1.595, 1.6006, 1.5477, 1.5982, 1.5983, 1.582, 1.5575, 1.569, 1.5332, 1.6113, 1.5551, 1.5475, 1.6054, 1.5487, 1.5822, 1.5379, 1.5565, 1.5079, 1.5397, 1.5078, 1.7135, 1.5519, 1.5894, 1.6043, 1.6105, 1.5882, 1.5701, 1.5855, 1.5605, 1.5641, 1.5935, 1.5037, 1.5796, 1.5618, 1.5458, 1.5308, 1.625, 1.5955, 1.4931, 1.5995, 1.5929, 1.4691, 1.5121, 1.5524, 1.5014, 1.5889, 1.4796, 1.5825, 1.5475, 1.5716, 1.5245, 1.5815, 1.5856, 1.6253, 1.5881, 1.4642, 1.6479, 1.6026, 1.5046, 1.6126, 1.5165, 1.539, 1.5522, 1.5822, 1.4986, 1.5736, 1.5226, 1.5323, 1.5344, 1.53, 1.4437, 1.5163, 1.5807, 1.6468, 1.5671, 1.5118, 1.5445, 1.4981, 1.5588, 1.5552, 1.5366, 1.5008, 1.5965, 1.5481, 1.6481, 1.4861, 1.54, 1.5474, 1.4801, 1.4991, 1.5409, 1.5336, 1.5972, 1.5536, 1.6104, 1.5163, 1.538, 1.4657, 1.5305, 1.5611, 1.5574, 1.5587, 1.608, 1.4713, 1.54, 1.5573, 1.5265, 1.5735, 1.4722, 1.5492, 1.5483, 1.5955, 1.5923, 1.4739, 1.6201, 1.5002, 1.5167, 1.48, 1.5513, 1.5914, 1.5131, 1.5274, 1.4525, 1.5059, 1.6083, 1.5418, 1.6085, 1.5303, 1.5029, 1.471, 1.5989, 1.6556, 1.5423, 1.5106, 1.5273, 1.4841, 1.4924, 1.5074, 1.5388, 1.5431, 1.604, 1.5053, 1.5531, 1.5898, 1.5805, 1.5199, 1.4661, 1.5712, 1.515, 1.5169, 1.6008, 1.5566, 1.5327, 1.588, 1.5983, 1.5157, 1.5226, 1.5222, 1.5802, 1.4734, 1.5292, 1.512, 1.5451, 1.5409, 1.5467, 1.5589, 1.5285, 1.4869, 1.5026, 1.5261, 1.4941, 1.4267, 1.5411, 1.5363, 1.5064, 1.556, 1.5764, 1.5378, 1.5029, 1.5667, 1.569, 1.5068, 1.4732, 1.6414, 1.5372, 1.5823, 1.5324, 1.577, 1.5868, 1.5239], 'learning_rate': [1e-05, 2e-05, 3e-05, 4e-05, 5e-05, 6e-05, 7e-05, 8e-05, 9e-05, 0.0001, 0.00011000000000000002, 0.00012, 0.00013000000000000002, 0.00014, 0.00015000000000000001, 0.00016, 0.00017, 0.00018, 0.00019, 0.0002, 0.0001997058823529412, 0.00019941176470588236, 0.00019911764705882355, 0.00019882352941176472, 0.0001985294117647059, 0.00019823529411764707, 0.00019794117647058826, 0.00019764705882352942, 0.0001973529411764706, 0.00019705882352941177, 0.00019676470588235294, 0.00019647058823529413, 0.0001961764705882353, 0.00019588235294117648, 0.00019558823529411764, 0.00019529411764705883, 0.000195, 0.0001947058823529412, 0.00019441176470588235, 0.00019411764705882354, 0.0001938235294117647, 0.0001935294117647059, 0.00019323529411764708, 0.00019294117647058825, 0.00019264705882352944, 0.0001923529411764706, 0.0001920588235294118, 0.00019176470588235295, 0.00019147058823529414, 0.0001911764705882353, 0.0001908823529411765, 0.00019058823529411766, 0.00019029411764705882, 0.00019, 0.00018970588235294117, 0.00018941176470588236, 0.00018911764705882353, 0.00018882352941176472, 0.00018852941176470588, 0.00018823529411764707, 0.00018794117647058823, 0.00018764705882352942, 0.00018735294117647059, 0.00018705882352941178, 0.00018676470588235297, 0.00018647058823529413, 0.00018617647058823532, 0.00018588235294117648, 0.00018558823529411767, 0.00018529411764705883, 0.00018500000000000002, 0.0001847058823529412, 0.00018441176470588238, 0.00018411764705882354, 0.0001838235294117647, 0.0001835294117647059, 0.00018323529411764706, 0.00018294117647058825, 0.0001826470588235294, 0.0001823529411764706, 0.00018205882352941176, 0.00018176470588235295, 0.00018147058823529412, 0.0001811764705882353, 0.00018088235294117647, 0.00018058823529411766, 0.00018029411764705885, 0.00018, 0.0001797058823529412, 0.00017941176470588236, 0.00017911764705882355, 0.00017882352941176472, 0.0001785294117647059, 0.00017823529411764707, 0.00017794117647058823, 0.00017764705882352942, 0.00017735294117647059, 0.00017705882352941178, 0.00017676470588235294, 0.00017647058823529413, 0.0001761764705882353, 0.00017588235294117648, 0.00017558823529411765, 0.00017529411764705884, 0.000175, 0.0001747058823529412, 0.00017441176470588235, 0.00017411764705882354, 0.00017382352941176473, 0.0001735294117647059, 0.00017323529411764708, 0.00017294117647058825, 0.00017264705882352944, 0.0001723529411764706, 0.0001720588235294118, 0.00017176470588235293, 0.00017147058823529412, 0.0001711764705882353, 0.00017088235294117647, 0.00017058823529411766, 0.00017029411764705882, 0.00017, 0.00016970588235294118, 0.00016941176470588237, 0.00016911764705882353, 0.00016882352941176472, 0.00016852941176470588, 0.00016823529411764707, 0.00016794117647058823, 0.00016764705882352942, 0.00016735294117647061, 0.00016705882352941178, 0.00016676470588235297, 0.00016647058823529413, 0.00016617647058823532, 0.00016588235294117648, 0.00016558823529411765, 0.0001652941176470588, 0.000165, 0.0001647058823529412, 0.00016441176470588235, 0.00016411764705882354, 0.0001638235294117647, 0.0001635294117647059, 0.00016323529411764706, 0.00016294117647058825, 0.0001626470588235294, 0.0001623529411764706, 0.00016205882352941176, 0.00016176470588235295, 0.00016147058823529412, 0.0001611764705882353, 0.0001608823529411765, 0.00016058823529411766, 0.00016029411764705885, 0.00016, 0.0001597058823529412, 0.00015941176470588237, 0.00015911764705882353, 0.0001588235294117647, 0.00015852941176470588, 0.00015823529411764707, 0.00015794117647058824, 0.00015764705882352943, 0.0001573529411764706, 0.00015705882352941178, 0.00015676470588235294, 0.00015647058823529413, 0.0001561764705882353, 0.00015588235294117648, 0.00015558823529411765, 0.00015529411764705884, 0.000155, 0.0001547058823529412, 0.00015441176470588238, 0.00015411764705882354, 0.00015382352941176473, 0.0001535294117647059, 0.00015323529411764709, 0.00015294117647058822, 0.0001526470588235294, 0.00015235294117647057, 0.00015205882352941176, 0.00015176470588235295, 0.00015147058823529412, 0.0001511764705882353, 0.00015088235294117647, 0.00015058823529411766, 0.00015029411764705882, 0.00015000000000000001, 0.00014970588235294118, 0.00014941176470588237, 0.00014911764705882353, 0.00014882352941176472, 0.00014852941176470588, 0.00014823529411764707, 0.00014794117647058826, 0.00014764705882352943, 0.00014735294117647062, 0.00014705882352941178, 0.00014676470588235294, 0.0001464705882352941, 0.0001461764705882353, 0.00014588235294117646, 0.00014558823529411765, 0.00014529411764705884, 0.000145, 0.0001447058823529412, 0.00014441176470588235, 0.00014411764705882354, 0.0001438235294117647, 0.0001435294117647059, 0.00014323529411764706, 0.00014294117647058825, 0.0001426470588235294, 0.0001423529411764706, 0.00014205882352941177, 0.00014176470588235296, 0.00014147058823529415, 0.0001411764705882353, 0.0001408823529411765, 0.00014058823529411763, 0.00014029411764705882, 0.00014, 0.00013970588235294118, 0.00013941176470588234, 0.00013911764705882353, 0.00013882352941176472, 0.00013852941176470588, 0.00013823529411764707, 0.00013794117647058824, 0.00013764705882352943, 0.0001373529411764706, 0.00013705882352941178, 0.00013676470588235294, 0.00013647058823529413, 0.0001361764705882353, 0.00013588235294117649, 0.00013558823529411765, 0.00013529411764705884, 0.00013500000000000003, 0.0001347058823529412, 0.00013441176470588238, 0.00013411764705882352, 0.0001338235294117647, 0.00013352941176470587, 0.00013323529411764706, 0.00013294117647058822, 0.00013264705882352941, 0.0001323529411764706, 0.00013205882352941177, 0.00013176470588235296, 0.00013147058823529412, 0.0001311764705882353, 0.00013088235294117647, 0.00013058823529411766, 0.00013029411764705883, 0.00013000000000000002, 0.00012970588235294118, 0.00012941176470588237, 0.00012911764705882353, 0.00012882352941176472, 0.00012852941176470588, 0.00012823529411764707, 0.00012794117647058824, 0.0001276470588235294, 0.0001273529411764706, 0.00012705882352941175, 0.00012676470588235294, 0.0001264705882352941, 0.0001261764705882353, 0.0001258823529411765, 0.00012558823529411765, 0.00012529411764705884, 0.000125, 0.0001247058823529412, 0.00012441176470588236, 0.00012411764705882355, 0.0001238235294117647, 0.0001235294117647059, 0.00012323529411764706, 0.00012294117647058825, 0.00012264705882352941, 0.0001223529411764706, 0.00012205882352941178, 0.00012176470588235293, 0.00012147058823529412, 0.0001211764705882353, 0.00012088235294117647, 0.00012058823529411765, 0.00012029411764705883, 0.00012, 0.00011970588235294118, 0.00011941176470588236, 0.00011911764705882353, 0.00011882352941176471, 0.00011852941176470589, 0.00011823529411764706, 0.00011794117647058824, 0.00011764705882352942, 0.0001173529411764706, 0.00011705882352941178, 0.00011676470588235296, 0.00011647058823529413, 0.00011617647058823531, 0.00011588235294117649, 0.00011558823529411764, 0.00011529411764705881, 0.00011499999999999999, 0.00011470588235294118, 0.00011441176470588236, 0.00011411764705882353, 0.00011382352941176471, 0.00011352941176470589, 0.00011323529411764706, 0.00011294117647058824, 0.00011264705882352942, 0.00011235294117647059, 0.00011205882352941177, 0.00011176470588235294, 0.00011147058823529412, 0.0001111764705882353, 0.00011088235294117649, 0.00011058823529411766, 0.00011029411764705884, 0.00011000000000000002, 0.0001097058823529412, 0.00010941176470588237, 0.00010911764705882352, 0.0001088235294117647, 0.00010852941176470587, 0.00010823529411764706, 0.00010794117647058824, 0.00010764705882352942, 0.00010735294117647059, 0.00010705882352941177, 0.00010676470588235295, 0.00010647058823529412, 0.0001061764705882353, 0.00010588235294117647, 0.00010558823529411765, 0.00010529411764705883, 0.000105, 0.00010470588235294118, 0.00010441176470588237, 0.00010411764705882355, 0.00010382352941176472, 0.0001035294117647059, 0.00010323529411764708, 0.00010294117647058823, 0.0001026470588235294, 0.00010235294117647058, 0.00010205882352941176, 0.00010176470588235295, 0.00010147058823529412, 0.0001011764705882353, 0.00010088235294117648, 0.00010058823529411765, 0.00010029411764705883, 0.0001, 9.970588235294118e-05, 9.941176470588236e-05, 9.911764705882353e-05, 9.882352941176471e-05, 9.852941176470589e-05, 9.823529411764706e-05, 9.794117647058824e-05, 9.764705882352942e-05, 9.73529411764706e-05, 9.705882352941177e-05, 9.676470588235295e-05, 9.647058823529412e-05, 9.61764705882353e-05, 9.588235294117648e-05, 9.558823529411765e-05, 9.529411764705883e-05, 9.5e-05, 9.470588235294118e-05, 9.441176470588236e-05, 9.411764705882353e-05, 9.382352941176471e-05, 9.352941176470589e-05, 9.323529411764706e-05, 9.294117647058824e-05, 9.264705882352942e-05, 9.23529411764706e-05, 9.205882352941177e-05, 9.176470588235295e-05, 9.147058823529412e-05, 9.11764705882353e-05, 9.088235294117648e-05, 9.058823529411765e-05, 9.029411764705883e-05, 9e-05, 8.970588235294118e-05, 8.941176470588236e-05, 8.911764705882354e-05, 8.882352941176471e-05, 8.852941176470589e-05, 8.823529411764706e-05, 8.794117647058824e-05, 8.764705882352942e-05, 8.73529411764706e-05, 8.705882352941177e-05, 8.676470588235295e-05, 8.647058823529412e-05, 8.61764705882353e-05, 8.588235294117646e-05, 8.558823529411765e-05, 8.529411764705883e-05, 8.5e-05, 8.470588235294118e-05, 8.441176470588236e-05, 8.411764705882354e-05, 8.382352941176471e-05, 8.352941176470589e-05, 8.323529411764707e-05, 8.294117647058824e-05, 8.26470588235294e-05, 8.23529411764706e-05, 8.205882352941177e-05, 8.176470588235295e-05, 8.147058823529412e-05, 8.11764705882353e-05, 8.088235294117648e-05, 8.058823529411765e-05, 8.029411764705883e-05, 8e-05, 7.970588235294118e-05, 7.941176470588235e-05, 7.911764705882354e-05, 7.882352941176471e-05, 7.852941176470589e-05, 7.823529411764707e-05, 7.794117647058824e-05, 7.764705882352942e-05, 7.73529411764706e-05, 7.705882352941177e-05, 7.676470588235295e-05, 7.647058823529411e-05, 7.617647058823529e-05, 7.588235294117648e-05, 7.558823529411765e-05, 7.529411764705883e-05, 7.500000000000001e-05, 7.470588235294118e-05, 7.441176470588236e-05, 7.411764705882354e-05, 7.382352941176471e-05, 7.352941176470589e-05, 7.323529411764705e-05, 7.294117647058823e-05, 7.264705882352942e-05, 7.23529411764706e-05, 7.205882352941177e-05, 7.176470588235295e-05, 7.147058823529412e-05, 7.11764705882353e-05, 7.088235294117648e-05, 7.058823529411765e-05, 7.029411764705882e-05, 7e-05, 6.970588235294117e-05, 6.941176470588236e-05, 6.911764705882354e-05, 6.882352941176471e-05, 6.852941176470589e-05, 6.823529411764707e-05, 6.794117647058824e-05, 6.764705882352942e-05, 6.73529411764706e-05, 6.705882352941176e-05, 6.676470588235294e-05, 6.647058823529411e-05, 6.61764705882353e-05, 6.588235294117648e-05, 6.558823529411765e-05, 6.529411764705883e-05, 6.500000000000001e-05, 6.470588235294118e-05, 6.441176470588236e-05, 6.411764705882354e-05, 6.38235294117647e-05, 6.352941176470588e-05, 6.323529411764705e-05, 6.294117647058824e-05, 6.264705882352942e-05, 6.23529411764706e-05, 6.205882352941177e-05, 6.176470588235295e-05, 6.147058823529413e-05, 6.11764705882353e-05, 6.0882352941176465e-05, 6.058823529411765e-05, 6.0294117647058825e-05, 6e-05, 5.970588235294118e-05, 5.9411764705882355e-05, 5.911764705882353e-05, 5.882352941176471e-05, 5.852941176470589e-05, 5.823529411764707e-05, 5.7941176470588244e-05, 5.764705882352941e-05, 5.735294117647059e-05, 5.7058823529411766e-05, 5.676470588235294e-05, 5.647058823529412e-05, 5.6176470588235296e-05, 5.588235294117647e-05, 5.558823529411765e-05, 5.529411764705883e-05, 5.500000000000001e-05, 5.4705882352941185e-05, 5.441176470588235e-05, 5.411764705882353e-05, 5.382352941176471e-05, 5.3529411764705884e-05, 5.323529411764706e-05, 5.294117647058824e-05, 5.2647058823529414e-05, 5.235294117647059e-05, 5.2058823529411774e-05, 5.176470588235295e-05, 5.147058823529411e-05, 5.117647058823529e-05, 5.088235294117647e-05, 5.058823529411765e-05, 5.0294117647058826e-05, 5e-05, 4.970588235294118e-05, 4.9411764705882355e-05, 4.911764705882353e-05, 4.882352941176471e-05, 4.8529411764705885e-05, 4.823529411764706e-05, 4.794117647058824e-05, 4.7647058823529414e-05, 4.735294117647059e-05, 4.705882352941177e-05, 4.6764705882352944e-05, 4.647058823529412e-05, 4.61764705882353e-05, 4.588235294117647e-05, 4.558823529411765e-05, 4.5294117647058826e-05, 4.5e-05, 4.470588235294118e-05, 4.4411764705882356e-05, 4.411764705882353e-05, 4.382352941176471e-05, 4.3529411764705885e-05, 4.323529411764706e-05, 4.294117647058823e-05, 4.2647058823529415e-05, 4.235294117647059e-05, 4.205882352941177e-05, 4.1764705882352944e-05, 4.147058823529412e-05, 4.11764705882353e-05, 4.0882352941176474e-05, 4.058823529411765e-05, 4.029411764705883e-05, 4e-05, 3.970588235294117e-05, 3.9411764705882356e-05, 3.911764705882353e-05, 3.882352941176471e-05, 3.8529411764705886e-05, 3.8235294117647055e-05, 3.794117647058824e-05, 3.7647058823529415e-05, 3.735294117647059e-05, 3.705882352941177e-05, 3.6764705882352945e-05, 3.6470588235294114e-05, 3.61764705882353e-05, 3.5882352941176474e-05, 3.558823529411765e-05, 3.529411764705883e-05, 3.5e-05, 3.470588235294118e-05, 3.441176470588236e-05, 3.411764705882353e-05, 3.382352941176471e-05, 3.352941176470588e-05, 3.3235294117647056e-05, 3.294117647058824e-05, 3.2647058823529416e-05, 3.235294117647059e-05, 3.205882352941177e-05, 3.176470588235294e-05, 3.147058823529412e-05, 3.11764705882353e-05, 3.0882352941176475e-05, 3.058823529411765e-05, 3.0294117647058824e-05, 3e-05, 2.9705882352941177e-05, 2.9411764705882354e-05, 2.9117647058823534e-05, 2.8823529411764703e-05, 2.8529411764705883e-05, 2.823529411764706e-05, 2.7941176470588236e-05, 2.7647058823529416e-05, 2.7352941176470593e-05, 2.7058823529411766e-05, 2.6764705882352942e-05, 2.647058823529412e-05, 2.6176470588235295e-05, 2.5882352941176475e-05, 2.5588235294117645e-05, 2.5294117647058825e-05, 2.5e-05, 2.4705882352941178e-05, 2.4411764705882354e-05, 2.411764705882353e-05, 2.3823529411764707e-05, 2.3529411764705884e-05, 2.323529411764706e-05, 2.2941176470588237e-05, 2.2647058823529413e-05, 2.235294117647059e-05, 2.2058823529411766e-05, 2.1764705882352943e-05, 2.1470588235294116e-05, 2.1176470588235296e-05, 2.0882352941176472e-05, 2.058823529411765e-05, 2.0294117647058825e-05, 2e-05, 1.9705882352941178e-05, 1.9411764705882355e-05, 1.9117647058823528e-05, 1.8823529411764708e-05, 1.8529411764705884e-05, 1.8235294117647057e-05, 1.7941176470588237e-05, 1.7647058823529414e-05, 1.735294117647059e-05, 1.7058823529411767e-05, 1.676470588235294e-05, 1.647058823529412e-05, 1.6176470588235296e-05, 1.588235294117647e-05, 1.558823529411765e-05, 1.5294117647058826e-05, 1.5e-05, 1.4705882352941177e-05, 1.4411764705882352e-05, 1.411764705882353e-05, 1.3823529411764708e-05, 1.3529411764705883e-05, 1.323529411764706e-05, 1.2941176470588238e-05, 1.2647058823529412e-05, 1.2352941176470589e-05, 1.2058823529411765e-05, 1.1764705882352942e-05, 1.1470588235294118e-05, 1.1176470588235295e-05, 1.0882352941176471e-05, 1.0588235294117648e-05, 1.0294117647058824e-05, 1e-05, 9.705882352941177e-06, 9.411764705882354e-06, 9.117647058823529e-06, 8.823529411764707e-06, 8.529411764705883e-06, 8.23529411764706e-06, 7.941176470588235e-06, 7.647058823529413e-06, 7.3529411764705884e-06, 7.058823529411765e-06, 6.7647058823529414e-06, 6.470588235294119e-06, 6.1764705882352944e-06, 5.882352941176471e-06, 5.588235294117647e-06, 5.294117647058824e-06, 5e-06, 4.705882352941177e-06, 4.411764705882353e-06, 4.11764705882353e-06, 3.823529411764706e-06, 3.5294117647058825e-06, 3.2352941176470594e-06, 2.9411764705882355e-06, 2.647058823529412e-06, 2.3529411764705885e-06, 2.058823529411765e-06, 1.7647058823529412e-06, 1.4705882352941177e-06, 1.1764705882352942e-06, 8.823529411764706e-07, 5.882352941176471e-07, 2.9411764705882356e-07, 0.0], 'training_time': 87095.12248468399}
12
+ 2025-02-14 11:34:25,367 - Evaluation results: {'meteor_scores': {'meteor': 0.10115606936416185}, 'rouge_scores': {'rouge1': 0.0, 'rouge2': 0.0, 'rougeL': 0.0, 'rougeLsum': 0.0}, 'bleu_scores': {'bleu': 0.0, 'precisions': [0.08235294117647059, 0.0, 0.0, 0.0], 'brevity_penalty': 1.0, 'length_ratio': 2.9310344827586206, 'translation_length': 85, 'reference_length': 29}, 'perplexity': 756517900.0}
session_logs/lora_finetuning_report.pdf ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4d503fc35e2d54c52449db0639bd7178a13ae9ffbdbd1a9effa663d5e7ac2d67
3
+ size 107215