EshAhm commited on
Commit
fffce84
·
verified ·
1 Parent(s): 0a2c5fa

EshAhm/LoRa-Python2

Browse files
README.md CHANGED
@@ -5,6 +5,7 @@ base_model: microsoft/phi-2
5
  tags:
6
  - base_model:adapter:microsoft/phi-2
7
  - lora
 
8
  pipeline_tag: text-generation
9
  model-index:
10
  - name: phi-2-LoRa-Python
@@ -18,7 +19,7 @@ should probably proofread and complete it, then remove this comment. -->
18
 
19
  This model is a fine-tuned version of [microsoft/phi-2](https://huggingface.co/microsoft/phi-2) on the None dataset.
20
  It achieves the following results on the evaluation set:
21
- - Loss: 4.4689
22
 
23
  ## Model description
24
 
@@ -52,28 +53,28 @@ The following hyperparameters were used during training:
52
 
53
  | Training Loss | Epoch | Step | Validation Loss |
54
  |:-------------:|:------:|:----:|:---------------:|
55
- | 4.5284 | 0.1333 | 100 | 4.4728 |
56
- | 4.4172 | 0.2667 | 200 | 4.4776 |
57
- | 4.2789 | 0.4 | 300 | 4.4774 |
58
- | 4.4041 | 0.5333 | 400 | 4.4751 |
59
- | 4.3978 | 0.6667 | 500 | 4.4777 |
60
- | 4.061 | 0.8 | 600 | 4.4762 |
61
- | 4.1693 | 0.9333 | 700 | 4.4764 |
62
- | 4.5403 | 1.0667 | 800 | 4.4727 |
63
- | 4.5481 | 1.2 | 900 | 4.4725 |
64
- | 4.0223 | 1.3333 | 1000 | 4.4757 |
65
- | 4.5108 | 1.4667 | 1100 | 4.4747 |
66
- | 4.0763 | 1.6 | 1200 | 4.4719 |
67
- | 4.1443 | 1.7333 | 1300 | 4.4723 |
68
- | 4.4699 | 1.8667 | 1400 | 4.4738 |
69
- | 4.7084 | 2.0 | 1500 | 4.4713 |
70
- | 3.9716 | 2.1333 | 1600 | 4.4710 |
71
- | 4.5229 | 2.2667 | 1700 | 4.4711 |
72
- | 3.8189 | 2.4 | 1800 | 4.4702 |
73
- | 4.6479 | 2.5333 | 1900 | 4.4695 |
74
- | 4.4305 | 2.6667 | 2000 | 4.4690 |
75
- | 4.2955 | 2.8 | 2100 | 4.4690 |
76
- | 4.2989 | 2.9333 | 2200 | 4.4689 |
77
 
78
 
79
  ### Framework versions
 
5
  tags:
6
  - base_model:adapter:microsoft/phi-2
7
  - lora
8
+ - transformers
9
  pipeline_tag: text-generation
10
  model-index:
11
  - name: phi-2-LoRa-Python
 
19
 
20
  This model is a fine-tuned version of [microsoft/phi-2](https://huggingface.co/microsoft/phi-2) on the None dataset.
21
  It achieves the following results on the evaluation set:
22
+ - Loss: 4.4864
23
 
24
  ## Model description
25
 
 
53
 
54
  | Training Loss | Epoch | Step | Validation Loss |
55
  |:-------------:|:------:|:----:|:---------------:|
56
+ | 4.5433 | 0.1333 | 100 | 4.4747 |
57
+ | 4.4162 | 0.2667 | 200 | 4.4774 |
58
+ | 4.2759 | 0.4 | 300 | 4.4755 |
59
+ | 4.4021 | 0.5333 | 400 | 4.4764 |
60
+ | 4.3925 | 0.6667 | 500 | 4.4775 |
61
+ | 4.6016 | 0.8 | 600 | 4.5976 |
62
+ | 4.2527 | 0.9333 | 700 | 4.5484 |
63
+ | 4.5823 | 1.0667 | 800 | 4.5037 |
64
+ | 4.5826 | 1.2 | 900 | 4.5032 |
65
+ | 4.0654 | 1.3333 | 1000 | 4.5073 |
66
+ | 4.5386 | 1.4667 | 1100 | 4.4961 |
67
+ | 4.1046 | 1.6 | 1200 | 4.4957 |
68
+ | 4.1705 | 1.7333 | 1300 | 4.4943 |
69
+ | 4.4922 | 1.8667 | 1400 | 4.4918 |
70
+ | 4.7333 | 2.0 | 1500 | 4.4901 |
71
+ | 3.997 | 2.1333 | 1600 | 4.4889 |
72
+ | 4.5407 | 2.2667 | 1700 | 4.4880 |
73
+ | 3.8457 | 2.4 | 1800 | 4.4877 |
74
+ | 4.6653 | 2.5333 | 1900 | 4.4873 |
75
+ | 4.4524 | 2.6667 | 2000 | 4.4865 |
76
+ | 4.3138 | 2.8 | 2100 | 4.4870 |
77
+ | 4.3203 | 2.9333 | 2200 | 4.4865 |
78
 
79
 
80
  ### Framework versions
adapter_config.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
  "alpha_pattern": {},
3
  "auto_mapping": null,
4
- "base_model_name_or_path": null,
5
  "bias": "none",
6
  "corda_config": null,
7
  "eva_config": null,
@@ -25,10 +25,10 @@
25
  "rank_pattern": {},
26
  "revision": null,
27
  "target_modules": [
28
- "v_proj",
29
  "k_proj",
30
  "dense",
31
- "q_proj"
 
32
  ],
33
  "target_parameters": null,
34
  "task_type": "CAUSAL_LM",
 
1
  {
2
  "alpha_pattern": {},
3
  "auto_mapping": null,
4
+ "base_model_name_or_path": "microsoft/phi-2",
5
  "bias": "none",
6
  "corda_config": null,
7
  "eva_config": null,
 
25
  "rank_pattern": {},
26
  "revision": null,
27
  "target_modules": [
 
28
  "k_proj",
29
  "dense",
30
+ "q_proj",
31
+ "v_proj"
32
  ],
33
  "target_parameters": null,
34
  "task_type": "CAUSAL_LM",
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2746cc7bdcac3d6b58df64efac21ef3160762157b0ea2c2af8976c80df4b6ef8
3
- size 83924816
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d0cb54926955f8465684c4f5a5d7fa4f8f6a6a2ecb1b624fdca9677961b29f12
3
+ size 83920464
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:77a7985546e2331302690dc943aa4032cf03d6e8a512705d41ba11c33fac01ec
3
  size 5777
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:92c05c04197940bf30d25a6ee8a5208e08514d553240522c61099e94cceb9a3b
3
  size 5777