[WIP] Upload folder using huggingface_hub (multi-commit 4cd94e22b636df419eb04f0cf58e5b00188bf26052dae98b0b94b80572bafc24)

#1
Files changed (1) hide show
  1. README.md +1 -109
README.md CHANGED
@@ -14,101 +14,6 @@ datasets:
14
  - iamtarun/python_code_instructions_18k_alpaca
15
  - ajibawa-2023/Python-Code-23k-ShareGPT
16
  pipeline_tag: text-generation
17
- model-index:
18
- - name: phi-3-mini-4k-python
19
- results:
20
- - task:
21
- type: text-generation
22
- name: Text Generation
23
- dataset:
24
- name: IFEval (0-Shot)
25
- type: HuggingFaceH4/ifeval
26
- args:
27
- num_few_shot: 0
28
- metrics:
29
- - type: inst_level_strict_acc and prompt_level_strict_acc
30
- value: 24.09
31
- name: strict accuracy
32
- source:
33
- url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=theprint/phi-3-mini-4k-python
34
- name: Open LLM Leaderboard
35
- - task:
36
- type: text-generation
37
- name: Text Generation
38
- dataset:
39
- name: BBH (3-Shot)
40
- type: BBH
41
- args:
42
- num_few_shot: 3
43
- metrics:
44
- - type: acc_norm
45
- value: 28.45
46
- name: normalized accuracy
47
- source:
48
- url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=theprint/phi-3-mini-4k-python
49
- name: Open LLM Leaderboard
50
- - task:
51
- type: text-generation
52
- name: Text Generation
53
- dataset:
54
- name: MATH Lvl 5 (4-Shot)
55
- type: hendrycks/competition_math
56
- args:
57
- num_few_shot: 4
58
- metrics:
59
- - type: exact_match
60
- value: 8.46
61
- name: exact match
62
- source:
63
- url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=theprint/phi-3-mini-4k-python
64
- name: Open LLM Leaderboard
65
- - task:
66
- type: text-generation
67
- name: Text Generation
68
- dataset:
69
- name: GPQA (0-shot)
70
- type: Idavidrein/gpqa
71
- args:
72
- num_few_shot: 0
73
- metrics:
74
- - type: acc_norm
75
- value: 5.48
76
- name: acc_norm
77
- source:
78
- url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=theprint/phi-3-mini-4k-python
79
- name: Open LLM Leaderboard
80
- - task:
81
- type: text-generation
82
- name: Text Generation
83
- dataset:
84
- name: MuSR (0-shot)
85
- type: TAUR-Lab/MuSR
86
- args:
87
- num_few_shot: 0
88
- metrics:
89
- - type: acc_norm
90
- value: 9.22
91
- name: acc_norm
92
- source:
93
- url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=theprint/phi-3-mini-4k-python
94
- name: Open LLM Leaderboard
95
- - task:
96
- type: text-generation
97
- name: Text Generation
98
- dataset:
99
- name: MMLU-PRO (5-shot)
100
- type: TIGER-Lab/MMLU-Pro
101
- config: main
102
- split: test
103
- args:
104
- num_few_shot: 5
105
- metrics:
106
- - type: acc
107
- value: 28.63
108
- name: accuracy
109
- source:
110
- url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=theprint/phi-3-mini-4k-python
111
- name: Open LLM Leaderboard
112
  ---
113
 
114
  # Uploaded model
@@ -119,17 +24,4 @@ model-index:
119
 
120
  This mistral model was trained 2x faster with [Unsloth](https://github.com/unslothai/unsloth) and Huggingface's TRL library.
121
 
122
- [<img src="https://raw.githubusercontent.com/unslothai/unsloth/main/images/unsloth%20made%20with%20love.png" width="200"/>](https://github.com/unslothai/unsloth)
123
- # [Open LLM Leaderboard Evaluation Results](https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard)
124
- Detailed results can be found [here](https://huggingface.co/datasets/open-llm-leaderboard/details_theprint__phi-3-mini-4k-python)
125
-
126
- | Metric |Value|
127
- |-------------------|----:|
128
- |Avg. |17.39|
129
- |IFEval (0-Shot) |24.09|
130
- |BBH (3-Shot) |28.45|
131
- |MATH Lvl 5 (4-Shot)| 8.46|
132
- |GPQA (0-shot) | 5.48|
133
- |MuSR (0-shot) | 9.22|
134
- |MMLU-PRO (5-shot) |28.63|
135
-
 
14
  - iamtarun/python_code_instructions_18k_alpaca
15
  - ajibawa-2023/Python-Code-23k-ShareGPT
16
  pipeline_tag: text-generation
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
17
  ---
18
 
19
  # Uploaded model
 
24
 
25
  This mistral model was trained 2x faster with [Unsloth](https://github.com/unslothai/unsloth) and Huggingface's TRL library.
26
 
27
+ [<img src="https://raw.githubusercontent.com/unslothai/unsloth/main/images/unsloth%20made%20with%20love.png" width="200"/>](https://github.com/unslothai/unsloth)