Skip to content

Commit abbab79

Browse files
authoredApr 29, 2024··
feat: add phi-3 (#20)
1 parent 6bb00b0 commit abbab79

File tree

2 files changed

+183
-1
lines changed

2 files changed

+183
-1
lines changed
 

‎all.json

+1-1
Large diffs are not rendered by default.

‎models/microsoft/phi-3.json

+182
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,182 @@
1+
{
2+
"_version": "1.0.0",
3+
"id": "microsoft/Phi-3-mini-4k-instruct-gguf",
4+
"name": "Phi-3-mini-4k-instruct-gguf",
5+
"creator": "microsoft",
6+
"title": "Phi-3 mini 4k instruct",
7+
"version": "3.0.0",
8+
"description": "Phi-3 is a Transformer with 2.7 billion parameters. It was trained using the same data sources as Phi-1.5, augmented with a new data source that consists of various NLP synthetic texts and filtered websites (for safety and educational value). When assessed against benchmarks testing common sense, language understanding, and logical reasoning, Phi-3 showcased a nearly state-of-the-art performance among models with less than 13 billion parameters.",
9+
"author": "Microsoft",
10+
"publisher": {
11+
"name": "Microsoft",
12+
"url": "https://huggingface.co/microsoft"
13+
},
14+
"license": "MIT",
15+
"tags": "transformer safetensors phi-msft text-generation nlp code custom_code en license:mit autotrain_compatible has_space region:us",
16+
"task_type": [
17+
"text-generation"
18+
],
19+
"languages": [
20+
"en"
21+
],
22+
"model_size": "3.8b",
23+
"context_size": 4096,
24+
"tensor_type": "float16",
25+
"base_model": "none",
26+
"model_type": "phi-msft",
27+
"library": "PyTorch",
28+
"private": false,
29+
"featured": true,
30+
"use_cases": "The model is intended for commercial and research use in English. The model provides uses for applications which require memory/compute constrained environments latency bound scenarios strong reasoning (especially math and logic) long context Our model is designed to accelerate research on language and multimodal models, for use as a building block for generative AI powered features. ",
31+
"out_of_scope_use_cases": "Limited Scope for code: Majority of Phi-3 training data is based in Python and use common packages such as 'typing, math, random, collections, datetime, itertools'. If the model generates Python scripts that utilize other packages or scripts in other languages, we strongly recommend users manually verify all API uses.",
32+
"bias_risks_limitations": "Like other language models, the Phi series models can potentially behave in ways that are unfair, unreliable, or offensive.",
33+
"repository": "https://huggingface.co/microsoft/phi-3",
34+
"download": "https://huggingface.co/microsoft/phi-3",
35+
"include": [
36+
{
37+
"name": "Phi-3-mini-4k-instruct-fp16.gguf",
38+
"recommendations": "Largest, not quantized extremely low quality loss - not recommended for most purposes",
39+
"bits": 16,
40+
"size": 7.64,
41+
"sha": "8fb08713c270f80793074cf30964e61cc2bccd6b4e1e5fd73a895a9bbecb7ac0",
42+
"file_size": 7643301888,
43+
"download": "https://huggingface.co/microsoft/Phi-3-mini-4k-instruct-gguf/raw/main/Phi-3-mini-4k-instruct-fp16.gguf"
44+
},
45+
{
46+
"name": "Phi-3-mini-4k-instruct-q4.gguf",
47+
"recommendations": "medium, balanced quality - recommended",
48+
"quantization": "Q4_K_M",
49+
"bits": 4,
50+
"size": 2.32,
51+
"recommended": true,
52+
"sha": "1cd9a9df07350196623f93bf4829cf228959e07ad32f787b8fdd7f5956f5b9de",
53+
"file_size": 2318919200,
54+
"download": "https://huggingface.co/microsoft/Phi-3-mini-4k-instruct-gguf/blob/main/Phi-3-mini-4k-instruct-q4.gguf"
55+
},
56+
{
57+
"name": "phi-3-mini-4k-instruct.Q2_K.gguf",
58+
"recommendations": "smallest, significant quality loss - not recommended for most purposes",
59+
"quantization": "Q2_K",
60+
"bits": 2,
61+
"size": 1.45,
62+
"sha": "08928f542fe145d26ea44249f123487271c9d372cba0a94d23bef5a546b7a86f",
63+
"file_size": 1446879616,
64+
"download": "https://huggingface.co/martineden/Phi-3-mini-4k-instruct-GGUF/resolve/main/phi-3-mini-4k-instruct.Q2_K.gguf"
65+
},
66+
{
67+
"name": "phi-3-mini-4k-instruct.Q3_K_S.gguf",
68+
"recommendations": "very small, high quality loss",
69+
"quantization": "Q3_K_S",
70+
"bits": 3,
71+
"size": 1.68,
72+
"sha": "145598bc4cff45095e500a228ceb4736c85a739a0a1bd495445bf214b6e9070a",
73+
"file_size": 1681803136,
74+
"download": "https://huggingface.co/martineden/Phi-3-mini-4k-instruct-GGUF/resolve/main/phi-3-mini-4k-instruct.Q3_K_S.gguf"
75+
},
76+
{
77+
"name": "phi-3-mini-4k-instruct.Q3_K_M.gguf",
78+
"recommendations": "very small, high quality loss",
79+
"quantization": "Q3_K_M",
80+
"bits": 3,
81+
"size": 1.88,
82+
"sha": "77952309d6929d52ec11d34bfc5f7ab22f7317087892c334626527cdf0dcd4ed",
83+
"file_size": 1877624704,
84+
"download": "https://huggingface.co/martineden/Phi-3-mini-4k-instruct-GGUF/resolve/main/phi-3-mini-4k-instruct.Q3_K_M.gguf"
85+
},
86+
{
87+
"name": "phi-3-mini-4k-instruct.Q3_K_L.gguf",
88+
"recommendations": "small, substantial quality loss",
89+
"quantization": "Q3_K_L",
90+
"bits": 3,
91+
"size": 2.05,
92+
"sha": "0496776c4cb6ce732552e039b7f64e1702bf0b942d963fbdf36652fb985a4933",
93+
"file_size": 2045134720,
94+
"download": "https://huggingface.co/martineden/Phi-3-mini-4k-instruct-GGUF/resolve/main/phi-3-mini-4k-instruct.Q3_K_L.gguf"
95+
},
96+
{
97+
"name": "phi-3-mini-4k-instruct.Q4_0.gguf",
98+
"recommendations": "legacy; small, very high quality loss - prefer using Q3_K_M",
99+
"quantization": "Q4_0",
100+
"bits": 4,
101+
"size": 2.18,
102+
"deprecated": true,
103+
"sha": "eaf1acc4ea062662291851b3dfaf37308183fe718c66ef1bca6b1313f6174648",
104+
"file_size": 2176181632,
105+
"download": "https://huggingface.co/martineden/Phi-3-mini-4k-instruct-GGUF/resolve/main/phi-3-mini-4k-instruct.Q4_0.gguf"
106+
},
107+
{
108+
"name": "phi-3-mini-4k-instruct.Q4_K_S.gguf",
109+
"recommendations": "small, greater quality loss",
110+
"quantization": "Q4_K_S",
111+
"bits": 4,
112+
"size": 2.19,
113+
"sha": "8fb84fb36191169e46ff8a73c10f168b7a1f756cde5c81d985dd524ec7fa7432",
114+
"file_size": 2193483136,
115+
"download": "https://huggingface.co/martineden/Phi-3-mini-4k-instruct-GGUF/resolve/main/phi-3-mini-4k-instruct.Q4_K_S.gguf"
116+
},
117+
{
118+
"name": "phi-3-mini-4k-instruct.Q4_K_M.gguf",
119+
"recommendations": "medium, balanced quality - recommended",
120+
"quantization": "Q4_K_M",
121+
"bits": 4,
122+
"size": 2.32,
123+
"recommended": true,
124+
"sha": "4fed7364ee3e0c7cb4fe0880148bfdfcd1b630981efa0802a6b62ee52e7da97e",
125+
"file_size": 2318919040,
126+
"download": "https://huggingface.co/martineden/Phi-3-mini-4k-instruct-GGUF/resolve/main/phi-3-mini-4k-instruct.Q4_K_M.gguf"
127+
},
128+
{
129+
"name": "phi-3-mini-4k-instruct.Q5_0.gguf",
130+
"recommendations": "legacy; medium, balanced quality - prefer using Q4_K_M",
131+
"quantization": "Q5_0",
132+
"bits": 5,
133+
"size": 2.64,
134+
"deprecated": true,
135+
"sha": "a42350d48d8b0d8bde4ed764c361609b1e3d51a10263bb407b177ae1ab694377",
136+
"file_size": 2641479040,
137+
"download": "https://huggingface.co/martineden/Phi-3-mini-4k-instruct-GGUF/resolve/main/phi-3-mini-4k-instruct.Q5_0.gguf"
138+
},
139+
{
140+
"name": "phi-3-mini-4k-instruct.Q5_K_S.gguf",
141+
"recommendations": "large, low quality loss - recommended",
142+
"quantization": "Q5_K_S",
143+
"bits": 5,
144+
"size": 2.64,
145+
"recommended": true,
146+
"sha": "276449866217a16a91b8264cd97e20e6178de28995afe78a99d9f8fc8821c32f",
147+
"file_size": 2641479040,
148+
"download": "https://huggingface.co/martineden/Phi-3-mini-4k-instruct-GGUF/resolve/main/phi-3-mini-4k-instruct.Q5_K_S.gguf"
149+
},
150+
{
151+
"name": "phi-3-mini-4k-instruct.Q5_K_M.gguf",
152+
"recommendations": "large, very low quality loss - recommended",
153+
"quantization": "Q5_K_M",
154+
"bits": 5,
155+
"size": 2.72,
156+
"recommended": true,
157+
"sha": "231e50055db793cfefb394b18eceb92166f749ca1d55ad472153eca29640cf68",
158+
"file_size": 2715010432,
159+
"download": "https://huggingface.co/martineden/Phi-3-mini-4k-instruct-GGUF/resolve/main/phi-3-mini-4k-instruct.Q5_K_M.gguf"
160+
},
161+
{
162+
"name": "phi-3-mini-4k-instruct.Q6_K.gguf",
163+
"recommendations": "very large, extremely low quality loss",
164+
"quantization": "Q6_K",
165+
"bits": 6,
166+
"size": 3.14,
167+
"sha": "2f757f37bf8178e3d54410eedfa05e91f28fa9aa051e2508a10e70acc67b0725",
168+
"file_size": 3135857536,
169+
"download": "https://huggingface.co/martineden/Phi-3-mini-4k-instruct-GGUF/resolve/main/phi-3-mini-4k-instruct.Q6_K.gguf"
170+
},
171+
{
172+
"name": "phi-3-mini-4k-instruct.Q8_0.gguf",
173+
"recommendations": "very large, extremely low quality loss",
174+
"quantization": "Q8_0",
175+
"bits": 8,
176+
"size": 4.06,
177+
"sha": "d8e99a77bec94f65e623b5c126f8210a9b98924310351e0eed245b81a5d2a93f",
178+
"file_size": 4061226880,
179+
"download": "https://huggingface.co/martineden/Phi-3-mini-4k-instruct-GGUF/resolve/main/phi-3-mini-4k-instruct.Q8_0.gguf"
180+
}
181+
]
182+
}

0 commit comments

Comments
 (0)
Please sign in to comment.