|
20 | 20 | MODELS = { |
21 | 21 | "TinyLlama-1.1B-Chat-v1.0": { |
22 | 22 | "name": "TinyLlama/TinyLlama-1.1B-Chat-v1.0", |
23 | | - "convert_args": [] |
| 23 | + "convert_args": ['--weight-format', 'fp16'] |
24 | 24 | }, |
25 | 25 | "SmolLM-135M": { |
26 | 26 | "name": "HuggingFaceTB/SmolLM-135M", |
27 | | - "convert_args": ['--trust-remote-code', '--weight-format', 'fp16'] |
| 27 | + "convert_args": ['--trust-remote-code'] |
28 | 28 | }, |
29 | 29 | "SmolLM2-135M": { |
30 | 30 | "name": "HuggingFaceTB/SmolLM2-135M", |
|
36 | 36 | }, |
37 | 37 | "WhisperTiny": { |
38 | 38 | "name": "openai/whisper-tiny", |
39 | | - "convert_args": ['--trust-remote-code'] |
| 39 | + "convert_args": ['--trust-remote-code', '--weight-format', 'fp16'] |
40 | 40 | }, |
41 | 41 | "Qwen2.5-0.5B-Instruct": { |
42 | 42 | "name": "Qwen/Qwen2.5-0.5B-Instruct", |
43 | | - "convert_args": ['--trust-remote-code', '--weight-format', 'fp16'] |
| 43 | + "convert_args": ['--trust-remote-code'] |
44 | 44 | }, |
45 | 45 | "Qwen2-0.5B-Instruct": { |
46 | 46 | "name": "Qwen/Qwen2-0.5B-Instruct", |
47 | | - "convert_args": ['--trust-remote-code', '--weight-format', 'fp16'] |
| 47 | + "convert_args": ['--trust-remote-code'] |
48 | 48 | }, |
49 | 49 | "phi-1_5": { |
50 | 50 | "name": "microsoft/phi-1_5", |
51 | 51 | "convert_args": ['--trust-remote-code', '--weight-format', 'fp16'] |
52 | 52 | }, |
53 | 53 | "TinyStories-1M": { |
54 | 54 | "name": "roneneldan/TinyStories-1M", |
55 | | - "convert_args": ['--trust-remote-code', '--weight-format', 'fp16'] |
| 55 | + "convert_args": ['--trust-remote-code'] |
56 | 56 | }, |
57 | 57 | "dreamlike-anime-1.0": { |
58 | 58 | "name": "dreamlike-art/dreamlike-anime-1.0", |
|
64 | 64 | }, |
65 | 65 | "llava-1.5-7b-hf": { |
66 | 66 | "name": "llava-hf/llava-1.5-7b-hf", |
67 | | - "convert_args": ['--trust-remote-code'] |
| 67 | + "convert_args": ['--trust-remote-code', '--weight-format', 'fp16'] |
68 | 68 | }, |
69 | 69 | "llava-v1.6-mistral-7b-hf": { |
70 | 70 | "name": "llava-hf/llava-v1.6-mistral-7b-hf", |
71 | | - "convert_args": ['--trust-remote-code'] |
| 71 | + "convert_args": ['--trust-remote-code', '--weight-format', 'fp16'] |
72 | 72 | }, |
73 | 73 | "dreamlike-anime-1.0": { |
74 | 74 | "name": "dreamlike-art/dreamlike-anime-1.0", |
|
84 | 84 | }, |
85 | 85 | "InternVL2-1B": { |
86 | 86 | "name": "OpenGVLab/InternVL2-1B", |
87 | | - "convert_args": ['--trust-remote-code'] |
| 87 | + "convert_args": ['--trust-remote-code', '--weight-format', 'fp16'] |
88 | 88 | }, |
89 | 89 | "Qwen2-VL-2B-Instruct": { |
90 | 90 | "name": "Qwen/Qwen2-VL-2B-Instruct", |
91 | | - "convert_args": ['--trust-remote-code'] |
| 91 | + "convert_args": ['--trust-remote-code', '--weight-format', 'fp16'] |
92 | 92 | }, |
93 | 93 | "tiny-dummy-qwen2": { |
94 | 94 | "name": "fxmarty/tiny-dummy-qwen2", |
|
0 commit comments