11691169 "act_param" : None ,
11701170 "open-data" : "None" ,
11711171 },
1172+ "Qwen/Qwen2.5-Coder-1.5B-Instruct" : {
1173+ "name" : "Qwen2.5-Coder-1.5B-Instruct" ,
1174+ "link" : "https://huggingface.co/Qwen/Qwen2.5-Coder-1.5B-Instruct" ,
1175+ "prompted" : True ,
1176+ "moe" : False ,
1177+ "size" : 1.5 ,
1178+ "act_param" : 1.5 ,
1179+ "open-data" : "None" ,
1180+ },
1181+ "Qwen/Qwen2.5-Coder-7B-Instruct" : {
1182+ "name" : "Qwen2.5-Coder-7B-Instruct" ,
1183+ "link" : "https://huggingface.co/Qwen/Qwen2.5-Coder-7B-Instruct" ,
1184+ "prompted" : True ,
1185+ "moe" : False ,
1186+ "size" : 7 ,
1187+ "act_param" : 7 ,
1188+ "open-data" : "None" ,
1189+ },
1190+ "gemini-1.5-pro-002" : {
1191+ "name" : "Gemini-1.5-Pro-002" ,
1192+ "link" : "https://deepmind.google/technologies/gemini/pro" ,
1193+ "prompted" : True ,
1194+ "moe" : False ,
1195+ "size" : None ,
1196+ "act_param" : None ,
1197+ "open-data" : "None" ,
1198+ },
1199+ "mistralai/Mistral-Small-Instruct-2409" : {
1200+ "name" : "Mistral-Small-Instruct-2409" ,
1201+ "link" : "https://huggingface.co/mistralai/Mistral-Small-Instruct-2409" ,
1202+ "prompted" : True ,
1203+ "moe" : False ,
1204+ "size" : 22.2 ,
1205+ "act_param" : 22.2 ,
1206+ "open-data" : "None" ,
1207+ },
1208+ "Qwen/Qwen2.5-0.5B-Instruct" : {
1209+ "name" : "Qwen2.5-0.5B-Instruct" ,
1210+ "link" : "https://huggingface.co/Qwen/Qwen2.5-0.5B-Instruct" ,
1211+ "prompted" : True ,
1212+ "moe" : False ,
1213+ "size" : 0.5 ,
1214+ "act_param" : 0.5 ,
1215+ "open-data" : "None" ,
1216+ },
1217+ "Qwen/Qwen2.5-1.5B-Instruct" : {
1218+ "name" : "Qwen2.5-1.5B-Instruct" ,
1219+ "link" : "https://huggingface.co/Qwen/Qwen2.5-1.5B-Instruct" ,
1220+ "prompted" : True ,
1221+ "moe" : False ,
1222+ "size" : 1.5 ,
1223+ "act_param" : 1.5 ,
1224+ "open-data" : "None" ,
1225+ },
1226+ "Qwen/Qwen2.5-7B-Instruct" : {
1227+ "name" : "Qwen2.5-7B-Instruct" ,
1228+ "link" : "https://huggingface.co/Qwen/Qwen2.5-7B-Instruct" ,
1229+ "prompted" : True ,
1230+ "moe" : False ,
1231+ "size" : 7 ,
1232+ "act_param" : 7 ,
1233+ "open-data" : "None" ,
1234+ },
1235+ "Qwen/Qwen2.5-14B-Instruct" : {
1236+ "name" : "Qwen2.5-14B-Instruct" ,
1237+ "link" : "https://huggingface.co/Qwen/Qwen2.5-14B-Instruct" ,
1238+ "prompted" : True ,
1239+ "moe" : False ,
1240+ "size" : 14 ,
1241+ "act_param" : 14 ,
1242+ "open-data" : "None" ,
1243+ },
1244+ "Qwen/Qwen2.5-32B-Instruct" : {
1245+ "name" : "Qwen2.5-32B-Instruct" ,
1246+ "link" : "https://huggingface.co/Qwen/Qwen2.5-32B-Instruct" ,
1247+ "prompted" : True ,
1248+ "moe" : False ,
1249+ "size" : 32 ,
1250+ "act_param" : 32 ,
1251+ "open-data" : "None" ,
1252+ },
1253+ "Qwen/Qwen2.5-72B-Instruct" : {
1254+ "name" : "Qwen2.5-72B-Instruct" ,
1255+ "link" : "https://huggingface.co/Qwen/Qwen2.5-72B-Instruct" ,
1256+ "prompted" : True ,
1257+ "moe" : False ,
1258+ "size" : 72 ,
1259+ "act_param" : 72 ,
1260+ "open-data" : "None" ,
1261+ },
1262+ "meta-llama/Llama-3.2-1B-Instruct" : {
1263+ "name" : "Llama-3.2-1B-Instruct" ,
1264+ "link" : "https://huggingface.co/meta-llama/Llama-3.2-1B-Instruct" ,
1265+ "prompted" : True ,
1266+ "moe" : False ,
1267+ "size" : 1 ,
1268+ "act_param" : 1 ,
1269+ "open-data" : "None" ,
1270+ },
1271+ "meta-llama/Llama-3.2-3B-Instruct" : {
1272+ "name" : "Llama-3.2-3B-Instruct" ,
1273+ "link" : "https://huggingface.co/meta-llama/Llama-3.2-3B-Instruct" ,
1274+ "prompted" : True ,
1275+ "moe" : False ,
1276+ "size" : 3 ,
1277+ "act_param" : 3 ,
1278+ "open-data" : "None" ,
1279+ },
11721280}
0 commit comments