mirror of
https://github.com/deepseek-ai/ESFT
synced 2024-11-25 13:26:13 +00:00
18d23501ab
update readme update readme update readme Update benchmarks.py Update download_adapters.sh Update esft.py
1 line
586 B
JSON
1 line
586 B
JSON
{"experts": {"1": [35, 22, 13, 43], "10": [25, 9, 13], "11": [4, 17], "12": [28, 61, 56], "13": [15, 14, 45], "14": [5, 56, 27, 46], "15": [23, 30, 55], "16": [16, 9, 20], "17": [26, 62, 29], "18": [30, 59, 52], "19": [24, 22, 58], "2": [23, 33, 1], "20": [38, 43, 4], "21": [17, 15, 53], "22": [11, 55, 5], "23": [58, 54, 46, 4], "24": [47, 23, 57, 1], "25": [63, 29, 52, 46], "26": [56, 17, 21, 52], "3": [15, 5, 42, 14], "4": [51, 2, 59], "5": [55, 53, 63], "6": [23, 55, 41], "7": [16, 46, 32], "8": [63, 25], "9": [0, 44, 12]}, "shared_experts": false, "non_expert_modules": false} |