mirror of
https://github.com/deepseek-ai/ESFT
synced 2024-11-22 19:44:22 +00:00
18d23501ab
update readme update readme update readme Update benchmarks.py Update download_adapters.sh Update esft.py
1 line
758 B
JSON
1 line
758 B
JSON
{"experts": {"1": [62, 25, 32, 30, 27, 55, 48, 33], "10": [0, 43, 37, 51, 1], "11": [62, 24, 57, 55], "12": [30, 17, 25, 28, 48, 42], "13": [19, 55, 51, 44, 21, 3], "14": [40, 5, 12, 36], "15": [8, 29, 30, 23, 60], "16": [24, 34, 3, 62, 38], "17": [55, 56, 42, 13, 57, 46, 52, 8], "18": [51, 35, 30, 25, 0], "19": [17, 53, 56, 47], "2": [7, 51, 33, 19, 42, 20, 46], "20": [57, 5, 26, 17], "21": [31, 53, 54], "22": [6, 25, 61, 57, 19], "23": [4, 36, 2, 60], "24": [20, 14, 16, 21, 53], "25": [57, 49, 8, 37], "26": [48, 36], "3": [58, 45, 44, 7, 22, 2], "4": [59, 9, 52, 13, 61, 26], "5": [31, 42, 15, 55, 35], "6": [6, 14, 19, 37, 12, 40], "7": [33, 20, 17, 16], "8": [46, 25, 2, 17], "9": [25, 46, 0]}, "shared_experts": false, "non_expert_modules": false} |