Files
mm-cand-aim_on_task_arithmetic/merge_manifest.json

49 lines
1.9 KiB
JSON
Raw Permalink Normal View History

{
"config_id": "aim_on_task_arithmetic",
"baseline_id": "aim_on_task_arithmetic",
"method_family": "AIM",
"variant": "aim_post_merge",
"calibration_id": "mix",
"parent_config_id": "task_arithmetic_best",
"parent_checkpoint": "outputs/merged/task_arithmetic_best",
"parent_manifest": "outputs/merged/task_arithmetic_best/merge_manifest.json",
"parent_manifest_sha256": "92f74cbaee5cced7e80cb0e8d40cd467c5208ed2536ce74ab909110da18b837d",
"base_model": {
"alias": "base",
"repo": "Qwen/Qwen3-8B-Base",
"revision": "49e3418fbbbca6ecbdf9608b4d22e5a407081db4"
},
"source_models": [
{
"alias": "instr_only",
"repo": "Qwen/Qwen3-8B",
"revision": "b968826d9c46dd6066d109eabc6255188de91218"
},
{
"alias": "reasoning_only",
"repo": "OpenDataArena/Qwen3-8B-ODA-Math-460k",
"revision": "8e8758ee23e5d959dd844b3bb5c5344219544795"
},
{
"alias": "uncensored_only",
"repo": "mlabonne/Qwen3-8B-abliterated",
"revision": "30c72fa348f37c72d12ecbb259068ddee98aa9ed"
}
],
"calibration_corpus": "data/calibration/calib_mix.jsonl",
"calibration_corpus_sha256": "2a06712fad717ca9c6e30f0448eba00f75e1a8441175e38f84dfd34205455bbc",
"calibration_manifest": "data/calibration/calibration_manifest.json",
"calibration_manifest_sha256": "0329db8847280d638976f6565207bc1f3e08f0b877cdadb82d23220f64c2bcb0",
"non_overlap_report": "data/calibration/non_overlap_report.json",
"non_overlap_report_sha256": "73a2efdbd1e304ec8310ba973a9cc3026026e542eefe5bccf4908918af89ca6b",
"aim_repo": "external/ActivationInformedMerging",
"aim_commit": "e7eccd573d010da13dc6f795a23a36f9822851c9",
"aim_patch_script": "code/patches/activation_informed_merging/apply_local_calibration_patch.py",
"aim_patch_script_sha256": "b1f0d5d2aead41d1b750af5c5f5475a2ad5476b2f7bfcc6b81e5a1e42d40b9ad",
"omega": 0.4,
"device": "cuda",
"dtype": "bfloat16",
"run": {
"exit_code": 0
}
}