From e7a907fbc64a3c630d879dc6d54cb96b0f693fa2 Mon Sep 17 00:00:00 2001 From: ModelHub XC Date: Fri, 12 Jun 2026 13:30:30 +0800 Subject: [PATCH] =?UTF-8?q?=E5=88=9D=E5=A7=8B=E5=8C=96=E9=A1=B9=E7=9B=AE?= =?UTF-8?q?=EF=BC=8C=E7=94=B1ModelHub=20XC=E7=A4=BE=E5=8C=BA=E6=8F=90?= =?UTF-8?q?=E4=BE=9B=E6=A8=A1=E5=9E=8B?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit Model: jackf857/llama-3-8b-base-new-dpo-harmless-s_star0.6-q_t0.4 Source: Original Platform --- .gitattributes | 36 + README.md | 78 + all_results.json | 23 + config.json | 29 + eval_results.json | 17 + generation_config.json | 9 + margin_logs/margins.jsonl | 661 ++++++++ model-00001-of-00007.safetensors | 3 + model-00002-of-00007.safetensors | 3 + model-00003-of-00007.safetensors | 3 + model-00004-of-00007.safetensors | 3 + model-00005-of-00007.safetensors | 3 + model-00006-of-00007.safetensors | 3 + model-00007-of-00007.safetensors | 3 + model.safetensors.index.json | 298 ++++ special_tokens_map.json | 23 + tokenizer.json | 3 + tokenizer_config.json | 2064 +++++++++++++++++++++++ train_results.json | 9 + trainer_state.json | 2621 ++++++++++++++++++++++++++++++ 20 files changed, 5892 insertions(+) create mode 100644 .gitattributes create mode 100644 README.md create mode 100644 all_results.json create mode 100644 config.json create mode 100644 eval_results.json create mode 100644 generation_config.json create mode 100644 margin_logs/margins.jsonl create mode 100644 model-00001-of-00007.safetensors create mode 100644 model-00002-of-00007.safetensors create mode 100644 model-00003-of-00007.safetensors create mode 100644 model-00004-of-00007.safetensors create mode 100644 model-00005-of-00007.safetensors create mode 100644 model-00006-of-00007.safetensors create mode 100644 model-00007-of-00007.safetensors create mode 100644 model.safetensors.index.json create mode 100644 special_tokens_map.json create mode 100644 tokenizer.json create mode 100644 tokenizer_config.json create mode 100644 train_results.json create mode 100644 trainer_state.json diff --git a/.gitattributes b/.gitattributes new file mode 100644 index 0000000..52373fe --- /dev/null +++ b/.gitattributes @@ -0,0 +1,36 @@ +*.7z filter=lfs diff=lfs merge=lfs -text +*.arrow filter=lfs diff=lfs merge=lfs -text +*.bin filter=lfs diff=lfs merge=lfs -text +*.bz2 filter=lfs diff=lfs merge=lfs -text +*.ckpt filter=lfs diff=lfs merge=lfs -text +*.ftz filter=lfs diff=lfs merge=lfs -text +*.gz filter=lfs diff=lfs merge=lfs -text +*.h5 filter=lfs diff=lfs merge=lfs -text +*.joblib filter=lfs diff=lfs merge=lfs -text +*.lfs.* filter=lfs diff=lfs merge=lfs -text +*.mlmodel filter=lfs diff=lfs merge=lfs -text +*.model filter=lfs diff=lfs merge=lfs -text +*.msgpack filter=lfs diff=lfs merge=lfs -text +*.npy filter=lfs diff=lfs merge=lfs -text +*.npz filter=lfs diff=lfs merge=lfs -text +*.onnx filter=lfs diff=lfs merge=lfs -text +*.ot filter=lfs diff=lfs merge=lfs -text +*.parquet filter=lfs diff=lfs merge=lfs -text +*.pb filter=lfs diff=lfs merge=lfs -text +*.pickle filter=lfs diff=lfs merge=lfs -text +*.pkl filter=lfs diff=lfs merge=lfs -text +*.pt filter=lfs diff=lfs merge=lfs -text +*.pth filter=lfs diff=lfs merge=lfs -text +*.rar filter=lfs diff=lfs merge=lfs -text +*.safetensors filter=lfs diff=lfs merge=lfs -text +saved_model/**/* filter=lfs diff=lfs merge=lfs -text +*.tar.* filter=lfs diff=lfs merge=lfs -text +*.tar filter=lfs diff=lfs merge=lfs -text +*.tflite filter=lfs diff=lfs merge=lfs -text +*.tgz filter=lfs diff=lfs merge=lfs -text +*.wasm filter=lfs diff=lfs merge=lfs -text +*.xz filter=lfs diff=lfs merge=lfs -text +*.zip filter=lfs diff=lfs merge=lfs -text +*.zst filter=lfs diff=lfs merge=lfs -text +*tfevents* filter=lfs diff=lfs merge=lfs -text +tokenizer.json filter=lfs diff=lfs merge=lfs -text diff --git a/README.md b/README.md new file mode 100644 index 0000000..3f889ef --- /dev/null +++ b/README.md @@ -0,0 +1,78 @@ +--- +library_name: transformers +base_model: W-61/llama-3-8b-base-sft-hh-harmless-4xh200 +tags: +- alignment-handbook +- new-dpo +- generated_from_trainer +datasets: +- Anthropic/hh-rlhf +model-index: +- name: llama3-8b-base-new-method-s_star0.6 + results: [] +--- + + + +# llama3-8b-base-new-method-s_star0.6 + +This model is a fine-tuned version of [W-61/llama-3-8b-base-sft-hh-harmless-4xh200](https://huggingface.co/W-61/llama-3-8b-base-sft-hh-harmless-4xh200) on the Anthropic/hh-rlhf dataset. +It achieves the following results on the evaluation set: +- Loss: 0.5591 +- Fcm Dpo/beta: 0.0089 +- Margin Dpo/margin Mean: 55.2826 +- Margin Dpo/margin Std: 95.3567 +- Logps/chosen: -205.2188 +- Logps/rejected: -265.1909 +- Logps/ref Chosen: -74.8595 +- Logps/ref Rejected: -79.5490 +- Logits/chosen: 0.7206 +- Logits/rejected: 0.6751 + +## Model description + +More information needed + +## Intended uses & limitations + +More information needed + +## Training and evaluation data + +More information needed + +## Training procedure + +### Training hyperparameters + +The following hyperparameters were used during training: +- learning_rate: 5e-07 +- train_batch_size: 8 +- eval_batch_size: 8 +- seed: 42 +- distributed_type: multi-GPU +- num_devices: 4 +- gradient_accumulation_steps: 2 +- total_train_batch_size: 64 +- total_eval_batch_size: 32 +- optimizer: Use OptimizerNames.ADAMW_TORCH with betas=(0.9,0.999) and epsilon=1e-08 and optimizer_args=No additional optimizer arguments +- lr_scheduler_type: cosine +- lr_scheduler_warmup_ratio: 0.1 +- num_epochs: 1 + +### Training results + +| Training Loss | Epoch | Step | Validation Loss | Fcm Dpo/beta | Margin Dpo/margin Mean | Margin Dpo/margin Std | Logps/chosen | Logps/rejected | Logps/ref Chosen | Logps/ref Rejected | Logits/chosen | Logits/rejected | +|:-------------:|:------:|:----:|:---------------:|:------------:|:----------------------:|:---------------------:|:------------:|:--------------:|:----------------:|:------------------:|:-------------:|:---------------:| +| 1.0505 | 0.3023 | 200 | 0.5490 | 0.0445 | 12.8367 | 21.5327 | -94.9354 | -112.4616 | -74.8595 | -79.5490 | 0.4353 | 0.3850 | +| 1.0738 | 0.6047 | 400 | 0.5614 | 0.0103 | 44.9123 | 77.2791 | -176.5743 | -226.1761 | -74.8595 | -79.5490 | 0.6246 | 0.5775 | +| 1.1653 | 0.9070 | 600 | 0.5591 | 0.0089 | 55.2826 | 95.3567 | -205.2188 | -265.1909 | -74.8595 | -79.5490 | 0.7206 | 0.6751 | + + +### Framework versions + +- Transformers 4.51.0 +- Pytorch 2.3.1+cu121 +- Datasets 2.21.0 +- Tokenizers 0.21.4 diff --git a/all_results.json b/all_results.json new file mode 100644 index 0000000..1fa2cbf --- /dev/null +++ b/all_results.json @@ -0,0 +1,23 @@ +{ + "epoch": 0.999244142101285, + "eval_fcm_dpo/beta": 0.00873605813831091, + "eval_logits/chosen": 0.7100939750671387, + "eval_logits/rejected": 0.6652560830116272, + "eval_logps/chosen": -206.1328125, + "eval_logps/ref_chosen": -74.85946655273438, + "eval_logps/ref_rejected": -79.54898834228516, + "eval_logps/rejected": -266.35693359375, + "eval_loss": 0.5597169995307922, + "eval_margin_dpo/margin_mean": 55.534568786621094, + "eval_margin_dpo/margin_std": 95.7474365234375, + "eval_runtime": 38.6273, + "eval_samples": 2303, + "eval_samples_per_second": 59.621, + "eval_steps_per_second": 1.864, + "total_flos": 0.0, + "train_loss": 1.120150500454809, + "train_runtime": 1811.4729, + "train_samples": 42336, + "train_samples_per_second": 23.371, + "train_steps_per_second": 0.365 +} \ No newline at end of file diff --git a/config.json b/config.json new file mode 100644 index 0000000..5092b09 --- /dev/null +++ b/config.json @@ -0,0 +1,29 @@ +{ + "architectures": [ + "LlamaForCausalLM" + ], + "attention_bias": false, + "attention_dropout": 0.0, + "bos_token_id": 128000, + "eos_token_id": 128001, + "head_dim": 128, + "hidden_act": "silu", + "hidden_size": 4096, + "initializer_range": 0.02, + "intermediate_size": 14336, + "max_position_embeddings": 8192, + "mlp_bias": false, + "model_type": "llama", + "num_attention_heads": 32, + "num_hidden_layers": 32, + "num_key_value_heads": 8, + "pretraining_tp": 1, + "rms_norm_eps": 1e-05, + "rope_scaling": null, + "rope_theta": 500000.0, + "tie_word_embeddings": false, + "torch_dtype": "float32", + "transformers_version": "4.51.0", + "use_cache": true, + "vocab_size": 128256 +} diff --git a/eval_results.json b/eval_results.json new file mode 100644 index 0000000..15061d2 --- /dev/null +++ b/eval_results.json @@ -0,0 +1,17 @@ +{ + "epoch": 0.999244142101285, + "eval_fcm_dpo/beta": 0.00873605813831091, + "eval_logits/chosen": 0.7100939750671387, + "eval_logits/rejected": 0.6652560830116272, + "eval_logps/chosen": -206.1328125, + "eval_logps/ref_chosen": -74.85946655273438, + "eval_logps/ref_rejected": -79.54898834228516, + "eval_logps/rejected": -266.35693359375, + "eval_loss": 0.5597169995307922, + "eval_margin_dpo/margin_mean": 55.534568786621094, + "eval_margin_dpo/margin_std": 95.7474365234375, + "eval_runtime": 38.6273, + "eval_samples": 2303, + "eval_samples_per_second": 59.621, + "eval_steps_per_second": 1.864 +} \ No newline at end of file diff --git a/generation_config.json b/generation_config.json new file mode 100644 index 0000000..76247c9 --- /dev/null +++ b/generation_config.json @@ -0,0 +1,9 @@ +{ + "bos_token_id": 128000, + "do_sample": true, + "eos_token_id": 128001, + "max_length": 4096, + "temperature": 0.6, + "top_p": 0.9, + "transformers_version": "4.51.0" +} diff --git a/margin_logs/margins.jsonl b/margin_logs/margins.jsonl new file mode 100644 index 0000000..6cfef9d --- /dev/null +++ b/margin_logs/margins.jsonl @@ -0,0 +1,661 @@ +{"epoch": 0.0, "step": 1, "batch_size": 64, "mean": -0.0013527870178222656, "std": 0.2564818859100342, "min": -0.736083984375, "p10": -0.3432229995727539, "median": 0.038166046142578125, "p90": 0.29227676391601565, "max": 0.645111083984375, "pos_frac": 0.578125, "sample": [0.1120758056640625, 0.12518310546875, 0.31621551513671875, 0.13765716552734375, -0.12592506408691406, 0.23141098022460938, -0.21887779235839844, 0.21950721740722656, 0.04480743408203125, 0.020877838134765625, 0.0570220947265625, 0.058269500732421875, -0.4338226318359375, -0.030628204345703125, 0.645111083984375, -0.395477294921875, 0.09050941467285156, 0.0007190704345703125, -0.34615325927734375, 0.016077041625976562, -0.33638572692871094, 0.293853759765625, 0.17610931396484375, 0.22386932373046875, 0.21470260620117188, -0.08536529541015625, 0.0907745361328125, -0.03816986083984375, 0.39190101623535156, 0.16336441040039062, 0.08024787902832031, -0.031158447265625, 0.08477020263671875, 0.002460479736328125, -0.242034912109375, 0.07232666015625, -0.60186767578125, 0.20531463623046875, 0.155731201171875, -0.14299774169921875, -0.25698089599609375, 0.12331962585449219, -0.26497650146484375, 0.15140533447265625, -0.0920257568359375, -0.18599319458007812, 0.19028091430664062, 0.2496490478515625, 0.42162322998046875, 0.17873382568359375, -0.1525421142578125, -0.4972076416015625, 0.32010650634765625, -0.10365867614746094, -0.233795166015625, -0.19828224182128906, -0.4018898010253906, -0.13407135009765625, -0.09596633911132812, 0.031524658203125, 0.28859710693359375, -0.192962646484375, -0.736083984375, 0.3026123046875], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000001.npy"} +{"epoch": 0.0015117157974300832, "step": 2, "batch_size": 64, "mean": 0.03744968771934509, "std": 0.2875921130180359, "min": -0.7604827880859375, "p10": -0.2812448501586914, "median": 0.03963661193847656, "p90": 0.3654294967651367, "max": 0.8134727478027344, "pos_frac": 0.5625, "sample": [0.30594635009765625, -0.24289894104003906, -0.11509323120117188, -0.13417816162109375, 0.06942558288574219, 0.36568641662597656, -0.14640045166015625, 0.1497650146484375, 0.30261993408203125, 0.10124588012695312, 0.13028717041015625, -0.0031890869140625, 0.0361480712890625, 0.5662612915039062, 0.09694290161132812, -0.01091766357421875, 0.1128997802734375, 0.0411834716796875, -0.21860504150390625, -0.1236419677734375, -0.08812713623046875, 0.10360527038574219, 0.1790008544921875, -0.5114288330078125, 0.3056755065917969, -0.14553451538085938, 0.28168487548828125, 0.26990509033203125, 0.1686878204345703, 0.038089752197265625, 0.19541168212890625, -0.10783576965332031, -0.2644004821777344, -0.19707489013671875, -0.140472412109375, 0.1349811553955078, 0.19672012329101562, -0.0714111328125, 0.53369140625, 0.1271820068359375, 0.8134727478027344, 0.2990264892578125, -0.7604827880859375, -0.08274078369140625, 0.05890846252441406, 0.029361724853515625, 0.4510040283203125, -0.1599273681640625, -0.29346656799316406, 0.10005569458007812, -0.27509117126464844, -0.1937713623046875, 0.19167327880859375, 0.28173065185546875, -0.09406471252441406, -0.3380699157714844, -0.29186248779296875, 0.36483001708984375, 0.009979248046875, 0.44391632080078125, -0.126708984375, -0.6550216674804688, 0.6160736083984375, -0.28388214111328125], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000002.npy"} +{"epoch": 0.0030234315948601664, "step": 3, "batch_size": 64, "mean": -0.04198172688484192, "std": 0.32261142134666443, "min": -0.7572402954101562, "p10": -0.49693832397460935, "median": -0.07027435302734375, "p90": 0.3893344879150391, "max": 0.63494873046875, "pos_frac": 0.421875, "sample": [0.08205032348632812, -0.25003623962402344, -0.095489501953125, -0.5428848266601562, 0.3788909912109375, 0.37230682373046875, -0.1027984619140625, 0.0685272216796875, 0.63494873046875, -0.41262054443359375, -0.30046844482421875, -0.454376220703125, -0.4721527099609375, 0.09978675842285156, 0.0134124755859375, 0.24958038330078125, -0.1798248291015625, 0.114044189453125, 0.17412567138671875, -0.27457427978515625, -0.3025665283203125, -0.10743904113769531, -0.07501220703125, 0.4218788146972656, -0.6099090576171875, 0.2885265350341797, 0.6256179809570312, 0.305145263671875, -0.13189315795898438, 0.3245086669921875, 0.055606842041015625, -0.3444061279296875, -0.11013031005859375, -0.2378692626953125, -0.079437255859375, -0.002017974853515625, -0.0655364990234375, -0.53411865234375, -0.10840797424316406, 0.5537261962890625, 0.45458984375, -0.26770782470703125, -0.1485595703125, 0.4827423095703125, 0.19634246826171875, 0.002468109130859375, -0.12972640991210938, 0.09444808959960938, 0.23598098754882812, -0.5075607299804688, -0.5266265869140625, -0.7572402954101562, 0.3938102722167969, 0.18079376220703125, -0.6481781005859375, -0.01328277587890625, 0.196441650390625, -0.38765716552734375, -0.03672027587890625, -0.0483551025390625, -0.14605712890625, -0.15972137451171875, -0.14984130859375, 0.0340728759765625], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000003.npy"} +{"epoch": 0.0045351473922902496, "step": 4, "batch_size": 64, "mean": 0.022722840309143066, "std": 0.30529195070266724, "min": -0.8279953002929688, "p10": -0.29837455749511715, "median": 0.04853343963623047, "p90": 0.34981613159179686, "max": 1.0779800415039062, "pos_frac": 0.546875, "sample": [-0.4030609130859375, 0.350830078125, 0.1124267578125, -0.8279953002929688, -0.0238037109375, -0.30373382568359375, 0.05287742614746094, 0.351654052734375, 0.3687171936035156, 1.0779800415039062, 0.25439453125, 0.08449554443359375, 0.06561279296875, -0.1245574951171875, -0.0300750732421875, -0.27288818359375, 0.06986618041992188, -0.04917144775390625, -0.27333831787109375, -0.2161865234375, -0.037567138671875, -0.046199798583984375, -0.230743408203125, -0.238006591796875, 0.13322830200195312, 0.14502716064453125, -0.02077484130859375, 0.18889617919921875, 0.09489059448242188, 0.25335693359375, 0.552459716796875, 0.08419036865234375, 0.0289154052734375, 0.13988494873046875, 0.22600555419921875, 0.2879791259765625, -0.008331298828125, 0.07963943481445312, 0.0636138916015625, -0.128143310546875, 0.28050994873046875, -0.11520195007324219, 0.4122047424316406, -0.23202133178710938, 0.06203460693359375, 0.654876708984375, -0.43418121337890625, 0.258697509765625, -0.1044158935546875, -0.15058517456054688, 0.34745025634765625, -0.47785186767578125, -0.2688636779785156, 0.18692398071289062, -0.339569091796875, 0.0334320068359375, -0.009735107421875, 0.3154449462890625, 0.22133636474609375, -0.2858695983886719, -0.7691497802734375, 0.0738067626953125, 0.044189453125, -0.08156585693359375], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000004.npy"} +{"epoch": 0.006046863189720333, "step": 5, "batch_size": 64, "mean": -0.043451666831970215, "std": 0.30981379747390747, "min": -1.0077362060546875, "p10": -0.5129764556884765, "median": -0.053882598876953125, "p90": 0.30394592285156263, "max": 0.694183349609375, "pos_frac": 0.421875, "sample": [-0.09662055969238281, -0.18099212646484375, -0.1827526092529297, -0.142730712890625, -0.1404571533203125, -0.5668487548828125, 0.07156562805175781, 0.2546539306640625, 0.33139801025390625, 0.0885162353515625, 0.1129913330078125, -0.565155029296875, -0.23888397216796875, 0.048641204833984375, -0.7220115661621094, -0.5600929260253906, -0.05425262451171875, -0.21500587463378906, -0.0235137939453125, -0.13640594482421875, -0.06752395629882812, -0.08025169372558594, 0.11359596252441406, 0.07106781005859375, -1.0077362060546875, -0.207000732421875, -0.40303802490234375, -0.09217071533203125, 0.1728973388671875, 0.13853836059570312, -0.0535125732421875, -0.11650848388671875, -0.1841583251953125, 0.173095703125, 0.694183349609375, -0.21235275268554688, -0.2887134552001953, 0.160858154296875, 0.048870086669921875, -0.0139312744140625, 0.23087692260742188, 0.0373687744140625, -0.15271759033203125, 0.10651397705078125, 0.53424072265625, -0.1541309356689453, -0.042083740234375, 0.3181915283203125, 0.5571517944335938, -0.570465087890625, 0.16139602661132812, -0.23996734619140625, 0.2707061767578125, 0.640228271484375, 0.159912109375, -0.013580322265625, -0.5809173583984375, -0.0915069580078125, -0.07631683349609375, 0.20147132873535156, -0.2611064910888672, -0.12371826171875, 0.047748565673828125, 0.3315467834472656], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000005.npy"} +{"epoch": 0.007558578987150416, "step": 6, "batch_size": 64, "mean": -0.06396755576133728, "std": 0.271879106760025, "min": -0.7890625, "p10": -0.36733341217041016, "median": -0.076812744140625, "p90": 0.2984201431274415, "max": 0.583221435546875, "pos_frac": 0.421875, "sample": [-0.338165283203125, 0.0106201171875, -0.08860015869140625, 0.189544677734375, -0.08608245849609375, -0.3614788055419922, -0.09904861450195312, 0.05257415771484375, -0.2289886474609375, -0.05226898193359375, 0.038471221923828125, 0.364227294921875, -0.17060470581054688, 0.018585205078125, -0.3251953125, 0.3396148681640625, 0.3220062255859375, 0.32270050048828125, -0.19354248046875, -0.5346965789794922, 0.02748870849609375, -0.33274078369140625, 0.09450531005859375, 0.2871742248535156, 0.08797454833984375, -0.1553192138671875, -0.06754302978515625, -0.1655120849609375, -0.2256622314453125, 0.3032398223876953, 0.27200889587402344, -0.176910400390625, 0.3886566162109375, -0.20251083374023438, -0.7265853881835938, 0.08280181884765625, -0.23501205444335938, -0.49259185791015625, -0.27077484130859375, -0.01956939697265625, 0.09012603759765625, 0.07952117919921875, 0.066192626953125, 0.2450714111328125, -0.5121078491210938, -0.2880401611328125, 0.583221435546875, -0.02813720703125, -0.17931747436523438, -0.12440299987792969, 0.08063507080078125, 0.2512359619140625, -0.3171977996826172, -0.40761756896972656, -0.19710922241210938, -0.1668224334716797, -0.10699844360351562, -0.005096435546875, -0.369842529296875, -0.7890625, -0.1580047607421875, 0.1688671112060547, 0.2018260955810547, 0.13634681701660156], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000006.npy"} +{"epoch": 0.009070294784580499, "step": 7, "batch_size": 64, "mean": -0.004343748092651367, "std": 0.2991655468940735, "min": -0.7390937805175781, "p10": -0.3599309921264648, "median": 0.03826427459716797, "p90": 0.35006732940673835, "max": 0.5846405029296875, "pos_frac": 0.546875, "sample": [0.031764984130859375, -0.7390937805175781, -0.181365966796875, -0.28308677673339844, 0.377899169921875, 0.33434295654296875, 0.15570640563964844, 0.43511962890625, -0.2527008056640625, 0.35497283935546875, 0.15949630737304688, 0.3386211395263672, 0.1456317901611328, -0.003925323486328125, 0.011249542236328125, -0.0006618499755859375, -0.036876678466796875, -0.10408782958984375, 0.06827163696289062, -0.6949234008789062, 0.060779571533203125, -0.2384796142578125, -0.143402099609375, 0.0579986572265625, 0.226409912109375, 0.04458045959472656, -0.189788818359375, 0.12189483642578125, 0.5846405029296875, 0.1779804229736328, -0.331085205078125, 0.3233795166015625, -0.37229347229003906, 0.5323295593261719, -0.6696853637695312, 0.29498291015625, -0.11354827880859375, 0.22333145141601562, 0.2027301788330078, 0.05087471008300781, -0.1044158935546875, -0.039386749267578125, -0.094696044921875, 0.3162384033203125, -0.322174072265625, 0.03464508056640625, -0.3109245300292969, -0.2894477844238281, 0.10874176025390625, -0.201904296875, 0.04188346862792969, -0.5976181030273438, 0.14584922790527344, -0.18697738647460938, 0.18901824951171875, -0.07962799072265625, -0.19184112548828125, -0.4927978515625, 0.5784759521484375, 0.0483245849609375, 0.048004150390625, 0.068695068359375, 0.4739990234375, -0.3800468444824219], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000007.npy"} +{"epoch": 0.010582010582010581, "step": 8, "batch_size": 64, "mean": 0.024642616510391235, "std": 0.352443128824234, "min": -0.874237060546875, "p10": -0.3041717529296875, "median": -0.03726768493652344, "p90": 0.39086608886718754, "max": 1.142333984375, "pos_frac": 0.453125, "sample": [0.2988452911376953, 0.9765167236328125, -0.874237060546875, -0.138336181640625, -0.8180313110351562, 0.19239044189453125, 0.2508087158203125, 0.12615966796875, -0.20199012756347656, -0.2940216064453125, 0.138946533203125, -0.09970855712890625, -0.13245391845703125, -0.12129592895507812, 0.370849609375, 1.142333984375, 0.8131179809570312, 0.16967010498046875, -0.06316375732421875, -0.1042327880859375, 0.024484634399414062, -0.1923828125, -0.23999786376953125, -0.1626129150390625, 0.2302989959716797, -0.07460594177246094, -0.3413848876953125, -0.15283584594726562, 0.17314529418945312, 0.08873748779296875, 0.3931732177734375, -0.12885284423828125, 0.0193939208984375, -0.3070831298828125, -0.07708358764648438, -0.0536041259765625, 0.35785675048828125, 0.17076492309570312, 0.3292388916015625, 0.11693572998046875, 0.6328887939453125, -0.1679973602294922, -0.01293182373046875, -0.29717254638671875, -0.176483154296875, -0.5701828002929688, 0.2982215881347656, -0.2973785400390625, -0.36641502380371094, 0.4541778564453125, -0.18176841735839844, 0.26333045959472656, -0.3507881164550781, 0.04180145263671875, -0.0834808349609375, 0.3854827880859375, -0.23087692260742188, -0.01666259765625, -0.151458740234375, 0.048480987548828125, -0.06011962890625, 0.125030517578125, 0.5066070556640625, -0.020931243896484375], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000008.npy"} +{"epoch": 0.012093726379440665, "step": 9, "batch_size": 64, "mean": -0.04336252808570862, "std": 0.3272463083267212, "min": -1.0512428283691406, "p10": -0.41162338256835934, "median": -0.005809783935546875, "p90": 0.2795431137084961, "max": 0.87823486328125, "pos_frac": 0.484375, "sample": [-0.48473358154296875, -0.03017425537109375, -0.2949066162109375, 0.010284423828125, -0.1741924285888672, -0.12142562866210938, -0.1871795654296875, -0.657958984375, -0.1727752685546875, -0.348236083984375, -0.35904693603515625, -0.23862075805664062, 0.34465789794921875, 0.21097373962402344, -0.346588134765625, -0.1607208251953125, -0.18871307373046875, 0.560028076171875, 0.010265350341796875, 0.09906005859375, -0.0373382568359375, 0.03173065185546875, 0.87823486328125, 0.15509033203125, -0.2873191833496094, 0.10272979736328125, 0.2351551055908203, -0.074493408203125, 0.16239547729492188, -1.0512428283691406, -0.42153167724609375, -0.47515296936035156, 0.176971435546875, 0.330047607421875, 0.008052825927734375, -0.1783924102783203, 0.10608291625976562, -0.6476325988769531, -0.3885040283203125, 0.10224151611328125, -0.005645751953125, -0.3321342468261719, 0.242919921875, 0.125701904296875, 0.05614280700683594, 0.23783111572265625, 0.2750263214111328, 0.1526508331298828, -0.033294677734375, -0.23826980590820312, 0.049533843994140625, -0.02277374267578125, 0.023134231567382812, 0.2814788818359375, 0.3785247802734375, 0.7438812255859375, 0.08829879760742188, -0.27292633056640625, 0.1981048583984375, 0.135711669921875, -0.25469970703125, -0.697357177734375, -0.0981903076171875, -0.00597381591796875], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000009.npy"} +{"epoch": 0.013605442176870748, "step": 10, "batch_size": 64, "mean": 0.019409894943237305, "std": 0.3381289541721344, "min": -0.8375701904296875, "p10": -0.3992046356201172, "median": 0.03704833984375, "p90": 0.3601150512695313, "max": 1.111541748046875, "pos_frac": 0.546875, "sample": [-0.1129608154296875, -0.0860443115234375, -0.08916473388671875, 0.00188446044921875, -0.2246246337890625, -0.8375701904296875, -0.1435413360595703, 0.3529052734375, -0.48944091796875, 0.26802825927734375, 0.10845184326171875, 0.11957168579101562, -0.46993255615234375, 0.04681396484375, 0.195831298828125, -0.04119873046875, 0.1483173370361328, -0.01715087890625, 0.376708984375, -0.2831916809082031, 0.05576515197753906, -0.07813453674316406, 0.528594970703125, 0.5237579345703125, -0.08731842041015625, -0.19510269165039062, -0.395751953125, -0.353424072265625, 0.3249473571777344, -0.16251373291015625, -0.04685211181640625, 0.352569580078125, 0.09577178955078125, -0.10973358154296875, 0.21998214721679688, 0.21600341796875, -0.23913955688476562, 0.2774066925048828, 0.031707763671875, 0.23627853393554688, 0.002391815185546875, -0.4006843566894531, 0.0811004638671875, 0.23494720458984375, -0.17826080322265625, 0.10111618041992188, -0.633636474609375, -0.00228118896484375, 0.3326416015625, -0.7223968505859375, -0.0006103515625, 0.706695556640625, 0.042388916015625, 0.07421875, 0.2917976379394531, -0.02799224853515625, 1.111541748046875, 0.05002784729003906, 0.25037384033203125, 0.07891845703125, 0.3632049560546875, -0.38149261474609375, 0.4854583740234375, -0.6357421875], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000010.npy"} +{"epoch": 0.015117157974300832, "step": 11, "batch_size": 64, "mean": 0.020615994930267334, "std": 0.3354145884513855, "min": -0.87548828125, "p10": -0.3877235412597656, "median": 0.08286285400390625, "p90": 0.40000534057617193, "max": 0.843292236328125, "pos_frac": 0.578125, "sample": [-0.35793304443359375, 0.037872314453125, -0.1992034912109375, 0.11615371704101562, -0.20163345336914062, 0.12691116333007812, -0.1767864227294922, 0.12452507019042969, 0.3114013671875, -0.5652923583984375, 0.5246963500976562, 0.27108001708984375, 0.38080596923828125, 0.12929153442382812, -0.08264732360839844, -0.16736984252929688, 0.4804840087890625, -0.268218994140625, 0.097015380859375, 0.00041961669921875, 0.2924690246582031, 0.0687103271484375, 0.35874176025390625, -0.033782958984375, -0.39411163330078125, -0.113525390625, -0.36810302734375, 0.2213916778564453, 0.147369384765625, 0.2972373962402344, -0.040264129638671875, 0.13144874572753906, -0.19587326049804688, 0.408233642578125, -0.12874984741210938, -0.00139617919921875, -0.3728179931640625, 0.843292236328125, 0.19774627685546875, 0.240081787109375, -0.55621337890625, 0.4857940673828125, -0.27599334716796875, 0.061275482177734375, -0.23402023315429688, -0.87548828125, 0.22509384155273438, 0.13301849365234375, 0.22092437744140625, 0.6900711059570312, 0.15554428100585938, -0.5411834716796875, -0.1485462188720703, 0.002193450927734375, 0.10039520263671875, 0.119781494140625, -0.047443389892578125, 0.1701202392578125, -0.5357437133789062, -0.7805938720703125, 0.412078857421875, 0.319793701171875, -0.26922607421875, 0.34812164306640625], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000011.npy"} +{"epoch": 0.016628873771730914, "step": 12, "batch_size": 64, "mean": 0.051781415939331055, "std": 0.2990102767944336, "min": -0.4466094970703125, "p10": -0.29737167358398436, "median": -0.004532814025878906, "p90": 0.39180221557617195, "max": 0.909027099609375, "pos_frac": 0.5, "sample": [-0.14056777954101562, -0.17279052734375, 0.14368247985839844, 0.2694587707519531, -0.07523345947265625, -0.1941986083984375, 0.2027435302734375, 0.095947265625, 0.19960975646972656, -0.19939804077148438, -0.32428741455078125, 0.4373130798339844, -0.231536865234375, 0.10906982421875, 0.0360870361328125, -0.09310150146484375, -0.085052490234375, -0.42996978759765625, 0.19439697265625, 0.10242652893066406, -0.13724136352539062, -0.3349456787109375, -0.30731201171875, 0.3973388671875, 0.31307411193847656, -0.3939018249511719, -0.4451274871826172, -0.27417755126953125, -0.09087753295898438, 0.1399250030517578, -0.17314529418945312, -0.0371246337890625, -0.1430511474609375, -0.4466094970703125, -0.03893280029296875, 0.10553550720214844, -0.009380340576171875, 0.3671112060546875, 0.15744781494140625, -0.2315387725830078, 0.21073150634765625, 0.0003147125244140625, -0.09290313720703125, 0.19947242736816406, 0.7079620361328125, 0.6305522918701172, -0.2568511962890625, 0.250518798828125, 0.278289794921875, 0.6895408630371094, 0.37888336181640625, 0.3013744354248047, 0.2624683380126953, 0.909027099609375, 0.0485382080078125, 0.6390609741210938, -0.05643463134765625, 0.29642486572265625, -0.18575668334960938, -0.2516632080078125, -0.14163970947265625, -0.0513153076171875, 0.34821510314941406, -0.062465667724609375], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000012.npy"} +{"epoch": 0.018140589569160998, "step": 13, "batch_size": 64, "mean": -0.022946447134017944, "std": 0.30812835693359375, "min": -0.856781005859375, "p10": -0.40518875122070314, "median": -0.009311676025390625, "p90": 0.3406209945678711, "max": 0.6244449615478516, "pos_frac": 0.46875, "sample": [-0.856781005859375, 0.03649139404296875, 0.522796630859375, -0.0053253173828125, -0.07928466796875, -0.698699951171875, 0.2710533142089844, 0.2446746826171875, -0.16443634033203125, 0.09099578857421875, -0.06397628784179688, -0.11374092102050781, 0.14305877685546875, 0.2749481201171875, 0.15098953247070312, 0.3395500183105469, -0.087066650390625, -0.2541770935058594, 0.0458221435546875, 0.09832000732421875, 0.04178619384765625, -0.4949607849121094, -0.0037994384765625, -0.4476165771484375, -0.36476898193359375, 0.32135772705078125, 0.00283050537109375, -0.26648902893066406, -0.2801055908203125, -0.39463043212890625, -0.11033058166503906, 0.16449737548828125, 0.4351043701171875, -0.5693702697753906, -0.3221588134765625, 0.6244449615478516, -0.01329803466796875, -0.014019012451171875, 0.3149394989013672, -0.02593231201171875, 0.08579826354980469, -0.0286407470703125, -0.16580963134765625, -0.3440132141113281, -0.4097137451171875, 0.3409900665283203, -0.0557098388671875, 0.468902587890625, -0.238800048828125, 0.0155792236328125, 0.3318138122558594, 0.33975982666015625, -0.2087726593017578, 0.0047130584716796875, 0.4697113037109375, -0.34905242919921875, -0.6664276123046875, 0.09031486511230469, 0.1256866455078125, 0.38063621520996094, -0.0262298583984375, 0.0638885498046875, -0.05627250671386719, -0.12961769104003906], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000013.npy"} +{"epoch": 0.019652305366591082, "step": 14, "batch_size": 64, "mean": 0.06008493900299072, "std": 0.3543643057346344, "min": -0.6910858154296875, "p10": -0.29991531372070307, "median": 0.030269622802734375, "p90": 0.46559753417968774, "max": 1.225372314453125, "pos_frac": 0.546875, "sample": [0.14774703979492188, -0.32098388671875, -0.471832275390625, 0.18935394287109375, 0.08307075500488281, 0.18294525146484375, 0.1099395751953125, 1.11700439453125, -0.14616012573242188, -0.09718894958496094, -0.14044952392578125, 0.14907455444335938, 0.2072010040283203, -0.22475433349609375, 0.04196929931640625, -0.04860877990722656, -0.028421401977539062, 0.30570220947265625, -0.24739837646484375, 0.07049179077148438, -0.21895217895507812, -0.4050407409667969, 0.15260887145996094, -0.23224639892578125, 0.16646575927734375, -0.18597412109375, -0.117431640625, 0.48842620849609375, 0.2508068084716797, 0.6795654296875, 0.41233062744140625, 1.0863418579101562, 0.07164764404296875, 1.225372314453125, 0.26997947692871094, -0.123138427734375, 0.22986221313476562, 0.0254364013671875, 0.12425041198730469, -0.6910858154296875, 0.254730224609375, 0.5450553894042969, -0.21963882446289062, 0.640380859375, -0.10102462768554688, -0.038562774658203125, -0.16613006591796875, -0.338775634765625, 0.07475471496582031, -0.06191444396972656, 0.010162353515625, -0.4939842224121094, 0.04631614685058594, -0.3367462158203125, 0.1250152587890625, 0.18604278564453125, 0.03510284423828125, -0.1817474365234375, -0.1298542022705078, -0.25075531005859375, -0.12557411193847656, -0.0565643310546875, 0.32659912109375, 0.014621734619140625], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000014.npy"} +{"epoch": 0.021164021164021163, "step": 15, "batch_size": 64, "mean": -0.029221028089523315, "std": 0.31245914101600647, "min": -0.8779754638671875, "p10": -0.3564990997314453, "median": -0.09288311004638672, "p90": 0.3515838623046875, "max": 1.1569976806640625, "pos_frac": 0.390625, "sample": [0.18373489379882812, -0.1577606201171875, -0.1848430633544922, -0.06588363647460938, -0.3653831481933594, -0.04378509521484375, -0.062591552734375, -0.30728912353515625, -0.470458984375, -0.3357696533203125, 0.29019927978515625, -0.18724822998046875, 0.0388946533203125, -0.14234352111816406, -0.039031982421875, 0.04933929443359375, 1.1569976806640625, -0.21475601196289062, 0.3247814178466797, -0.40129661560058594, 0.350921630859375, -0.16495513916015625, 0.021732330322265625, -0.24829483032226562, -0.11576461791992188, 0.24501800537109375, 0.48996734619140625, -0.2650299072265625, -0.3667755126953125, -0.30057525634765625, 0.1019439697265625, -0.207794189453125, -0.14226531982421875, -0.5839309692382812, 0.40073394775390625, -0.47151947021484375, 0.0455322265625, -0.1458587646484375, -0.09995079040527344, 0.1764984130859375, -0.10736083984375, -0.1351776123046875, -0.23438262939453125, 0.38031005859375, 0.2884178161621094, -0.8779754638671875, -0.32379913330078125, -0.1167755126953125, 0.27768516540527344, 0.4853363037109375, -0.14803314208984375, 0.16379356384277344, 0.05365562438964844, -0.0858154296875, 0.07592010498046875, 0.35186767578125, 0.0901947021484375, -0.12524032592773438, -0.036991119384765625, -0.018833160400390625, 0.5255126953125, -0.23902130126953125, 0.2644386291503906, -0.1630115509033203], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000015.npy"} +{"epoch": 0.022675736961451247, "step": 16, "batch_size": 64, "mean": 0.027941584587097168, "std": 0.25433027744293213, "min": -0.4372711181640625, "p10": -0.21688804626464842, "median": -0.0125274658203125, "p90": 0.3108978271484376, "max": 1.0721282958984375, "pos_frac": 0.46875, "sample": [0.1760997772216797, 0.22381591796875, -0.186248779296875, 0.012302398681640625, -0.01776123046875, -0.11184883117675781, 0.09255218505859375, -0.1600799560546875, 0.57635498046875, -0.1965484619140625, -0.1232147216796875, 0.00087738037109375, -0.014980316162109375, -0.08568572998046875, 0.2661628723144531, -0.2806968688964844, 0.3196296691894531, -0.09027671813964844, 0.22197723388671875, -0.04827880859375, 0.03318023681640625, -0.38962554931640625, 0.5804443359375, 0.2550926208496094, -0.0023345947265625, 0.1401519775390625, 0.0163421630859375, 0.0584564208984375, 0.2151947021484375, 1.0721282958984375, 0.56158447265625, -0.12945556640625, 0.374114990234375, 0.026424407958984375, -0.0751800537109375, -0.37175750732421875, 0.0786285400390625, -0.07159423828125, -0.4027900695800781, -0.15947341918945312, -0.22134780883789062, -0.010074615478515625, -0.01859283447265625, 0.0920562744140625, 0.12099456787109375, 0.2905235290527344, -0.114837646484375, -0.20648193359375, 0.03934478759765625, -0.31972694396972656, -0.05732154846191406, -0.12072372436523438, 0.06295013427734375, -0.017307281494140625, -0.0382080078125, -0.05158042907714844, -0.03826141357421875, -0.168121337890625, -0.4372711181640625, 0.09065818786621094, 0.1409168243408203, -0.08447265625, 0.1309814453125, 0.3404808044433594], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000016.npy"} +{"epoch": 0.02418745275888133, "step": 17, "batch_size": 64, "mean": 0.06366986036300659, "std": 0.357475221157074, "min": -1.184112548828125, "p10": -0.2556148529052734, "median": 0.050568580627441406, "p90": 0.45443305969238296, "max": 1.1582183837890625, "pos_frac": 0.59375, "sample": [0.0873565673828125, 0.1313323974609375, 0.0020542144775390625, -0.03973960876464844, 1.01361083984375, 0.28847503662109375, 0.113555908203125, -0.150177001953125, 0.16538238525390625, -0.186187744140625, 0.2797088623046875, 0.16480636596679688, -0.2633533477783203, 0.08198928833007812, -0.24064254760742188, -0.13204574584960938, 0.0648345947265625, 0.013439178466796875, 0.19467735290527344, 0.21291351318359375, -0.2229461669921875, 0.009120941162109375, -1.184112548828125, -0.07321929931640625, -0.13005828857421875, -0.1410541534423828, 0.5154647827148438, -0.09707450866699219, 0.201324462890625, -0.6115608215332031, -0.48906707763671875, -0.5495834350585938, 0.08315277099609375, -0.11556625366210938, 1.1582183837890625, 0.6767730712890625, 0.06447219848632812, -0.011993408203125, 0.3491058349609375, 0.04156494140625, -0.0491485595703125, 0.021724700927734375, 0.2426433563232422, 0.40418243408203125, 0.1405487060546875, -0.030548095703125, 0.4700164794921875, 0.75079345703125, 0.6495437622070312, 0.353912353515625, 0.23602676391601562, -0.3849945068359375, -0.26203155517578125, 0.05957221984863281, 0.1215972900390625, -0.22636032104492188, 0.10623359680175781, 0.136260986328125, -0.00534820556640625, 0.0297698974609375, 0.4180717468261719, -0.04750823974609375, -0.1314411163330078, -0.2035980224609375], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000017.npy"} +{"epoch": 0.025699168556311415, "step": 18, "batch_size": 64, "mean": 0.051440656185150146, "std": 0.24022811651229858, "min": -0.5367355346679688, "p10": -0.22108993530273435, "median": 0.0330352783203125, "p90": 0.3614631652832031, "max": 0.553985595703125, "pos_frac": 0.5625, "sample": [0.2502021789550781, 0.10062789916992188, 0.16594886779785156, -0.07047080993652344, 0.022006988525390625, 0.09182357788085938, 0.061065673828125, 0.4899749755859375, 0.50482177734375, 0.01964569091796875, 0.044063568115234375, 0.3202972412109375, -0.0006656646728515625, -0.07827949523925781, 0.017364501953125, 0.3341064453125, 0.059474945068359375, -0.42404937744140625, 0.20194625854492188, 0.361602783203125, 0.30583953857421875, 0.553985595703125, 0.0768280029296875, 0.4828033447265625, 0.19252777099609375, -0.12376785278320312, 0.26108551025390625, 0.2609062194824219, 0.19157791137695312, -0.010972976684570312, -0.037075042724609375, -0.09140777587890625, -0.2705535888671875, -0.0919647216796875, -0.15679168701171875, -0.4173126220703125, 0.071380615234375, -0.15773963928222656, -0.5367355346679688, 0.26336669921875, -0.20767974853515625, -0.5193557739257812, -0.09226226806640625, -0.226837158203125, -0.039241790771484375, 0.3001556396484375, -0.04511260986328125, 0.1369342803955078, 0.061069488525390625, -0.27706146240234375, 0.36113739013671875, -0.017045974731445312, -0.09973526000976562, -0.0039348602294921875, -0.06565093994140625, -0.07245635986328125, 0.00438690185546875, -0.16149330139160156, 0.4289131164550781, 0.06557846069335938, 0.37116241455078125, -0.12215423583984375, 0.20373916625976562, 0.07165908813476562], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000018.npy"} +{"epoch": 0.027210884353741496, "step": 19, "batch_size": 64, "mean": 0.053305551409721375, "std": 0.3574451804161072, "min": -1.48504638671875, "p10": -0.19431915283203124, "median": 0.07643604278564453, "p90": 0.428713607788086, "max": 0.8997344970703125, "pos_frac": 0.5625, "sample": [0.42315673828125, 0.1797637939453125, 0.14099884033203125, -0.13909912109375, 0.15715789794921875, 0.4310951232910156, 0.1028594970703125, -0.10912322998046875, -0.430389404296875, -0.09244155883789062, 0.177978515625, 0.2276153564453125, 0.388519287109375, 0.05001258850097656, 0.2453765869140625, -0.10874366760253906, 0.1254596710205078, -0.013994216918945312, -0.11019515991210938, 0.1907634735107422, 0.3574981689453125, -0.1838836669921875, -0.07673263549804688, -0.172576904296875, 0.6175079345703125, 0.6234817504882812, 0.3483734130859375, 0.1482086181640625, -0.27825164794921875, -0.19879150390625, 0.1921844482421875, 0.14036178588867188, -0.18369293212890625, 0.015384674072265625, -1.48504638671875, -1.0800628662109375, -0.243560791015625, -0.014177322387695312, 0.743560791015625, 0.15624046325683594, 0.16431236267089844, -0.1466693878173828, -0.02532958984375, -0.18280029296875, 0.122772216796875, 0.34414100646972656, 0.45238494873046875, 0.037384033203125, -0.15554046630859375, 0.49019622802734375, 0.8997344970703125, -0.07363128662109375, -0.15833282470703125, -0.17246723175048828, 0.11025238037109375, 0.10790634155273438, -0.37734222412109375, -0.08847808837890625, -0.04386711120605469, 0.255859375, 0.23505210876464844, -0.030826568603515625, 0.3554840087890625, 0.028564453125], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000019.npy"} +{"epoch": 0.02872260015117158, "step": 20, "batch_size": 64, "mean": 0.03143279254436493, "std": 0.31017181277275085, "min": -0.76629638671875, "p10": -0.3445831298828125, "median": -0.0043888092041015625, "p90": 0.40684356689453127, "max": 0.9925384521484375, "pos_frac": 0.484375, "sample": [-0.06719970703125, -0.14977645874023438, -0.18285369873046875, -0.091033935546875, -0.11297988891601562, -0.03179168701171875, -0.24716949462890625, 0.13214111328125, 0.3703346252441406, -0.34850311279296875, 0.14498138427734375, 0.2672233581542969, 0.1021270751953125, 0.06261444091796875, -0.0653839111328125, -0.1918048858642578, -0.4976959228515625, -0.24495506286621094, 0.4218788146972656, -0.3447914123535156, 0.043399810791015625, 0.10161209106445312, -0.12838363647460938, 0.21646881103515625, -0.14717864990234375, 0.508148193359375, -0.059413909912109375, -0.010698318481445312, 0.498565673828125, -0.06562423706054688, -0.69622802734375, -0.5797271728515625, -0.07039642333984375, -0.15881729125976562, -0.76629638671875, 0.4947624206542969, 0.051639556884765625, 0.4028167724609375, -0.0086822509765625, -0.12938690185546875, 0.10400390625, -0.0126953125, 0.2194366455078125, -0.1081085205078125, 0.07143402099609375, 0.9925384521484375, 0.4085693359375, -0.0167236328125, 0.31276702880859375, 0.0985565185546875, -0.353851318359375, 0.30391693115234375, -0.3440971374511719, 0.7526779174804688, -9.5367431640625e-05, 0.21120643615722656, 0.3076667785644531, 0.26270294189453125, 0.22455596923828125, 0.045879364013671875, -0.1262054443359375, 0.22344970703125, 0.06402206420898438, -0.051850318908691406], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000020.npy"} +{"epoch": 0.030234315948601664, "step": 21, "batch_size": 64, "mean": -0.045765221118927, "std": 0.2906523644924164, "min": -0.74090576171875, "p10": -0.3026935577392578, "median": -0.10069561004638672, "p90": 0.25765762329101566, "max": 0.9508285522460938, "pos_frac": 0.359375, "sample": [-0.15053558349609375, -0.2900524139404297, -0.14768218994140625, -0.0020294189453125, -0.11345672607421875, 0.1673431396484375, -0.00878143310546875, -0.2626953125, -0.22713088989257812, -0.2398357391357422, 0.04850006103515625, -0.337493896484375, 0.097320556640625, -0.27459716796875, 0.0811309814453125, 0.41031646728515625, -0.19008636474609375, 0.9508285522460938, -0.2330169677734375, -0.2505626678466797, 0.12805938720703125, -0.07076263427734375, -0.08005714416503906, -0.10750579833984375, 0.47100830078125, -0.74090576171875, -0.007640838623046875, 0.26152801513671875, 0.16866302490234375, 0.12261199951171875, -0.074554443359375, -0.30811119079589844, 0.21746826171875, -0.053302764892578125, -0.2569732666015625, 0.5451183319091797, 0.248626708984375, -0.2826385498046875, -0.338348388671875, -0.45267486572265625, -0.20420074462890625, -0.20227813720703125, 0.07708740234375, 0.10251426696777344, 0.125823974609375, -0.1668109893798828, -0.08621978759765625, 0.09705734252929688, -0.46657562255859375, 0.030361175537109375, -0.18556594848632812, -0.56597900390625, -0.1656665802001953, -0.256317138671875, -0.14267921447753906, -0.14747238159179688, 0.057292938232421875, -0.09388542175292969, 0.3199501037597656, 0.8441162109375, -0.23923492431640625, -0.10770416259765625, 0.23668670654296875, -0.20636558532714844], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000021.npy"} +{"epoch": 0.031746031746031744, "step": 22, "batch_size": 64, "mean": -0.02719232439994812, "std": 0.3017886281013489, "min": -0.7225189208984375, "p10": -0.4063697814941406, "median": 0.006821632385253906, "p90": 0.3308160781860353, "max": 0.6414947509765625, "pos_frac": 0.53125, "sample": [-0.6598434448242188, -0.709014892578125, -0.31777191162109375, 0.009006500244140625, 0.17787551879882812, 0.11153411865234375, 0.10295486450195312, -0.4171295166015625, -0.08838844299316406, 0.2027435302734375, 0.029285430908203125, 0.21056365966796875, -0.1485271453857422, 0.0525665283203125, 0.21472930908203125, 0.0426025390625, -0.350128173828125, -0.24630355834960938, -0.12624359130859375, -0.38126373291015625, 0.530426025390625, -0.0684661865234375, 0.1977996826171875, 0.11606407165527344, 0.076904296875, 0.6414947509765625, 0.07976531982421875, 0.030506134033203125, 0.0046367645263671875, 0.002361297607421875, -0.7225189208984375, -0.5756378173828125, -0.3801383972167969, 0.2590484619140625, 0.2180156707763672, -0.284149169921875, 0.10008049011230469, -0.5370941162109375, -0.33559417724609375, -0.0579681396484375, 0.4363212585449219, -0.442138671875, 0.23297882080078125, 0.18402099609375, -0.004062652587890625, -0.181915283203125, -0.02947998046875, -0.1006011962890625, -0.04224395751953125, 0.3852386474609375, 0.041973114013671875, 0.4423828125, -0.1928863525390625, 0.472808837890625, -0.0130462646484375, 0.016843795776367188, 0.2907390594482422, 0.21769332885742188, 0.347991943359375, -0.367034912109375, -0.102783203125, -0.3295860290527344, 0.21021461486816406, -0.2185211181640625], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000022.npy"} +{"epoch": 0.03325774754346183, "step": 23, "batch_size": 64, "mean": 0.02588629722595215, "std": 0.3233484625816345, "min": -0.970672607421875, "p10": -0.2834091186523437, "median": 0.009592056274414062, "p90": 0.44495315551757814, "max": 0.8207244873046875, "pos_frac": 0.53125, "sample": [-0.7049713134765625, 0.013519287109375, -0.092559814453125, 0.45062255859375, -0.12572288513183594, 0.37262535095214844, -0.00955963134765625, 0.8207244873046875, -0.1513519287109375, 0.0110321044921875, 0.38401031494140625, -0.13522911071777344, 0.08380889892578125, 0.09180068969726562, 0.2611732482910156, 0.01025390625, -0.40917205810546875, 0.22530364990234375, -0.197998046875, 0.004669189453125, 0.12850189208984375, 0.2552070617675781, -0.010824203491210938, -0.190277099609375, 0.008930206298828125, 0.261810302734375, -0.07413482666015625, 0.03020477294921875, 0.5322113037109375, 0.03542327880859375, -0.970672607421875, 0.17662811279296875, -0.2226104736328125, 0.435943603515625, 0.44881439208984375, -0.1860809326171875, -0.57177734375, 0.205902099609375, -0.11726760864257812, -0.14934921264648438, -0.2415924072265625, -0.435546875, 0.018131256103515625, -0.005279541015625, 0.6103553771972656, -0.089508056640625, -0.20426177978515625, 0.08638381958007812, -0.03951263427734375, -0.24053955078125, -0.5867462158203125, -0.040607452392578125, 0.11521530151367188, -0.13874244689941406, -0.14442825317382812, 0.062458038330078125, 0.6422882080078125, -0.30133056640625, 0.29932403564453125, 0.3950767517089844, 0.61163330078125, 0.11522674560546875, 0.24114036560058594, -0.00197601318359375], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000023.npy"} +{"epoch": 0.03476946334089191, "step": 24, "batch_size": 64, "mean": -0.03844273090362549, "std": 0.26216158270835876, "min": -0.617767333984375, "p10": -0.36543292999267574, "median": -0.05375099182128906, "p90": 0.26255989074707037, "max": 0.578094482421875, "pos_frac": 0.421875, "sample": [-0.4184837341308594, -0.20508956909179688, -0.1900482177734375, 0.15815353393554688, 0.11945343017578125, -0.04859161376953125, 0.18297958374023438, 0.05084991455078125, -0.4038810729980469, -0.15781402587890625, 0.019029617309570312, -0.174774169921875, -0.14595603942871094, -0.097503662109375, 0.47747039794921875, -0.07269287109375, -0.11826705932617188, -0.21421051025390625, -0.2808036804199219, 0.15904617309570312, -0.33985137939453125, 0.12322616577148438, 0.3856201171875, -0.3901786804199219, 0.212249755859375, 0.0356292724609375, -0.15773773193359375, -0.2743034362792969, -0.617767333984375, -0.1141510009765625, 0.2384929656982422, -0.045623779296875, -0.2159576416015625, -0.3727703094482422, 0.00872039794921875, -0.1410980224609375, -0.24636077880859375, -0.11902999877929688, 0.07331085205078125, -0.051403045654296875, 0.527252197265625, 0.36163330078125, 0.2692718505859375, 0.22236251831054688, 0.5691680908203125, -0.1862640380859375, -0.05609893798828125, -0.5142669677734375, 0.10333061218261719, -0.44769287109375, 0.0917816162109375, -0.2824363708496094, -0.0152435302734375, -0.01586151123046875, 0.0989990234375, 0.06884765625, 0.13130950927734375, -0.3133544921875, -0.25003814697265625, 0.24689865112304688, -0.08055877685546875, -0.3483123779296875, 0.578094482421875, 0.15096092224121094], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000024.npy"} +{"epoch": 0.036281179138321996, "step": 25, "batch_size": 64, "mean": 0.06195506453514099, "std": 0.30696606636047363, "min": -0.9359130859375, "p10": -0.2854103088378906, "median": 0.08290863037109375, "p90": 0.34499511718750003, "max": 1.2019805908203125, "pos_frac": 0.671875, "sample": [-0.10469818115234375, -0.20440673828125, -0.026689529418945312, 0.07466888427734375, 0.23430633544921875, 0.08723258972167969, 0.19769287109375, 0.01857757568359375, 0.1200408935546875, 0.3466682434082031, -0.395111083984375, 0.08047866821289062, -0.290557861328125, -0.427215576171875, 0.770477294921875, 0.0633087158203125, -0.27339935302734375, 0.08533859252929688, 0.15015792846679688, 0.3413848876953125, -0.056549072265625, 0.21759414672851562, -0.15139007568359375, 1.2019805908203125, 0.4197731018066406, 0.06278610229492188, 0.2764472961425781, -0.46356201171875, 0.13145065307617188, -0.18106460571289062, 0.09218978881835938, 0.1662425994873047, 0.28200531005859375, 0.2138671875, 0.23486328125, 0.11457443237304688, 0.05413818359375, 0.10794830322265625, -0.07400131225585938, -0.2605438232421875, -0.9359130859375, -0.16971969604492188, 0.15246963500976562, 0.07788276672363281, -0.06114959716796875, 0.06574249267578125, 0.3465423583984375, -0.10548782348632812, 0.1966705322265625, -0.5830078125, 0.18473052978515625, 0.13566017150878906, 0.20902252197265625, -0.037578582763671875, -0.32349395751953125, 0.06952285766601562, 0.0502777099609375, 0.19736862182617188, 0.48722076416015625, 0.0178985595703125, 0.10720062255859375, 0.5618133544921875, -0.18813705444335938, 0.2725830078125], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000025.npy"} +{"epoch": 0.03779289493575208, "step": 26, "batch_size": 64, "mean": 0.029800832271575928, "std": 0.29926609992980957, "min": -0.8420257568359375, "p10": -0.2704889297485351, "median": -0.0026397705078125, "p90": 0.41131286621093754, "max": 0.7847900390625, "pos_frac": 0.484375, "sample": [0.4037933349609375, 0.3265380859375, -0.14723968505859375, 0.0621337890625, 0.09585952758789062, -0.15991783142089844, -0.0425567626953125, -0.24853515625, -0.16318893432617188, 0.2760276794433594, -0.042751312255859375, 0.7847900390625, 0.537200927734375, -0.2349395751953125, -0.6038970947265625, -0.01122283935546875, 0.056842803955078125, 0.5875492095947266, -0.03374481201171875, 0.0703125, -0.1116485595703125, -0.021856307983398438, -0.40906524658203125, 0.1949939727783203, 0.2205657958984375, -0.13924407958984375, 0.23647308349609375, -0.18337249755859375, 0.22662925720214844, -0.0572357177734375, 0.12171745300292969, 0.6623764038085938, 0.0179901123046875, 0.16838836669921875, -0.0751953125, 0.12249755859375, -0.22748565673828125, 0.16364097595214844, -0.00067138671875, 0.19781494140625, 0.13062095642089844, -0.004608154296875, -0.04548454284667969, -0.08933258056640625, 0.5095405578613281, -0.22762298583984375, -0.8420257568359375, -0.04185676574707031, -0.610015869140625, -0.1301136016845703, 0.4145355224609375, -0.45882415771484375, 0.3914909362792969, 0.47084808349609375, -0.27989768981933594, 0.212005615234375, -0.30542755126953125, -0.18959617614746094, -0.13915252685546875, 0.20157814025878906, 0.170196533203125, 0.12354850769042969, -0.04830741882324219, 0.07478713989257812], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000026.npy"} +{"epoch": 0.039304610733182165, "step": 27, "batch_size": 64, "mean": 0.007359504699707031, "std": 0.26162222027778625, "min": -0.53204345703125, "p10": -0.2994827270507812, "median": 0.015827178955078125, "p90": 0.3674528121948243, "max": 0.900634765625, "pos_frac": 0.546875, "sample": [-0.16038131713867188, 0.2852611541748047, -0.26934814453125, 0.04386329650878906, 0.017513275146484375, -0.184417724609375, 0.1556243896484375, -0.27178955078125, 0.13681793212890625, -0.006317138671875, -0.3566131591796875, 0.0516815185546875, 0.3921318054199219, 0.059726715087890625, -0.07156181335449219, -0.46331024169921875, 0.06818580627441406, 0.143310546875, 0.0454559326171875, -0.2748870849609375, 0.4959869384765625, -0.2858428955078125, -0.059478759765625, -0.114349365234375, 0.169342041015625, -0.2209014892578125, -0.11260986328125, 0.040248870849609375, 0.34603118896484375, -0.2484111785888672, -0.38883209228515625, -0.0566253662109375, 0.14307212829589844, 0.0223236083984375, 0.3844947814941406, -0.305328369140625, 0.37325096130371094, 0.4301910400390625, 0.151458740234375, 0.0656280517578125, 0.008270263671875, -0.11808013916015625, 0.06742668151855469, 0.014141082763671875, -0.109649658203125, 0.34059906005859375, -0.41728973388671875, 0.3539237976074219, 0.1424102783203125, -0.057559967041015625, 0.039306640625, -0.53204345703125, 0.002956390380859375, 0.900634765625, 0.3946819305419922, -0.16124343872070312, 0.1694793701171875, -0.2858409881591797, -0.1116790771484375, -0.13444137573242188, 0.17803192138671875, -0.32025909423828125, 0.09354019165039062, -0.15690231323242188], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000027.npy"} +{"epoch": 0.04081632653061224, "step": 28, "batch_size": 64, "mean": -0.0014629065990447998, "std": 0.3271964490413666, "min": -1.1375579833984375, "p10": -0.36187686920166007, "median": 0.027330398559570312, "p90": 0.4008281707763672, "max": 0.8732376098632812, "pos_frac": 0.546875, "sample": [0.09465789794921875, 0.16046142578125, -0.639068603515625, 0.4018592834472656, 0.133941650390625, -0.053173065185546875, -0.150970458984375, 0.11547088623046875, 0.276641845703125, 0.4169464111328125, -0.042755126953125, 0.08896636962890625, 0.07605743408203125, -0.00716400146484375, -0.541748046875, -0.20821380615234375, -0.23908615112304688, -0.28531837463378906, 0.11183547973632812, 0.3984222412109375, 0.45072174072265625, -0.26908111572265625, -0.020341873168945312, 0.08852386474609375, -0.0066070556640625, 0.060993194580078125, -0.16768264770507812, -0.00856781005859375, -1.1375579833984375, 0.0240325927734375, -0.6459579467773438, 0.022457122802734375, 0.015445709228515625, 0.2602081298828125, 0.222808837890625, 0.43735504150390625, -0.006832122802734375, -0.2476348876953125, -0.4028778076171875, -0.2837371826171875, 0.03963279724121094, -0.25559234619140625, -0.3946876525878906, 0.18059539794921875, 0.31740570068359375, -0.16085243225097656, 0.21374893188476562, -0.7603530883789062, -0.07771492004394531, 0.030628204345703125, 0.469085693359375, 0.8732376098632812, 0.10520362854003906, 0.1489715576171875, 0.415771484375, 0.3800506591796875, -0.17039108276367188, -0.14987945556640625, -0.27967071533203125, 0.1575641632080078, 0.037109375, 0.2933235168457031, 0.1558990478515625, -0.1561431884765625], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000028.npy"} +{"epoch": 0.042328042328042326, "step": 29, "batch_size": 64, "mean": 0.07004186511039734, "std": 0.29630810022354126, "min": -0.726959228515625, "p10": -0.2664455413818359, "median": 0.059894561767578125, "p90": 0.46548271179199224, "max": 0.6992034912109375, "pos_frac": 0.625, "sample": [-0.01448822021484375, -0.425262451171875, 0.643096923828125, -0.2716217041015625, 0.07647705078125, -0.2307262420654297, 0.3783721923828125, -0.0067005157470703125, -0.6902122497558594, -0.058746337890625, 0.09349250793457031, 0.4710502624511719, 0.07118988037109375, 0.17753219604492188, 0.45249176025390625, -0.19488525390625, -0.233306884765625, -0.18641281127929688, 0.39788818359375, 0.05582427978515625, 0.05847930908203125, 0.223480224609375, 0.30164337158203125, -0.07727622985839844, 0.2787017822265625, 0.561553955078125, 0.05260467529296875, -0.726959228515625, 0.414642333984375, 0.27890586853027344, 0.08177566528320312, -0.15069580078125, 0.1981201171875, 0.12291145324707031, 0.0482177734375, 0.1960010528564453, 0.09810638427734375, 0.05565643310546875, 0.23864173889160156, 0.6992034912109375, -0.15141677856445312, 0.022678375244140625, -0.30306053161621094, 0.4228477478027344, -0.10304450988769531, 0.21414947509765625, -0.2543678283691406, -0.0590972900390625, 0.041839599609375, 0.24493789672851562, 0.541595458984375, -0.1623382568359375, 0.5084114074707031, 0.1452350616455078, -0.2884521484375, -0.03845977783203125, -0.10182952880859375, 0.06581878662109375, 0.23819732666015625, 0.5395050048828125, -0.526397705078125, -0.0729217529296875, 0.061309814453125, 0.0387725830078125], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000029.npy"} +{"epoch": 0.04383975812547241, "step": 30, "batch_size": 64, "mean": -0.049675971269607544, "std": 0.2572989761829376, "min": -0.598785400390625, "p10": -0.3749996185302734, "median": -0.06646156311035156, "p90": 0.2457496643066407, "max": 0.8201904296875, "pos_frac": 0.390625, "sample": [-0.17055892944335938, -0.06609725952148438, -0.39760589599609375, -0.38265228271484375, 0.025510787963867188, 0.2326812744140625, 0.08306312561035156, 0.10614776611328125, -0.25318145751953125, -0.4415435791015625, 0.08875274658203125, -0.395843505859375, -0.026828765869140625, -0.01023101806640625, -0.27362060546875, -0.103790283203125, -0.19570159912109375, 0.8201904296875, -0.15807723999023438, 0.15502166748046875, -0.01729583740234375, -0.061763763427734375, -0.18532180786132812, 0.03684043884277344, -0.22234344482421875, -0.143402099609375, 0.08754348754882812, -0.3571434020996094, 0.1627044677734375, 0.25135040283203125, -0.2857208251953125, -0.27166175842285156, -0.273193359375, 0.5926666259765625, -0.138336181640625, -0.08135223388671875, -0.1196441650390625, -0.1848621368408203, 0.31081390380859375, -0.24654769897460938, -0.08167266845703125, -0.036952972412109375, 0.457489013671875, -0.13646697998046875, -0.14365386962890625, -0.14713287353515625, 0.013671875, -0.19166183471679688, 0.07639503479003906, -0.598785400390625, -0.489166259765625, 0.28984832763671875, 0.32779884338378906, 0.16181182861328125, 0.13532257080078125, -0.11884307861328125, 0.221710205078125, 0.12714767456054688, -0.5670166015625, 0.03696441650390625, 0.049713134765625, -0.026340484619140625, -0.06682586669921875, 0.038417816162109375], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000030.npy"} +{"epoch": 0.045351473922902494, "step": 31, "batch_size": 64, "mean": 0.0262012779712677, "std": 0.30501872301101685, "min": -0.8401336669921875, "p10": -0.34798202514648435, "median": 0.029781341552734375, "p90": 0.4360298156738282, "max": 0.712158203125, "pos_frac": 0.53125, "sample": [0.2236480712890625, 0.46114349365234375, 0.04412841796875, 0.26598167419433594, -0.20290184020996094, -0.526123046875, -0.226898193359375, 0.061595916748046875, 0.712158203125, 0.39933013916015625, -0.12321281433105469, 0.6176986694335938, 0.3242168426513672, 0.366668701171875, 0.42359161376953125, 0.120941162109375, 0.46072959899902344, 0.02127838134765625, 0.4413604736328125, -0.04608154296875, -0.0858306884765625, -0.066070556640625, 0.08474159240722656, -0.07370948791503906, 0.18589019775390625, -0.40435791015625, 0.521697998046875, -0.11389923095703125, -0.18541717529296875, -0.168182373046875, 0.2407989501953125, -0.15191650390625, -0.47718048095703125, -0.2896232604980469, -0.019550323486328125, -0.004367828369140625, -0.32346343994140625, -0.17060089111328125, -0.11499595642089844, -0.2950572967529297, 0.13088226318359375, -0.4937896728515625, -0.22977447509765625, 0.0089569091796875, 0.153472900390625, 0.1404266357421875, -0.07374382019042969, -0.358489990234375, 0.06693649291992188, 0.11627197265625, -0.8401336669921875, -0.1325225830078125, 0.3868408203125, 0.04302215576171875, 0.14776611328125, 0.15410614013671875, 0.21824073791503906, 0.0382843017578125, -0.0018978118896484375, -0.02452850341796875, 0.6301651000976562, 0.15920448303222656, 0.058750152587890625, -0.52972412109375], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000031.npy"} +{"epoch": 0.04686318972033258, "step": 32, "batch_size": 64, "mean": 0.027545809745788574, "std": 0.29064273834228516, "min": -0.6551284790039062, "p10": -0.3900234222412109, "median": 0.06524181365966797, "p90": 0.3334106445312501, "max": 0.60699462890625, "pos_frac": 0.609375, "sample": [-0.0499267578125, 0.1609649658203125, -0.6551284790039062, 0.2733917236328125, -0.362335205078125, -0.07727432250976562, -0.108428955078125, -0.40683746337890625, 0.2833709716796875, 0.0973358154296875, 0.43463897705078125, 0.60699462890625, 0.13994216918945312, -0.2797698974609375, 0.28414154052734375, 0.147918701171875, 0.2243804931640625, 0.06940841674804688, -0.4018898010253906, 0.12909317016601562, 0.05453681945800781, -0.10507965087890625, 0.12519454956054688, 0.2939300537109375, 0.4456291198730469, -0.22505569458007812, 0.31247711181640625, 0.35524749755859375, -0.0067596435546875, 0.5631523132324219, 0.06107521057128906, 0.320465087890625, 0.084228515625, -0.0235137939453125, 0.25861358642578125, 0.29065704345703125, -0.25244903564453125, -0.3305931091308594, -0.078857421875, 0.338958740234375, 0.058269500732421875, 0.30499267578125, 0.22217559814453125, 0.01985931396484375, 0.07130241394042969, -0.11240386962890625, 0.08774375915527344, -0.5110702514648438, -0.493499755859375, 0.08559036254882812, 0.275604248046875, 0.20383834838867188, -0.229217529296875, 0.03293418884277344, 0.08623123168945312, -0.1771869659423828, -0.6021194458007812, 0.5986404418945312, -0.11630058288574219, 0.011987686157226562, -0.20037841796875, 0.01367950439453125, -0.537322998046875, -0.322265625], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000032.npy"} +{"epoch": 0.04837490551776266, "step": 33, "batch_size": 64, "mean": 0.032418325543403625, "std": 0.37006300687789917, "min": -1.0313949584960938, "p10": -0.36003627777099606, "median": 0.03457355499267578, "p90": 0.49918212890625013, "max": 0.909271240234375, "pos_frac": 0.59375, "sample": [-0.1780853271484375, -0.62127685546875, 0.32627105712890625, -0.566162109375, -0.10111236572265625, -0.2368621826171875, 0.08296966552734375, 0.07081794738769531, 0.46759796142578125, 0.9014511108398438, 0.0921478271484375, 0.2895317077636719, -0.19060420989990234, -0.147430419921875, 0.7280807495117188, -0.70928955078125, -0.2462615966796875, 0.4295616149902344, 0.12602996826171875, 0.655181884765625, 0.01894378662109375, 0.909271240234375, 0.327880859375, 0.03373146057128906, -1.0313949584960938, 0.02764892578125, 0.6258544921875, 0.027782440185546875, 0.2064666748046875, -0.0506134033203125, 0.11191177368164062, -0.0659942626953125, 0.5227432250976562, -0.03558349609375, 0.0354156494140625, -0.012723922729492188, 0.11032295227050781, -0.2918853759765625, -0.25519561767578125, -0.5650157928466797, -0.3384246826171875, -0.20564651489257812, -0.08742904663085938, 0.1142578125, -0.3660736083984375, -0.2992095947265625, 0.4135284423828125, 0.09741592407226562, -0.10672187805175781, 0.11419296264648438, -0.3459491729736328, 0.124481201171875, 0.0080108642578125, 0.0903472900390625, 0.15750503540039062, 0.11320114135742188, 0.027935028076171875, 0.5127182006835938, -0.531402587890625, -0.3292236328125, 0.07693862915039062, 0.3185272216796875, 0.31661033630371094, 0.3770599365234375], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000033.npy"} +{"epoch": 0.049886621315192746, "step": 34, "batch_size": 64, "mean": 0.07393822073936462, "std": 0.29819947481155396, "min": -0.7526397705078125, "p10": -0.2496221542358398, "median": 0.03618907928466797, "p90": 0.4594360351562501, "max": 0.7834014892578125, "pos_frac": 0.59375, "sample": [-0.09128952026367188, 0.6821441650390625, -0.2609100341796875, -0.05878448486328125, 0.3698844909667969, -0.02138519287109375, -0.020198822021484375, 0.4793434143066406, 0.3797588348388672, 0.23184967041015625, 0.20541763305664062, 0.470428466796875, 0.22217559814453125, -0.1390380859375, 0.0176239013671875, -0.3268585205078125, 0.1348876953125, 0.12547683715820312, 0.3161277770996094, 0.05264854431152344, -0.28708648681640625, -0.2232837677001953, -0.04023933410644531, 0.00995635986328125, 0.1498870849609375, 0.02770233154296875, 0.7834014892578125, 0.4305000305175781, -0.0588836669921875, -0.1678466796875, 0.1628265380859375, 0.3192634582519531, 0.13983917236328125, 0.12944984436035156, -0.10126876831054688, 0.437347412109375, -0.021484375, 0.19845199584960938, 0.09677886962890625, 0.2503395080566406, -0.4517059326171875, 0.04456329345703125, 0.11732864379882812, 0.2584705352783203, 0.7185821533203125, 0.2165985107421875, -0.7526397705078125, 0.4096641540527344, 0.009307861328125, 0.22208786010742188, 0.007335662841796875, -0.6559906005859375, 0.468902587890625, -0.1220245361328125, -0.20263290405273438, -0.3521766662597656, -0.14410400390625, -0.08852577209472656, -0.22324562072753906, 0.027814865112304688, 0.5438232421875, -0.0525054931640625, -0.20597076416015625, -0.06586456298828125], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000034.npy"} +{"epoch": 0.05139833711262283, "step": 35, "batch_size": 64, "mean": 0.00705409049987793, "std": 0.35035452246665955, "min": -0.6241912841796875, "p10": -0.47769393920898434, "median": 0.06374931335449219, "p90": 0.3938940048217774, "max": 1.1309814453125, "pos_frac": 0.5625, "sample": [0.2500762939453125, -0.49938201904296875, 0.38579368591308594, -0.19503021240234375, -0.33704376220703125, 0.13275146484375, 0.0113525390625, 0.2699756622314453, -0.17946624755859375, -0.4339122772216797, 0.300323486328125, 0.1275653839111328, 0.032085418701171875, 0.09852027893066406, -0.01018524169921875, 0.09389114379882812, 1.1309814453125, 0.209564208984375, 0.2122650146484375, 0.41888427734375, 0.13559913635253906, 0.049407958984375, 0.3973655700683594, 0.07809066772460938, 0.2546730041503906, 0.4116554260253906, -0.5807952880859375, -0.20165252685546875, 0.16421890258789062, -0.16646575927734375, -0.6142120361328125, 0.10242462158203125, -0.372528076171875, -0.36853790283203125, -0.20765304565429688, -0.31280517578125, -0.24708175659179688, -0.5640106201171875, 0.15793991088867188, -0.487396240234375, 0.13082504272460938, 0.24870872497558594, 0.7468490600585938, -0.5485916137695312, -0.20225906372070312, 0.31414031982421875, 0.37252044677734375, 0.3228912353515625, -0.07317733764648438, 0.2442493438720703, -0.323150634765625, -0.1927947998046875, 0.2198638916015625, -0.170745849609375, -0.45505523681640625, 0.22388458251953125, -0.1231689453125, -0.6241912841796875, 0.045421600341796875, 0.6246337890625, -0.19710350036621094, 0.4033966064453125, -0.3061027526855469, 0.12317085266113281], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000035.npy"} +{"epoch": 0.05291005291005291, "step": 36, "batch_size": 64, "mean": -0.0037604570388793945, "std": 0.32554805278778076, "min": -0.6224632263183594, "p10": -0.35969886779785154, "median": -0.032909393310546875, "p90": 0.3657419204711915, "max": 0.9949569702148438, "pos_frac": 0.46875, "sample": [-0.3119049072265625, 0.825469970703125, 0.0236053466796875, -0.3279991149902344, -0.17600250244140625, -0.3673057556152344, 0.26663970947265625, 0.10781478881835938, 0.3430004119873047, 0.25344085693359375, -0.1578521728515625, -0.3046836853027344, 0.1678924560546875, -0.5272216796875, -0.05256462097167969, -0.17998504638671875, 0.37548828125, -0.14632797241210938, 0.10362815856933594, 0.5955085754394531, -0.04969978332519531, -0.04720306396484375, -0.11956024169921875, 0.0072536468505859375, -0.07393646240234375, -0.47676849365234375, -0.17527389526367188, 0.23149871826171875, 0.0234222412109375, -0.008270263671875, 0.07318878173828125, 0.021266937255859375, -0.166839599609375, 0.379669189453125, -0.602691650390625, -0.6224632263183594, 0.07196807861328125, -0.0260772705078125, -0.2601890563964844, -0.4737281799316406, 0.14860153198242188, 0.094207763671875, 0.9949569702148438, -0.22957992553710938, 0.00386810302734375, 0.10256576538085938, 0.13321304321289062, 0.2661094665527344, -0.206939697265625, 0.9120101928710938, 0.39910888671875, -0.14152145385742188, 0.031414031982421875, -0.162078857421875, -0.21974563598632812, -0.27042388916015625, -0.03974151611328125, 0.319732666015625, -0.4676971435546875, -0.09242630004882812, -0.06530952453613281, 0.28375244140625, -0.341949462890625, 0.09099578857421875], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000036.npy"} +{"epoch": 0.05442176870748299, "step": 37, "batch_size": 64, "mean": 0.14793086051940918, "std": 0.34940940141677856, "min": -0.778289794921875, "p10": -0.2674240112304687, "median": 0.1704559326171875, "p90": 0.6230422973632813, "max": 1.20269775390625, "pos_frac": 0.75, "sample": [0.050048828125, 0.7100296020507812, 0.2147216796875, 0.39614105224609375, 0.709228515625, 0.003612518310546875, 0.033191680908203125, 0.04087066650390625, 0.11700439453125, 0.19181442260742188, 0.03375244140625, 0.2279815673828125, 0.46173095703125, 0.4847259521484375, -0.24993896484375, -0.539031982421875, 0.05478858947753906, 0.43720245361328125, 0.2553138732910156, 0.2432861328125, -0.1446208953857422, -0.2942924499511719, -0.5398406982421875, 0.25344085693359375, 0.227691650390625, 0.19372940063476562, 0.08937835693359375, -0.026668548583984375, 0.02509307861328125, 0.16251373291015625, -0.778289794921875, -0.41037750244140625, 0.344512939453125, 0.673858642578125, 0.8802490234375, 0.23339080810546875, 0.20987701416015625, 0.024019241333007812, -0.40482521057128906, 0.028350830078125, 1.20269775390625, -0.2277984619140625, 0.2659149169921875, 0.2230224609375, 0.03882598876953125, -0.05142784118652344, 0.190460205078125, 0.633392333984375, 0.5988922119140625, 0.83154296875, 0.0101470947265625, 0.04755401611328125, -0.06694793701171875, -0.09216499328613281, 0.17839813232421875, 0.11185455322265625, 0.36495208740234375, 0.2522735595703125, 0.190338134765625, -0.2749176025390625, 0.443939208984375, -0.03002166748046875, -0.24813079833984375, 0.2511138916015625], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000037.npy"} +{"epoch": 0.055933484504913075, "step": 38, "batch_size": 64, "mean": 0.0001119077205657959, "std": 0.37784868478775024, "min": -0.756134033203125, "p10": -0.4995227813720703, "median": -0.0031118392944335938, "p90": 0.5136001586914063, "max": 0.9199485778808594, "pos_frac": 0.5, "sample": [0.012470245361328125, 0.14210891723632812, 0.6531143188476562, 0.9199485778808594, -0.18443679809570312, 0.49625396728515625, 0.09549903869628906, 0.7384300231933594, -0.5071868896484375, -0.2642364501953125, -0.16999053955078125, 0.00457000732421875, 0.22286033630371094, 0.08946418762207031, -0.23476409912109375, -0.1468048095703125, -0.12451934814453125, 0.0037937164306640625, -0.38072967529296875, -0.07024383544921875, -0.14653778076171875, 0.0716552734375, -0.2420654296875, -0.7007980346679688, 0.304229736328125, 0.1356658935546875, 0.44475555419921875, -0.5916290283203125, -0.37177276611328125, 0.0595703125, -0.1661968231201172, 0.27532958984375, 0.1658191680908203, 0.16719436645507812, 0.6361160278320312, 0.5210342407226562, 0.1133880615234375, -0.6398544311523438, 0.10378646850585938, 0.13185882568359375, 0.32154083251953125, -0.34763336181640625, -0.17063140869140625, -0.07941055297851562, 0.042316436767578125, -0.4816398620605469, -0.20279693603515625, -0.3766899108886719, 0.8021736145019531, 0.39361572265625, -0.756134033203125, -0.21335601806640625, 0.7589874267578125, -0.6551513671875, -0.04543113708496094, 0.2648029327392578, -0.0144500732421875, -0.106964111328125, -0.6385498046875, -0.01001739501953125, 0.09572219848632812, -0.2459716796875, 0.16901397705078125, -0.06333351135253906], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000038.npy"} +{"epoch": 0.05744520030234316, "step": 39, "batch_size": 64, "mean": 0.007851779460906982, "std": 0.326423317193985, "min": -0.7481708526611328, "p10": -0.39921607971191403, "median": 0.03482532501220703, "p90": 0.38047504425048834, "max": 0.729461669921875, "pos_frac": 0.53125, "sample": [0.236358642578125, -0.07099533081054688, -0.197662353515625, 0.12405967712402344, -0.4034423828125, -0.7226104736328125, 0.41211700439453125, 0.3242607116699219, -0.0932464599609375, 0.15235137939453125, 0.226104736328125, -0.2432537078857422, 0.13091659545898438, 0.025293350219726562, -0.14892578125, 0.3871498107910156, -0.2255535125732422, 0.20594215393066406, 0.3649005889892578, 0.122833251953125, -0.7481708526611328, -0.307373046875, -0.12688827514648438, -0.038516998291015625, 0.493072509765625, 0.07571029663085938, -0.56463623046875, 0.2675018310546875, -0.12665557861328125, -0.3893547058105469, 0.14899826049804688, 0.3622589111328125, 0.3277435302734375, -0.24402618408203125, 0.058319091796875, 0.3601570129394531, 0.09539031982421875, 0.35150146484375, -0.5871162414550781, -0.5596847534179688, 0.2062530517578125, -0.666412353515625, -0.18646240234375, 0.2342987060546875, 0.063720703125, -0.054164886474609375, 0.0443572998046875, -0.16937255859375, 0.4569358825683594, 0.01398468017578125, 0.729461669921875, -0.252716064453125, -0.047725677490234375, -0.06528472900390625, -0.22768402099609375, -0.276336669921875, 0.5252857208251953, 0.591094970703125, 0.34362030029296875, -0.15768051147460938, 0.08982467651367188, 0.2230243682861328, -0.14439964294433594, -0.2259368896484375], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000039.npy"} +{"epoch": 0.05895691609977324, "step": 40, "batch_size": 64, "mean": -0.020780310034751892, "std": 0.31510892510414124, "min": -0.7749862670898438, "p10": -0.43318824768066405, "median": -0.0017423629760742188, "p90": 0.32824134826660156, "max": 0.6095428466796875, "pos_frac": 0.5, "sample": [0.26937103271484375, 0.6095428466796875, -0.06254959106445312, 0.01432037353515625, 0.22247314453125, 0.12001609802246094, 0.31403350830078125, -0.04929351806640625, -0.4003143310546875, 0.11700439453125, 0.33484649658203125, 0.12783241271972656, -0.21691131591796875, -0.10539627075195312, -0.142791748046875, -0.1998748779296875, 0.09710693359375, 0.13379669189453125, 0.24271583557128906, -0.04304695129394531, -0.06995773315429688, -0.0430450439453125, 0.3117790222167969, 0.3307533264160156, 0.1149444580078125, -0.09674072265625, 0.12070083618164062, -0.28421783447265625, -0.6461639404296875, -0.017805099487304688, 0.07439422607421875, -0.7440414428710938, 0.380889892578125, -0.32297515869140625, 0.108062744140625, 0.19343090057373047, 0.31488037109375, 0.29340553283691406, -0.39299774169921875, 0.3056793212890625, -0.10942268371582031, 0.387908935546875, 0.29413604736328125, -0.568756103515625, -0.7749862670898438, 0.3704643249511719, -0.07401084899902344, -0.21966934204101562, -0.3839912414550781, -0.1440277099609375, 0.41278076171875, 0.089385986328125, -0.3126106262207031, 0.210968017578125, -0.15227508544921875, -0.4472770690917969, -0.608551025390625, -0.18773651123046875, -0.6768798828125, -0.30522918701171875, 0.12196922302246094, 0.32238006591796875, 0.2324371337890625, -0.1208038330078125], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000040.npy"} +{"epoch": 0.06046863189720333, "step": 41, "batch_size": 64, "mean": 0.09139147400856018, "std": 0.3836233615875244, "min": -0.786285400390625, "p10": -0.3840232849121093, "median": 0.07900047302246094, "p90": 0.5670700073242191, "max": 1.4370269775390625, "pos_frac": 0.625, "sample": [0.37361907958984375, -0.03537750244140625, 0.05524444580078125, -0.4899444580078125, -0.21905517578125, 0.605926513671875, -0.23998260498046875, 0.7570114135742188, 0.01702880859375, -0.4284019470214844, 0.187896728515625, 0.16183090209960938, 0.09568023681640625, 0.4912872314453125, 0.128753662109375, 0.4627532958984375, 0.10240936279296875, 0.1291046142578125, -0.07451629638671875, -0.16602134704589844, 0.59954833984375, -0.0527801513671875, -0.037303924560546875, 0.21497344970703125, -0.037395477294921875, -0.2640533447265625, -0.4710540771484375, 0.1780548095703125, 0.01056671142578125, -0.1439208984375, 0.018121719360351562, 0.869873046875, 1.4370269775390625, 0.37087249755859375, -0.07119178771972656, -0.5125198364257812, 0.2792015075683594, -0.32617950439453125, 0.6397476196289062, 0.0033245086669921875, -0.13876724243164062, -0.786285400390625, 0.062320709228515625, 0.12575531005859375, 0.1807098388671875, -0.2277965545654297, 0.046001434326171875, 0.1477508544921875, 0.9378280639648438, 0.22409820556640625, -0.4088134765625, 0.21124267578125, -0.3196258544921875, -0.661376953125, -0.032527923583984375, 0.108673095703125, 0.28403472900390625, 0.2464752197265625, 0.34851646423339844, 0.0253448486328125, 0.1789703369140625, 0.466583251953125, 0.39247703552246094, -0.1826934814453125], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000041.npy"} +{"epoch": 0.06198034769463341, "step": 42, "batch_size": 64, "mean": 0.010489404201507568, "std": 0.4226493239402771, "min": -1.0410842895507812, "p10": -0.43574676513671873, "median": -0.0031671524047851562, "p90": 0.5303871154785157, "max": 1.405181884765625, "pos_frac": 0.5, "sample": [1.405181884765625, 0.716156005859375, -0.3023223876953125, -0.178466796875, -0.16999053955078125, -0.8917236328125, -0.06153297424316406, -0.13006210327148438, -0.3481597900390625, 0.0391845703125, -0.5691261291503906, -0.0984649658203125, -0.21509933471679688, -0.27478790283203125, 0.14162445068359375, 0.16372299194335938, 0.4653778076171875, 0.5139007568359375, 0.029760360717773438, 0.3246269226074219, -0.07390975952148438, 0.4483184814453125, 0.39971923828125, 0.13529205322265625, -0.6187057495117188, -0.41439056396484375, 0.30954742431640625, -0.13224029541015625, -0.26910400390625, -0.14455604553222656, -0.22412490844726562, 0.2171001434326172, -0.30115699768066406, -0.31172943115234375, 0.6735038757324219, 0.11907958984375, 0.5374526977539062, 0.2743072509765625, -1.0410842895507812, 0.14865875244140625, -0.3258018493652344, -0.31777191162109375, -0.421295166015625, -0.7883758544921875, -0.23155975341796875, 0.0475311279296875, 0.11641693115234375, 0.0691375732421875, 0.061908721923828125, -0.4419403076171875, 0.1430683135986328, 0.36917877197265625, 0.24727630615234375, -0.03609466552734375, 0.5634098052978516, -0.0689239501953125, -0.58538818359375, -0.039043426513671875, 0.865264892578125, -0.036228179931640625, 0.3651237487792969, 0.2539653778076172, 0.03163909912109375, 0.5380477905273438], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000042.npy"} +{"epoch": 0.06349206349206349, "step": 43, "batch_size": 64, "mean": 0.07060915231704712, "std": 0.42092418670654297, "min": -1.2113037109375, "p10": -0.4433650970458984, "median": 0.11067485809326172, "p90": 0.6535800933837891, "max": 0.819976806640625, "pos_frac": 0.578125, "sample": [0.36472320556640625, 0.08939361572265625, -1.2113037109375, -0.08522796630859375, 0.01331329345703125, -0.5099849700927734, -0.04974365234375, 0.07254600524902344, -0.2551727294921875, -0.4560279846191406, 0.2609367370605469, 0.120513916015625, -0.04876708984375, -0.18011474609375, 0.819976806640625, 0.170166015625, 0.6715507507324219, 0.17917633056640625, 0.1361217498779297, 0.09272003173828125, 0.3509807586669922, -0.16248321533203125, -0.3160247802734375, -0.3277549743652344, 0.7270584106445312, -0.03567695617675781, 0.2532787322998047, 0.13518524169921875, 0.17392349243164062, 0.401092529296875, 0.6654052734375, -0.413818359375, 0.2516632080078125, -0.390289306640625, 0.10083580017089844, 0.280517578125, 0.6381378173828125, -0.30982208251953125, 0.7686080932617188, 0.5055618286132812, 0.135345458984375, -0.19076156616210938, -0.07570648193359375, -1.017852783203125, 0.1345653533935547, 0.7721405029296875, -0.08530426025390625, 0.2569007873535156, -0.06826400756835938, 0.5606956481933594, 0.29367828369140625, 0.6274337768554688, 0.162261962890625, -0.23517608642578125, 0.3712120056152344, 0.29624176025390625, -0.4740772247314453, 0.6601982116699219, 0.5711669921875, -0.2369384765625, -0.704742431640625, -0.02114105224609375, -0.1699657440185547, -0.5340995788574219], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000043.npy"} +{"epoch": 0.06500377928949358, "step": 44, "batch_size": 64, "mean": 0.04925870895385742, "std": 0.43301987648010254, "min": -1.1612625122070312, "p10": -0.4908187866210937, "median": 0.08185291290283203, "p90": 0.49897842407226567, "max": 1.2504196166992188, "pos_frac": 0.578125, "sample": [-0.5381908416748047, -0.14547348022460938, -0.6384353637695312, -0.08871841430664062, 0.4069061279296875, 0.1549072265625, 0.597076416015625, -0.2860565185546875, -0.33038330078125, -0.5195388793945312, -0.21776962280273438, 0.6877899169921875, -0.7180328369140625, 0.1806793212890625, 0.23886871337890625, -0.5593643188476562, -0.2742443084716797, 0.20519065856933594, 0.06453514099121094, 0.03302955627441406, -0.07856369018554688, 0.8590583801269531, 0.45989418029785156, 0.12917327880859375, 0.1492290496826172, 0.586822509765625, -0.09381103515625, -0.2613067626953125, 0.2716827392578125, -0.390594482421875, 0.2626800537109375, 0.4111976623535156, 0.37090301513671875, 0.0244293212890625, 0.019727706909179688, 0.24645042419433594, 1.2504196166992188, 0.34439659118652344, -0.264251708984375, -0.1728515625, -0.029138565063476562, -0.23979568481445312, 0.3128204345703125, 0.01421356201171875, 0.40921783447265625, 0.50335693359375, -0.160797119140625, 0.2377166748046875, -0.22100830078125, 0.13957977294921875, -1.1612625122070312, 0.09917068481445312, 0.48876190185546875, -0.349212646484375, -0.10702133178710938, 0.24694061279296875, 0.18704986572265625, 1.0385894775390625, 0.3598194122314453, 0.46869659423828125, 0.1668548583984375, -0.42380523681640625, -0.3991851806640625, -0.8064651489257812], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000044.npy"} +{"epoch": 0.06651549508692366, "step": 45, "batch_size": 64, "mean": 0.10806754231452942, "std": 0.417008638381958, "min": -0.8307571411132812, "p10": -0.4434761047363281, "median": 0.11849212646484375, "p90": 0.6176582336425782, "max": 1.06134033203125, "pos_frac": 0.59375, "sample": [-0.1641998291015625, -0.49602508544921875, 0.44477081298828125, 0.0411224365234375, -0.0013561248779296875, -0.8146743774414062, -0.0057430267333984375, 0.13067626953125, 0.3208160400390625, -0.6856842041015625, 0.163543701171875, 0.7042922973632812, 0.3300514221191406, 0.32604217529296875, 0.047588348388671875, 0.26743316650390625, 0.1814899444580078, -0.462310791015625, -0.5621566772460938, 0.6279373168945312, 0.3808746337890625, -0.348236083984375, 0.30420875549316406, -0.1250896453857422, -0.05307769775390625, 1.005035400390625, -0.148223876953125, -0.026882171630859375, 0.6619796752929688, 0.5767936706542969, -0.094207763671875, 1.06134033203125, -0.47783660888671875, 0.4253349304199219, 0.208740234375, 1.0293121337890625, -0.29875755310058594, 0.21820068359375, -0.39952850341796875, 0.285491943359375, -0.8307571411132812, 0.2469635009765625, -0.0323486328125, -0.23435592651367188, 0.223968505859375, 0.06885528564453125, 0.2137908935546875, -0.049785614013671875, -0.22216796875, 0.56982421875, -0.27732086181640625, 0.38361358642578125, 0.24028778076171875, 0.00266265869140625, -0.24459075927734375, 0.489166259765625, 0.8035125732421875, 0.19936370849609375, 0.1063079833984375, 0.0010662078857421875, -0.18299102783203125, 0.443359375, 0.5936737060546875, -0.17486190795898438], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000045.npy"} +{"epoch": 0.06802721088435375, "step": 46, "batch_size": 64, "mean": 0.1649779975414276, "std": 0.3971222937107086, "min": -0.7170791625976562, "p10": -0.2717355728149414, "median": 0.14553165435791016, "p90": 0.6864753723144532, "max": 1.0256500244140625, "pos_frac": 0.625, "sample": [0.48644256591796875, -0.612457275390625, -0.7170791625976562, 0.16158294677734375, 0.318145751953125, 0.08087158203125, -0.0097503662109375, 0.14409255981445312, 0.0710296630859375, -0.4210205078125, 0.6916160583496094, 0.22211837768554688, 0.4884490966796875, 0.38519287109375, -0.10350799560546875, -0.1760101318359375, -0.188232421875, 0.13418960571289062, 0.2983722686767578, 0.4406890869140625, 0.08522224426269531, 0.9649658203125, -0.01085662841796875, 0.4838104248046875, 0.1805267333984375, -0.037506103515625, 0.5995407104492188, 0.9329376220703125, 0.15522003173828125, 0.17523193359375, -0.6215667724609375, 0.23748016357421875, -0.008056640625, -0.11437225341796875, -0.2802448272705078, 0.651641845703125, 0.13765907287597656, 0.21187782287597656, -0.49620819091796875, 0.9341583251953125, 0.20931243896484375, -0.1129302978515625, 0.29293060302734375, 0.18648529052734375, 0.6744804382324219, -0.03984832763671875, -0.05657958984375, -0.036312103271484375, -0.29892730712890625, 0.22667694091796875, 0.3847942352294922, 0.02399444580078125, -0.2518806457519531, 0.048954010009765625, 0.2604827880859375, 0.9677886962890625, -0.2206268310546875, -0.1413421630859375, -0.12855148315429688, 1.0058746337890625, 0.5269088745117188, 0.1469707489013672, -0.01190948486328125, 1.0256500244140625], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000046.npy"} +{"epoch": 0.06953892668178382, "step": 47, "batch_size": 64, "mean": 0.13176396489143372, "std": 0.3814322352409363, "min": -0.8818130493164062, "p10": -0.2871948242187499, "median": 0.1335601806640625, "p90": 0.5525650024414063, "max": 0.858642578125, "pos_frac": 0.6875, "sample": [0.4273109436035156, -0.10222625732421875, 0.3675193786621094, 0.01978302001953125, 0.8494491577148438, 0.1917438507080078, 0.015539169311523438, 0.19654083251953125, -0.13844680786132812, 0.5556869506835938, 0.10949897766113281, -0.07408905029296875, -0.0767669677734375, -0.731842041015625, -0.13665008544921875, 0.23408889770507812, 0.4663276672363281, 0.0788116455078125, 0.1335296630859375, -0.20003890991210938, 0.19826126098632812, 0.45015716552734375, 0.0083160400390625, 0.110260009765625, -0.21304702758789062, 0.1335906982421875, 0.07400703430175781, 0.20024681091308594, -0.0438232421875, 0.033538818359375, -0.31330108642578125, 0.5346622467041016, -0.21543121337890625, 0.64453125, -0.83282470703125, 0.19549560546875, 0.3938140869140625, 0.322357177734375, 0.5199413299560547, 0.5316848754882812, -0.4163818359375, 0.05699920654296875, -0.10338592529296875, 0.413818359375, 0.4223518371582031, 0.21809005737304688, 0.858642578125, 0.16841888427734375, 0.4415454864501953, 0.6046581268310547, -0.22628021240234375, 0.5452804565429688, -0.6833953857421875, -0.8818130493164062, -0.41957855224609375, 0.689605712890625, 0.08485603332519531, 0.8133468627929688, 0.5274200439453125, 0.06365966796875, 0.31418609619140625, 0.25412750244140625, -0.15240478515625, -0.07908058166503906], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000047.npy"} +{"epoch": 0.0710506424792139, "step": 48, "batch_size": 64, "mean": 0.02435573935508728, "std": 0.465448260307312, "min": -1.0857086181640625, "p10": -0.4718841552734375, "median": -0.003101348876953125, "p90": 0.605232620239258, "max": 1.3580398559570312, "pos_frac": 0.484375, "sample": [0.07063674926757812, -0.37641143798828125, 0.26184844970703125, 0.4282951354980469, 0.0435943603515625, 0.5659446716308594, 0.07501220703125, -0.0282135009765625, -0.467803955078125, 0.116363525390625, 0.27899932861328125, 0.2613658905029297, -0.32762908935546875, -0.4757843017578125, 0.30518341064453125, 0.926849365234375, 0.6220703125, 0.12786102294921875, -0.726531982421875, 0.47734832763671875, -0.07450485229492188, -0.2845916748046875, -0.45323944091796875, 0.6532058715820312, 0.177001953125, 0.27048492431640625, 0.2801361083984375, 0.3063850402832031, -0.327056884765625, 1.0075912475585938, -0.25829315185546875, 0.0500030517578125, -0.4736328125, 0.06584930419921875, 0.47783660888671875, -0.03008270263671875, -0.3105926513671875, -0.10651016235351562, 0.5167980194091797, -0.3248767852783203, -0.36986732482910156, -0.3655242919921875, -0.001739501953125, 0.04147911071777344, -0.8974075317382812, -0.00446319580078125, 0.4722003936767578, 0.6555099487304688, -0.1693115234375, -0.4289588928222656, -0.120025634765625, -0.2538604736328125, -0.4078960418701172, 0.4197101593017578, -0.38951873779296875, 0.3609638214111328, 1.3580398559570312, -0.07215309143066406, -0.6141204833984375, -0.22555923461914062, -0.01361083984375, 0.903961181640625, -0.5542812347412109, -1.0857086181640625], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000048.npy"} +{"epoch": 0.07256235827664399, "step": 49, "batch_size": 64, "mean": 0.13957056403160095, "std": 0.470011830329895, "min": -1.1416168212890625, "p10": -0.4132041931152342, "median": 0.15933895111083984, "p90": 0.5788078308105469, "max": 1.998199462890625, "pos_frac": 0.671875, "sample": [0.0090179443359375, -0.159149169921875, 0.22216033935546875, -0.0871734619140625, 0.17024993896484375, -0.1651458740234375, -0.14385414123535156, 0.5602169036865234, 0.2798004150390625, 0.2746925354003906, 0.14864349365234375, -0.23391342163085938, 0.511138916015625, 0.579071044921875, -0.23019981384277344, -0.26145172119140625, -0.4870471954345703, 0.33621978759765625, -0.016269683837890625, -0.94940185546875, 0.40712547302246094, 0.03966712951660156, 0.1529521942138672, 0.2512359619140625, 0.14783477783203125, 0.35802459716796875, 0.2138824462890625, 0.34554481506347656, 0.13234710693359375, -0.5058746337890625, 0.2478656768798828, 0.13437652587890625, 0.27042388916015625, 0.873199462890625, 0.34539222717285156, 0.381500244140625, 0.219146728515625, -0.1504058837890625, 0.5964508056640625, 1.196136474609375, 0.203704833984375, -0.15709304809570312, -0.0795745849609375, -0.2155609130859375, -0.5404129028320312, 0.41616058349609375, 0.1657257080078125, 0.4048118591308594, 0.07291412353515625, 0.055881500244140625, 0.7413406372070312, 0.7390365600585938, -1.1416168212890625, -0.16927337646484375, -0.24628829956054688, -0.478240966796875, 0.4863929748535156, 1.998199462890625, 0.5781936645507812, 0.11612510681152344, 0.3254852294921875, 0.09175872802734375, 0.29400634765625, -0.74359130859375], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000049.npy"} +{"epoch": 0.07407407407407407, "step": 50, "batch_size": 64, "mean": 0.11145466566085815, "std": 0.41129276156425476, "min": -0.68853759765625, "p10": -0.3435249328613281, "median": 0.07257270812988281, "p90": 0.5606197357177737, "max": 1.1772537231445312, "pos_frac": 0.625, "sample": [0.5019454956054688, 0.358489990234375, -0.59423828125, 0.057064056396484375, 0.14488983154296875, 0.224578857421875, 0.0152587890625, -0.32686614990234375, 1.0926742553710938, 0.4355735778808594, 0.1897563934326172, 0.9945831298828125, -0.33367919921875, -0.15093612670898438, -0.07531356811523438, -0.4766674041748047, 0.169677734375, 0.2779197692871094, 0.5857658386230469, 0.2886962890625, 0.0218048095703125, 0.12233734130859375, -0.05390739440917969, -0.34360504150390625, 0.02315521240234375, 0.978515625, -0.0375518798828125, 0.1464691162109375, 0.09662628173828125, 0.0354461669921875, 0.3387031555175781, 0.1549091339111328, 0.4293384552001953, 0.3226947784423828, -0.38887786865234375, -0.056182861328125, 0.42938232421875, 1.1772537231445312, 0.03692436218261719, -0.17852783203125, 1.0552978515625, 1.00762939453125, -0.1880340576171875, -0.41130828857421875, -0.2204723358154297, 0.3051910400390625, -0.31587982177734375, 0.08808135986328125, -0.28095245361328125, 0.3187255859375, 0.3185462951660156, -0.1172332763671875, 0.00850677490234375, 0.0944671630859375, 0.4596385955810547, -0.68853759765625, -0.414764404296875, -0.0296783447265625, -0.22103118896484375, -0.3128814697265625, 0.16859817504882812, -0.3433380126953125, 0.2140216827392578, 0.004425048828125], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000050.npy"} +{"epoch": 0.07558578987150416, "step": 51, "batch_size": 64, "mean": 0.19032499194145203, "std": 0.5450688004493713, "min": -1.11004638671875, "p10": -0.34324798583984373, "median": 0.12278366088867188, "p90": 0.7856891632080079, "max": 2.24749755859375, "pos_frac": 0.59375, "sample": [0.7772216796875, 0.20092201232910156, -0.04407501220703125, -0.2955322265625, -0.20458221435546875, 0.7731246948242188, 0.067352294921875, 0.4930458068847656, -0.41463279724121094, -0.11502838134765625, 0.10432815551757812, 0.4913673400878906, -0.30870819091796875, 0.9446792602539062, -0.01513671875, 0.331298828125, 0.31884002685546875, -0.0885009765625, 0.13654327392578125, 2.24749755859375, 0.27246856689453125, 0.45909690856933594, 0.4612846374511719, 0.1090240478515625, 0.5155868530273438, -0.3333892822265625, -0.34747314453125, -0.574676513671875, -0.07543182373046875, 0.3439369201660156, 0.08050537109375, 0.6794586181640625, -0.01575469970703125, 0.5435333251953125, -1.11004638671875, -0.2784690856933594, 0.18953323364257812, -0.15340042114257812, -0.305389404296875, 0.015350341796875, -0.143310546875, -0.5829925537109375, 0.7893180847167969, 0.992462158203125, 0.5519943237304688, -0.20844650268554688, -0.5039482116699219, 1.1885986328125, 0.2315216064453125, 1.3882980346679688, 0.39720726013183594, 0.37432861328125, 0.4919891357421875, -0.123260498046875, 0.0618743896484375, -0.1746807098388672, -0.10666656494140625, 1.3154296875, 0.23865318298339844, 0.184783935546875, -0.7447128295898438, 0.4575347900390625, 0.37172508239746094, -0.14267349243164062], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000051.npy"} +{"epoch": 0.07709750566893424, "step": 52, "batch_size": 64, "mean": 0.19649244844913483, "std": 0.5858774781227112, "min": -0.9342269897460938, "p10": -0.4411275863647461, "median": 0.124481201171875, "p90": 0.876451110839844, "max": 2.3634490966796875, "pos_frac": 0.609375, "sample": [1.206390380859375, 0.447418212890625, 0.72833251953125, 0.6167144775390625, 0.6194839477539062, 0.32708740234375, 0.4668159484863281, -0.16039657592773438, -0.234893798828125, 1.4072265625, 1.5089569091796875, 0.47846221923828125, -0.268829345703125, 0.814788818359375, 0.9242401123046875, -0.8448486328125, 0.46967315673828125, -0.21549224853515625, -0.08443450927734375, -0.2868175506591797, -0.2995033264160156, -0.17405319213867188, 0.3850059509277344, -0.014234542846679688, 0.4093017578125, 0.707763671875, -0.5562286376953125, 0.07971763610839844, 0.2361297607421875, 0.12240219116210938, 0.21686172485351562, -0.728729248046875, 0.04544830322265625, -0.4388751983642578, 0.13373184204101562, 0.9028778076171875, 0.036224365234375, 0.21688079833984375, 0.0522308349609375, -0.1968231201171875, -0.2350139617919922, 0.377227783203125, 0.18201637268066406, 0.36807823181152344, -0.11381912231445312, 0.41010284423828125, -0.06288433074951172, -0.23621368408203125, 2.3634490966796875, -0.4420928955078125, 0.7038612365722656, -0.8301773071289062, -0.6938438415527344, 0.6348495483398438, 0.28322601318359375, -0.9342269897460938, 1.0113677978515625, -0.023464202880859375, 0.67315673828125, 0.011461257934570312, 0.12656021118164062, 0.055637359619140625, -0.10596466064453125, -0.0037841796875], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000052.npy"} +{"epoch": 0.07860922146636433, "step": 53, "batch_size": 64, "mean": 0.18445560336112976, "std": 0.46792739629745483, "min": -1.22607421875, "p10": -0.3811729431152343, "median": 0.1915273666381836, "p90": 0.7845436096191407, "max": 1.17919921875, "pos_frac": 0.640625, "sample": [0.3186149597167969, 0.8519020080566406, 1.085906982421875, 0.088653564453125, 0.3496856689453125, 0.3317985534667969, 0.390777587890625, 0.4029083251953125, 0.14948654174804688, -0.4121742248535156, 0.18012237548828125, -0.400909423828125, 0.003509521484375, 0.6129837036132812, -0.0760650634765625, 0.25691986083984375, 0.223480224609375, 1.17919921875, -0.07911872863769531, -0.29436492919921875, 0.2582225799560547, 0.05345916748046875, 0.5111618041992188, 0.10325241088867188, -1.22607421875, 0.7295913696289062, -0.2311382293701172, 0.5032424926757812, 0.7246952056884766, 0.2790641784667969, 0.2688274383544922, -0.5275115966796875, -0.3313026428222656, -0.33512115478515625, 0.3400230407714844, 0.80712890625, 0.46175384521484375, 1.0138015747070312, -0.16397666931152344, -0.18673133850097656, -0.0015811920166015625, -0.248199462890625, 0.6800098419189453, -0.8761138916015625, 0.7503585815429688, 0.613372802734375, -0.05466461181640625, 0.26204681396484375, 0.5370750427246094, 0.7991943359375, -0.1125335693359375, 0.49790191650390625, -0.21867942810058594, 0.6578521728515625, -0.14214324951171875, -0.4058647155761719, 0.9575042724609375, -0.4490509033203125, 0.1195220947265625, -0.019376754760742188, -0.0279998779296875, 0.04579925537109375, 0.022111892700195312, 0.20293235778808594], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000053.npy"} +{"epoch": 0.0801209372637944, "step": 54, "batch_size": 64, "mean": 0.15835073590278625, "std": 0.5420072674751282, "min": -1.5352516174316406, "p10": -0.3925331115722656, "median": 0.1025238037109375, "p90": 0.7600374221801759, "max": 2.4225006103515625, "pos_frac": 0.625, "sample": [0.9503631591796875, 1.5955963134765625, -0.00861358642578125, 0.2561664581298828, -0.06778335571289062, -0.4234771728515625, 0.7309513092041016, 0.45932769775390625, 0.6626777648925781, -0.5636329650878906, -0.3458404541015625, -0.053592681884765625, 0.282928466796875, -1.5352516174316406, -0.12606048583984375, -0.03816795349121094, 0.678314208984375, 0.3905487060546875, 0.3312339782714844, -0.0284423828125, 0.018768310546875, 2.4225006103515625, 0.12093544006347656, 0.6445579528808594, 0.2218780517578125, 0.8569126129150391, 0.3090553283691406, 0.087677001953125, 0.0732421875, -0.0638580322265625, 0.05077362060546875, 0.07165908813476562, -0.48528289794921875, -0.3810882568359375, 0.2803668975830078, 0.11737060546875, 0.0379638671875, -0.01372528076171875, 0.8730201721191406, 0.7725028991699219, 0.18519973754882812, -0.0111541748046875, -0.0121917724609375, 0.2412109375, -0.3110809326171875, 0.48229217529296875, 0.5865554809570312, 0.17376327514648438, -0.09702301025390625, 0.11792755126953125, -0.075103759765625, -0.697021484375, 0.186279296875, 0.17456436157226562, 0.363983154296875, -0.3561515808105469, 0.13307762145996094, -0.3448963165283203, 0.7883949279785156, 0.03054046630859375, -0.39743804931640625, 0.0386199951171875, 0.265594482421875, -0.4939708709716797], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000054.npy"} +{"epoch": 0.08163265306122448, "step": 55, "batch_size": 64, "mean": 0.27443674206733704, "std": 0.7423748970031738, "min": -1.79083251953125, "p10": -0.4484128952026367, "median": 0.2318859100341797, "p90": 0.965884780883789, "max": 2.534271240234375, "pos_frac": 0.6875, "sample": [1.6875076293945312, 0.37007904052734375, 0.14284896850585938, -0.03680419921875, -0.17086029052734375, 0.617034912109375, 0.969085693359375, -0.16522979736328125, -0.4522895812988281, -0.20417022705078125, 0.18207168579101562, 0.4319305419921875, -1.5031814575195312, 0.15338134765625, 0.24579238891601562, 1.9034423828125, 0.9394340515136719, 0.4052581787109375, -0.0648345947265625, -0.0655975341796875, 0.045795440673828125, -1.79083251953125, 0.4493865966796875, 0.43897438049316406, 2.534271240234375, 0.42266082763671875, 0.2774219512939453, 0.82000732421875, 0.095123291015625, 0.227020263671875, 0.2707862854003906, 0.769378662109375, 0.34393310546875, -0.43936729431152344, -0.992889404296875, -0.325927734375, 0.3379554748535156, 0.2221221923828125, 0.441864013671875, -0.0734710693359375, 0.23675155639648438, 0.9584159851074219, 0.28722381591796875, 0.8603973388671875, 0.156951904296875, 0.15839004516601562, 1.81195068359375, -0.254241943359375, -0.4159698486328125, -0.7142486572265625, -0.07575607299804688, 0.4817790985107422, 0.08086395263671875, 0.0638275146484375, -0.16978073120117188, 0.8349990844726562, 1.02984619140625, 0.2940788269042969, 0.7819232940673828, 2.08880615234375, 0.0682220458984375, -0.530059814453125, 0.9044914245605469, -0.8340225219726562], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000055.npy"} +{"epoch": 0.08314436885865457, "step": 56, "batch_size": 64, "mean": 0.15546634793281555, "std": 0.6684150099754333, "min": -2.6973114013671875, "p10": -0.5643566131591796, "median": 0.242706298828125, "p90": 0.9604156494140631, "max": 1.6248397827148438, "pos_frac": 0.59375, "sample": [-0.1551971435546875, 0.5188217163085938, -0.03510093688964844, -0.09032440185546875, 0.6029815673828125, -0.14191436767578125, 0.649322509765625, -0.8329010009765625, -0.4649391174316406, -0.05691337585449219, 0.3183746337890625, -1.268463134765625, 0.2524566650390625, -0.059539794921875, 0.069488525390625, 1.2195892333984375, 0.29381561279296875, -0.6059284210205078, 0.289215087890625, 1.0184898376464844, -0.31253814697265625, 1.5108108520507812, 0.7031211853027344, 0.45660400390625, 0.26336097717285156, 0.7455234527587891, -0.04911041259765625, 0.43242645263671875, 0.09358787536621094, 0.4645957946777344, -0.52178955078125, -0.05145263671875, 1.0522613525390625, 0.4834728240966797, 0.5489578247070312, -0.7112350463867188, -2.6973114013671875, 0.21076011657714844, -0.0112457275390625, 0.258636474609375, 0.2947063446044922, 0.6575088500976562, -0.3846588134765625, -0.5825996398925781, 0.33568382263183594, 0.04120635986328125, 0.2329559326171875, 1.2450942993164062, -0.06374931335449219, 0.13957595825195312, 0.5118064880371094, 0.5216941833496094, 0.8249092102050781, 1.0752143859863281, 0.292022705078125, -0.34683990478515625, -0.817169189453125, 0.2579193115234375, 0.5909309387207031, -0.08493804931640625, -0.3322601318359375, 1.6248397827148438, -0.058826446533203125, -0.4159507751464844], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000056.npy"} +{"epoch": 0.08465608465608465, "step": 57, "batch_size": 64, "mean": 0.39299964904785156, "std": 0.68541419506073, "min": -0.8373565673828125, "p10": -0.5355854034423828, "median": 0.4466114044189453, "p90": 1.105838775634766, "max": 2.1488265991210938, "pos_frac": 0.71875, "sample": [-0.2680625915527344, -0.4253406524658203, 0.39888572692871094, 1.90716552734375, -0.22179222106933594, 1.2596282958984375, 0.4360389709472656, -0.11962127685546875, 0.57843017578125, 0.9505462646484375, 1.836456298828125, 0.6240520477294922, -0.8373565673828125, 0.33886146545410156, 0.8805160522460938, -0.75457763671875, 0.7282180786132812, 0.650238037109375, 2.1488265991210938, 0.315277099609375, 0.6040725708007812, -0.4238433837890625, 0.4706001281738281, 2.0494384765625, -0.04189300537109375, -0.6843032836914062, 0.22573089599609375, 0.457183837890625, -0.18921852111816406, -0.5970458984375, 0.7456283569335938, 0.6159839630126953, 0.32275390625, 0.5397415161132812, -0.1975860595703125, 0.2536468505859375, 0.487762451171875, 0.1380176544189453, -0.8074111938476562, 0.4844512939453125, 0.2990875244140625, -0.28833770751953125, -0.5915756225585938, 0.7497806549072266, -0.5375595092773438, 0.586273193359375, 0.5403671264648438, 0.7345123291015625, 1.1518096923828125, 0.7437515258789062, 0.8596839904785156, 0.7168197631835938, 0.0668487548828125, 1.8844146728515625, 0.17547035217285156, 0.9985733032226562, 0.0884246826171875, 0.7810859680175781, 0.19747543334960938, 0.6924057006835938, -0.04878997802734375, 0.0670928955078125, 0.93524169921875, -0.5309791564941406], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000057.npy"} +{"epoch": 0.08616780045351474, "step": 58, "batch_size": 64, "mean": 0.21979853510856628, "std": 0.9964690208435059, "min": -1.3160934448242188, "p10": -0.642724609375, "median": 0.009464263916015625, "p90": 1.0815887451171875, "max": 4.578033447265625, "pos_frac": 0.5, "sample": [-1.3160934448242188, 0.8334274291992188, 0.9622802734375, -0.3194770812988281, 1.0826873779296875, -0.5652389526367188, -0.04640960693359375, 0.2486114501953125, 0.12656402587890625, -0.44968414306640625, 1.3241806030273438, -0.4199504852294922, 0.814422607421875, -0.6303176879882812, -0.8095417022705078, 0.5235633850097656, 1.4886970520019531, -0.44268035888671875, -0.642852783203125, 0.65850830078125, 0.05493927001953125, 0.033313751220703125, 0.6620330810546875, 0.07830810546875, -0.6930770874023438, 0.0322113037109375, -1.27679443359375, 0.1584625244140625, -0.6616935729980469, 0.8889198303222656, -0.01328277587890625, -1.0975914001464844, 0.6844749450683594, -0.14960479736328125, 4.578033447265625, -0.10886383056640625, -0.60052490234375, 3.4256591796875, 1.7943038940429688, 0.4450874328613281, -0.421661376953125, -0.031818389892578125, -0.2457275390625, -0.33487701416015625, -0.642425537109375, 2.507598876953125, -0.3371238708496094, -0.5187225341796875, 0.17547607421875, 0.7381401062011719, 0.3577728271484375, 1.023956298828125, -0.3504180908203125, -0.16420745849609375, -0.026645660400390625, 1.0790252685546875, 0.25008392333984375, -0.47554779052734375, -0.42757415771484375, 1.013702392578125, -0.23537445068359375, -0.100982666015625, 0.23415565490722656, 0.3452911376953125], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000058.npy"} +{"epoch": 0.08767951625094482, "step": 59, "batch_size": 64, "mean": 0.2514455020427704, "std": 0.831771194934845, "min": -1.4849929809570312, "p10": -0.5891313552856445, "median": 0.21755218505859375, "p90": 1.0565628051757814, "max": 2.832244873046875, "pos_frac": 0.5625, "sample": [-0.2672233581542969, 0.5373992919921875, 0.25731658935546875, -0.9608802795410156, -0.21635055541992188, -0.5904903411865234, 0.8502197265625, -1.4849929809570312, 0.4454345703125, 0.61199951171875, 1.80511474609375, 0.40380859375, 0.8007354736328125, 1.2814826965332031, 0.4888591766357422, -0.1738300323486328, 1.482452392578125, -0.9573040008544922, -0.503997802734375, 0.49465179443359375, 0.35245513916015625, -0.3036041259765625, -0.22283172607421875, 0.7387161254882812, -0.44317626953125, 0.6633415222167969, -0.21821975708007812, 1.0076065063476562, 2.825927734375, 0.17778778076171875, -0.035858154296875, 1.0607833862304688, 0.6201667785644531, -0.15439605712890625, -0.439361572265625, 0.11636161804199219, -0.038005828857421875, 0.558868408203125, -0.2174224853515625, -0.4157829284667969, 2.832244873046875, 0.32320404052734375, 1.0467147827148438, 0.8313617706298828, -0.5859603881835938, 0.5149269104003906, -0.4888877868652344, 0.8833847045898438, 0.08413505554199219, 0.8363800048828125, -1.0332069396972656, 0.8623275756835938, -0.010135650634765625, -1.458343505859375, 0.698333740234375, -0.2422943115234375, -1.0753021240234375, 0.1049041748046875, -0.2623023986816406, -0.0128021240234375, 0.499603271484375, 1.521087646484375, 0.38272857666015625, -0.09735107421875], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000059.npy"} +{"epoch": 0.08919123204837491, "step": 60, "batch_size": 64, "mean": 0.07426166534423828, "std": 0.8363189697265625, "min": -2.2081146240234375, "p10": -1.0402454376220702, "median": 0.2582721710205078, "p90": 0.9341352462768555, "max": 1.6619110107421875, "pos_frac": 0.625, "sample": [0.6920890808105469, 0.39113616943359375, 0.9207344055175781, 0.01360321044921875, -0.32747650146484375, 1.2174491882324219, -1.7433624267578125, -1.0098762512207031, 0.036205291748046875, -2.2081146240234375, 0.47585296630859375, 0.0281219482421875, -0.25353240966796875, -0.22067642211914062, -1.0626907348632812, 0.6716270446777344, -0.2503776550292969, 0.9398784637451172, 1.3406181335449219, 0.5826988220214844, -0.4944915771484375, 0.027111053466796875, -0.11749267578125, -1.0532608032226562, 0.33036041259765625, -0.10840606689453125, 0.6301956176757812, 0.3169059753417969, 0.9512252807617188, -0.9433174133300781, 0.4146747589111328, 0.01740264892578125, 1.28814697265625, 0.6331253051757812, -0.10106658935546875, 0.7147140502929688, 0.6929416656494141, -0.7448883056640625, 0.2854156494140625, -0.7178192138671875, -0.9533233642578125, 0.8576030731201172, 0.6202392578125, -1.7135200500488281, 0.3192272186279297, 1.1945953369140625, -0.2830543518066406, -1.423797607421875, 0.8288497924804688, 0.020900726318359375, 0.8631210327148438, 0.2963409423828125, 0.5706920623779297, 0.6859664916992188, 1.6619110107421875, -0.2685680389404297, 0.5406608581542969, 0.188140869140625, 0.37335205078125, 0.23112869262695312, -2.001434326171875, -0.9283962249755859, 0.8915500640869141, -0.07482337951660156], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000060.npy"} +{"epoch": 0.09070294784580499, "step": 61, "batch_size": 64, "mean": 0.10098138451576233, "std": 1.000292420387268, "min": -2.7902755737304688, "p10": -1.2415443420410155, "median": 0.025379180908203125, "p90": 1.1810745239257814, "max": 2.077667236328125, "pos_frac": 0.515625, "sample": [1.149169921875, 0.8672027587890625, 1.5864105224609375, 2.044219970703125, -0.012882232666015625, 0.6273708343505859, 0.5098342895507812, 2.002391815185547, 0.94134521484375, -0.3205108642578125, -0.0759429931640625, -0.18745040893554688, -0.14943695068359375, -0.2664031982421875, 0.4832115173339844, -0.3456306457519531, 1.0766983032226562, -0.37404823303222656, 0.03690338134765625, 0.5734596252441406, -0.13105010986328125, 0.1922454833984375, 0.9619903564453125, 0.01385498046875, -0.16029739379882812, -0.11937141418457031, -1.0771026611328125, -2.1100921630859375, 0.04216766357421875, -0.34014129638671875, 0.9876003265380859, -0.34522247314453125, -0.8764533996582031, 0.9528656005859375, -0.5444183349609375, 0.6411514282226562, 0.2708320617675781, -0.4171257019042969, -0.32564544677734375, 1.033905029296875, 2.077667236328125, -2.09246826171875, -0.138824462890625, -1.6699600219726562, 0.5209197998046875, 1.3718986511230469, 0.37950897216796875, 0.19367218017578125, -0.42822265625, -0.2183666229248047, 1.1466789245605469, -1.4816360473632812, -0.045806884765625, -0.0561370849609375, 0.87371826171875, -2.7902755737304688, 1.1947479248046875, 0.5392303466796875, 0.13739013671875, -0.34223175048828125, 1.2948455810546875, 0.6573562622070312, -2.1644821166992188, -1.3120193481445312], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000061.npy"} +{"epoch": 0.09221466364323508, "step": 62, "batch_size": 64, "mean": 0.25477129220962524, "std": 0.865344226360321, "min": -1.8827667236328125, "p10": -0.6472923278808593, "median": 0.20161151885986328, "p90": 1.3239845275878908, "max": 2.4447479248046875, "pos_frac": 0.65625, "sample": [1.22332763671875, -1.5298290252685547, -0.7667694091796875, 0.5202255249023438, 0.7224273681640625, 0.26085662841796875, 1.3646736145019531, -0.42843055725097656, -1.3854904174804688, -0.18120574951171875, 1.7654151916503906, 0.015550613403320312, 1.2422103881835938, -1.51678466796875, 1.3367767333984375, 0.39697265625, 0.5135574340820312, 0.56591796875, -0.1978473663330078, 0.6047286987304688, -0.3256683349609375, -0.6140899658203125, -0.603759765625, 0.07237052917480469, 0.09573745727539062, 0.0457305908203125, -0.5648994445800781, 0.2746124267578125, 0.8891067504882812, 1.2941360473632812, -0.21502685546875, 0.05436515808105469, 0.03250694274902344, 0.19720458984375, 1.4070510864257812, -1.8827667236328125, -0.581085205078125, 1.6324996948242188, -0.1391925811767578, -0.12540435791015625, 0.18707275390625, 1.1659927368164062, 0.0877532958984375, 0.607391357421875, 0.8098716735839844, 0.7164115905761719, -0.114013671875, -0.5135307312011719, 0.20831298828125, 1.1995849609375, -0.2896881103515625, 0.7610435485839844, 0.8014011383056641, 0.2798290252685547, -0.6615219116210938, 0.04799652099609375, 2.4447479248046875, 2.36456298828125, 0.20601844787597656, 0.45877838134765625, 0.7623291015625, -0.22653961181640625, -1.082427978515625, 0.6142749786376953], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000062.npy"} +{"epoch": 0.09372637944066516, "step": 63, "batch_size": 64, "mean": 0.569621205329895, "std": 0.8622504472732544, "min": -2.7677459716796875, "p10": -0.29421920776367183, "median": 0.46799373626708984, "p90": 1.5765550613403323, "max": 2.800537109375, "pos_frac": 0.84375, "sample": [0.8937606811523438, 0.24556732177734375, 0.0464019775390625, 0.2537841796875, 2.6307373046875, -0.30352783203125, -0.32636260986328125, 2.0491943359375, 1.01385498046875, 0.5932083129882812, -2.7677459716796875, -0.36301422119140625, 0.3446540832519531, -0.6314239501953125, 1.1202392578125, -0.1119232177734375, 2.09918212890625, 0.1627197265625, 0.2832908630371094, 0.8229923248291016, -0.9531173706054688, 0.19393348693847656, 0.7030982971191406, 2.33026123046875, 0.6853179931640625, 0.8290557861328125, 1.3846893310546875, 0.17151641845703125, 0.4403820037841797, 0.31919097900390625, 0.3818855285644531, 0.6842880249023438, 1.3760490417480469, 0.7718505859375, 0.075836181640625, 0.0075225830078125, 0.53948974609375, -0.27249908447265625, 0.47617530822753906, 0.9799289703369141, 0.8313522338867188, 2.800537109375, 0.3807239532470703, 1.4882259368896484, 0.7437839508056641, 0.9680633544921875, 0.80908203125, 1.4256019592285156, 0.7158966064453125, -0.19495010375976562, 0.19382476806640625, 0.32678985595703125, 0.000324249267578125, 0.0296173095703125, 0.9006271362304688, 0.25634765625, 0.9347381591796875, 0.4598121643066406, -0.48146629333496094, 0.12309646606445312, 1.0994110107421875, 1.7975921630859375, 1.614410400390625, 0.05187225341796875], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000063.npy"} +{"epoch": 0.09523809523809523, "step": 64, "batch_size": 64, "mean": 0.08646336197853088, "std": 0.8720651865005493, "min": -3.161590576171875, "p10": -0.6949203491210937, "median": 0.18042755126953125, "p90": 0.9491264343261722, "max": 2.333038330078125, "pos_frac": 0.5625, "sample": [1.8232192993164062, 2.030120849609375, -0.9599437713623047, -0.5177841186523438, -0.25330352783203125, -0.46508026123046875, 0.7674064636230469, 0.2554168701171875, 0.28772926330566406, 2.333038330078125, 0.463714599609375, 0.48412322998046875, 1.0209293365478516, -0.3406562805175781, 0.47408294677734375, -0.21117401123046875, -0.3355255126953125, 0.3881378173828125, 0.23015213012695312, 0.6419048309326172, 0.982147216796875, -0.16418838500976562, -0.16288375854492188, -0.2917919158935547, -0.7391815185546875, -0.27062416076660156, -0.07817459106445312, -3.161590576171875, -0.6539688110351562, 0.4040870666503906, 0.105377197265625, 0.3545989990234375, -0.24452972412109375, -0.5446243286132812, 0.09844970703125, 0.3600311279296875, 0.4840507507324219, -2.677764892578125, -1.1802978515625, 0.6953392028808594, 0.30738067626953125, 0.27904510498046875, 0.8720779418945312, -0.4150238037109375, 0.20894622802734375, 0.003021240234375, -0.06601524353027344, 0.2382049560546875, -0.28668975830078125, 1.8125381469726562, -0.7585105895996094, -0.3640098571777344, 1.3336563110351562, 0.32964324951171875, 0.19525527954101562, 0.3621864318847656, 0.6979866027832031, 0.16559982299804688, -0.7124710083007812, -0.4071044921875, 0.32440948486328125, -0.43470001220703125, -0.18434524536132812, 0.6016044616699219], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000064.npy"} +{"epoch": 0.09674981103552532, "step": 65, "batch_size": 64, "mean": 0.515876054763794, "std": 1.219058632850647, "min": -2.665496826171875, "p10": -0.873748779296875, "median": 0.4864778518676758, "p90": 1.8953302383422854, "max": 4.17254638671875, "pos_frac": 0.71875, "sample": [0.18703937530517578, 0.7629165649414062, 1.517364501953125, 0.182769775390625, 0.020772933959960938, 0.63055419921875, -1.4543914794921875, -0.4731292724609375, -0.6344184875488281, 1.8179092407226562, -0.8873443603515625, 0.7030372619628906, 1.325296401977539, 0.29662322998046875, 0.8959922790527344, 0.5479297637939453, 0.6323471069335938, 0.22374725341796875, -0.8361663818359375, 2.3655242919921875, 1.0385284423828125, 0.1256103515625, -1.684112548828125, 2.5362167358398438, 1.9285106658935547, 0.12725448608398438, -2.665496826171875, 0.3143768310546875, -0.1424713134765625, 0.72381591796875, 0.12549972534179688, 0.6168594360351562, -0.8052139282226562, -1.0546989440917969, 0.7836990356445312, 2.9727706909179688, 0.6808891296386719, 2.9557952880859375, 1.4086151123046875, 1.2347412109375, 1.6476917266845703, 0.08747291564941406, 1.7422866821289062, 0.8088188171386719, -0.6049346923828125, 0.13724517822265625, 0.7607612609863281, -0.04726409912109375, -1.0558605194091797, -0.8420257568359375, 0.42502593994140625, 0.92486572265625, -0.275299072265625, 0.9319648742675781, 0.12709808349609375, 0.7829742431640625, 2.8852310180664062, -0.28510093688964844, 1.44500732421875, 1.7351303100585938, -0.031982421875, -1.6870269775390625, 4.17254638671875, 0.18587684631347656], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000065.npy"} +{"epoch": 0.0982615268329554, "step": 66, "batch_size": 64, "mean": 0.38975614309310913, "std": 1.1121292114257812, "min": -2.74554443359375, "p10": -1.0713481903076172, "median": 0.3004570007324219, "p90": 1.7776916503906253, "max": 3.5006103515625, "pos_frac": 0.71875, "sample": [0.24657821655273438, 3.4921722412109375, 1.0518035888671875, 0.6490917205810547, 0.2617321014404297, 0.7761383056640625, 0.38411903381347656, 0.2226715087890625, -0.2649974822998047, 0.1803607940673828, -0.6755180358886719, 0.8734664916992188, 2.3466644287109375, -0.051265716552734375, -1.104278564453125, -0.985137939453125, 0.6356048583984375, 0.7067222595214844, 1.701385498046875, 1.9928207397460938, 0.5063934326171875, 1.7161521911621094, -1.4074249267578125, 0.0075836181640625, 0.05722808837890625, 0.7892684936523438, 0.7231826782226562, 1.2528839111328125, 0.8295745849609375, 0.39832305908203125, 0.7985305786132812, 0.3795604705810547, 0.22895050048828125, -0.17481422424316406, 0.11736106872558594, -0.11783599853515625, 0.8157310485839844, 0.31275177001953125, -0.9945106506347656, -0.00022125244140625, -2.74554443359375, -2.2093467712402344, 0.085052490234375, -0.1737823486328125, 0.10915374755859375, -1.1199874877929688, 1.8040657043457031, 0.24338531494140625, 1.23406982421875, 0.9485988616943359, 0.07155799865722656, 0.197601318359375, 0.3212623596191406, 3.5006103515625, 2.2508544921875, -1.1151809692382812, 0.2881622314453125, -1.3843269348144531, -0.0911865234375, 1.830474853515625, 1.1651535034179688, -0.2998237609863281, 0.9504547119140625, 0.4043121337890625], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000066.npy"} +{"epoch": 0.09977324263038549, "step": 67, "batch_size": 64, "mean": 0.32035303115844727, "std": 0.9184228777885437, "min": -2.10833740234375, "p10": -0.7311441421508789, "median": 0.2754364013671875, "p90": 1.4441055297851566, "max": 3.0619964599609375, "pos_frac": 0.671875, "sample": [0.3763275146484375, -1.2891845703125, -0.6390285491943359, -0.42486000061035156, -0.7706222534179688, 0.39021873474121094, 1.7707576751708984, 0.9664764404296875, 0.41754913330078125, -0.5498428344726562, 1.4833450317382812, 0.13468170166015625, -0.3615875244140625, -1.01751708984375, 1.0610122680664062, 0.9731521606445312, -0.39806175231933594, 0.8261871337890625, -0.4023284912109375, 0.9518890380859375, -0.26715087890625, 1.1234664916992188, -2.10833740234375, 3.0619964599609375, 0.5105247497558594, 0.752685546875, 0.8504447937011719, 0.1618804931640625, 1.3525466918945312, -0.8291893005371094, 0.20713043212890625, 0.5196933746337891, 0.58294677734375, 1.6450576782226562, 0.5821037292480469, 0.2400684356689453, 0.27081298828125, 0.2411632537841797, -0.3631019592285156, 1.0595016479492188, 2.360687255859375, 0.183868408203125, 0.9120101928710938, 1.0541610717773438, 0.4618377685546875, 0.09965133666992188, -0.3536224365234375, -0.09742546081542969, 0.09174346923828125, -0.4753570556640625, 0.6177139282226562, 1.7169189453125, 0.3477020263671875, 0.1399078369140625, -0.5034675598144531, -0.23821258544921875, 0.875823974609375, -0.0986175537109375, -1.0996952056884766, -1.69586181640625, 1.9478340148925781, 0.25952911376953125, 0.280059814453125, 0.6225967407226562], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000067.npy"} +{"epoch": 0.10128495842781557, "step": 68, "batch_size": 64, "mean": 0.3158555328845978, "std": 1.263443112373352, "min": -4.003265380859375, "p10": -1.156245422363281, "median": 0.4177703857421875, "p90": 1.4872001647949225, "max": 4.072021484375, "pos_frac": 0.734375, "sample": [4.072021484375, 1.553619384765625, 0.15522193908691406, 1.2933502197265625, -0.7252731323242188, 2.3156814575195312, 0.42095947265625, 0.09686660766601562, 1.0969982147216797, -0.0631866455078125, 1.8922042846679688, -4.003265380859375, 1.3322219848632812, 1.0865097045898438, 0.791351318359375, 0.995147705078125, -0.191558837890625, -0.25278472900390625, 0.3838348388671875, 0.46331024169921875, 0.785003662109375, 0.3296527862548828, 0.414581298828125, 1.0999488830566406, 0.4902381896972656, 0.5565547943115234, 0.6091728210449219, -0.95062255859375, 0.9048995971679688, -0.880462646484375, 0.05497550964355469, 0.6479606628417969, 0.7167930603027344, 0.5619964599609375, -1.2443695068359375, 0.14781951904296875, 3.5490570068359375, 0.09363555908203125, 0.188140869140625, 0.05415153503417969, -1.99224853515625, -1.396636962890625, 0.3861236572265625, 0.7470932006835938, -1.9389114379882812, -2.6358566284179688, 0.08425140380859375, 0.14867782592773438, -0.6895256042480469, -0.14485931396484375, 1.102386474609375, 0.44219207763671875, 0.02629852294921875, 1.6155471801757812, 0.9685211181640625, -0.07367706298828125, 0.45252227783203125, 1.3127365112304688, 2.1235809326171875, 0.49971580505371094, 1.0515098571777344, -0.8785400390625, 0.045436859130859375, -1.883941650390625], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000068.npy"} +{"epoch": 0.10279667422524566, "step": 69, "batch_size": 64, "mean": 0.6287362575531006, "std": 1.256372094154358, "min": -2.23614501953125, "p10": -0.8013250350952148, "median": 0.4043140411376953, "p90": 2.2839324951171887, "max": 5.198333740234375, "pos_frac": 0.78125, "sample": [0.0089874267578125, 0.101593017578125, 2.6906471252441406, 0.237152099609375, 0.4903411865234375, -0.15279006958007812, -0.4105987548828125, -0.19332504272460938, 1.0823974609375, 1.1091766357421875, 0.8059406280517578, 0.2951011657714844, 0.338897705078125, 1.651824951171875, 1.584381103515625, 2.047515869140625, 0.5142955780029297, 1.719024658203125, 3.1915740966796875, -1.4703140258789062, 3.16064453125, -2.23614501953125, 2.44842529296875, 0.059482574462890625, 2.38525390625, 0.00634002685546875, 0.38720703125, 0.5510025024414062, 0.1631927490234375, 0.54400634765625, 0.48178863525390625, -0.972625732421875, 0.39853477478027344, 1.0255813598632812, 0.3244361877441406, -0.75030517578125, 1.7222862243652344, 0.5411853790283203, 0.024688720703125, 1.1186141967773438, 0.3146209716796875, 0.47052955627441406, 0.0699310302734375, 0.22010040283203125, 1.7079391479492188, -0.7418136596679688, 1.5326461791992188, 0.7040729522705078, -0.044586181640625, -1.3212509155273438, 0.2452850341796875, 1.0808963775634766, -1.8527870178222656, -0.8231906890869141, 0.9168128967285156, -0.14710617065429688, 1.2592620849609375, 0.17433547973632812, 2.039306640625, -0.9134922027587891, 5.198333740234375, 0.4100933074951172, 2.61285400390625, 0.10091018676757812], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000069.npy"} +{"epoch": 0.10430839002267574, "step": 70, "batch_size": 64, "mean": 0.37581607699394226, "std": 1.162222146987915, "min": -3.083831787109375, "p10": -1.0137407302856445, "median": 0.47175025939941406, "p90": 1.8032127380371108, "max": 3.21771240234375, "pos_frac": 0.65625, "sample": [0.49465179443359375, -1.1881599426269531, 1.1775970458984375, -1.024871826171875, 0.4882678985595703, -0.9877681732177734, -0.44830322265625, 1.2617568969726562, 1.4107437133789062, -0.24939918518066406, 1.1133499145507812, 1.4071464538574219, -3.083831787109375, 1.1977691650390625, 0.08077239990234375, -0.5535717010498047, 2.2182464599609375, -1.6490478515625, -0.8371315002441406, -0.467926025390625, 3.0078048706054688, 0.7044086456298828, 1.0862483978271484, 0.7593116760253906, -1.5065040588378906, 0.8334770202636719, 0.6420631408691406, 2.1722946166992188, -0.9653091430664062, 3.21771240234375, 0.03225517272949219, 0.7009201049804688, -0.6462020874023438, -0.6018943786621094, 0.3680572509765625, 2.2628555297851562, 1.9535675048828125, 0.4522247314453125, 0.5929470062255859, 1.381866455078125, 0.4552326202392578, -1.065317153930664, -0.3947486877441406, 0.5144271850585938, 1.4523849487304688, 0.4398765563964844, -0.46913909912109375, 2.251800537109375, 0.033000946044921875, 1.1259536743164062, 0.18239593505859375, 1.2970123291015625, 0.618804931640625, -0.391876220703125, 0.37908172607421875, 0.04790687561035156, -0.2575531005859375, -1.5358715057373047, 1.3137283325195312, 0.7368412017822266, -0.5376739501953125, 0.8574104309082031, -0.6287384033203125, 0.8188934326171875], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000070.npy"} +{"epoch": 0.10582010582010581, "step": 71, "batch_size": 64, "mean": 0.2483464628458023, "std": 1.5239101648330688, "min": -4.701080322265625, "p10": -1.5161952972412107, "median": 0.31485652923583984, "p90": 2.002921295166016, "max": 3.2950973510742188, "pos_frac": 0.578125, "sample": [-0.2174053192138672, 1.4105873107910156, 0.9137496948242188, 0.3372669219970703, -0.09765625, -0.6652374267578125, 1.1468677520751953, -1.2607955932617188, -0.37110137939453125, 2.75677490234375, 0.5554466247558594, -2.349700927734375, -0.447418212890625, 1.054840087890625, -2.8036346435546875, 0.0054779052734375, 0.646881103515625, 2.9429244995117188, 0.8262805938720703, 1.6749114990234375, -3.7229766845703125, 2.5982589721679688, 0.12114715576171875, -0.6031227111816406, 1.4957809448242188, 2.7581787109375, 0.04000091552734375, -0.1464405059814453, 0.7410602569580078, 0.5276870727539062, -4.701080322265625, -0.641510009765625, -1.6256523132324219, -0.9083480834960938, -0.06897163391113281, 0.34091949462890625, 0.3671989440917969, 0.88775634765625, 1.4940948486328125, -0.822418212890625, -0.51995849609375, -2.9059600830078125, 0.797943115234375, 1.8055267333984375, -0.32904815673828125, -0.25231075286865234, -1.631805419921875, 1.9448318481445312, -0.43476104736328125, -0.08956718444824219, 1.2618141174316406, 2.4083900451660156, -0.7936248779296875, 2.0278167724609375, 1.0791091918945312, 1.4028358459472656, 0.6569938659667969, 0.04242706298828125, 0.6008529663085938, 0.2924461364746094, 1.6351776123046875, -0.176971435546875, 3.2950973510742188, -0.41370391845703125], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000071.npy"} +{"epoch": 0.1073318216175359, "step": 72, "batch_size": 64, "mean": 0.7564687728881836, "std": 1.3514184951782227, "min": -3.2237091064453125, "p10": -0.7837268829345703, "median": 0.8011436462402344, "p90": 2.0021152496337895, "max": 4.986873626708984, "pos_frac": 0.75, "sample": [1.7545242309570312, 1.3472366333007812, 0.8473358154296875, 1.9140357971191406, -2.999908447265625, 0.3736763000488281, 0.4252166748046875, 4.986873626708984, -1.5907974243164062, -0.31053924560546875, 1.6559791564941406, 1.7526702880859375, -0.03050994873046875, 2.0367603302001953, 0.06924057006835938, -0.5248298645019531, -0.3127117156982422, 0.8373641967773438, 1.7925186157226562, 0.0904693603515625, 3.276519775390625, 1.0762386322021484, 1.9287223815917969, 0.4223651885986328, 0.6882171630859375, 0.764923095703125, 0.2151317596435547, -0.7967262268066406, -0.958892822265625, -0.7533950805664062, 2.6908493041992188, 1.315164566040039, 1.3078765869140625, 2.0335693359375, 1.7592697143554688, 0.5223045349121094, 0.7647571563720703, 1.4837055206298828, 0.9693717956542969, -0.0795135498046875, 1.2635231018066406, 1.3580760955810547, 1.57958984375, 0.20705604553222656, 0.8426361083984375, -0.12503433227539062, 1.7408599853515625, 1.1901092529296875, -1.1882286071777344, 0.996612548828125, -0.89410400390625, 1.4687042236328125, 3.2089385986328125, -0.6393451690673828, 2.9828720092773438, -0.20059967041015625, 1.7092361450195312, 0.6198387145996094, -3.2237091064453125, 0.03491401672363281, 0.49176788330078125, 1.2899169921875, 0.494659423828125, 0.4606475830078125], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000072.npy"} +{"epoch": 0.10884353741496598, "step": 73, "batch_size": 64, "mean": 0.1308615803718567, "std": 1.612172245979309, "min": -3.9698333740234375, "p10": -1.4412124633789063, "median": -0.07537269592285156, "p90": 1.4895238876342776, "max": 7.09124755859375, "pos_frac": 0.484375, "sample": [1.1232070922851562, 0.6114540100097656, -0.7355117797851562, -0.8804130554199219, -1.2950687408447266, -1.48638916015625, -1.9505157470703125, -0.7746772766113281, -3.9698333740234375, 1.4482879638671875, -1.1481094360351562, 0.7797393798828125, 0.28287506103515625, -0.9854736328125, -1.0183448791503906, 0.7255458831787109, -1.9123611450195312, -0.18959426879882812, -0.267364501953125, 0.919525146484375, -0.6572113037109375, -0.022769927978515625, -0.8280220031738281, -0.3931884765625, 7.09124755859375, 2.314849853515625, -0.1279754638671875, -0.9756069183349609, 0.09177207946777344, 0.8976631164550781, 0.571929931640625, -0.17193031311035156, 0.9625835418701172, -0.3874244689941406, -1.428619384765625, 0.2346515655517578, 1.5071964263916016, 2.6893310546875, -1.9008808135986328, -1.3949813842773438, -0.722625732421875, 2.8387908935546875, 0.237701416015625, -1.4466094970703125, -0.9305000305175781, 1.2854690551757812, 0.8098220825195312, -0.8896579742431641, 0.079437255859375, -0.5690994262695312, -1.69061279296875, 0.6191177368164062, 1.1826553344726562, 0.3954429626464844, 1.1610298156738281, 1.134796142578125, 0.9710731506347656, 0.8189239501953125, -0.398681640625, -0.4219245910644531, 0.14597129821777344, 3.0272216796875, 4.200164794921875, -0.8123569488525391], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000073.npy"} +{"epoch": 0.11035525321239607, "step": 74, "batch_size": 64, "mean": 0.6733803749084473, "std": 1.39522385597229, "min": -3.1580352783203125, "p10": -0.8496105194091796, "median": 0.7450008392333984, "p90": 2.1684890747070327, "max": 6.059967041015625, "pos_frac": 0.6875, "sample": [-0.6336822509765625, 1.2256927490234375, -0.052703857421875, 0.5626144409179688, 1.7957687377929688, -0.7137413024902344, 2.3386077880859375, 6.059967041015625, 1.4352798461914062, 2.4061222076416016, 1.2497749328613281, 0.2042083740234375, 1.571746826171875, 1.3737106323242188, -0.7680835723876953, 1.3795051574707031, 0.91961669921875, 0.864288330078125, -0.2852764129638672, -3.1580352783203125, 0.5828971862792969, 2.3013916015625, 0.8661041259765625, 0.9160423278808594, 0.7351722717285156, -0.06527328491210938, -0.7309513092041016, 1.3094215393066406, 2.3783950805664062, -1.0394973754882812, 0.39363861083984375, 0.8790531158447266, 1.5998649597167969, -1.1194076538085938, -0.8743400573730469, 1.0121803283691406, -0.6375617980957031, 0.7548294067382812, -1.68865966796875, -0.2523002624511719, 0.6221942901611328, -1.1076183319091797, 1.287689208984375, 0.851470947265625, 0.9108047485351562, 2.7342071533203125, 1.5651779174804688, -0.5599861145019531, 1.5315170288085938, 1.8244857788085938, -2.0129852294921875, -0.3793525695800781, 0.7280845642089844, -0.2718353271484375, -0.7919082641601562, 0.36559486389160156, 0.43963623046875, 3.860443115234375, 1.8583831787109375, 1.5405044555664062, 1.5292739868164062, 0.3267478942871094, 0.5601253509521484, 0.587310791015625], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000074.npy"} +{"epoch": 0.11186696900982615, "step": 75, "batch_size": 64, "mean": 0.7894306182861328, "std": 1.349428415298462, "min": -2.8599586486816406, "p10": -0.6761844635009764, "median": 0.5343170166015625, "p90": 2.7303056716918963, "max": 4.687744140625, "pos_frac": 0.75, "sample": [-0.4111652374267578, -0.5399703979492188, -0.19181442260742188, 1.3294448852539062, 3.3711318969726562, 0.055850982666015625, 0.35608673095703125, 1.3534202575683594, 1.2713165283203125, 3.1672210693359375, -0.14633941650390625, -0.11722946166992188, -1.1533870697021484, 0.5526275634765625, 0.3136444091796875, 1.3800468444824219, 2.1522979736328125, -1.4059104919433594, 0.43184852600097656, 0.43876075744628906, 3.94927978515625, 1.2021636962890625, 1.2850341796875, 2.0516815185546875, 1.2312984466552734, 0.4973564147949219, 1.2388801574707031, -1.0706634521484375, 2.33209228515625, 0.483642578125, 0.9424057006835938, 2.900968551635742, 0.0990447998046875, 2.015972137451172, 1.1426773071289062, 0.42351722717285156, 4.687744140625, 0.974700927734375, 0.7354660034179688, 0.3401050567626953, 0.26847076416015625, 1.0025653839111328, -2.8599586486816406, 0.7341995239257812, 1.4704093933105469, -0.09377288818359375, -0.7345619201660156, 0.45793914794921875, 0.5251750946044922, 0.05490875244140625, 0.5434589385986328, 2.2747535705566406, -1.2464637756347656, -0.11252975463867188, 0.7013359069824219, -0.273590087890625, 3.079803466796875, -0.29462623596191406, -0.8862876892089844, 0.13444137573242188, 0.65673828125, 0.06103706359863281, 3.4472503662109375, 1.9416122436523438], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000075.npy"} +{"epoch": 0.11337868480725624, "step": 76, "batch_size": 64, "mean": 0.33148977160453796, "std": 1.5809109210968018, "min": -4.362266540527344, "p10": -1.5409076690673826, "median": 0.2889137268066406, "p90": 2.226250457763672, "max": 4.406608581542969, "pos_frac": 0.578125, "sample": [-4.362266540527344, 1.1635398864746094, -2.6450042724609375, -0.099700927734375, 0.8156814575195312, -0.9173831939697266, -0.4400005340576172, 1.0179443359375, 0.4595222473144531, 3.39215087890625, 2.2835865020751953, 4.406608581542969, -0.33550453186035156, -3.6392669677734375, 0.852935791015625, -1.3918991088867188, 0.6060104370117188, 1.0204238891601562, 0.650726318359375, 0.2979621887207031, 0.354766845703125, 2.8189926147460938, -1.8619384765625, 3.0661239624023438, -1.8784942626953125, 1.6541595458984375, 0.8941459655761719, 1.2179794311523438, 0.11174201965332031, -0.26642799377441406, -0.05871009826660156, -0.7564163208007812, -1.5844879150390625, -0.4329071044921875, -0.3813610076904297, -0.06037139892578125, 2.1162490844726562, 0.894012451171875, -0.6712398529052734, 1.2828750610351562, -0.2937583923339844, 0.21990203857421875, 0.2926216125488281, -0.22830581665039062, 2.1938705444335938, 0.7346019744873047, 0.6918373107910156, -1.4392204284667969, 0.2852058410644531, -0.298583984375, -0.12091827392578125, 0.831573486328125, 0.16004562377929688, 2.2401275634765625, 3.787200927734375, 0.9602222442626953, -0.28496360778808594, -0.9406356811523438, -1.8968505859375, 1.7728271484375, 1.4878082275390625, 0.011386871337890625, 1.691558837890625, -0.2369670867919922], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000076.npy"} +{"epoch": 0.11489040060468632, "step": 77, "batch_size": 64, "mean": 0.7387731075286865, "std": 1.474638819694519, "min": -3.1195526123046875, "p10": -1.2691188812255858, "median": 0.48543453216552734, "p90": 2.648730850219727, "max": 4.9232025146484375, "pos_frac": 0.734375, "sample": [-0.39266014099121094, 1.3716354370117188, -1.3016395568847656, -1.4175491333007812, 2.008974075317383, 1.6629524230957031, -1.672698974609375, -0.11261177062988281, -3.1195526123046875, 0.22945404052734375, 2.108123779296875, 1.1646232604980469, 0.2560253143310547, -1.5337562561035156, 0.8526458740234375, 2.955402374267578, 0.2272491455078125, 1.1741943359375, 0.8080978393554688, 3.5502548217773438, -0.36012840270996094, 0.13500022888183594, 2.463714599609375, 2.4446678161621094, 0.372039794921875, 0.5529747009277344, 0.07716941833496094, 2.7280235290527344, 0.18938064575195312, 0.4862213134765625, -0.6862640380859375, -0.7665214538574219, -0.2522087097167969, 0.4436988830566406, 1.3084068298339844, 2.15484619140625, 1.05682373046875, 1.219045639038086, 0.9416542053222656, 1.7013320922851562, 1.972564697265625, 0.06078338623046875, 0.863006591796875, -0.08915519714355469, 0.07196426391601562, 4.9232025146484375, 0.2848529815673828, -0.010747909545898438, 2.9564971923828125, 0.9563980102539062, 4.132568359375, 0.25160980224609375, 0.4846477508544922, 1.6711845397949219, 2.3209152221679688, 0.35999298095703125, -1.38800048828125, -1.1932373046875, 1.4032058715820312, -0.2993431091308594, 0.29634857177734375, 3.1570968627929688, 0.5252170562744141, -1.459136962890625], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000077.npy"} +{"epoch": 0.1164021164021164, "step": 78, "batch_size": 64, "mean": 0.4390455484390259, "std": 1.4534575939178467, "min": -3.9903335571289062, "p10": -1.0647705078124998, "median": 0.38290977478027344, "p90": 2.091961288452149, "max": 4.147132873535156, "pos_frac": 0.640625, "sample": [2.6414623260498047, -2.95635986328125, 0.7653179168701172, 1.9414634704589844, 0.65374755859375, 2.486480712890625, 0.7694206237792969, -0.3345184326171875, 0.5092849731445312, 0.569549560546875, 1.19085693359375, -1.239288330078125, -0.24477767944335938, 1.7109756469726562, 0.3712921142578125, -0.34720611572265625, -1.6561698913574219, 3.654266357421875, -1.2527618408203125, 0.6546554565429688, -0.9588775634765625, -0.481658935546875, 0.1053466796875, -0.9507484436035156, 0.9763946533203125, 0.32465362548828125, 0.1332855224609375, -3.9903335571289062, 2.1310577392578125, -3.0204925537109375, 1.8915176391601562, 1.2956771850585938, -0.20146942138671875, 1.7545623779296875, 0.155517578125, -0.277099609375, -0.8847885131835938, -0.10529327392578125, 1.7624073028564453, 1.7075614929199219, 0.613739013671875, 0.16906356811523438, 1.457244873046875, 1.5632896423339844, -0.360137939453125, 1.3022613525390625, -1.1101531982421875, 0.3945274353027344, 0.2604522705078125, 1.0130691528320312, -0.5627822875976562, 2.643951416015625, 0.21910858154296875, -0.6937255859375, -0.004058837890625, -0.7161750793457031, 0.09647178649902344, -0.5164031982421875, 1.2426719665527344, 2.3843154907226562, 0.83807373046875, 0.4613304138183594, 4.147132873535156, 2.0007362365722656], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000078.npy"} +{"epoch": 0.11791383219954649, "step": 79, "batch_size": 64, "mean": 1.1672492027282715, "std": 2.0240259170532227, "min": -3.0674514770507812, "p10": -0.5760848999023438, "median": 0.6685504913330078, "p90": 3.2078861236572283, "max": 8.059417724609375, "pos_frac": 0.71875, "sample": [-0.07511711120605469, 0.2720489501953125, -1.2310523986816406, 1.7906951904296875, 0.0263824462890625, 1.3686599731445312, -3.0674514770507812, -0.23629379272460938, 0.44753265380859375, 0.31854248046875, -0.8136062622070312, 0.4979400634765625, 1.9058189392089844, 8.059417724609375, -1.7506103515625, 0.5972824096679688, 2.3574485778808594, 0.46764373779296875, -0.4424419403076172, -0.20886993408203125, 1.2513599395751953, 6.5101165771484375, 1.6090240478515625, 3.605865478515625, 1.1129875183105469, -1.4051628112792969, 4.524600982666016, 2.4472198486328125, 1.9611358642578125, 1.9981613159179688, -1.2086639404296875, -0.23090362548828125, 2.5463409423828125, 2.1599884033203125, 1.8773555755615234, 0.5098075866699219, 1.1500205993652344, 1.842203140258789, -0.5684051513671875, 2.1607818603515625, -0.4942665100097656, 2.8086700439453125, 0.3248748779296875, -0.2907600402832031, 0.7701282501220703, 0.9780426025390625, 2.2840728759765625, 0.2659893035888672, 0.7398185729980469, 0.152496337890625, 1.1606426239013672, -0.0325927734375, 5.33367919921875, -0.1719207763671875, 0.5916328430175781, 8.048309326171875, 0.4428253173828125, 1.4773635864257812, 0.3643035888671875, 2.0928306579589844, -0.579376220703125, 1.1853981018066406, 3.378978729248047, -0.26499176025390625], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000079.npy"} +{"epoch": 0.11942554799697656, "step": 80, "batch_size": 64, "mean": 0.5562411546707153, "std": 1.9760124683380127, "min": -4.5836181640625, "p10": -1.5239288330078125, "median": 0.1878490447998047, "p90": 3.127659606933594, "max": 5.474639892578125, "pos_frac": 0.53125, "sample": [-0.5489406585693359, 3.1454620361328125, 0.1019134521484375, 2.001556396484375, 1.2495155334472656, -0.784027099609375, -0.5607757568359375, -0.3222827911376953, -1.5619049072265625, -1.815093994140625, 2.1700668334960938, 3.3876266479492188, -0.29697418212890625, -1.1065597534179688, -0.23830413818359375, 4.652435302734375, -1.34893798828125, -0.10589599609375, 0.6338977813720703, -0.05616569519042969, 0.2677955627441406, -1.4353179931640625, 0.35042381286621094, 1.4327011108398438, 4.6071014404296875, 2.954641342163086, 2.9001693725585938, -0.7372055053710938, 2.8413543701171875, 4.1387481689453125, -1.7671661376953125, 1.8689727783203125, 0.6630096435546875, 0.67657470703125, 0.9211273193359375, 2.178131103515625, -0.7704849243164062, 0.10790252685546875, 4.41583251953125, -4.5836181640625, 3.08612060546875, -0.22338104248046875, -3.1146163940429688, 1.7824935913085938, -0.14497756958007812, 0.8591804504394531, 1.391754150390625, 0.46926116943359375, -2.1073532104492188, -1.4105606079101562, 2.676055908203125, -0.17298507690429688, -0.562591552734375, -0.269073486328125, -0.30319976806640625, -0.12369346618652344, 0.8271484375, -1.2264385223388672, 1.3748703002929688, -2.9561920166015625, 0.37030792236328125, -0.424041748046875, 5.474639892578125, 0.69940185546875], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000080.npy"} +{"epoch": 0.12093726379440665, "step": 81, "batch_size": 64, "mean": 0.8704346418380737, "std": 1.852181077003479, "min": -2.5418243408203125, "p10": -1.0956283569335936, "median": 0.6477737426757812, "p90": 2.8413894653320315, "max": 7.9740753173828125, "pos_frac": 0.65625, "sample": [1.0381813049316406, 1.9865703582763672, 1.2289161682128906, -1.31829833984375, 1.4504585266113281, -2.5418243408203125, 0.3020057678222656, 0.381744384765625, -0.5611152648925781, -0.7833900451660156, 4.704833984375, -0.1648101806640625, 0.6469802856445312, 2.3249740600585938, 0.6485671997070312, -0.2262725830078125, 0.5046634674072266, -0.053714752197265625, 3.4786300659179688, 2.189699172973633, 0.9036369323730469, -0.5785484313964844, 1.7673797607421875, 2.1041259765625, 2.8596038818359375, 1.7635002136230469, 0.1306304931640625, -0.42264556884765625, -0.08964157104492188, -1.4518280029296875, 0.8740806579589844, -2.1587295532226562, 1.7127304077148438, 0.2667579650878906, -0.9417877197265625, 3.648040771484375, 0.1864776611328125, 7.9740753173828125, 1.282440185546875, 5.58148193359375, -0.5025711059570312, 1.2617988586425781, 0.53814697265625, -0.3665924072265625, 1.2831039428710938, 0.14260292053222656, 2.028108596801758, 0.8900527954101562, 2.4271011352539062, 2.2754974365234375, 3.6749114990234375, -0.8724365234375, 2.5244712829589844, -0.911895751953125, -0.2857799530029297, 1.006072998046875, -1.6135997772216797, 0.3027610778808594, 1.0626907348632812, 2.79888916015625, -0.6193580627441406, 1.4438209533691406, -2.266998291015625, -1.16156005859375], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000081.npy"} +{"epoch": 0.12244897959183673, "step": 82, "batch_size": 64, "mean": 1.0469751358032227, "std": 1.5333313941955566, "min": -4.034271240234375, "p10": -0.5807218551635742, "median": 1.0396509170532227, "p90": 3.114344024658205, "max": 5.590278625488281, "pos_frac": 0.765625, "sample": [0.8003559112548828, 1.2377433776855469, 0.470184326171875, -0.8061199188232422, 2.144622802734375, 0.1974811553955078, 0.7573699951171875, 2.3317642211914062, 3.525360107421875, 1.3626995086669922, 1.2677726745605469, 0.5803451538085938, 1.832366943359375, 2.7377853393554688, 0.7517433166503906, 1.8121490478515625, 1.0614471435546875, 0.5112228393554688, 1.2992496490478516, 0.636810302734375, 0.2747230529785156, -0.4895515441894531, 1.0456409454345703, -0.23849105834960938, -0.33405303955078125, 3.275726318359375, 1.782308578491211, 1.062835693359375, 1.716115951538086, 1.0152130126953125, 0.5076789855957031, -0.06869888305664062, 5.590278625488281, -0.0265350341796875, 1.6174774169921875, 3.5176544189453125, 2.5683670043945312, 1.324066162109375, 1.5029144287109375, 3.7926712036132812, 0.45905303955078125, -1.9494400024414062, 2.6559677124023438, -1.3459587097167969, 1.8609142303466797, 0.5282974243164062, 2.155733108520508, 0.07718086242675781, 4.060356140136719, 1.033660888671875, -0.66070556640625, -0.012912750244140625, 1.65673828125, 3.3991928100585938, -0.22418212890625, -0.5889530181884766, 1.5557594299316406, 1.3461189270019531, 1.9334239959716797, 0.6389274597167969, -1.1959152221679688, -4.034271240234375, -0.5615158081054688, 0.2702445983886719], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000082.npy"} +{"epoch": 0.12396069538926682, "step": 83, "batch_size": 64, "mean": 1.1476980447769165, "std": 1.8273438215255737, "min": -3.6911792755126953, "p10": -0.6866079330444332, "median": 0.9790611267089844, "p90": 2.902433395385742, "max": 8.108726501464844, "pos_frac": 0.78125, "sample": [2.05084228515625, 1.463104248046875, -1.1475639343261719, 0.3421649932861328, 0.7381496429443359, -0.03308868408203125, 1.3052978515625, 1.4200210571289062, 2.0505142211914062, 5.10308837890625, 0.54296875, 1.3484420776367188, -2.0363807678222656, 1.0449943542480469, 1.8540706634521484, 0.8949966430664062, 1.5577850341796875, 2.6236648559570312, 2.1843605041503906, 0.9119834899902344, 1.9052505493164062, -0.39737701416015625, 3.5962066650390625, 0.28745079040527344, -1.559722900390625, 1.6677169799804688, 3.862396240234375, 0.3845672607421875, 0.46157264709472656, -0.05690956115722656, -0.32623291015625, 0.5942249298095703, 2.8882408142089844, -3.6911792755126953, -0.8105640411376953, 2.3327713012695312, 1.4951972961425781, 0.30224609375, 1.465200424194336, -2.392181396484375, 0.4159107208251953, 0.43935394287109375, 0.6290130615234375, 0.3050689697265625, -0.20660400390625, -0.1332855224609375, 0.2515735626220703, 2.082122802734375, 3.5899429321289062, 1.7335281372070312, 8.108726501464844, 1.7301807403564453, 2.9085159301757812, 0.9131278991699219, -0.01860809326171875, 1.731405258178711, 1.2001018524169922, 1.9027385711669922, 2.0184555053710938, 6.26080322265625, 1.134307861328125, 0.6437835693359375, 0.4357433319091797, -0.8515243530273438], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000083.npy"} +{"epoch": 0.1254724111866969, "step": 84, "batch_size": 64, "mean": 0.9099798202514648, "std": 1.8950119018554688, "min": -2.927001953125, "p10": -1.6559640884399414, "median": 0.7940635681152344, "p90": 3.6635864257812503, "max": 5.39056396484375, "pos_frac": 0.75, "sample": [1.1292343139648438, 2.081279754638672, 0.8820610046386719, 2.168323516845703, 5.363609313964844, 1.785919189453125, 3.9455718994140625, -0.18450927734375, -0.35025787353515625, -2.375152587890625, 0.16365814208984375, 2.2178077697753906, 2.8012046813964844, 0.11771392822265625, 0.870513916015625, 0.4674034118652344, 0.2902984619140625, -0.7055282592773438, 4.205909729003906, -1.3852577209472656, 0.9746932983398438, 2.1471099853515625, 1.1802959442138672, 2.3707962036132812, 0.41562843322753906, 0.600860595703125, -1.6890449523925781, 3.6042633056640625, 0.21904563903808594, 0.7833023071289062, 0.6952590942382812, 0.8048248291015625, -0.4577980041503906, 5.39056396484375, -2.4305953979492188, 1.2237281799316406, 1.6383495330810547, 2.2801055908203125, 1.2486610412597656, -2.1353302001953125, -2.927001953125, 4.3316802978515625, 1.880615234375, 0.3717632293701172, 3.6890106201171875, 0.4733448028564453, 0.14326095581054688, 2.9420127868652344, 1.3555946350097656, -2.6132278442382812, 0.46405792236328125, -0.8518524169921875, 2.0763988494873047, 1.2319717407226562, 1.1206016540527344, -1.26507568359375, 4.004364013671875, 0.30223846435546875, 0.22206878662109375, -1.634490966796875, 2.9617233276367188, 0.1630096435546875, -1.6651668548583984, -0.8927154541015625], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000084.npy"} +{"epoch": 0.12698412698412698, "step": 85, "batch_size": 64, "mean": 1.2924078702926636, "std": 2.0140769481658936, "min": -4.069866180419922, "p10": -1.4360519409179686, "median": 1.0604619979858398, "p90": 3.544819259643555, "max": 6.7323150634765625, "pos_frac": 0.78125, "sample": [2.9548587799072266, -1.2593803405761719, 1.2010250091552734, 2.442117691040039, 1.0304336547851562, 1.3074111938476562, 1.7911834716796875, 0.7498836517333984, 0.10869026184082031, 3.476184844970703, 3.4584121704101562, 1.258880615234375, 2.214902877807617, 0.606048583984375, 1.4016075134277344, 1.6973495483398438, 1.8922615051269531, 2.9066162109375, 2.885204315185547, 2.5649337768554688, -1.5117683410644531, 2.58648681640625, -2.37127685546875, 2.668468475341797, 0.34115028381347656, 3.5742340087890625, 0.6153564453125, 1.5009689331054688, 5.081684112548828, -0.032466888427734375, -1.5773429870605469, 1.8334884643554688, 2.4834136962890625, 0.8442840576171875, 0.5170078277587891, 0.2210540771484375, 4.315086364746094, 2.523408889770508, 0.3500480651855469, -0.078338623046875, -4.069866180419922, 1.549896240234375, -0.8649673461914062, 2.1833229064941406, 6.7323150634765625, 3.14361572265625, 5.0868377685546875, 0.41481971740722656, 1.0275001525878906, 0.824737548828125, 1.0406074523925781, -2.298980712890625, 0.90728759765625, -0.3421630859375, 0.8083305358886719, 0.8927764892578125, -2.005908966064453, -1.5924072265625, 4.378959655761719, 0.6344413757324219, 5.8104705810546875, -0.996002197265625, -0.20540618896484375, 1.0803165435791016], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000085.npy"} +{"epoch": 0.12849584278155707, "step": 86, "batch_size": 64, "mean": 0.9739255309104919, "std": 2.0345981121063232, "min": -3.8279647827148438, "p10": -1.4832504272460934, "median": 0.8419170379638672, "p90": 3.8140174865722667, "max": 6.146537780761719, "pos_frac": 0.6875, "sample": [6.146537780761719, 0.11419105529785156, -2.1407012939453125, 0.09087371826171875, 1.978668212890625, -0.42836952209472656, 0.29862213134765625, 0.7771072387695312, -3.8279647827148438, 1.5158100128173828, -0.5247898101806641, -1.9001617431640625, 4.448822021484375, 4.952781677246094, -0.4712677001953125, 3.6016387939453125, 1.659097671508789, -0.6008758544921875, -3.1277847290039062, 0.09514236450195312, 4.51373291015625, -0.03865814208984375, -0.20467376708984375, 2.477994918823242, 4.1219024658203125, 0.24565696716308594, 0.886749267578125, 1.1425666809082031, 2.039886474609375, 0.38497161865234375, 2.6363487243652344, 4.6552886962890625, 2.2458343505859375, -2.2150726318359375, 3.111541748046875, 1.6914749145507812, -1.0963363647460938, 0.9281787872314453, -0.8697166442871094, 0.35555267333984375, -1.6157341003417969, 2.6467933654785156, 2.047840118408203, -0.4749927520751953, 1.9909095764160156, 0.19416427612304688, 3.2192325592041016, -1.1741218566894531, 1.8173866271972656, -0.7446842193603516, 1.810211181640625, 3.3756637573242188, 0.1270904541015625, -0.21648025512695312, 2.392852783203125, 3.9050369262695312, -2.205629348754883, 2.1446990966796875, 0.9709548950195312, -0.6707229614257812, 0.9521026611328125, 0.21129989624023438, 1.1596755981445312, 0.7970848083496094], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000086.npy"} +{"epoch": 0.13000755857898716, "step": 87, "batch_size": 64, "mean": 1.0779623985290527, "std": 2.5056161880493164, "min": -6.708251953125, "p10": -2.1207695007324214, "median": 1.044332504272461, "p90": 4.526567840576172, "max": 6.662971496582031, "pos_frac": 0.703125, "sample": [1.1609840393066406, 5.295684814453125, 6.662971496582031, 0.02423858642578125, 1.6320152282714844, 0.64263916015625, 3.269989013671875, -1.3874053955078125, 3.82470703125, 2.817079544067383, -2.318981170654297, -1.3169631958007812, 1.4678058624267578, -2.241436004638672, -6.708251953125, 5.4741668701171875, -2.6262130737304688, 4.578590393066406, 0.7011833190917969, 1.4110260009765625, -3.070831298828125, 0.2063140869140625, 1.6237239837646484, -0.8021354675292969, 3.8123855590820312, -4.276344299316406, -0.3699493408203125, -0.09139633178710938, 1.7180023193359375, -1.334451675415039, -0.9195709228515625, 0.820098876953125, 4.405181884765625, -2.252288818359375, 1.58880615234375, -1.44012451171875, 1.0835342407226562, 1.7492713928222656, 2.7919998168945312, 0.5641098022460938, 0.7029876708984375, 2.9942398071289062, 0.72174072265625, -1.8392143249511719, 1.4391250610351562, 1.2023200988769531, 1.0051307678222656, 2.8646621704101562, -0.33194923400878906, 3.385162353515625, 3.16552734375, 1.520599365234375, 5.710052490234375, 0.15836334228515625, -0.105743408203125, 1.8127670288085938, 0.6975975036621094, -0.064453125, 5.568939208984375, 5.1241455078125, 1.54315185546875, 0.8358497619628906, 0.766021728515625, 1.9424057006835938], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000087.npy"} +{"epoch": 0.13151927437641722, "step": 88, "batch_size": 64, "mean": 0.8290235996246338, "std": 3.027784824371338, "min": -8.073501586914062, "p10": -2.403634643554687, "median": 0.7219009399414062, "p90": 3.834303283691407, "max": 10.966018676757812, "pos_frac": 0.671875, "sample": [6.588531494140625, 0.90460205078125, -2.258646011352539, -0.79058837890625, 6.865486145019531, 3.6815948486328125, 5.8812713623046875, 0.4000740051269531, 1.1740341186523438, -0.0046863555908203125, 3.5245018005371094, 3.618560791015625, 1.5868473052978516, 1.7406673431396484, -0.9796371459960938, 1.7402191162109375, 4.6559600830078125, -1.0706405639648438, -2.821197509765625, 0.9989013671875, 2.759756088256836, 0.8922786712646484, 0.3899421691894531, -0.48756980895996094, -2.2312240600585938, 1.6939773559570312, 0.08464813232421875, 10.966018676757812, -1.2125091552734375, -2.6467666625976562, -7.611335754394531, -2.7872467041015625, 3.4742889404296875, -0.1720733642578125, 1.0385665893554688, 0.1708526611328125, -0.9908676147460938, 2.207378387451172, 1.3928718566894531, 1.1291751861572266, 0.3120613098144531, 2.5153045654296875, 2.2453155517578125, 0.9402503967285156, -3.149627685546875, -0.1732635498046875, 0.01474761962890625, 0.5515232086181641, 0.3411979675292969, 0.19012832641601562, 2.3517589569091797, 1.1348953247070312, 6.3065643310546875, 3.899749755859375, 2.2707290649414062, -2.045633316040039, 1.6325912475585938, 0.21390724182128906, 0.37802886962890625, 3.262714385986328, -1.1606483459472656, -8.073501586914062, -1.9315261840820312, -2.4657726287841797], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000088.npy"} +{"epoch": 0.1330309901738473, "step": 89, "batch_size": 64, "mean": 1.3838995695114136, "std": 2.663546085357666, "min": -4.092193603515625, "p10": -0.9051488876342774, "median": 1.0014543533325195, "p90": 4.3167774200439455, "max": 11.81512451171875, "pos_frac": 0.75, "sample": [0.3788414001464844, 1.9550743103027344, -0.39879798889160156, 1.7664794921875, 3.5948944091796875, 4.020788192749023, -0.36830902099609375, 0.4337005615234375, 1.8146171569824219, 3.885223388671875, 2.076202392578125, 4.352081298828125, 1.867523193359375, 0.2715301513671875, 0.290283203125, 0.3680896759033203, 0.029354095458984375, 1.57427978515625, -0.390625, -2.850099563598633, 2.6178054809570312, -0.9185905456542969, 0.42679595947265625, 3.8402252197265625, -0.7138252258300781, 11.81512451171875, 2.3765335083007812, 1.2576179504394531, -0.8737850189208984, 4.598785400390625, 0.12943267822265625, 2.009490966796875, 1.016336441040039, 0.812286376953125, 4.4296722412109375, -0.32377052307128906, 3.6313705444335938, 0.8701934814453125, -1.97442626953125, 2.618804931640625, 2.681539535522461, 2.944774627685547, 6.922454833984375, 7.407835006713867, 0.986572265625, 0.04096031188964844, 0.21099853515625, 3.26495361328125, 4.234401702880859, -3.464935302734375, -0.854949951171875, 2.5451297760009766, -0.0749969482421875, 0.13192367553710938, 0.4628257751464844, -4.028221130371094, 1.8119449615478516, -0.4205131530761719, -3.1705150604248047, -4.092193603515625, 4.6407012939453125, 0.8481330871582031, 1.4138450622558594, 1.8096942901611328], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000089.npy"} +{"epoch": 0.1345427059712774, "step": 90, "batch_size": 64, "mean": 1.2766653299331665, "std": 2.5911195278167725, "min": -5.8450927734375, "p10": -1.8805053710937498, "median": 1.0194940567016602, "p90": 4.1011207580566404, "max": 6.8856658935546875, "pos_frac": 0.734375, "sample": [-0.9784336090087891, 3.0704593658447266, 0.9577903747558594, 2.299365997314453, 3.72723388671875, 0.2428760528564453, 3.0805110931396484, 6.8125457763671875, -3.44219970703125, -5.8450927734375, 3.4293594360351562, 3.523571014404297, 3.285593032836914, 0.9359512329101562, 2.919769287109375, -0.94683837890625, 1.5301971435546875, 5.9805450439453125, -1.9149932861328125, 0.9281349182128906, 4.060569763183594, -1.0675582885742188, 6.8856658935546875, 3.8660354614257812, 6.2433013916015625, 1.0957164764404297, 0.6933822631835938, 3.771514892578125, 0.5324325561523438, 0.646697998046875, 0.6739425659179688, -0.4766845703125, 1.8468303680419922, 6.8568115234375, 1.3228302001953125, 4.118499755859375, -2.8056411743164062, -1.1083450317382812, 4.154777526855469, 1.8438873291015625, -1.6039657592773438, 1.0837249755859375, 2.25933837890625, -1.8000335693359375, 4.032989501953125, 0.17098617553710938, 0.8355140686035156, 0.4187602996826172, 0.039081573486328125, -0.14879226684570312, -3.2316017150878906, 1.5113372802734375, 2.620208740234375, -0.069091796875, 0.4413337707519531, 1.081197738647461, 0.5003128051757812, -3.1385955810546875, -2.0460891723632812, 2.2645492553710938, 1.8906021118164062, 2.173614501953125, -0.6507854461669922, 0.32097434997558594], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000090.npy"} +{"epoch": 0.1360544217687075, "step": 91, "batch_size": 64, "mean": 1.169396162033081, "std": 2.821866512298584, "min": -6.123172760009766, "p10": -1.7575971603393554, "median": 0.9079208374023438, "p90": 4.282357025146484, "max": 12.16522216796875, "pos_frac": 0.640625, "sample": [3.629180908203125, 4.100898742675781, 1.2392349243164062, -1.707986831665039, 0.36922454833984375, 6.49835205078125, 0.3733406066894531, 2.0164718627929688, 3.1577720642089844, 6.712425231933594, 12.16522216796875, -0.8190155029296875, 1.3313312530517578, -1.286001205444336, 1.9052734375, -1.5169353485107422, -0.7111968994140625, -0.49383544921875, 2.5279541015625, -3.5096511840820312, 1.9420623779296875, 3.487621307373047, 0.899444580078125, 0.24493026733398438, 2.0263519287109375, 2.158140182495117, 3.242136001586914, -1.7659530639648438, -2.659393310546875, 3.427459716796875, 1.0798416137695312, -1.7902488708496094, -2.5545501708984375, 1.2966346740722656, 4.76069450378418, -0.5517082214355469, -0.727691650390625, 2.7611923217773438, -0.8601608276367188, -6.123172760009766, 2.6857070922851562, 0.9163970947265625, -2.1646499633789062, -1.56939697265625, 0.4055309295654297, 0.5548591613769531, 0.584442138671875, 5.170738220214844, 2.3618125915527344, 1.4632949829101562, -0.42626190185546875, -1.7381000518798828, -0.07196998596191406, 0.022504806518554688, 4.298831939697266, 3.37060546875, 5.6443023681640625, -0.010028839111328125, 4.243915557861328, 2.129596710205078, -1.5321807861328125, -0.0028057098388671875, 1.7930068969726562, 0.43551063537597656], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000091.npy"} +{"epoch": 0.13756613756613756, "step": 92, "batch_size": 64, "mean": 1.5875178575515747, "std": 3.1924126148223877, "min": -4.975597381591797, "p10": -1.5001630783081055, "median": 0.8249931335449219, "p90": 5.796308326721192, "max": 11.5400390625, "pos_frac": 0.65625, "sample": [2.8046951293945312, -0.7543430328369141, -3.4070205688476562, 0.09283447265625, -0.828948974609375, -0.8525772094726562, 0.08077621459960938, 0.6145534515380859, 1.0416030883789062, -0.9854354858398438, -1.4250907897949219, 1.4979934692382812, 3.6979217529296875, -2.1887969970703125, 5.04163932800293, 2.5085296630859375, 2.10064697265625, -0.1339893341064453, 5.622556686401367, 0.5456504821777344, 3.430419921875, -0.453643798828125, 1.4972610473632812, 0.9468231201171875, 4.7283172607421875, -0.3521919250488281, -3.5347747802734375, 1.3707504272460938, -4.085319519042969, 2.9640579223632812, -1.4793949127197266, 2.7294235229492188, 6.444244384765625, 0.6426010131835938, 3.7839202880859375, 0.7031631469726562, 0.08341217041015625, 4.0948486328125, -3.7627105712890625, 2.814228057861328, -0.08889007568359375, -0.12104415893554688, 5.8707733154296875, 2.8791427612304688, 2.2178211212158203, -1.509063720703125, 4.733612060546875, 6.439666748046875, 4.062416076660156, -1.25286865234375, -0.2802467346191406, 10.09478759765625, 1.2651290893554688, -0.013048171997070312, 4.4222412109375, -4.975597381591797, 11.5400390625, 4.230155944824219, 0.4937114715576172, 6.8985595703125, 6.059352874755859, 0.6964607238769531, 0.46417236328125, -0.1647796630859375], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000092.npy"} +{"epoch": 0.13907785336356765, "step": 93, "batch_size": 64, "mean": 0.9775991439819336, "std": 3.2234745025634766, "min": -5.372093200683594, "p10": -2.5484851837158202, "median": 0.33251380920410156, "p90": 4.847383880615235, "max": 13.516357421875, "pos_frac": 0.625, "sample": [0.9146251678466797, 3.2082862854003906, 4.7377471923828125, 3.8365821838378906, -2.3106536865234375, 3.5188446044921875, -2.031585693359375, -1.1616287231445312, -0.29305458068847656, 2.6035003662109375, 1.1191864013671875, 2.4875621795654297, 13.516357421875, 0.34814453125, -0.22920989990234375, 0.14214515686035156, 0.20440673828125, 3.2342681884765625, -0.7621326446533203, -5.372093200683594, 2.3387603759765625, 7.8469696044921875, -2.2976913452148438, 0.069091796875, 2.4841079711914062, -0.19291114807128906, 4.1400146484375, -0.09701728820800781, -1.9218311309814453, 1.609954833984375, -0.818328857421875, 0.06943702697753906, -0.5784626007080078, 5.487213134765625, -1.1013565063476562, -1.7099990844726562, 0.25229644775390625, 0.18346786499023438, -5.3426055908203125, -0.350677490234375, 1.0188560485839844, 0.2563667297363281, 2.069967269897461, 1.6693363189697266, 1.4467964172363281, -2.7429580688476562, 0.5845928192138672, 0.3168830871582031, 5.6102294921875, 1.1795425415039062, 4.705879211425781, 1.6392250061035156, 4.894371032714844, 2.36627197265625, -2.351837158203125, -2.632762908935547, 5.2552032470703125, -5.2469940185546875, -3.5571517944335938, 5.331825256347656, 4.118255615234375, -3.541778564453125, -0.3851165771484375, 2.7796096801757812], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000093.npy"} +{"epoch": 0.14058956916099774, "step": 94, "batch_size": 64, "mean": 1.8636175394058228, "std": 4.0619306564331055, "min": -10.477210998535156, "p10": -1.3188224792480465, "median": 1.902017593383789, "p90": 5.873636627197267, "max": 14.723617553710938, "pos_frac": 0.765625, "sample": [3.9861373901367188, 0.4071197509765625, 1.1085586547851562, 3.442596435546875, 1.3061561584472656, -8.512069702148438, 0.10937690734863281, 0.6629238128662109, 1.654205322265625, 2.526641845703125, 0.6429119110107422, 6.079620361328125, 2.173553466796875, -8.659477233886719, 2.228546142578125, 5.038265228271484, -1.8366813659667969, -0.4215984344482422, 5.50140380859375, 2.1167373657226562, 2.5924606323242188, 2.60284423828125, 3.2546768188476562, 1.9585533142089844, 2.3878173828125, 0.8909168243408203, 0.42257118225097656, 0.8502578735351562, -3.2086257934570312, 3.7148971557617188, 3.4965572357177734, -0.9266681671142578, 0.3373298645019531, -0.0575714111328125, 3.2156829833984375, 3.243255615234375, 3.927154541015625, 2.6083984375, 3.5292091369628906, 0.239501953125, 6.302925109863281, 6.033164978027344, -0.012256622314453125, 13.004913330078125, 4.408527374267578, 4.276153564453125, -1.04046630859375, 10.637664794921875, 4.0709228515625, 2.460855484008789, 14.723617553710938, 0.8186359405517578, -0.36829376220703125, -0.8787574768066406, 1.9345760345458984, 0.5172023773193359, -10.477210998535156, 1.8694591522216797, 9.162918090820312, 1.740457534790039, 0.12013626098632812, -1.4381179809570312, -2.5202693939208984, -0.7093887329101562], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000094.npy"} +{"epoch": 0.1421012849584278, "step": 95, "batch_size": 64, "mean": 1.5943739414215088, "std": 3.4581985473632812, "min": -5.9072723388671875, "p10": -2.7065475463867186, "median": 1.230173110961914, "p90": 6.4127143859863285, "max": 8.943618774414062, "pos_frac": 0.609375, "sample": [5.908111572265625, -2.7916183471679688, 1.4975738525390625, -0.6040992736816406, -2.5080490112304688, -0.2733268737792969, 8.943618774414062, 0.687103271484375, 2.8069534301757812, 1.523590087890625, -0.8708648681640625, 1.368927001953125, 1.274017333984375, -0.2961540222167969, -0.32967376708984375, 0.773956298828125, -3.6398468017578125, -2.1317062377929688, -0.3536052703857422, 1.5550956726074219, 7.93695068359375, 6.391838073730469, -0.17929840087890625, 1.0900039672851562, -5.31494140625, -0.9918975830078125, 8.24169921875, 7.136962890625, -3.2425079345703125, -5.9072723388671875, 2.2764129638671875, 6.594062805175781, 1.1863288879394531, 2.6711196899414062, -0.8314838409423828, 1.0964279174804688, 5.915283203125, -1.7644500732421875, -3.2883834838867188, 2.3196258544921875, 3.2910003662109375, 0.4881591796875, 5.853584289550781, 2.7771224975585938, -2.8415985107421875, 5.0101165771484375, 4.6644287109375, -0.11115074157714844, 2.120555877685547, 6.33660888671875, -0.47016143798828125, 4.427734375, -0.6175365447998047, 3.6053085327148438, 5.013580322265625, 8.294891357421875, -1.6527938842773438, -0.068817138671875, 1.3703136444091797, 3.6982345581054688, 0.4797935485839844, 2.137868881225586, 6.421661376953125, -2.065458297729492], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000095.npy"} +{"epoch": 0.1436130007558579, "step": 96, "batch_size": 64, "mean": 1.87106192111969, "std": 4.5902509689331055, "min": -7.760040283203125, "p10": -2.3937103271484372, "median": 1.2171096801757812, "p90": 7.995709228515626, "max": 15.927825927734375, "pos_frac": 0.65625, "sample": [3.1235618591308594, -2.5241775512695312, 8.050262451171875, -0.50726318359375, 12.357162475585938, -7.760040283203125, 3.971038818359375, 0.03275299072265625, 2.7071151733398438, 0.78582763671875, 5.1302947998046875, -0.6101322174072266, 1.2855911254882812, 10.54156494140625, 2.9048538208007812, 2.009429931640625, -5.5122222900390625, -0.0128021240234375, 0.9464225769042969, -0.6854972839355469, 1.9904365539550781, 2.7436065673828125, 7.8695220947265625, -5.539054870605469, 0.8336029052734375, 0.7106742858886719, 5.283660888671875, -0.42337799072265625, -1.8587799072265625, -0.04192352294921875, 2.2433738708496094, 8.049789428710938, 15.927825927734375, 5.640625, -1.0285835266113281, -2.0892868041992188, -7.44683837890625, 0.34754180908203125, -3.2205963134765625, 1.7100028991699219, 3.458160400390625, 1.1486282348632812, 1.7750492095947266, -0.15508651733398438, 13.243209838867188, -1.871337890625, 3.7672863006591797, 0.0198822021484375, 1.5869712829589844, -0.5827865600585938, 3.9555282592773438, -1.5084724426269531, 0.5976696014404297, 7.127433776855469, 10.479415893554688, 2.8953933715820312, -1.2763423919677734, 0.5222244262695312, 1.438720703125, 3.6819915771484375, 7.07916259765625, 1.7342605590820312, -1.7100868225097656, -5.594871520996094], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000096.npy"} +{"epoch": 0.14512471655328799, "step": 97, "batch_size": 64, "mean": 1.045839548110962, "std": 5.064228534698486, "min": -17.4052734375, "p10": -2.909008026123047, "median": 0.8999090194702148, "p90": 6.244076919555669, "max": 17.957611083984375, "pos_frac": 0.640625, "sample": [-10.226959228515625, -1.5615119934082031, 0.2846794128417969, 7.293079376220703, 0.8898143768310547, 13.005424499511719, -2.9242401123046875, -3.58990478515625, -2.43096923828125, -17.4052734375, -2.844766616821289, -0.876708984375, 0.7191696166992188, 2.7758140563964844, -3.7906875610351562, -8.941688537597656, 0.11376571655273438, 1.0743274688720703, 3.2939300537109375, 0.37793731689453125, 1.0932788848876953, 3.283294677734375, 1.4883899688720703, -2.3862571716308594, 3.38018798828125, -1.0683364868164062, -0.9678077697753906, 5.110862731933594, -1.5043449401855469, 10.781425476074219, 0.7985382080078125, -2.7703399658203125, 3.3030319213867188, 0.4446544647216797, 0.910003662109375, 4.436470031738281, 7.872337341308594, 6.729740142822266, -0.9628868103027344, 4.15948486328125, 3.1210250854492188, -5.318511962890625, 17.957611083984375, 2.4318580627441406, 3.2027053833007812, -1.6304988861083984, 3.2224254608154297, 4.1353607177734375, 10.20526123046875, -2.8734664916992188, 0.0939483642578125, 2.2752914428710938, 1.28607177734375, -1.794830322265625, -1.5370407104492188, 3.5360794067382812, 3.855813980102539, -2.0232696533203125, 2.7524795532226562, 1.9717178344726562, 1.0111274719238281, 0.11392974853515625, 2.657093048095703, -1.085409164428711], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000097.npy"} +{"epoch": 0.14663643235071808, "step": 98, "batch_size": 64, "mean": 0.7058207988739014, "std": 3.2831475734710693, "min": -9.230621337890625, "p10": -2.8356441497802733, "median": 1.1394624710083008, "p90": 5.128139495849611, "max": 6.86993408203125, "pos_frac": 0.65625, "sample": [0.11029815673828125, 1.5134258270263672, 5.432146072387695, 1.1428451538085938, 2.128692626953125, 2.223926544189453, 1.9545745849609375, 1.8244667053222656, -1.0188751220703125, 6.633888244628906, -9.040695190429688, -3.1966800689697266, -1.65771484375, -1.4462051391601562, -2.6466064453125, 0.4438018798828125, -0.44315338134765625, 2.1633033752441406, 1.1360797882080078, -0.6615447998046875, 3.4724388122558594, 5.885780334472656, -3.6289825439453125, 5.32208251953125, 0.7209186553955078, -2.2413272857666016, 3.7767562866210938, 0.6473045349121094, 1.5967464447021484, 1.1481742858886719, 2.3037796020507812, 1.3984527587890625, 5.7364654541015625, 2.518035888671875, -2.9166603088378906, 1.4302291870117188, 1.3370590209960938, 2.8791046142578125, 0.6545124053955078, -0.28868865966796875, 2.4272689819335938, 0.489471435546875, -7.959541320800781, 1.4619102478027344, -0.8874969482421875, -3.4388294219970703, 1.8366222381591797, 1.0707149505615234, -1.7480316162109375, 5.459999084472656, -1.9233207702636719, 4.675605773925781, -1.4270591735839844, -2.024066925048828, -9.230621337890625, 3.411651611328125, 2.1413307189941406, 0.21646499633789062, 0.7931861877441406, 6.86993408203125, 3.1522560119628906, 4.1782379150390625, -0.1986846923828125, -2.522624969482422], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000098.npy"} +{"epoch": 0.14814814814814814, "step": 99, "batch_size": 64, "mean": 1.009109377861023, "std": 4.642709732055664, "min": -12.619537353515625, "p10": -3.8707000732421872, "median": 0.865081787109375, "p90": 6.596235656738282, "max": 14.79449462890625, "pos_frac": 0.625, "sample": [8.893165588378906, 7.798376083374023, 6.4443817138671875, 11.138298034667969, 0.21377182006835938, -4.055355072021484, -0.6283683776855469, -1.7186355590820312, 1.4207534790039062, 6.7859039306640625, 2.65948486328125, 1.257568359375, 2.1368370056152344, 4.781551361083984, -0.4382801055908203, 0.9433441162109375, 1.1450309753417969, 0.0016803741455078125, -1.2159233093261719, 1.5629291534423828, 6.26776123046875, -0.07501602172851562, -5.7080841064453125, -2.3772506713867188, -5.6427764892578125, -3.439838409423828, 14.79449462890625, -9.522445678710938, -2.4228286743164062, 6.66131591796875, 1.8756141662597656, -2.665252685546875, -0.5927467346191406, 0.5213241577148438, 0.7722206115722656, 1.2308120727539062, 1.2293128967285156, -3.1007747650146484, 0.057544708251953125, 5.478679656982422, 1.1154060363769531, -12.619537353515625, 5.510429382324219, 11.11651611328125, -0.6220626831054688, 1.4215888977050781, 5.6082763671875, 0.7868194580078125, -8.055252075195312, 1.2709808349609375, -0.4212493896484375, 3.4405555725097656, 2.144287109375, 0.6491050720214844, 2.7943878173828125, 0.097381591796875, -0.00682830810546875, 4.472892761230469, 1.6967887878417969, -1.211151123046875, 1.3208694458007812, -2.3239288330078125, -1.7760086059570312, -4.295845031738281], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000099.npy"} +{"epoch": 0.14965986394557823, "step": 100, "batch_size": 64, "mean": 1.4694781303405762, "std": 6.184628486633301, "min": -16.671005249023438, "p10": -3.9044868469238274, "median": 0.9725379943847656, "p90": 7.187139892578127, "max": 25.899749755859375, "pos_frac": 0.671875, "sample": [1.1126708984375, -2.114990234375, -4.154167175292969, 2.9047622680664062, 7.3709869384765625, -1.0268630981445312, 0.5130329132080078, 3.5949649810791016, 6.157478332519531, 3.696075439453125, 1.6911163330078125, 1.5666732788085938, 4.208030700683594, 12.535881042480469, 1.3710479736328125, 4.310089111328125, -0.5811538696289062, 1.6408195495605469, 0.7186012268066406, 0.6840667724609375, 0.4906272888183594, 0.49501800537109375, -5.5247039794921875, 0.7679901123046875, -4.437408447265625, 4.783576965332031, -1.5024585723876953, 8.588302612304688, 1.2071456909179688, -14.344085693359375, -0.5830917358398438, -0.477752685546875, -2.8433609008789062, 1.0203857421875, 0.7813644409179688, -0.4779510498046875, 3.2182159423828125, 0.4580841064453125, -12.931732177734375, 5.858678817749023, 0.5592803955078125, 18.660369873046875, -4.3408355712890625, 0.9246902465820312, -1.5607643127441406, -0.2735023498535156, 2.866119384765625, 1.2078533172607422, -1.1142024993896484, -0.9321937561035156, 6.7581634521484375, 8.820755004882812, -1.2041778564453125, 2.9710121154785156, 1.9993896484375, 1.6942901611328125, -3.3218994140625, 11.829360961914062, 4.560997009277344, 1.6490249633789062, 25.899749755859375, 0.49072265625, -16.671005249023438, 1.8274383544921875], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000100.npy"} +{"epoch": 0.15117157974300832, "step": 101, "batch_size": 64, "mean": 2.0949583053588867, "std": 4.160855293273926, "min": -11.14349365234375, "p10": -2.014481544494628, "median": 1.5910959243774414, "p90": 7.0200141906738285, "max": 12.855270385742188, "pos_frac": 0.75, "sample": [-0.9290771484375, -0.35228729248046875, 3.5296630859375, 0.3907318115234375, 6.51220703125, 6.9280548095703125, 4.284839630126953, 0.7016105651855469, -0.088348388671875, -0.4316902160644531, 0.60748291015625, 4.0859375, -11.14349365234375, 7.943550109863281, 4.532005310058594, 0.21289825439453125, 4.4496612548828125, 2.3582801818847656, -0.9473323822021484, -3.048145294189453, 3.8652420043945312, 0.46285247802734375, 5.6254425048828125, -1.3812026977539062, 3.9794349670410156, -1.3745803833007812, 4.248634338378906, 3.6597251892089844, 0.7788982391357422, 6.847028732299805, 0.8765754699707031, 10.713226318359375, 5.533269882202148, 0.6816959381103516, -0.4538726806640625, -2.3455047607421875, 1.5489959716796875, -6.78167724609375, -2.285886764526367, 4.5303802490234375, -4.0222625732421875, 4.1594696044921875, 1.3826751708984375, 1.6060447692871094, 7.059425354003906, 2.234130859375, 0.45334625244140625, -8.785079956054688, 0.060787200927734375, 1.5761470794677734, 7.2598876953125, 0.5452804565429688, 7.345502853393555, 3.2345542907714844, 3.7902297973632812, 0.2077484130859375, 12.855270385742188, 2.6599044799804688, -0.7853927612304688, 2.4359169006347656, 5.831695556640625, 3.0384368896484375, 10.250251770019531, 1.3581409454345703], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000101.npy"} +{"epoch": 0.15268329554043839, "step": 102, "batch_size": 64, "mean": 0.8588533401489258, "std": 5.521229267120361, "min": -10.495765686035156, "p10": -4.359429931640625, "median": 0.27520179748535156, "p90": 6.886394119262695, "max": 20.9478759765625, "pos_frac": 0.546875, "sample": [7.1306610107421875, -4.171478271484375, -2.149181365966797, 1.2458953857421875, -6.884696960449219, -1.3811569213867188, -4.2147216796875, 2.7742843627929688, -8.226799011230469, 0.18473434448242188, 2.4821014404296875, 4.009757995605469, -0.06876373291015625, 1.7578659057617188, 6.866668701171875, -3.4848403930664062, -2.3091564178466797, 16.955856323242188, -3.3734359741210938, 10.1083984375, -2.8050670623779297, 1.203481674194336, -2.953094482421875, -0.468780517578125, 2.9730758666992188, 2.8734130859375, 0.8113365173339844, 6.894847869873047, -9.460906982421875, 1.1301403045654297, 6.811637878417969, 1.1740036010742188, -4.42144775390625, 0.5428657531738281, -3.7709884643554688, -1.1327056884765625, 4.21295166015625, 7.442985534667969, 11.984268188476562, -2.9107494354248047, -0.5443058013916016, 1.17547607421875, -10.495765686035156, -0.5930633544921875, -1.4770889282226562, 0.24739456176757812, 0.303009033203125, 5.396575927734375, 0.029554367065429688, -1.5180778503417969, 1.8704795837402344, 5.3220367431640625, 1.971588134765625, -4.552873611450195, -1.5529975891113281, -3.651947021484375, -1.5156936645507812, 20.9478759765625, -3.180431365966797, -7.3017120361328125, 4.090335845947266, 5.545173645019531, 6.025775909423828, 1.0420360565185547], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000102.npy"} +{"epoch": 0.15419501133786848, "step": 103, "batch_size": 64, "mean": 1.5551273822784424, "std": 3.7801764011383057, "min": -6.755027770996094, "p10": -2.749940490722656, "median": 1.1008377075195312, "p90": 6.86798267364502, "max": 10.648368835449219, "pos_frac": 0.640625, "sample": [-3.234943389892578, -0.4770660400390625, 7.48443603515625, -6.755027770996094, 0.07526588439941406, 3.9805259704589844, -1.0367050170898438, -1.289052963256836, 1.1464385986328125, 7.013298034667969, -2.3020858764648438, 2.0686569213867188, -2.4104080200195312, 1.05523681640625, -1.7916717529296875, 5.162006378173828, 2.684429168701172, -0.886444091796875, -5.0516357421875, 5.928459167480469, 1.4458160400390625, 4.340938568115234, 0.08052825927734375, 2.744335174560547, 2.186901092529297, -0.4769935607910156, -0.5427513122558594, 9.2615966796875, -2.8954544067382812, 3.040302276611328, 3.86651611328125, 6.956214904785156, 8.5645751953125, -1.4372787475585938, 0.6866531372070312, 4.3541107177734375, -6.131195068359375, 4.0970458984375, 0.6615982055664062, 0.6530094146728516, 5.566703796386719, 0.9827156066894531, 0.8495845794677734, 2.79254150390625, 3.082134246826172, 0.32977294921875, 6.634674072265625, -2.2143020629882812, 6.662107467651367, -0.22631454467773438, 9.33184814453125, 2.8757095336914062, -4.626979827880859, 1.1978378295898438, -3.7415313720703125, -0.08164215087890625, -1.7701873779296875, -0.616241455078125, -1.0717315673828125, 1.1803092956542969, 3.2577438354492188, 3.3456878662109375, 10.648368835449219, 2.3191604614257812], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000103.npy"} +{"epoch": 0.15570672713529857, "step": 104, "batch_size": 64, "mean": 2.33424711227417, "std": 6.462503433227539, "min": -11.941818237304688, "p10": -3.9486373901367178, "median": 1.0258855819702148, "p90": 9.788765335083015, "max": 28.16558837890625, "pos_frac": 0.6875, "sample": [10.49041748046875, 5.4066162109375, 3.9896163940429688, -1.987630844116211, -4.282539367675781, 2.585540771484375, -1.8589534759521484, 0.7619171142578125, 4.6357269287109375, -0.496490478515625, 0.80902099609375, -11.941818237304688, 28.16558837890625, 7.8682403564453125, -6.286674499511719, -2.1183929443359375, 13.6173095703125, 2.0743942260742188, -0.4787406921386719, 7.6134490966796875, -4.899688720703125, -9.856414794921875, 6.708740234375, 7.3028106689453125, 0.348541259765625, -0.6358165740966797, 1.0744972229003906, -7.403694152832031, 5.021638870239258, -0.27921104431152344, 0.49073028564453125, 0.5828952789306641, -0.8511505126953125, 2.4617843627929688, 8.15157699584961, 3.249776840209961, 0.8716812133789062, -1.0737571716308594, 3.7905502319335938, 2.8466720581054688, 1.0531234741210938, -2.773256301879883, 18.209320068359375, 0.5732135772705078, 4.05584716796875, 11.567771911621094, 3.254718780517578, 0.9986476898193359, -9.194862365722656, 0.03131103515625, 1.8443622589111328, 2.9963912963867188, 6.031253814697266, 4.2318878173828125, 1.4410667419433594, -3.1695327758789062, 0.10369873046875, -1.299530029296875, 0.6751556396484375, 0.85418701171875, -2.80364990234375, 6.252632141113281, 12.62078857421875, 15.368507385253906], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000104.npy"} +{"epoch": 0.15721844293272866, "step": 105, "batch_size": 64, "mean": 1.8228154182434082, "std": 4.994847774505615, "min": -8.382949829101562, "p10": -4.063740539550781, "median": 1.5084056854248047, "p90": 7.842504119873048, "max": 18.645111083984375, "pos_frac": 0.65625, "sample": [1.6639175415039062, 5.558074951171875, 2.665557861328125, 3.6839447021484375, 1.5898571014404297, 4.95085334777832, -8.382949829101562, 10.43572998046875, -3.55767822265625, 2.5363216400146484, 0.24761581420898438, 3.9841461181640625, -1.5445747375488281, 7.9691925048828125, 0.28125762939453125, 8.063560485839844, -1.1586551666259766, -5.787162780761719, -0.9700965881347656, 4.172149658203125, 3.082569122314453, -2.16796875, 1.55194091796875, -4.2806243896484375, 0.6399993896484375, 4.32476806640625, 1.2542877197265625, -5.694183349609375, 2.8770980834960938, -6.1548614501953125, -2.1813125610351562, 0.9362392425537109, -1.6772003173828125, 1.8228988647460938, -8.253883361816406, 18.645111083984375, 1.4648704528808594, -0.1935577392578125, 1.7053909301757812, 0.019937515258789062, -0.2885475158691406, -1.2585334777832031, 0.0152130126953125, 1.8059844970703125, -5.2056427001953125, 5.100429534912109, 5.1474151611328125, -1.4740943908691406, 6.756317138671875, -2.639923095703125, -2.5643157958984375, 2.3682899475097656, 0.9610309600830078, 10.496879577636719, 14.73284912109375, 0.3200225830078125, 7.225841522216797, 5.651252746582031, -0.2701911926269531, 2.7217884063720703, -0.25634765625, 10.2669677734375, 5.378021240234375, 7.546897888183594], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000105.npy"} +{"epoch": 0.15873015873015872, "step": 106, "batch_size": 64, "mean": 1.571278691291809, "std": 5.3349738121032715, "min": -16.962661743164062, "p10": -4.795919036865233, "median": 1.5883302688598633, "p90": 5.909991455078125, "max": 15.68756103515625, "pos_frac": 0.6875, "sample": [-5.2678070068359375, 5.145416259765625, 3.8158016204833984, 5.612560272216797, -6.182929992675781, -0.8056831359863281, 8.815841674804688, 3.0304641723632812, 0.9958229064941406, 1.0547256469726562, 4.223762512207031, 5.813228607177734, 10.599952697753906, 3.5438995361328125, 0.4253520965576172, -3.6948471069335938, 2.0015029907226562, 5.795387268066406, 3.672882080078125, 0.5820159912109375, -0.7549552917480469, 0.42697906494140625, -7.90509033203125, 2.2421798706054688, -0.8655977249145508, -0.3866615295410156, -0.2198505401611328, -3.68865966796875, 1.6641311645507812, 15.4608154296875, -0.7195854187011719, -0.5047359466552734, -2.288360595703125, -2.7419815063476562, 5.316917419433594, 5.61566162109375, 0.7836208343505859, -1.4566478729248047, 5.8567352294921875, 15.68756103515625, 4.2621612548828125, 2.678600311279297, 4.477560043334961, 0.542449951171875, -6.265380859375, 0.8438568115234375, 1.6647701263427734, 1.8552322387695312, -16.962661743164062, 1.5125293731689453, -10.004180908203125, 1.5021820068359375, 4.916770935058594, 4.577299118041992, 5.9328155517578125, 8.484779357910156, 0.8950386047363281, 2.5251941680908203, -0.8213958740234375, 10.572616577148438, -7.912200927734375, 1.6919441223144531, 0.288726806640625, 2.6033077239990234], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000106.npy"} +{"epoch": 0.1602418745275888, "step": 107, "batch_size": 64, "mean": 0.8920239210128784, "std": 6.264650344848633, "min": -18.109878540039062, "p10": -5.148905181884765, "median": 1.5416450500488281, "p90": 7.651882171630861, "max": 18.379562377929688, "pos_frac": 0.65625, "sample": [1.320028305053711, -5.003593444824219, 2.1394195556640625, 0.16146469116210938, 7.11907958984375, 4.045036315917969, -16.552154541015625, 6.886199951171875, -0.463043212890625, 1.691558837890625, -18.109878540039062, 0.05092620849609375, 1.73492431640625, 1.7635955810546875, 3.7877674102783203, -3.984111785888672, -3.5570449829101562, 4.789459228515625, 3.8311290740966797, 1.1197052001953125, -1.5758895874023438, 10.370819091796875, 8.799118041992188, 0.796600341796875, 4.819637298583984, -9.638885498046875, 3.8008193969726562, -2.8255844116210938, -1.8158950805664062, 1.3917312622070312, 3.122394561767578, -7.011787414550781, 2.6806488037109375, 5.897686004638672, 0.9377784729003906, 5.7545013427734375, 6.194183349609375, 1.1062698364257812, 3.4771881103515625, 9.573410034179688, 12.271774291992188, 7.880226135253906, -4.676231384277344, -1.815521240234375, 2.935148239135742, 1.26141357421875, -0.2987403869628906, 3.114044189453125, 2.607532501220703, -11.29302978515625, 8.412590026855469, 3.0733108520507812, -2.1038856506347656, -3.929281234741211, -0.027164459228515625, 1.1866073608398438, 2.0843048095703125, 18.379562377929688, 2.669422149658203, -3.0536727905273438, -5.211181640625, -14.954513549804688, 2.2944183349609375, -2.3428115844726562], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000107.npy"} +{"epoch": 0.1617535903250189, "step": 108, "batch_size": 64, "mean": 1.8913304805755615, "std": 5.461851119995117, "min": -12.025543212890625, "p10": -4.865935516357421, "median": 1.792205810546875, "p90": 8.352892303466799, "max": 18.572052001953125, "pos_frac": 0.625, "sample": [2.736663818359375, 4.812522888183594, 10.82025146484375, -0.9724044799804688, -0.48954200744628906, 5.477699279785156, 4.485137939453125, 4.105152130126953, 5.5162353515625, -5.113433837890625, 2.2866134643554688, 6.2897186279296875, 3.870452880859375, -1.3205928802490234, 6.201141357421875, 1.857269287109375, -3.3032073974609375, -0.422821044921875, 0.5502395629882812, 0.8049449920654297, 7.6175537109375, 0.1788482666015625, -0.6681919097900391, 5.334716796875, 0.7646102905273438, -6.54229736328125, 3.3881149291992188, -12.025543212890625, 12.348648071289062, 0.6534042358398438, -9.403472900390625, -1.7977886199951172, 6.92889404296875, -1.1643638610839844, 8.668037414550781, 5.079137802124023, 0.05836677551269531, -0.18626976013183594, -5.921211242675781, 4.93475341796875, -4.071723937988281, 8.848342895507812, 2.5886669158935547, -1.6259517669677734, -0.5547752380371094, 2.342060089111328, -1.619424819946289, 2.837240219116211, 2.0460052490234375, -5.016258239746094, -7.547168731689453, 3.4119033813476562, -4.5151824951171875, 2.370819091796875, 11.404815673828125, 0.15545654296875, 3.6211013793945312, 18.572052001953125, 1.727142333984375, -0.2710113525390625, -0.15266036987304688, 5.568019866943359, -1.0534210205078125, 15.541122436523438], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000108.npy"} +{"epoch": 0.16326530612244897, "step": 109, "batch_size": 64, "mean": 2.9811506271362305, "std": 5.444560527801514, "min": -5.265907287597656, "p10": -1.5221111297607421, "median": 1.5270051956176758, "p90": 8.432666778564453, "max": 25.631607055664062, "pos_frac": 0.703125, "sample": [-0.185394287109375, 13.338066101074219, 15.07568359375, 0.6013832092285156, 4.145145416259766, 3.8575782775878906, 6.853008270263672, -0.1302490234375, 2.167356491088867, 4.745151519775391, -0.3233661651611328, 1.2760543823242188, 1.980865478515625, 5.454704284667969, 2.19244384765625, -3.852294921875, 2.619455337524414, 0.4205474853515625, -0.91845703125, 1.165069580078125, 1.4827709197998047, 4.7657928466796875, -4.1195831298828125, -0.2714500427246094, -0.675628662109375, 25.631607055664062, 0.3182487487792969, -0.31191062927246094, 4.002170562744141, 19.43902587890625, 3.940580368041992, 1.4146194458007812, 1.2027969360351562, 0.11313629150390625, 0.21567726135253906, 1.8062686920166016, -1.287576675415039, 5.2349395751953125, -0.9223403930664062, 4.8638458251953125, -1.5377082824707031, 4.019983291625977, 1.3668060302734375, 5.889862060546875, -0.7329311370849609, -1.4857177734375, 0.2548675537109375, 1.5712394714355469, -5.265907287597656, -3.8080062866210938, 1.3348159790039062, 3.6323165893554688, 5.156715393066406, 8.440986633300781, 8.413253784179688, 14.155769348144531, 11.273448944091797, 1.9323577880859375, 5.765892028808594, 3.18310546875, -3.3816680908203125, -0.9865646362304688, -2.22955322265625, 6.5045318603515625], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000109.npy"} +{"epoch": 0.16477702191987906, "step": 110, "batch_size": 64, "mean": 0.2856212854385376, "std": 5.43139123916626, "min": -19.837081909179688, "p10": -5.482870483398437, "median": 1.0098991394042969, "p90": 6.611803436279299, "max": 13.52337646484375, "pos_frac": 0.578125, "sample": [2.0162487030029297, -0.14231491088867188, -2.9302978515625, 1.3337783813476562, -0.5873031616210938, 6.829353332519531, 3.1343536376953125, -1.2511329650878906, -10.327667236328125, 1.6428146362304688, 5.6611328125, 3.090747833251953, 0.9825286865234375, 6.834098815917969, 0.3515815734863281, -3.0544204711914062, 0.5716552734375, 10.118728637695312, -0.98858642578125, -4.186756134033203, 2.546937942504883, -2.374755859375, 2.053621292114258, 6.10418701171875, 0.390960693359375, 2.8645248413085938, 1.0949382781982422, 1.2770652770996094, 0.7206077575683594, -5.9644622802734375, -3.181934356689453, 1.7091026306152344, 2.3638992309570312, -1.4420509338378906, -5.617919921875, 1.0372695922851562, -5.167755126953125, 4.41815185546875, -1.4087486267089844, 1.7091350555419922, 9.074920654296875, 4.159797668457031, -1.1764984130859375, -2.410736083984375, -0.8834686279296875, 2.7070083618164062, 5.001243591308594, -7.4141845703125, -8.62347412109375, -16.356109619140625, -1.3697357177734375, 1.2853775024414062, -0.6027374267578125, -0.2955169677734375, -0.52337646484375, 13.52337646484375, 8.568485260009766, 3.649202346801758, 1.8232231140136719, 7.59295654296875, -4.207447052001953, 1.3193206787109375, 1.0438995361328125, -19.837081909179688], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000110.npy"} +{"epoch": 0.16628873771730915, "step": 111, "batch_size": 64, "mean": 1.982884168624878, "std": 5.283370494842529, "min": -7.403327941894531, "p10": -3.455814743041992, "median": 1.1540231704711914, "p90": 9.58136672973633, "max": 19.589141845703125, "pos_frac": 0.578125, "sample": [-0.8435401916503906, -2.7647266387939453, -0.26514434814453125, 13.052215576171875, 2.186229705810547, 7.8618621826171875, -0.9272727966308594, 3.8350181579589844, 2.0871849060058594, 0.497283935546875, 5.435920715332031, -0.997161865234375, -4.2630462646484375, 2.1780853271484375, -7.1908416748046875, -0.031391143798828125, -0.31853294372558594, 1.1170616149902344, -2.1977920532226562, 2.531373977661133, 9.745193481445312, 5.974212646484375, 11.195327758789062, 9.911457061767578, 12.45428466796875, 4.3493499755859375, 3.826171875, 5.713165283203125, 1.9358444213867188, -7.403327941894531, -0.32041168212890625, -2.6982460021972656, -4.227935791015625, -6.4974212646484375, -0.5170440673828125, -2.683135986328125, 0.10034942626953125, 5.10601806640625, -2.0154781341552734, 5.588573455810547, 9.199104309082031, 8.726417541503906, 9.761817932128906, -1.7128887176513672, -2.0219478607177734, -0.45713233947753906, 2.910186767578125, 9.162857055664062, -2.6881561279296875, 1.1909847259521484, 5.11236572265625, 3.2479095458984375, 3.125894546508789, -2.6761951446533203, -5.8624267578125, 0.4246101379394531, -3.5491104125976562, 3.5312652587890625, -3.2381248474121094, 1.7404670715332031, 19.589141845703125, -1.9222335815429688, 2.3897132873535156, 0.40032958984375], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000111.npy"} +{"epoch": 0.16780045351473924, "step": 112, "batch_size": 64, "mean": 2.4087562561035156, "std": 4.812221050262451, "min": -10.323745727539062, "p10": -2.654032707214355, "median": 2.531036376953125, "p90": 8.325587463378907, "max": 13.36334228515625, "pos_frac": 0.734375, "sample": [11.972137451171875, 7.2927703857421875, 9.518203735351562, 3.706714630126953, 0.026582717895507812, 2.5989532470703125, 12.1512451171875, 3.4003448486328125, 5.627677917480469, 2.7848281860351562, 0.5248870849609375, 6.1875, -5.3763580322265625, 2.402719497680664, 1.287832260131836, -7.8591461181640625, -1.7028961181640625, 4.163963317871094, -4.482292175292969, -0.5495834350585938, 3.121490478515625, -2.7630462646484375, 3.125091552734375, 6.138145446777344, 2.4631195068359375, 3.14324951171875, 5.758033752441406, 1.8881454467773438, 13.36334228515625, 3.302267074584961, 7.60302734375, 1.3980026245117188, -2.2447032928466797, 0.7888469696044922, 5.869255065917969, -0.9637908935546875, 2.6019039154052734, -5.516304016113281, 8.217376708984375, 2.855224609375, -1.5042877197265625, 2.3701171875, 4.986461639404297, 2.638479232788086, 2.7718429565429688, 10.518569946289062, 6.0041351318359375, 5.770290374755859, -0.9637222290039062, 0.9880943298339844, -9.1605224609375, 1.9493560791015625, -0.664215087890625, 1.6286849975585938, 8.371963500976562, 1.2897567749023438, 1.6136093139648438, -2.399667739868164, -2.2777633666992188, 4.49310302734375, -0.4563140869140625, -10.323745727539062, 2.0844955444335938, 10.606910705566406], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000112.npy"} +{"epoch": 0.1693121693121693, "step": 113, "batch_size": 64, "mean": 1.3757245540618896, "std": 4.64796781539917, "min": -15.223068237304688, "p10": -3.5580572128295893, "median": 1.0273056030273438, "p90": 6.311777114868164, "max": 13.5732421875, "pos_frac": 0.625, "sample": [-2.2716064453125, -6.081306457519531, -2.6900711059570312, 1.0652313232421875, -0.7220268249511719, 6.158535003662109, 2.532012939453125, -8.310577392578125, 0.5997161865234375, 3.914632797241211, 1.4084930419921875, -1.3993721008300781, -3.2562332153320312, 2.6231231689453125, -3.687410354614258, -0.45965576171875, 1.5706253051757812, 9.028671264648438, -0.48078155517578125, -3.7257957458496094, -2.673614501953125, 3.138702392578125, 6.342739105224609, -5.1200714111328125, -0.7197208404541016, 3.63494873046875, 4.735008239746094, 2.7691211700439453, 7.359306335449219, -0.7391681671142578, 3.8992156982421875, 13.5732421875, 0.908203125, -0.25798797607421875, 3.6193084716796875, 7.251279830932617, -15.223068237304688, 2.854696273803711, 6.239532470703125, -1.5231246948242188, 1.5814838409423828, 5.490575790405273, -4.2806396484375, 6.110588073730469, -2.934783935546875, 9.351776123046875, 0.9893798828125, 0.23941993713378906, -0.3545856475830078, 4.601051330566406, 3.0103759765625, -2.8726348876953125, 1.723825454711914, 11.054351806640625, 5.339111328125, -0.0043315887451171875, 3.1841278076171875, 0.5650997161865234, 5.240058898925781, 0.38156890869140625, 0.7367210388183594, 0.31331634521484375, -3.187786102294922, 5.883552551269531], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000113.npy"} +{"epoch": 0.1708238851095994, "step": 114, "batch_size": 64, "mean": 2.356678009033203, "std": 4.733741760253906, "min": -5.8934326171875, "p10": -3.4449796676635733, "median": 1.5496196746826172, "p90": 8.200089263916018, "max": 16.325164794921875, "pos_frac": 0.6875, "sample": [-5.8934326171875, -4.3236541748046875, 1.2827301025390625, 6.433742523193359, 4.424924850463867, 1.5983657836914062, 3.6014060974121094, 7.479949951171875, 4.541389465332031, -2.2570228576660156, -3.763643264770508, 1.1963729858398438, 3.3746261596679688, -2.7014312744140625, -1.1246376037597656, 1.8327178955078125, 3.172679901123047, -0.2077178955078125, 0.46680641174316406, -1.3106803894042969, 2.819629669189453, -2.214569091796875, 16.325164794921875, -2.624134063720703, 0.6773891448974609, 7.040870666503906, 4.421173095703125, 5.414934158325195, 1.157989501953125, 6.5020294189453125, -1.8316173553466797, 1.5008735656738281, 8.508720397949219, 3.2296295166015625, 2.8454742431640625, 0.8676910400390625, 6.729461669921875, 1.7319488525390625, 5.259563446044922, -4.6036224365234375, 16.02203369140625, 7.402082443237305, 5.960968017578125, 0.1885833740234375, 4.93994140625, 1.0118236541748047, 10.8707275390625, -2.2986679077148438, -1.6478919982910156, -3.8335304260253906, 0.5660781860351562, -1.26177978515625, 3.760042190551758, 9.574676513671875, 8.899330139160156, 10.77935791015625, 1.7785453796386719, -0.6675739288330078, -5.06915283203125, -4.266534805297852, 5.682075500488281, -1.657867431640625, 1.3601570129394531, 1.151865005493164], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000114.npy"} +{"epoch": 0.17233560090702948, "step": 115, "batch_size": 64, "mean": 1.943716049194336, "std": 4.36088228225708, "min": -7.922126770019531, "p10": -2.936222076416015, "median": 1.6682519912719727, "p90": 7.339668273925783, "max": 15.117507934570312, "pos_frac": 0.6875, "sample": [-1.5242843627929688, -2.4039344787597656, 4.4298553466796875, -6.0723724365234375, 15.117507934570312, 1.9719600677490234, 3.3685760498046875, 4.503330230712891, 0.6549072265625, 12.903762817382812, 1.9430809020996094, -1.54388427734375, 9.652732849121094, -4.873680114746094, -2.6710891723632812, -3.704132080078125, 0.0718841552734375, 6.9183502197265625, 2.0681915283203125, 2.9273910522460938, 4.63311767578125, 3.7265396118164062, 2.0824356079101562, 0.14133071899414062, -3.3587989807128906, 1.943655014038086, 4.229736328125, 1.5375213623046875, -7.922126770019531, 7.667018890380859, -3.0498504638671875, -0.20490455627441406, 0.5350379943847656, 7.520233154296875, 1.5512313842773438, 4.892173767089844, -0.5037994384765625, 3.576425552368164, -2.494873046875, 2.6076812744140625, 2.646282196044922, -6.127292633056641, 5.802215576171875, 3.832763671875, 10.806930541992188, 2.5395774841308594, 1.3745956420898438, 1.7852725982666016, -0.9055519104003906, 6.12310791015625, 0.7083148956298828, -0.023649215698242188, 6.559364318847656, -0.2994956970214844, 0.5143756866455078, -0.9387092590332031, -2.3159561157226562, -0.8010730743408203, 1.3965377807617188, 1.1876754760742188, 4.329254150390625, 0.4374275207519531, 2.7533493041992188, 10.164566040039062], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000115.npy"} +{"epoch": 0.17384731670445955, "step": 116, "batch_size": 64, "mean": 2.8369667530059814, "std": 4.093185901641846, "min": -5.7953948974609375, "p10": -2.077742004394531, "median": 3.138803482055664, "p90": 7.086999511718751, "max": 12.473175048828125, "pos_frac": 0.75, "sample": [6.163036346435547, -2.23681640625, 0.6629295349121094, 8.891807556152344, 5.5355224609375, 4.8623199462890625, 3.9175262451171875, 1.7107295989990234, 5.393178939819336, 7.264122009277344, 5.7799072265625, -2.80999755859375, -5.268943786621094, 10.672866821289062, 0.30710601806640625, -1.0838947296142578, 0.8089256286621094, 0.05603981018066406, 3.798419952392578, 5.872920989990234, -5.112548828125, 1.8838043212890625, 5.520359039306641, 3.256511688232422, -0.2767143249511719, 6.2141876220703125, 5.167655944824219, 6.431358337402344, 5.7529754638671875, 1.628448486328125, 1.3819541931152344, -1.234762191772461, -2.182332992553711, 0.9188499450683594, 10.504501342773438, 0.27646636962890625, 4.2994537353515625, 5.228607177734375, -0.9385757446289062, -1.5323562622070312, 5.8983306884765625, 4.53179931640625, 3.424945831298828, 1.3649368286132812, 12.473175048828125, 4.510231018066406, 10.568084716796875, -4.0235137939453125, 0.9068222045898438, 3.0210952758789062, -0.09343338012695312, 6.221031188964844, 0.603515625, -5.7953948974609375, -0.7524909973144531, 5.990447998046875, -1.4940223693847656, 4.522209167480469, 1.5247020721435547, 9.490036010742188, 6.673713684082031, 0.015035629272460938, 6.332759857177734, -1.8336963653564453], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000116.npy"} +{"epoch": 0.17535903250188964, "step": 117, "batch_size": 64, "mean": 1.9544355869293213, "std": 4.643931865692139, "min": -12.800537109375, "p10": -3.199420166015625, "median": 1.8898420333862305, "p90": 7.392373657226565, "max": 15.841384887695312, "pos_frac": 0.71875, "sample": [0.2425079345703125, 4.944578170776367, 3.9112396240234375, 0.662689208984375, 9.784774780273438, 3.103658676147461, 5.457056045532227, 2.1187305450439453, -2.358612060546875, 4.057592391967773, 0.36817169189453125, -1.8610286712646484, 6.88775634765625, -4.263282775878906, 1.4753799438476562, 3.223236083984375, -3.1805572509765625, 2.8429412841796875, 2.493377685546875, 5.618194580078125, 2.2497406005859375, 3.908550262451172, 4.977386474609375, 2.6424636840820312, -1.419729232788086, -4.932182312011719, 1.5743408203125, -0.5370101928710938, 3.5746726989746094, 10.753067016601562, -1.6185760498046875, 9.507705688476562, 7.595359802246094, 0.04541587829589844, 8.747894287109375, 1.6417999267578125, 4.506540298461914, 8.937294006347656, 0.777801513671875, 6.326484680175781, 2.2782821655273438, -0.5271530151367188, 2.0205345153808594, 3.35284423828125, -1.6500625610351562, -9.861793518066406, 1.7591495513916016, 0.9355239868164062, 2.86126708984375, 4.203277587890625, 1.5160293579101562, -0.1689910888671875, 6.918739318847656, -3.2075042724609375, 15.841384887695312, -6.201530456542969, -3.542461395263672, 1.6520881652832031, -12.800537109375, -0.6812515258789062, 4.855064392089844, 0.6195297241210938, 0.6204471588134766, -0.4964256286621094], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000117.npy"} +{"epoch": 0.17687074829931973, "step": 118, "batch_size": 64, "mean": 2.579646110534668, "std": 3.915975570678711, "min": -7.273593902587891, "p10": -2.033713722229004, "median": 2.5141754150390625, "p90": 8.179969787597656, "max": 10.697113037109375, "pos_frac": 0.71875, "sample": [2.3025054931640625, 2.1493301391601562, 4.6886749267578125, -3.8154449462890625, -7.273593902587891, -2.0458908081054688, 5.398368835449219, 2.5608367919921875, 4.760869979858398, -1.3723716735839844, 2.93426513671875, 2.9055938720703125, 1.274862289428711, 7.542457580566406, 0.8878135681152344, -0.6471099853515625, -1.9505462646484375, 5.51507568359375, 0.088531494140625, 0.8270854949951172, -1.5180740356445312, 7.992462158203125, 3.7462825775146484, 5.113983154296875, 2.9270248413085938, -2.512195587158203, 0.19159698486328125, -1.8415756225585938, 4.711893081665039, -0.07166862487792969, 4.174858093261719, 3.0961055755615234, 8.614700317382812, -2.005300521850586, 1.015106201171875, 3.80657958984375, 2.3227386474609375, 10.697113037109375, 8.960372924804688, -3.4822998046875, -1.966756820678711, 7.709686279296875, 0.2410736083984375, 5.5033111572265625, -1.00970458984375, 8.260330200195312, -1.5211029052734375, 8.841781616210938, 3.9364089965820312, 8.804595947265625, 5.15411376953125, 0.5888748168945312, 3.2776641845703125, 10.168506622314453, 6.317806243896484, 1.9919166564941406, -2.261932373046875, 4.3667449951171875, 5.892988204956055, 7.659677505493164, 2.4675140380859375, -2.0633468627929688, 1.1871414184570312, -1.1209640502929688], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000118.npy"} +{"epoch": 0.17838246409674982, "step": 119, "batch_size": 64, "mean": 1.887100100517273, "std": 5.470413684844971, "min": -12.98846435546875, "p10": -3.8121557235717773, "median": 1.6371421813964844, "p90": 8.871588134765625, "max": 22.046356201171875, "pos_frac": 0.640625, "sample": [-1.7263240814208984, 4.7105560302734375, -3.6502628326416016, 0.3497581481933594, -3.8815383911132812, -0.2782402038574219, 4.564029693603516, 3.0828857421875, -1.142141342163086, 0.6866645812988281, -4.25225830078125, -0.8289070129394531, 2.3403472900390625, 9.587623596191406, 7.353466033935547, -12.98846435546875, -0.08930206298828125, -3.6439476013183594, 1.077066421508789, 4.4546966552734375, -1.4641056060791016, 5.966646194458008, -2.3455352783203125, 2.665821075439453, 8.824943542480469, 4.4421844482421875, -4.376888275146484, 2.613910675048828, 9.126052856445312, 11.457275390625, 6.8158721923828125, -2.365966796875, 3.673032760620117, 4.315631866455078, 1.4374847412109375, 22.046356201171875, 2.2196788787841797, -0.8372421264648438, 1.0433101654052734, 8.891578674316406, 2.5911026000976562, 7.255889892578125, -2.2024574279785156, 0.3506622314453125, -6.463493347167969, -4.967561721801758, 11.751571655273438, 5.205516815185547, 1.9500503540039062, 4.17816162109375, 0.7489776611328125, -11.478378295898438, -3.40435791015625, -1.3440227508544922, 1.351806640625, 1.8303337097167969, 4.68733024597168, 10.431121826171875, 5.015838623046875, 1.6633529663085938, 2.2417125701904297, 1.610931396484375, -1.68475341796875, -0.42067718505859375], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000119.npy"} +{"epoch": 0.17989417989417988, "step": 120, "batch_size": 64, "mean": 2.8084969520568848, "std": 3.9094603061676025, "min": -4.577856063842773, "p10": -1.6987800598144531, "median": 2.0988197326660156, "p90": 6.9882854461669925, "max": 14.332855224609375, "pos_frac": 0.796875, "sample": [2.0145721435546875, 0.48842430114746094, -2.6300430297851562, 6.874095916748047, 4.9279327392578125, 0.712371826171875, 6.0998077392578125, 1.1063804626464844, 0.8398590087890625, -4.274940490722656, 7.806304931640625, 1.9075698852539062, 3.220304489135742, 3.6695289611816406, 3.799224853515625, 12.87310791015625, 3.9720916748046875, -0.22874832153320312, 2.1830673217773438, 5.009635925292969, 5.944709777832031, -1.6513824462890625, 5.014656066894531, 2.8134193420410156, 1.544708251953125, 1.6229057312011719, 7.037223815917969, 0.5257186889648438, 5.6749725341796875, 5.1927490234375, 14.332855224609375, -1.7190933227539062, 9.718559265136719, -1.0140380859375, 8.643341064453125, 0.2607269287109375, 1.8367958068847656, 0.6727771759033203, 6.150516510009766, -2.3082656860351562, 0.0040378570556640625, 2.484691619873047, 1.4805374145507812, 12.760009765625, -1.2552528381347656, -1.8459930419921875, -4.577856063842773, 6.4333648681640625, 4.46533203125, 0.6776046752929688, 0.13923072814941406, 0.5200290679931641, 6.099822998046875, 0.9314956665039062, 3.397157669067383, -0.349517822265625, 2.3740234375, 4.2926177978515625, -1.4775447845458984, -3.2339553833007812, 5.1298370361328125, 2.0144271850585938, 5.753711700439453, 2.861602783203125], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000120.npy"} +{"epoch": 0.18140589569160998, "step": 121, "batch_size": 64, "mean": 3.0093839168548584, "std": 5.031066417694092, "min": -4.327217102050781, "p10": -1.553898239135742, "median": 1.7978343963623047, "p90": 9.130072021484379, "max": 21.8310546875, "pos_frac": 0.734375, "sample": [1.2792510986328125, 14.251800537109375, 0.41944122314453125, -1.9042472839355469, 5.938892364501953, 14.6915283203125, 8.06020736694336, -1.8919544219970703, 1.7633018493652344, 4.755332946777344, -0.7770843505859375, -1.6015548706054688, 12.708969116210938, 3.3076553344726562, -0.0098114013671875, 0.6028690338134766, 5.023820877075195, -0.12189483642578125, 5.289398193359375, -4.327217102050781, 9.548065185546875, -0.20607757568359375, 6.7255859375, 3.31414794921875, 4.6377105712890625, 2.5275192260742188, 1.8587417602539062, -2.6174869537353516, 2.8455047607421875, 1.8422203063964844, -1.0273818969726562, 21.8310546875, 2.1480331420898438, 2.8064727783203125, 0.6336898803710938, -0.0160064697265625, -0.1075439453125, 1.5129013061523438, 2.781982421875, 0.439422607421875, -0.04100990295410156, 0.25630760192871094, 3.17364501953125, 5.46466064453125, 0.532867431640625, 2.06121826171875, -3.760650634765625, 16.33484649658203, -0.350433349609375, 2.4509334564208984, 1.832366943359375, 1.4373130798339844, 2.4944114685058594, 4.2905426025390625, 0.7395591735839844, 15.729248046875, 1.4042186737060547, -1.4426994323730469, 0.8611354827880859, 0.5604476928710938, 0.20336532592773438, 3.6105117797851562, 8.154754638671875, -2.334249496459961], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000121.npy"} +{"epoch": 0.18291761148904007, "step": 122, "batch_size": 64, "mean": 2.706878662109375, "std": 5.7016520500183105, "min": -6.7715606689453125, "p10": -3.55466194152832, "median": 1.6712493896484375, "p90": 9.224069976806646, "max": 22.613845825195312, "pos_frac": 0.6875, "sample": [22.613845825195312, -3.389373779296875, 0.4825439453125, 6.965641021728516, -4.2012786865234375, -2.4381351470947266, 13.70404052734375, 9.776176452636719, -0.6279201507568359, 6.090192794799805, 4.574459075927734, 1.774444580078125, 0.43114471435546875, 2.607452392578125, 0.6684246063232422, 16.0257568359375, -2.828338623046875, 2.8434982299804688, -4.900249481201172, 6.449745178222656, 0.9463863372802734, 11.422365188598633, 4.74493408203125, 5.5786590576171875, 7.935821533203125, 6.3566741943359375, -2.4486255645751953, -3.625499725341797, 4.571624755859375, 4.974540710449219, -6.7715606689453125, 5.00634765625, -0.4687690734863281, -2.4883575439453125, -4.598564147949219, 4.1140594482421875, 2.0757408142089844, -0.8942184448242188, 3.073793411254883, -0.37378692626953125, -0.8975486755371094, 0.29717254638671875, -4.014957427978516, 12.043411254882812, -2.8970565795898438, 5.529199600219727, 1.90618896484375, 1.56805419921875, -0.2785186767578125, 1.5403289794921875, 1.8340988159179688, 1.5555057525634766, 0.2616119384765625, 1.03851318359375, -4.067359924316406, 2.9420108795166016, 0.5472564697265625, -0.5955238342285156, 0.00737762451171875, 6.218231201171875, 4.06024169921875, 5.067394256591797, 2.603790283203125, 21.217178344726562], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000122.npy"} +{"epoch": 0.18442932728647016, "step": 123, "batch_size": 64, "mean": 2.6472043991088867, "std": 4.500986576080322, "min": -7.583160400390625, "p10": -1.9911159515380858, "median": 2.0584545135498047, "p90": 7.860216903686524, "max": 19.29534912109375, "pos_frac": 0.6875, "sample": [7.639728546142578, 6.7491912841796875, 2.0046615600585938, 19.29534912109375, -4.705015182495117, -1.4989204406738281, 2.6740074157714844, 0.96661376953125, 11.367591857910156, 5.287147521972656, 1.3683013916015625, 8.763397216796875, -0.014614105224609375, -1.7764739990234375, 6.0827789306640625, 6.674446105957031, 2.817800521850586, 3.7937145233154297, -0.6109428405761719, 8.083633422851562, 2.0306930541992188, 7.5858306884765625, 1.747467041015625, 7.506999969482422, 4.308158874511719, 11.159713745117188, 2.8782806396484375, -2.0158042907714844, 6.842315673828125, 2.46484375, 1.1529541015625, 11.363372802734375, -1.9060249328613281, 6.209699630737305, -0.6771965026855469, -5.3112945556640625, 2.1464004516601562, -2.1986827850341797, -0.39536476135253906, 1.6741046905517578, 1.6557998657226562, -1.9335098266601562, 2.0862159729003906, -0.38292694091796875, 1.7730579376220703, 6.42926025390625, -0.4032745361328125, -1.5644454956054688, 1.1509151458740234, 5.448883056640625, -1.5620574951171875, 2.7065505981445312, 1.5542068481445312, 2.8346099853515625, -7.583160400390625, 7.9547119140625, -0.7917881011962891, 2.113971710205078, -2.3478240966796875, 2.5247573852539062, 1.3567962646484375, 2.5502052307128906, 4.515350341796875, -2.194091796875], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000123.npy"} +{"epoch": 0.18594104308390022, "step": 124, "batch_size": 64, "mean": 3.655543327331543, "std": 4.830419540405273, "min": -4.813220977783203, "p10": -2.4520959854125977, "median": 3.4974632263183594, "p90": 10.08660125732422, "max": 16.235855102539062, "pos_frac": 0.765625, "sample": [-1.2772064208984375, 16.235855102539062, 5.046669006347656, -4.251567840576172, 4.38865852355957, 3.941925048828125, 16.011123657226562, 5.610691070556641, 12.934783935546875, 11.255783081054688, 7.560005187988281, 7.481109619140625, 1.4367084503173828, 12.989242553710938, 1.1098823547363281, 2.349170684814453, 2.1250228881835938, 6.116350173950195, 1.2361946105957031, -2.1912269592285156, -3.419647216796875, 3.5464324951171875, 3.6125717163085938, 1.6228561401367188, 2.3836898803710938, 4.476932525634766, 1.5197391510009766, -0.4840240478515625, -4.4716644287109375, -3.032440185546875, 4.522495269775391, 4.794952392578125, -2.4759368896484375, 9.628860473632812, 4.777713775634766, 8.742156982421875, 12.161895751953125, -3.6838226318359375, 7.327568054199219, 3.2342681884765625, 0.9437179565429688, 8.308525085449219, -0.8767852783203125, 4.572898864746094, 2.9714088439941406, 3.9671783447265625, 2.0134124755859375, 7.0423126220703125, -2.3964672088623047, 4.207643508911133, 10.28277587890625, 1.3883094787597656, 0.09893608093261719, 3.4273948669433594, 3.3383331298828125, 3.799530029296875, 3.4484939575195312, -1.5465621948242188, -4.813220977783203, 5.2022247314453125, -0.4563331604003906, 5.194248199462891, -0.51165771484375, 9.454681396484375], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000124.npy"} +{"epoch": 0.1874527588813303, "step": 125, "batch_size": 64, "mean": 3.1614742279052734, "std": 5.155557632446289, "min": -7.190940856933594, "p10": -3.093415069580078, "median": 2.928802490234375, "p90": 9.17966594696045, "max": 21.60491943359375, "pos_frac": 0.75, "sample": [-0.5500335693359375, 7.539085388183594, 6.445751190185547, 2.85107421875, 0.5734634399414062, -1.1698646545410156, 11.5372314453125, 0.12900924682617188, 6.725341796875, 3.5422611236572266, 21.60491943359375, -4.212852478027344, 0.6890029907226562, 3.740814208984375, 2.207956314086914, 9.273239135742188, 9.416976928710938, 3.7216949462890625, 3.2574462890625, -1.5864028930664062, 8.961328506469727, 0.6869010925292969, 3.7402267456054688, 3.9749069213867188, -1.0334243774414062, 2.087472915649414, 7.80419921875, -3.7620487213134766, -0.7159652709960938, 0.23838043212890625, 8.745407104492188, 4.539192199707031, 1.50921630859375, 12.3265380859375, 6.430295944213867, -3.370494842529297, 5.472373962402344, 1.5583267211914062, 11.5927734375, 16.551055908203125, 6.4981689453125, 3.00653076171875, 6.2764739990234375, 5.046810150146484, 3.2481117248535156, -7.190940856933594, -0.22174072265625, 8.097915649414062, 0.7712478637695312, 1.0446910858154297, 3.3062744140625, 3.2406349182128906, 4.579036712646484, 2.3120193481445312, -2.4439620971679688, 4.067913055419922, 0.865753173828125, -3.0973129272460938, 1.223114013671875, -0.6049728393554688, 2.3376102447509766, -3.2506332397460938, -6.766838073730469, -3.084320068359375], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000125.npy"} +{"epoch": 0.1889644746787604, "step": 126, "batch_size": 64, "mean": 1.7327555418014526, "std": 4.637869358062744, "min": -10.211334228515625, "p10": -3.027105712890625, "median": 2.0277891159057617, "p90": 6.480863189697266, "max": 15.269760131835938, "pos_frac": 0.640625, "sample": [3.3634510040283203, 0.3996410369873047, 6.2794342041015625, 2.771657943725586, 0.03695487976074219, 6.454196929931641, 6.454261779785156, 0.12509918212890625, 3.4224090576171875, -2.306640625, 6.10406494140625, 6.4922637939453125, -9.380409240722656, 1.0276641845703125, 6.143836975097656, 2.1076717376708984, -2.5420150756835938, -2.0078048706054688, -0.2741737365722656, -3.665576934814453, 2.647186279296875, 6.5690765380859375, 1.313638687133789, 3.13999080657959, -1.3086719512939453, -0.29225921630859375, 4.952095031738281, -5.37322998046875, -2.9933853149414062, -1.8813610076904297, 0.17081451416015625, -3.0415573120117188, -2.494882583618164, 3.385641098022461, -4.323141098022461, -1.2839431762695312, -2.3875865936279297, 15.269760131835938, 4.581611633300781, -10.211334228515625, 4.299888610839844, 3.5812911987304688, 3.692808151245117, 5.789005279541016, 5.071022033691406, 5.471900939941406, 7.368431091308594, 13.34002685546875, -0.4633216857910156, 1.947906494140625, 0.5918693542480469, 7.7910003662109375, 3.2427101135253906, 3.679523468017578, 1.6799392700195312, -1.2982254028320312, -2.7164154052734375, 5.455835342407227, -1.87017822265625, -1.1229782104492188, 2.603118896484375, 8.915641784667969, -6.253383636474609, 2.65447998046875], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000126.npy"} +{"epoch": 0.19047619047619047, "step": 127, "batch_size": 64, "mean": 3.310591697692871, "std": 4.475258827209473, "min": -7.964599609375, "p10": -1.773133087158203, "median": 2.853181838989258, "p90": 8.877926254272461, "max": 14.613250732421875, "pos_frac": 0.78125, "sample": [-1.3580551147460938, 14.371170043945312, 7.97735595703125, 3.6270675659179688, -1.5923385620117188, 8.90960693359375, 3.624603271484375, 8.17696762084961, 1.3265533447265625, 11.212577819824219, 7.437675476074219, 3.313720703125, 4.604087829589844, 8.543689727783203, 1.2180862426757812, 1.5043869018554688, 6.0976104736328125, 3.979717254638672, 0.7537918090820312, 1.3105049133300781, 6.9311370849609375, -7.964599609375, 4.2142791748046875, 7.038936614990234, 3.7580337524414062, -5.290321350097656, 3.5893936157226562, 1.6889533996582031, 2.5904388427734375, 0.893280029296875, 0.21018600463867188, 3.713916778564453, -0.3847389221191406, 9.306198120117188, -0.22437667846679688, 8.271318435668945, 1.6199684143066406, 8.804004669189453, 9.896564483642578, 14.613250732421875, -2.4141311645507812, 6.55426025390625, 2.641773223876953, -2.489349365234375, 2.4746856689453125, 2.8003387451171875, -1.850616455078125, -1.5802879333496094, 6.901420593261719, -4.1851043701171875, 0.4832916259765625, 7.952056884765625, 2.906024932861328, 1.3882369995117188, 1.2848243713378906, -1.3359870910644531, -1.8599319458007812, 1.8777694702148438, 3.7223281860351562, 3.4365673065185547, 4.262912750244141, 0.8246841430664062, 10.398468017578125, -0.6309700012207031], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000127.npy"} +{"epoch": 0.19198790627362056, "step": 128, "batch_size": 64, "mean": 3.642793655395508, "std": 6.5718913078308105, "min": -13.148681640625, "p10": -3.8996469497680653, "median": 2.9713668823242188, "p90": 12.078968811035157, "max": 20.10137939453125, "pos_frac": 0.75, "sample": [3.30364990234375, 11.574111938476562, 2.99993896484375, 3.8567276000976562, 3.1962852478027344, 1.6142807006835938, 4.7558135986328125, 11.921966552734375, 1.4101333618164062, 16.5933837890625, 1.9811630249023438, -13.148681640625, 12.146255493164062, -1.3790321350097656, 3.6820106506347656, -7.221580505371094, 0.7723789215087891, -0.5255203247070312, -7.061119079589844, 12.963233947753906, 17.051361083984375, -5.208736419677734, -2.3707504272460938, 20.10137939453125, 19.872894287109375, 7.62152099609375, 0.9351043701171875, 11.217941284179688, -1.970346450805664, 6.864582061767578, 1.02362060546875, 4.915824890136719, 2.9427947998046875, 8.341079711914062, 7.8813018798828125, 6.810523986816406, -0.2200469970703125, 9.954872131347656, -6.494924545288086, 2.0990219116210938, -2.828937530517578, 2.665792465209961, 2.4767189025878906, 0.24691009521484375, -4.358522415161133, 2.4919357299804688, 2.0325489044189453, 3.581775665283203, 3.1338653564453125, -2.2170467376708984, 4.826072692871094, 3.6142578125, 8.92535400390625, -0.687286376953125, 5.319755554199219, 0.9890499114990234, 1.5553436279296875, 6.872650146484375, 16.084823608398438, -1.7002315521240234, -7.720489501953125, 1.592742919921875, 5.356758117675781, 6.080535888671875], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000128.npy"} +{"epoch": 0.19349962207105065, "step": 129, "batch_size": 64, "mean": 2.1019034385681152, "std": 5.983180522918701, "min": -15.329315185546875, "p10": -4.6316287994384755, "median": 2.296438217163086, "p90": 8.633951377868653, "max": 19.406005859375, "pos_frac": 0.625, "sample": [-0.38253021240234375, -0.8385353088378906, 5.398584365844727, -5.308738708496094, -0.8045730590820312, 6.969993591308594, 0.4275665283203125, -2.1250476837158203, 2.3347930908203125, 10.003395080566406, 7.596061706542969, 2.438617706298828, 6.3174591064453125, -2.4288787841796875, -2.167236328125, -1.7820205688476562, 7.822319030761719, 0.6768646240234375, 9.801750183105469, 7.879112243652344, 2.8350372314453125, -12.741668701171875, 1.8226394653320312, 4.757080078125, -2.721576690673828, 19.406005859375, 4.721281051635742, -1.6147613525390625, 4.079263687133789, 4.0384979248046875, 6.201702117919922, -7.147003173828125, -5.6656036376953125, 8.474451065063477, 0.5212249755859375, 7.855857849121094, -7.734539031982422, -1.8107986450195312, -3.1777591705322266, 9.74907112121582, 4.022064208984375, -1.7012271881103516, -2.341217041015625, 1.3545665740966797, 5.207302093505859, 3.776508331298828, -1.7386703491210938, 16.230064392089844, 7.430320739746094, 7.926597595214844, 3.0566062927246094, 8.702308654785156, 9.143814086914062, -1.3834152221679688, -0.9977989196777344, -3.450450897216797, 3.462566375732422, -15.329315185546875, 5.21649169921875, 1.223653793334961, 2.2580833435058594, -5.137847900390625, 0.1342334747314453, 3.7792205810546875], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000129.npy"} +{"epoch": 0.19501133786848074, "step": 130, "batch_size": 64, "mean": 3.3813681602478027, "std": 4.938716888427734, "min": -5.919456481933594, "p10": -4.009207534790039, "median": 3.283296585083008, "p90": 9.299900817871094, "max": 16.848953247070312, "pos_frac": 0.796875, "sample": [1.3386573791503906, 1.9742164611816406, 10.463302612304688, 8.887908935546875, 5.6429595947265625, 0.99554443359375, -2.847412109375, 8.002298355102539, 3.5576705932617188, 1.0507545471191406, -4.1998443603515625, 7.349418640136719, 8.466049194335938, 1.9577579498291016, -4.774192810058594, 7.039329528808594, 2.5479564666748047, -4.522819519042969, 1.6431198120117188, 11.903877258300781, 3.1306915283203125, 3.8392105102539062, 6.162895202636719, 7.880180358886719, -2.502147674560547, -3.5643882751464844, -4.3199920654296875, 0.6731796264648438, -2.701526641845703, 0.4017333984375, 9.195556640625, 9.344619750976562, 7.7098236083984375, 5.000158309936523, 1.54412841796875, 14.526302337646484, 8.40460205078125, 3.8496456146240234, 16.848953247070312, 2.567882537841797, -1.8072280883789062, 3.435901641845703, 0.594879150390625, -5.27203369140625, 2.2839832305908203, 4.014116287231445, 6.005439758300781, 1.2106857299804688, 4.762550354003906, -1.5525245666503906, -4.943342208862305, 1.8796234130859375, 4.163787841796875, 5.367265701293945, -5.919456481933594, 5.144615173339844, 5.2123565673828125, 2.3492164611816406, 3.1196136474609375, 10.986419677734375, 10.161140441894531, 4.146692276000977, 1.7037162780761719, 4.892082214355469], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000130.npy"} +{"epoch": 0.1965230536659108, "step": 131, "batch_size": 64, "mean": 4.340440273284912, "std": 6.544402122497559, "min": -8.536399841308594, "p10": -3.9932922363281245, "median": 3.1904220581054688, "p90": 13.868031311035157, "max": 18.446258544921875, "pos_frac": 0.75, "sample": [3.5115013122558594, 7.741365432739258, -0.4599895477294922, -1.6928138732910156, -1.8615570068359375, 18.446258544921875, 3.7630996704101562, 4.591180801391602, -1.963815689086914, 13.523490905761719, 3.3006362915039062, 1.7218036651611328, -4.2108306884765625, -4.514373779296875, 2.032207489013672, 6.050310134887695, -3.009674072265625, 3.2896499633789062, 9.565635681152344, -6.9144134521484375, -4.74163818359375, -3.4857025146484375, 17.30560302734375, 6.570213317871094, 1.751007080078125, 0.28955841064453125, 1.9149456024169922, -4.592491149902344, -1.5164604187011719, 0.74420166015625, 6.332328796386719, 13.981918334960938, 12.205856323242188, 6.415727615356445, 13.321548461914062, 17.511505126953125, 2.1546363830566406, 14.678741455078125, 4.827295303344727, 13.602294921875, 2.276611328125, 15.165206909179688, -1.8928775787353516, 7.373626708984375, 2.3143081665039062, 0.57476806640625, 0.6237297058105469, 5.771026611328125, -5.4091796875, 9.83428955078125, 0.4174613952636719, -0.0730743408203125, 8.532585144042969, 0.005100250244140625, -8.536399841308594, 11.908355712890625, 2.4144973754882812, 2.277376174926758, 12.5174560546875, 3.9159164428710938, 3.0911941528320312, 9.152164459228516, 14.160242080688477, 9.193012237548828], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000131.npy"} +{"epoch": 0.1980347694633409, "step": 132, "batch_size": 64, "mean": 3.581754446029663, "std": 5.409476280212402, "min": -13.627410888671875, "p10": -2.4071277618408202, "median": 4.213432312011719, "p90": 9.537245178222657, "max": 17.63719940185547, "pos_frac": 0.75, "sample": [9.573902130126953, 2.846639633178711, 6.272651672363281, 6.2513275146484375, -2.378040313720703, -1.8873844146728516, 7.810478210449219, 0.2325878143310547, -2.4195938110351562, 5.0704193115234375, 5.80194091796875, 8.95986557006836, 4.605052947998047, 4.21087646484375, -0.7182769775390625, 1.8738784790039062, -1.5078773498535156, 15.611038208007812, 5.5677490234375, -0.2962837219238281, -2.3096656799316406, -13.627410888671875, 8.40133285522461, -1.6202621459960938, -3.182056427001953, -7.292938232421875, 5.770454406738281, 9.895221710205078, 10.154539108276367, -1.7159614562988281, 5.871124267578125, 1.0693321228027344, -11.10627555847168, 4.872833251953125, 2.4850234985351562, 4.0098114013671875, 17.63719940185547, 6.699735641479492, 9.52734375, 5.182395935058594, -0.04607391357421875, 9.906234741210938, 3.7573699951171875, 9.163810729980469, 8.046897888183594, 4.2159881591796875, 4.133628845214844, 2.5904769897460938, 2.3942794799804688, 4.453699111938477, 5.500907897949219, 2.8756790161132812, 4.06292724609375, 5.739589691162109, 8.965761184692383, 5.6016082763671875, 9.541488647460938, -2.756490707397461, 1.8604278564453125, 2.86676025390625, -4.777618408203125, 5.09844970703125, 4.1695098876953125, 5.66424560546875], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000132.npy"} +{"epoch": 0.19954648526077098, "step": 133, "batch_size": 64, "mean": 2.8249802589416504, "std": 5.932344436645508, "min": -15.741455078125, "p10": -3.5340324401855465, "median": 2.2508487701416016, "p90": 10.795059776306154, "max": 16.73937225341797, "pos_frac": 0.6875, "sample": [5.155601501464844, -5.657051086425781, 3.7994461059570312, 10.960861206054688, 0.1694355010986328, -1.3995513916015625, 4.032100677490234, 11.880134582519531, 0.7199554443359375, 1.9277381896972656, 2.5648536682128906, 14.773757934570312, 8.347829818725586, 0.6795158386230469, -6.189624786376953, 2.4953231811523438, 2.8587112426757812, -15.741455078125, 7.863452911376953, 1.6754913330078125, -0.4350318908691406, 6.7791290283203125, -1.2695732116699219, 7.444362640380859, 4.642740249633789, -0.579437255859375, 7.5711822509765625, -0.477386474609375, 3.8985061645507812, -0.9133033752441406, 2.470470428466797, 1.1142711639404297, -9.367080688476562, 10.40818977355957, -3.73126220703125, 2.0312271118164062, -1.0610160827636719, -3.0738296508789062, 8.974164962768555, 9.63250732421875, -1.7347412109375, 1.9841079711914062, 5.272560119628906, -6.987058639526367, 3.6928939819335938, 14.974746704101562, 6.538566589355469, 8.363876342773438, 1.2429962158203125, 16.73937225341797, 1.1151351928710938, -0.46900177001953125, -2.20068359375, 12.781967163085938, 6.845794677734375, 0.23825836181640625, 4.724334716796875, 11.333368301391602, 4.7244415283203125, -1.2800865173339844, 2.741302490234375, -2.105712890625, -4.463001251220703, 1.74993896484375], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000133.npy"} +{"epoch": 0.20105820105820105, "step": 134, "batch_size": 64, "mean": 4.924589157104492, "std": 6.39080810546875, "min": -12.178329467773438, "p10": -1.4896015167236325, "median": 4.050475120544434, "p90": 13.661423873901368, "max": 21.97967529296875, "pos_frac": 0.8125, "sample": [-1.2849960327148438, 0.8311920166015625, 3.7790489196777344, 4.09417724609375, 4.587436676025391, 3.8829193115234375, 3.46453857421875, 5.897369384765625, 13.74472427368164, 13.195526123046875, 4.636741638183594, 9.79913330078125, 5.4752044677734375, 3.3328208923339844, 4.006772994995117, -0.2699737548828125, 10.12173843383789, 7.744678497314453, -3.729412078857422, 7.0156707763671875, 7.937763214111328, 5.482677459716797, 9.287078857421875, -0.20698165893554688, 4.776496887207031, 8.727409362792969, 0.40887451171875, 1.7744903564453125, -1.5772895812988281, 7.133241653442383, -3.516254425048828, -0.44425392150878906, 13.467056274414062, 0.464263916015625, 0.5850391387939453, -7.09498405456543, 4.540134429931641, 2.803743362426758, 1.7755584716796875, 4.718347549438477, 21.780364990234375, 9.902383804321289, -12.178329467773438, 2.4635162353515625, 6.343486785888672, 1.761871337890625, 14.37847900390625, -4.31109619140625, 17.099945068359375, 2.969684600830078, 2.205821990966797, 6.760066986083984, 5.7637939453125, 7.9956817626953125, 18.903823852539062, 1.5019607543945312, -3.5512466430664062, 2.8068923950195312, 3.724559783935547, 10.203197479248047, 14.949783325195312, 21.97967529296875, 1.494649887084961, -1.1429634094238281], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000134.npy"} +{"epoch": 0.20256991685563114, "step": 135, "batch_size": 64, "mean": 3.140267848968506, "std": 5.896223545074463, "min": -12.91290283203125, "p10": -2.823689842224121, "median": 2.685211181640625, "p90": 10.049261474609377, "max": 19.92181396484375, "pos_frac": 0.734375, "sample": [5.027996063232422, -2.054180145263672, 7.276939392089844, 2.2974376678466797, 2.328197479248047, -2.5369129180908203, -0.5112991333007812, -4.492713928222656, -0.5259246826171875, 11.777542114257812, 7.001312255859375, -2.94659423828125, 6.131492614746094, -0.9595508575439453, 1.7126235961914062, -6.400859832763672, 11.645706176757812, 4.209831237792969, -0.7917270660400391, 2.6724624633789062, 2.470743179321289, 2.5808868408203125, -12.215763092041016, 2.0456771850585938, 3.9912261962890625, 8.30636978149414, 2.460693359375, 4.465171813964844, 1.2443161010742188, 4.331443786621094, 4.051700592041016, 0.4536590576171875, 10.245285034179688, 2.3112239837646484, 5.3300933837890625, 1.4624824523925781, 2.6979598999023438, 3.5163497924804688, 7.360481262207031, -5.904327392578125, 0.08779525756835938, 19.92181396484375, 0.5107479095458984, 4.37939453125, 3.304841995239258, 2.7116012573242188, -0.1793670654296875, -5.827096939086914, 8.128093719482422, 8.63800048828125, 5.900257110595703, -12.91290283203125, 0.6865768432617188, 7.4573822021484375, 13.460426330566406, 15.20916748046875, -2.425546646118164, 6.22490119934082, -2.249643325805664, 7.825801849365234, 3.763214111328125, 9.591873168945312, 15.341724395751953, -0.6393585205078125], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000135.npy"} +{"epoch": 0.20408163265306123, "step": 136, "batch_size": 64, "mean": 4.088949680328369, "std": 8.109720230102539, "min": -13.682098388671875, "p10": -4.8425964355468745, "median": 3.408832550048828, "p90": 15.948214340209962, "max": 23.810760498046875, "pos_frac": 0.6875, "sample": [16.038223266601562, 11.247360229492188, -10.34266471862793, -1.4080657958984375, -5.0927276611328125, 9.785438537597656, -3.6399383544921875, 0.7274932861328125, -6.885406494140625, 7.662195205688477, 3.2347946166992188, -13.682098388671875, -0.8711090087890625, 5.480871200561523, -2.267333984375, 8.171676635742188, 16.461332321166992, 3.692596435546875, 1.759054183959961, -4.2589569091796875, 10.078018188476562, 4.974437713623047, 10.693939208984375, 19.49279022216797, -1.9044342041015625, -0.043323516845703125, 15.639244079589844, 3.796977996826172, 1.8226165771484375, 23.810760498046875, 10.144393920898438, -0.8532066345214844, 16.28887939453125, 13.578933715820312, 3.5828704833984375, 2.888885498046875, -1.2293319702148438, 4.750026702880859, 6.736213684082031, 0.8431930541992188, -12.379678726196289, 4.6173858642578125, 1.7921600341796875, 11.107894897460938, 5.277202606201172, 7.877826690673828, -3.2943038940429688, 6.015739440917969, -3.8271942138671875, 18.121734619140625, 2.5538330078125, -7.955162048339844, -0.8256683349609375, 9.628158569335938, 2.4615211486816406, 16.2608642578125, -2.48138427734375, 0.33295440673828125, 12.735406875610352, 15.73819351196289, 7.41400146484375, 0.2598876953125, 1.6705589294433594, -12.313777923583984], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000136.npy"} +{"epoch": 0.20559334845049132, "step": 137, "batch_size": 64, "mean": 4.152113914489746, "std": 6.502209663391113, "min": -10.745208740234375, "p10": -2.2950956344604494, "median": 2.3371315002441406, "p90": 11.868867111206058, "max": 24.122406005859375, "pos_frac": 0.71875, "sample": [-1.8032684326171875, -10.745208740234375, 6.580005645751953, 10.990928649902344, 6.5971527099609375, 11.135856628417969, 12.524364471435547, 7.0765380859375, 0.15092849731445312, 24.122406005859375, 9.79208755493164, 2.2848129272460938, 12.092769622802734, 2.579132080078125, 11.346427917480469, -0.36902618408203125, 2.3894500732421875, 12.229965209960938, -1.4604949951171875, 1.8644752502441406, -0.7171401977539062, 6.04437255859375, 9.265411376953125, -6.271137237548828, 1.724527359008789, 0.1241455078125, 7.238414764404297, 21.74486541748047, -1.3149547576904297, 1.38641357421875, -1.4503326416015625, -2.3052139282226562, -1.13275146484375, 5.1274566650390625, 14.720573425292969, 1.6066017150878906, 0.17325782775878906, -3.84124755859375, 6.109138488769531, -2.271486282348633, 2.1207618713378906, 2.6013946533203125, 5.773967742919922, 12.420867919921875, 6.080501556396484, -3.7001171112060547, 1.843465805053711, 9.466653823852539, 9.441619873046875, 10.973114013671875, 2.1081161499023438, -4.681915283203125, -0.28681182861328125, -7.4829254150390625, 10.200061798095703, 3.7391128540039062, 1.3223648071289062, -2.049774169921875, -0.19762420654296875, 7.502586364746094, 2.2607879638671875, 10.73788833618164, 1.01873779296875, 9.1822509765625], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000137.npy"} +{"epoch": 0.20710506424792138, "step": 138, "batch_size": 64, "mean": 3.639800548553467, "std": 7.285195827484131, "min": -16.404647827148438, "p10": -3.298606491088867, "median": 4.225013732910156, "p90": 11.288243484497073, "max": 22.896011352539062, "pos_frac": 0.734375, "sample": [0.5650177001953125, 8.249008178710938, 4.349403381347656, 8.726600646972656, 5.85052490234375, 3.516752243041992, 0.05036163330078125, 4.100624084472656, -8.475143432617188, 4.871295928955078, 3.8351879119873047, -16.404647827148438, 13.15887451171875, -0.14165496826171875, 22.896011352539062, -7.9368133544921875, -2.6219406127929688, 8.418214797973633, 10.15374755859375, 4.918132781982422, 6.989295959472656, 1.8563308715820312, 19.42626953125, 9.562650680541992, 2.6127548217773438, 7.633762359619141, 10.560718536376953, 6.9296417236328125, 1.3035202026367188, 1.4050254821777344, 7.828573226928711, -0.35714149475097656, 11.524036407470703, -1.7861862182617188, -3.679208755493164, -2.9028244018554688, 0.12790870666503906, -13.42120361328125, -0.7816390991210938, 7.114265441894531, 6.3109283447265625, 10.738059997558594, 0.7252845764160156, 5.192131042480469, -2.2274551391601562, -15.534828186035156, 16.510562896728516, 3.951345443725586, 5.341400146484375, 0.4267120361328125, 5.09649658203125, 7.043556213378906, 9.614959716796875, -2.4351272583007812, 0.3750762939453125, -1.1026859283447266, -3.4682273864746094, 5.934629440307617, -1.6243343353271484, 7.454414367675781, 16.930999755859375, 4.625209808349609, 11.672630310058594, 1.369384765625], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000138.npy"} +{"epoch": 0.20861678004535147, "step": 139, "batch_size": 64, "mean": 4.247355937957764, "std": 6.389797210693359, "min": -14.903533935546875, "p10": -2.870815658569336, "median": 3.9879283905029297, "p90": 11.91675853729248, "max": 20.921661376953125, "pos_frac": 0.734375, "sample": [3.315309524536133, 11.801782608032227, 4.728446960449219, 3.4094696044921875, -7.369148254394531, 8.69649887084961, 8.869949340820312, 12.078056335449219, 6.695140838623047, -1.443746566772461, -1.5344429016113281, 17.016897201538086, 9.40379524230957, -2.716075897216797, 4.4190673828125, 11.966033935546875, 18.946853637695312, 3.6635913848876953, 1.6922225952148438, 11.74465560913086, -3.0040740966796875, -14.903533935546875, -2.8967056274414062, 3.0874481201171875, 8.35186767578125, 3.6058807373046875, 7.5146026611328125, 5.736543655395508, 6.2509307861328125, -0.9591064453125, 5.9585418701171875, 8.029739379882812, 3.641265869140625, 0.50341796875, -0.3391838073730469, 8.076812744140625, 6.940574645996094, 1.8998527526855469, 7.5985107421875, 1.8475456237792969, 9.845539093017578, -1.6169624328613281, 12.075122833251953, -0.7945461273193359, -2.810405731201172, -5.998638153076172, 5.0343780517578125, 5.081756591796875, 20.921661376953125, 4.018955230712891, 9.2156982421875, 3.9569015502929688, 1.8488693237304688, -7.49200439453125, -1.9945526123046875, 6.925327301025391, 0.4923248291015625, 2.6613082885742188, -4.085216522216797, 8.082733154296875, 5.995452880859375, 14.746177673339844, 3.9212474822998047, -0.525634765625], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000139.npy"} +{"epoch": 0.21012849584278157, "step": 140, "batch_size": 64, "mean": 5.89973258972168, "std": 9.23098373413086, "min": -23.127456665039062, "p10": -5.996425247192382, "median": 5.934577941894531, "p90": 17.967898178100587, "max": 21.50994873046875, "pos_frac": 0.71875, "sample": [19.513671875, 11.570068359375, 0.003841400146484375, -1.2236175537109375, -0.28878021240234375, 11.276649475097656, -8.704917907714844, -8.449882507324219, 9.928962707519531, 13.439857482910156, -23.127456665039062, 9.468109130859375, 4.86151123046875, 5.210968017578125, 17.67931365966797, 7.262413024902344, -6.572643280029297, 1.9073333740234375, 0.6533966064453125, 15.166847229003906, 4.186635971069336, 20.156951904296875, 12.5396728515625, 8.756309509277344, 1.0525856018066406, 9.0997314453125, 3.428892135620117, 19.202383041381836, 2.6133193969726562, -6.722015380859375, -4.5429229736328125, -4.2555694580078125, 11.449792861938477, -4.65191650390625, -3.5720443725585938, 6.3102569580078125, 13.047525405883789, 18.087554931640625, 16.287750244140625, 21.50994873046875, 7.774986267089844, 17.453170776367188, 17.730178833007812, 17.90634536743164, 5.55889892578125, -7.483478546142578, 17.994277954101562, -0.17335891723632812, 20.681549072265625, -3.248922348022461, -8.265949249267578, 10.747392654418945, 3.959606170654297, 8.219383239746094, 9.815711975097656, 2.0861892700195312, 9.728816986083984, -3.1368179321289062, 6.517509460449219, 4.612174987792969, -0.2245330810546875, 15.22623062133789, -3.7745532989501953, 4.3175811767578125], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000140.npy"} +{"epoch": 0.21164021164021163, "step": 141, "batch_size": 64, "mean": 5.329594135284424, "std": 8.927911758422852, "min": -13.99212646484375, "p10": -6.524429321289061, "median": 4.725830078125, "p90": 16.109927368164065, "max": 28.84552001953125, "pos_frac": 0.75, "sample": [-13.99212646484375, 0.5323829650878906, 16.331146240234375, 4.017383575439453, 8.768272399902344, -0.6863784790039062, 3.3402786254882812, 13.392829895019531, 3.236673355102539, -8.586246490478516, 5.9589691162109375, 0.81817626953125, 8.687456130981445, -7.3187408447265625, 10.376384735107422, 6.484409332275391, 6.847900390625, 1.2444419860839844, -1.3289299011230469, -13.739959716796875, 2.7692184448242188, 0.8005809783935547, 0.8884124755859375, 7.0702362060546875, 7.228645324707031, 3.634765625, 2.6199951171875, 8.220352172851562, -2.0048065185546875, -8.40545654296875, -1.4224624633789062, -7.762428283691406, 9.492938995361328, 10.21734619140625, 11.366905212402344, -2.402647018432617, 11.089855194091797, 4.770965576171875, 23.372173309326172, 19.814834594726562, 15.59375, 12.23653793334961, 12.54986572265625, 9.601104736328125, 22.063400268554688, 1.4364166259765625, -0.6886978149414062, 4.680694580078125, 18.07537841796875, 14.541816711425781, -9.904701232910156, 2.4207763671875, 5.961383819580078, 24.332916259765625, 9.534759521484375, 28.84552001953125, -4.107782363891602, 13.905912399291992, 1.4576492309570312, 8.228752136230469, 10.394439697265625, 3.1074275970458984, -4.6710357666015625, -4.246006011962891], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000141.npy"} +{"epoch": 0.21315192743764172, "step": 142, "batch_size": 64, "mean": 4.359848976135254, "std": 6.831005573272705, "min": -13.657463073730469, "p10": -2.7961450576782227, "median": 3.4303970336914062, "p90": 13.292652511596682, "max": 22.934921264648438, "pos_frac": 0.75, "sample": [5.31109619140625, -11.068992614746094, 2.359975814819336, 10.893417358398438, 12.544490814208984, 18.991943359375, 11.123519897460938, -1.8867530822753906, 2.116924285888672, 6.3756866455078125, 1.6475372314453125, -1.1079521179199219, 6.760471343994141, -13.657463073730469, -0.01634979248046875, 9.062339782714844, 6.301265716552734, -6.635324478149414, 1.9818859100341797, 3.5080108642578125, 2.82354736328125, 9.916748046875, 6.859947204589844, 3.9401588439941406, 3.4189300537109375, 14.297348022460938, -0.7246856689453125, -1.939117431640625, 11.559844970703125, -2.3646507263183594, 2.4694747924804688, 1.842681884765625, 15.249420166015625, 22.934921264648438, 1.7761154174804688, -2.8225326538085938, 2.6647186279296875, -6.773187637329102, 0.4178009033203125, 4.676990509033203, 16.185813903808594, 12.839523315429688, 3.441864013671875, 1.3579177856445312, -0.7217254638671875, 11.93994140625, -2.790111541748047, 3.6374969482421875, 0.293182373046875, 10.310874938964844, 3.2713241577148438, -2.7987308502197266, 1.334808349609375, 14.218826293945312, 4.692241668701172, 5.379081726074219, 13.48685073852539, 10.44993782043457, 6.465057373046875, -0.05629730224609375, 0.7343673706054688, -3.1666259765625, 9.569503784179688, 4.124992370605469], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000142.npy"} +{"epoch": 0.2146636432350718, "step": 143, "batch_size": 64, "mean": 3.733635902404785, "std": 9.325443267822266, "min": -27.381072998046875, "p10": -5.414996337890624, "median": 3.799072265625, "p90": 13.873058700561526, "max": 21.443359375, "pos_frac": 0.703125, "sample": [3.8203353881835938, 9.50469970703125, 13.387992858886719, 10.346145629882812, 4.584465026855469, -1.7886734008789062, 2.8602066040039062, -0.8681240081787109, 18.7717342376709, -10.033370971679688, 12.25651741027832, -2.2645263671875, 21.443359375, 3.7778091430664062, 7.660011291503906, 6.538579940795898, -14.355998992919922, 0.760589599609375, 19.806900024414062, 1.1789913177490234, -3.32171630859375, -0.4600105285644531, 20.488922119140625, 13.18597412109375, 9.861974716186523, 3.2548141479492188, 5.1123504638671875, -14.974822998046875, 2.194742202758789, -4.358409881591797, -0.5327606201171875, 4.191776275634766, -12.73504638671875, 7.4377593994140625, 16.619842529296875, -2.6617813110351562, -4.537528991699219, 0.6826324462890625, 1.0348358154296875, 7.442497253417969, 3.0097312927246094, -27.381072998046875, 12.557361602783203, 2.8941421508789062, -2.093576431274414, 10.696884155273438, 13.181175231933594, 10.376235961914062, 0.1060333251953125, -2.311004638671875, -5.791053771972656, 5.113058090209961, 14.080944061279297, 6.944770812988281, -18.585296630859375, 16.423006057739258, 10.835227966308594, 4.863128662109375, 11.587810516357422, 10.155757904052734, 2.506013870239258, -2.2476730346679688, 4.351551055908203, 2.3658447265625], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000143.npy"} +{"epoch": 0.2161753590325019, "step": 144, "batch_size": 64, "mean": 4.888025283813477, "std": 9.202474594116211, "min": -20.399459838867188, "p10": -5.650445175170899, "median": 3.391209602355957, "p90": 17.26864070892334, "max": 26.92218017578125, "pos_frac": 0.65625, "sample": [17.3518009185791, 6.852165222167969, -6.794776916503906, 1.2395858764648438, -2.257892608642578, 3.666749954223633, 0.5464649200439453, 12.247169494628906, 1.1618003845214844, -0.20598411560058594, -5.650489807128906, 8.11575698852539, -0.4466590881347656, 3.892528533935547, 8.547500610351562, 3.0842361450195312, 17.074600219726562, -0.1258087158203125, -4.84466552734375, 10.409820556640625, 12.563812255859375, 4.9141693115234375, -0.910369873046875, -3.0890121459960938, -2.3705787658691406, 2.478271484375, 6.291664123535156, 14.874271392822266, -0.5508022308349609, -1.4273681640625, 10.120941162109375, 3.1156692504882812, -5.650341033935547, -3.193756103515625, 14.079071044921875, -1.1905670166015625, -1.177511215209961, 19.927465438842773, 26.212570190429688, 19.214523315429688, 10.95135498046875, 7.238975524902344, -8.700775146484375, 15.902633666992188, -8.25345230102539, 7.322509765625, 4.7899169921875, -6.275140762329102, 12.930221557617188, 2.581634521484375, 0.7859420776367188, -5.3624420166015625, 4.549263000488281, 20.625328063964844, -6.9097137451171875, 16.778879165649414, 21.45294952392578, 26.92218017578125, 0.323394775390625, -20.399459838867188, 5.620018005371094, 2.6664867401123047, 9.358793258666992, 9.838111877441406], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000144.npy"} +{"epoch": 0.21768707482993196, "step": 145, "batch_size": 64, "mean": 5.158614635467529, "std": 9.74278736114502, "min": -24.193580627441406, "p10": -4.745299911499023, "median": 5.269868850708008, "p90": 17.91614208221436, "max": 27.910594940185547, "pos_frac": 0.734375, "sample": [6.730499267578125, 7.796985626220703, -3.8543167114257812, 5.922821044921875, 0.2215423583984375, -24.193580627441406, 11.294052124023438, -2.0756683349609375, 27.910594940185547, 2.2066802978515625, 8.02225112915039, 8.781402587890625, 3.369993209838867, 9.157310485839844, 3.4073257446289062, 9.092391967773438, -0.5615119934082031, 19.717323303222656, -6.91448974609375, 7.922554016113281, 3.0979537963867188, 2.093463897705078, -4.475208282470703, 6.033538818359375, 19.09975814819336, -1.9200057983398438, 2.93658447265625, 8.22528076171875, 6.9793853759765625, -0.7696189880371094, 20.854549407958984, 14.399444580078125, 5.1371612548828125, 23.63739776611328, -4.861053466796875, 18.35154914855957, 3.467142105102539, 10.429601669311523, 9.052757263183594, 13.704429626464844, -16.812103271484375, 7.667949676513672, 16.232681274414062, 5.669242858886719, 0.655914306640625, -1.233062744140625, 2.7494945526123047, 5.402576446533203, -3.3093643188476562, 9.287773132324219, 13.788070678710938, 10.628374099731445, 13.225208282470703, -1.9812202453613281, 1.3890457153320312, 27.088531494140625, 4.246307373046875, -5.765937805175781, -18.258468627929688, 4.055671691894531, 16.900192260742188, -7.531982421875, -3.6583251953125, 0.28650665283203125], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000145.npy"} +{"epoch": 0.21919879062736206, "step": 146, "batch_size": 64, "mean": 5.167600154876709, "std": 8.647029876708984, "min": -12.789894104003906, "p10": -6.85557861328125, "median": 4.738319396972656, "p90": 17.666928100585938, "max": 26.2296142578125, "pos_frac": 0.75, "sample": [14.311759948730469, 9.248115539550781, -6.8646697998046875, 5.720954895019531, 2.6392440795898438, -7.465705871582031, -2.8789215087890625, 8.438270568847656, 5.951526641845703, 5.1971588134765625, -9.893951416015625, -6.8343658447265625, 13.602981567382812, 7.200714111328125, 2.6045913696289062, -6.264701843261719, 10.488466262817383, -1.8375701904296875, 14.55807876586914, -12.789894104003906, 7.1657867431640625, 17.09058380126953, 1.68341064453125, -1.0566272735595703, -9.628374099731445, 0.71258544921875, 4.065645217895508, 10.988235473632812, -8.47243881225586, 2.2113723754882812, 7.496698379516602, -8.800125122070312, 21.361663818359375, 6.260009765625, 10.175537109375, -1.0256881713867188, 4.27947998046875, 0.8377151489257812, 5.55291748046875, 0.05257225036621094, 17.91393280029297, 6.953800201416016, 3.544454574584961, 12.597015380859375, 12.276443481445312, 21.220184326171875, 13.979513168334961, 7.174568176269531, 15.692375183105469, 3.792783737182617, 6.916196823120117, 1.203460693359375, 18.048006057739258, 2.4664764404296875, -5.250057220458984, -3.4478836059570312, 26.2296142578125, -3.6792144775390625, 3.473814010620117, 3.9821720123291016, 17.926124572753906, 8.927555084228516, 4.0291595458984375, 18.67285919189453], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000146.npy"} +{"epoch": 0.22071050642479215, "step": 147, "batch_size": 64, "mean": 4.200003147125244, "std": 9.054747581481934, "min": -23.88592529296875, "p10": -4.460276031494141, "median": 4.068685531616211, "p90": 15.863547325134284, "max": 23.973655700683594, "pos_frac": 0.625, "sample": [4.634868621826172, 8.058626174926758, 12.785430908203125, -4.3791046142578125, 2.0089263916015625, 8.235450744628906, -10.948951721191406, 4.1582489013671875, -1.7093658447265625, -4.005266189575195, 8.55792236328125, 7.393222808837891, 12.027557373046875, 8.952301025390625, -2.47857666015625, 8.599678039550781, 20.51677703857422, -23.88592529296875, 9.679426193237305, -1.8145771026611328, 6.71449089050293, 3.3531265258789062, -0.34438133239746094, 2.3809356689453125, -0.413909912109375, 16.552547454833984, -4.495063781738281, 9.355192184448242, 4.1026153564453125, 4.034755706787109, -1.3227787017822266, 5.490531921386719, 7.43621826171875, -9.267757415771484, -0.5916595458984375, 9.461082458496094, 14.255880355834961, 23.973655700683594, 21.107025146484375, 0.9739704132080078, 6.425628662109375, 2.7430038452148438, -2.093597412109375, 12.492164611816406, 13.187843322753906, -5.577667236328125, 23.664337158203125, -3.114421844482422, 13.254653930664062, -1.1604576110839844, -0.9840049743652344, 5.457618713378906, 10.41925048828125, -0.1565532684326172, -3.3473663330078125, 0.6794967651367188, 2.7059497833251953, -0.7654533386230469, 17.178054809570312, -14.8994140625, -12.344697952270508, 7.5411376953125, 18.630125045776367, -0.27857398986816406], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000147.npy"} +{"epoch": 0.2222222222222222, "step": 148, "batch_size": 64, "mean": 5.475609302520752, "std": 8.673022270202637, "min": -17.237586975097656, "p10": -7.176670074462889, "median": 5.912450790405273, "p90": 16.103711700439455, "max": 22.982681274414062, "pos_frac": 0.734375, "sample": [21.892791748046875, -9.256465911865234, 5.287654876708984, -8.529668807983398, 15.905960083007812, 18.899032592773438, 9.70248794555664, -10.170783996582031, 16.939453125, 15.926025390625, -2.1738109588623047, 11.05295181274414, 3.424346923828125, 4.505809783935547, 9.798847198486328, -5.835304260253906, -2.7115554809570312, 14.758010864257812, 12.353950500488281, -3.2597389221191406, 10.107440948486328, -7.844078063964844, 13.559616088867188, 2.4749832153320312, 11.190340042114258, 19.878829956054688, 11.726585388183594, -0.9629135131835938, 21.047027587890625, 1.927001953125, 6.5372467041015625, -1.5250625610351562, 11.085664749145508, -7.7515411376953125, 6.9921875, 14.698043823242188, 1.6190528869628906, 13.524131774902344, -17.237586975097656, 0.9803791046142578, 7.621513366699219, 1.2131080627441406, 9.666175842285156, 22.982681274414062, -11.083654403686523, 8.205087661743164, 6.624031066894531, 4.821882247924805, 16.17986297607422, -0.21541595458984375, 10.268783569335938, 3.3231048583984375, 4.2379608154296875, 1.5831375122070312, 0.5492897033691406, 6.821617126464844, 8.03131103515625, 7.750518798828125, 7.976036071777344, -0.8766555786132812, 2.54815673828125, 4.619598388671875, -2.00860595703125, -0.9378585815429688], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000148.npy"} +{"epoch": 0.2237339380196523, "step": 149, "batch_size": 64, "mean": 5.927312850952148, "std": 7.747051239013672, "min": -11.49359130859375, "p10": -2.9661993026733393, "median": 5.835484504699707, "p90": 16.276720809936524, "max": 24.37206268310547, "pos_frac": 0.78125, "sample": [11.168563842773438, 17.042007446289062, 12.411643981933594, -2.56927490234375, 1.802581787109375, 3.7878570556640625, -3.0921363830566406, 12.171747207641602, -1.8538589477539062, 14.389665603637695, -11.49359130859375, 4.088314056396484, 2.0439300537109375, 3.8666305541992188, 7.344398498535156, 0.21416854858398438, 3.794513702392578, 2.949493408203125, 1.7169227600097656, 10.724960327148438, 2.293109893798828, 10.915306091308594, 18.002092361450195, -3.5258140563964844, 24.37206268310547, 5.82066535949707, 4.555366516113281, -2.6723461151123047, 8.146963119506836, -10.828155517578125, -2.5395050048828125, 16.165313720703125, -9.521751403808594, 20.17007827758789, 4.925092697143555, 17.443010330200195, 10.925893783569336, -6.794090270996094, 11.64239501953125, -4.210878372192383, 2.537384033203125, 8.529510498046875, 1.3744068145751953, 15.942825317382812, 9.862316131591797, 14.144006729125977, 5.850303649902344, 7.173957824707031, 4.740007400512695, 6.114143371582031, 9.260513305664062, 6.0192718505859375, -1.379486083984375, -0.746185302734375, 0.6052188873291016, 9.972900390625, 6.3770599365234375, 21.664810180664062, 12.762866973876953, 5.895450592041016, 6.567577362060547, 16.324466705322266, -1.5220603942871094, 5.4834136962890625], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000149.npy"} +{"epoch": 0.2252456538170824, "step": 150, "batch_size": 64, "mean": 7.828769683837891, "std": 9.580052375793457, "min": -11.87026596069336, "p10": -2.621022033691405, "median": 6.302532196044922, "p90": 22.16426391601563, "max": 30.203994750976562, "pos_frac": 0.796875, "sample": [7.973262786865234, 3.8407325744628906, 23.681396484375, 6.752525329589844, -10.380455017089844, -2.99505615234375, 6.014886856079102, 7.224021911621094, 0.9484100341796875, 8.777853012084961, 2.438060760498047, 12.830825805664062, -1.356475830078125, 5.724822998046875, 0.47211456298828125, 5.1181488037109375, 4.873138427734375, 29.93267822265625, -0.753204345703125, 5.8438262939453125, 9.181831359863281, 1.8037796020507812, 24.49908447265625, -9.038040161132812, 1.4617156982421875, 11.165666580200195, 4.529458999633789, 7.916034698486328, 5.734142303466797, 20.472442626953125, 9.707992553710938, 15.092559814453125, 19.771255493164062, 6.521690368652344, 24.337051391601562, -5.4143524169921875, 1.6072406768798828, 9.23532485961914, 16.256820678710938, 23.655609130859375, 10.241500854492188, 18.04822540283203, -1.3940811157226562, 10.720245361328125, 20.509368896484375, 1.8304290771484375, 14.647346496582031, 16.754432678222656, -11.87026596069336, 30.203994750976562, 4.7057952880859375, -0.3608551025390625, 7.023460388183594, -5.4105987548828125, 3.1718997955322266, 22.873504638671875, -7.6663818359375, -1.7482757568359375, 14.916210174560547, -1.2218856811523438, 5.350067138671875, 17.234642028808594, 6.0833740234375, 10.9403076171875], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000150.npy"} +{"epoch": 0.22675736961451248, "step": 151, "batch_size": 64, "mean": 8.934582710266113, "std": 9.709501266479492, "min": -8.787712097167969, "p10": -2.537439918518066, "median": 8.849422454833984, "p90": 18.466282653808594, "max": 39.761016845703125, "pos_frac": 0.765625, "sample": [7.837898254394531, 14.82607650756836, 15.762786865234375, -3.6844520568847656, 2.907224655151367, 3.670076370239258, 39.761016845703125, 0.7808494567871094, 17.895599365234375, -0.49980926513671875, 10.424774169921875, 14.369857788085938, 8.623550415039062, -2.2249908447265625, 9.999614715576172, 12.58425521850586, 15.795312881469727, -1.7580204010009766, 7.24688720703125, -1.4038333892822266, -4.0778045654296875, -2.671346664428711, 13.150138854980469, -3.363849639892578, 31.853439331054688, -8.787712097167969, 12.690670013427734, 9.958576202392578, -1.8688335418701172, -1.2983245849609375, 6.149084091186523, -2.9472274780273438, 14.018905639648438, 14.360519409179688, 4.1886749267578125, -1.8446273803710938, 12.022666931152344, 8.838645935058594, 7.710479736328125, 31.640594482421875, 0.5446109771728516, 10.523258209228516, 16.952945709228516, 6.127595901489258, 24.27812957763672, 20.367385864257812, 18.710861206054688, 17.14605712890625, 17.16461944580078, 8.860198974609375, 8.792182922363281, 15.533538818359375, 3.0849266052246094, 19.866043090820312, -7.715663909912109, 13.80657958984375, 12.436391830444336, 6.697078704833984, -2.1084251403808594, 0.074951171875, 12.149932861328125, 17.552833557128906, 0.8424510955810547, 17.487449645996094], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000151.npy"} +{"epoch": 0.22826908541194255, "step": 152, "batch_size": 64, "mean": 5.723062992095947, "std": 10.284503936767578, "min": -16.459548950195312, "p10": -6.628373718261718, "median": 4.313596725463867, "p90": 19.595293235778808, "max": 26.755348205566406, "pos_frac": 0.734375, "sample": [-0.9221420288085938, 2.4636154174804688, 16.057668685913086, 2.8753509521484375, -16.459548950195312, 4.209892272949219, 12.456504821777344, 8.231048583984375, 6.447116851806641, -8.13873291015625, 5.912982940673828, -8.500411987304688, 10.761356353759766, -2.7416458129882812, 19.421974182128906, 16.98767852783203, 2.4763240814208984, 8.23129653930664, 0.8989772796630859, -4.514293670654297, -15.67919921875, 21.65280532836914, 10.461006164550781, 9.045402526855469, -5.122890472412109, 1.3955421447753906, 14.981712341308594, 4.417301177978516, 1.8925037384033203, 10.639663696289062, 2.8597774505615234, 19.669572830200195, 1.7794036865234375, 2.4429702758789062, -2.3503341674804688, -4.101165771484375, 1.8067054748535156, -4.7475433349609375, 16.50054168701172, 1.4844818115234375, -6.7222747802734375, 20.058076858520508, 12.006904602050781, -6.409271240234375, 7.619655609130859, 26.755348205566406, 14.457221984863281, 0.5459709167480469, 2.135162353515625, 8.464065551757812, -14.552337646484375, 14.421310424804688, 0.5338420867919922, 25.38280487060547, 15.70710563659668, 7.118812561035156, 23.617507934570312, 18.440048217773438, -3.379119873046875, 22.57642364501953, -1.1199417114257812, -11.524154663085938, 7.913978576660156, 17.045635223388672], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000152.npy"} +{"epoch": 0.22978080120937264, "step": 153, "batch_size": 64, "mean": 6.667169570922852, "std": 8.718976020812988, "min": -13.070222854614258, "p10": -4.8811595916748045, "median": 6.040218353271484, "p90": 19.098385238647463, "max": 22.98614501953125, "pos_frac": 0.765625, "sample": [10.962438583374023, 3.9181442260742188, 6.817008972167969, 14.8291015625, 16.12545394897461, 21.235042572021484, 10.0177001953125, 2.9277610778808594, 3.8271331787109375, 6.358345031738281, 5.795339584350586, 17.41168975830078, 2.8837356567382812, 15.591804504394531, 5.7954864501953125, -5.510986328125, 6.284950256347656, 1.105072021484375, 2.6191864013671875, 20.29132080078125, 20.354583740234375, 13.978485107421875, -6.003334045410156, 8.47320556640625, 22.208003997802734, -10.512338638305664, 13.895736694335938, 2.125560760498047, 0.3290290832519531, 17.032291412353516, -4.98272705078125, 4.870275497436523, -13.070222854614258, -0.6589393615722656, 11.413803100585938, 4.484020233154297, -2.5858078002929688, 19.327980041503906, 7.69110107421875, 5.2111358642578125, -2.7008514404296875, -1.4008216857910156, 22.272254943847656, 9.819255828857422, 10.63071060180664, -0.7953357696533203, 10.586387634277344, 8.237861633300781, 9.520004272460938, -2.6594390869140625, -0.3963623046875, 14.237789154052734, 5.5487060546875, 0.1078948974609375, 6.361572265625, -7.502716064453125, -6.4030303955078125, 16.94977378845215, 2.02685546875, 22.98614501953125, 18.562664031982422, 1.3566055297851562, -4.644168853759766, 11.129531860351562], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000153.npy"} +{"epoch": 0.23129251700680273, "step": 154, "batch_size": 64, "mean": 4.9311418533325195, "std": 9.883354187011719, "min": -19.86865234375, "p10": -9.825269889831542, "median": 5.717607498168945, "p90": 16.556081199646, "max": 25.7401180267334, "pos_frac": 0.703125, "sample": [-11.650665283203125, 1.0302352905273438, -11.688735961914062, -19.86865234375, 21.48175811767578, 14.080137252807617, -10.451017379760742, 5.783039093017578, 4.5053253173828125, -12.327247619628906, 5.493919372558594, -0.36756134033203125, 13.315336227416992, 5.624786376953125, -7.451202392578125, -6.5950164794921875, -2.1901512145996094, 6.206214904785156, 0.3239707946777344, -0.9234695434570312, 13.453414916992188, 25.7401180267334, 23.52115249633789, 5.94036865234375, -11.49072265625, 8.981328964233398, 11.488311767578125, -2.5229721069335938, 13.80560302734375, -17.637557983398438, 8.111024856567383, 3.5224742889404297, 15.292427062988281, 15.613044738769531, 11.21990966796875, 0.15445709228515625, 10.437261581420898, 15.888668060302734, 8.774812698364258, 6.338817596435547, -1.5779228210449219, -0.5049896240234375, 11.40776252746582, -1.688405990600586, 2.724700927734375, 20.369016647338867, 9.006494522094727, 5.6521759033203125, 13.808692932128906, -8.365192413330078, 2.815093994140625, -3.8913497924804688, 2.267436981201172, 4.155952453613281, 9.197509765625, 6.6029815673828125, 18.009742736816406, -0.36350250244140625, 16.84211540222168, 19.594802856445312, 7.470314025878906, 8.967327117919922, 2.191743850708008, 9.93763542175293], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000154.npy"} +{"epoch": 0.2328042328042328, "step": 155, "batch_size": 64, "mean": 6.793376922607422, "std": 11.936128616333008, "min": -23.968914031982422, "p10": -5.8785461425781245, "median": 6.443656921386719, "p90": 23.59611053466797, "max": 31.19475555419922, "pos_frac": 0.703125, "sample": [6.405967712402344, -1.0987091064453125, 30.076019287109375, 6.481346130371094, 4.098052978515625, 8.252750396728516, 0.7073135375976562, 20.948450088500977, -2.6180171966552734, 14.002246856689453, 10.809196472167969, 15.07502555847168, 1.119720458984375, -6.002906799316406, -0.19622421264648438, -3.5673141479492188, 10.356689453125, 27.2340087890625, 9.948951721191406, 25.576129913330078, 24.045799255371094, -1.5228252410888672, 12.160331726074219, -13.173681259155273, 13.313369750976562, 25.925033569335938, -0.219573974609375, 17.577835083007812, -3.8721466064453125, 14.056709289550781, -16.760177612304688, 9.866737365722656, 21.85664176940918, 9.317344665527344, 31.19475555419922, 10.9998779296875, -0.682281494140625, 1.5111160278320312, -17.677841186523438, 18.5743408203125, -3.3440093994140625, 0.4892921447753906, 12.618377685546875, 1.0941238403320312, 26.902145385742188, 8.215877532958984, 4.917808532714844, 19.878768920898438, -11.8018798828125, 6.323341369628906, 7.559234619140625, 3.46954345703125, 2.6983566284179688, 2.1490478515625, 3.643566131591797, -0.9596481323242188, 7.6365966796875, -11.46505355834961, -23.968914031982422, -0.12521743774414062, 9.27691650390625, 22.546836853027344, 18.509319305419922, -5.588371276855469], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000155.npy"} +{"epoch": 0.23431594860166288, "step": 156, "batch_size": 64, "mean": 8.170764923095703, "std": 9.902298927307129, "min": -13.158992767333984, "p10": -3.4578039169311516, "median": 6.726469039916992, "p90": 21.76080894470215, "max": 29.610881805419922, "pos_frac": 0.78125, "sample": [5.4465789794921875, -3.665475845336914, -4.1167449951171875, -13.158992767333984, 11.16748046875, 27.323165893554688, 29.610881805419922, 11.452930450439453, 12.709075927734375, 21.63168716430664, 2.8868331909179688, 20.51764678955078, -6.314300537109375, 16.0924072265625, 17.857421875, 21.37713623046875, 21.627960205078125, 18.80642318725586, -0.6937465667724609, 12.923198699951172, 3.0291271209716797, 2.544862747192383, 6.938182830810547, 16.29931640625, -2.7279434204101562, 4.6925506591796875, 0.2232685089111328, 16.86138153076172, 4.751361846923828, 13.304420471191406, 8.437118530273438, 5.847412109375, -2.973236083984375, 11.454742431640625, 10.566177368164062, 27.475082397460938, -9.414520263671875, 7.324012756347656, -4.967987060546875, 24.83460235595703, 11.697616577148438, 21.816146850585938, 3.9196090698242188, 2.7992706298828125, 0.9414882659912109, 4.308254241943359, -0.7885208129882812, 0.1549530029296875, 9.146987915039062, -1.994537353515625, 7.882404327392578, 3.09649658203125, 11.051849365234375, -0.28774261474609375, 6.5147552490234375, 4.545166015625, -2.3958282470703125, 16.721092224121094, 22.73577880859375, 2.612680435180664, 7.102630615234375, 25.321533203125, 5.002971649169922, -6.957588195800781], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000156.npy"} +{"epoch": 0.23582766439909297, "step": 157, "batch_size": 64, "mean": 6.442737579345703, "std": 10.240446090698242, "min": -18.764244079589844, "p10": -4.999976348876952, "median": 6.175037384033203, "p90": 20.005600166320804, "max": 32.66676330566406, "pos_frac": 0.75, "sample": [25.27027130126953, 24.847227096557617, -4.634002685546875, 13.060821533203125, 16.31102752685547, -18.764244079589844, 5.1301116943359375, -4.1475830078125, 13.387947082519531, -5.156822204589844, 0.6237220764160156, 6.647575378417969, 17.239227294921875, 5.064973831176758, -16.919692993164062, 0.18338775634765625, 0.08400726318359375, 6.111930847167969, 14.100015640258789, 20.240251541137695, 7.188148498535156, 19.458080291748047, 32.66676330566406, 10.009244918823242, 9.540609359741211, 13.680244445800781, -6.253345489501953, -1.0575199127197266, 7.926326751708984, -2.331544876098633, 16.268407821655273, -0.40789031982421875, 10.519813537597656, 6.7032318115234375, 12.742576599121094, 21.51563262939453, -8.121429443359375, 22.40760040283203, 24.369155883789062, 2.5939254760742188, -2.6729049682617188, 3.6003036499023438, -0.7318325042724609, 15.5274658203125, 7.3947601318359375, 3.5223464965820312, 2.0181350708007812, 10.454627990722656, 9.106016159057617, 2.621767044067383, 1.9378433227539062, -2.7390708923339844, 10.613338470458984, 1.6339874267578125, 5.471229553222656, 13.620874404907227, 3.5786666870117188, 13.42910385131836, -7.84173583984375, 13.376224517822266, 0.3383636474609375, -1.9863815307617188, -14.274246215820312, 6.2381439208984375], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000157.npy"} +{"epoch": 0.23733938019652306, "step": 158, "batch_size": 64, "mean": 6.766702175140381, "std": 10.772744178771973, "min": -17.61620330810547, "p10": -5.139881896972656, "median": 4.4038543701171875, "p90": 23.079129028320313, "max": 30.4222412109375, "pos_frac": 0.703125, "sample": [-1.214385986328125, 13.077049255371094, 1.8576278686523438, 8.56036376953125, -17.61620330810547, 15.123870849609375, 24.1390380859375, 11.198471069335938, -1.189697265625, 0.5314102172851562, 20.617752075195312, 10.152458190917969, 8.94146728515625, 16.626930236816406, -16.6361083984375, 13.746103286743164, 30.4222412109375, 4.132349014282227, 4.026933670043945, 6.148780822753906, -2.486553192138672, 4.3164520263671875, 12.984880447387695, 1.5405349731445312, 23.032997131347656, 13.329269409179688, -0.893341064453125, 23.098899841308594, 16.871002197265625, 12.654228210449219, -5.15924072265625, 10.117050170898438, 23.750877380371094, -0.8135147094726562, 22.228836059570312, 24.137338638305664, 14.627723693847656, -5.0947113037109375, 3.0229530334472656, -8.402420043945312, 18.961395263671875, 8.523399353027344, 1.640594482421875, 23.3970947265625, 12.60345458984375, 14.509590148925781, -3.8629322052001953, 3.9038009643554688, 25.992523193359375, -4.659553527832031, 4.4912567138671875, -3.7742080688476562, -7.369440078735352, 1.0667037963867188, 1.506866455078125, -0.0190887451171875, -4.473943710327148, 5.523799896240234, 11.4979248046875, 3.8431167602539062, -9.675067901611328, 2.6057586669921875, -0.2894859313964844, -8.38433837890625], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000158.npy"} +{"epoch": 0.23885109599395313, "step": 159, "batch_size": 64, "mean": 7.807815074920654, "std": 11.50208854675293, "min": -31.663833618164062, "p10": -4.5240884780883786, "median": 6.561983108520508, "p90": 23.851393699646, "max": 32.80104064941406, "pos_frac": 0.765625, "sample": [17.59420394897461, 13.550289154052734, 1.8111343383789062, 20.143272399902344, 9.592597961425781, -12.283195495605469, -6.575592041015625, 24.083642959594727, 2.4916763305664062, 32.80104064941406, 25.68475341796875, 5.182487487792969, 19.113977432250977, 6.87109375, -2.9157981872558594, 2.4329071044921875, 8.307022094726562, 30.39220428466797, 21.449295043945312, -0.26886940002441406, 2.122753143310547, -7.37481689453125, 5.993892669677734, 1.2533416748046875, 5.897735595703125, 3.5884342193603516, 2.5054378509521484, -8.551887512207031, 19.6358642578125, 23.309478759765625, -4.667762756347656, 15.469085693359375, 13.725666046142578, -0.3895263671875, 5.330535888671875, 10.383794784545898, 21.136795043945312, 9.67218017578125, 4.277587890625, -0.844818115234375, 6.252872467041016, -10.758132934570312, 25.684646606445312, 0.4436779022216797, 11.283760070800781, 24.861539840698242, -4.188848495483398, 14.501386642456055, -0.0482177734375, 7.349021911621094, 0.4431438446044922, 25.422935485839844, 8.702518463134766, -2.7656173706054688, -0.4163227081298828, -31.663833618164062, 17.89644432067871, 13.130622863769531, 0.2527313232421875, 7.748586654663086, 16.134986877441406, 6.245368957519531, 11.502639770507812, 9.752342224121094], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000159.npy"} +{"epoch": 0.24036281179138322, "step": 160, "batch_size": 64, "mean": 6.543596267700195, "std": 11.584945678710938, "min": -16.208106994628906, "p10": -6.1406608581542965, "median": 3.895771026611328, "p90": 21.63063354492188, "max": 35.67005920410156, "pos_frac": 0.734375, "sample": [1.9078960418701172, -3.692859649658203, 14.3837890625, 29.38610076904297, 1.3036956787109375, 22.144638061523438, 3.98779296875, -4.90782356262207, 10.652416229248047, 11.87176513671875, 35.67005920410156, -5.451374053955078, 20.203886032104492, 18.39246368408203, 7.585620880126953, 17.37781524658203, 1.05755615234375, -16.208106994628906, 12.488086700439453, 9.896463394165039, -3.8764877319335938, -8.652713775634766, 3.0001144409179688, 0.7412338256835938, 11.109914779663086, 2.0759925842285156, 10.719528198242188, 1.773111343383789, 5.10784912109375, 1.6808433532714844, 13.862249374389648, 8.616281509399414, 34.652557373046875, 28.462581634521484, 2.806547164916992, -6.147489547729492, 13.341331481933594, 2.1377792358398438, -0.4054431915283203, 23.3345947265625, 2.4948997497558594, 13.46591567993164, 1.7875442504882812, -11.929206848144531, -5.042469024658203, 8.892784118652344, -12.515380859375, -6.124727249145508, 13.163040161132812, 11.530467987060547, -6.355308532714844, -4.103607177734375, -3.022491455078125, 12.69924545288086, 11.456504821777344, 3.2161941528320312, 1.6264915466308594, 25.578475952148438, -15.861839294433594, 3.8037490844726562, 20.431289672851562, 19.400802612304688, 7.225830078125, -5.4183197021484375], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000160.npy"} +{"epoch": 0.2418745275888133, "step": 161, "batch_size": 64, "mean": 7.221508502960205, "std": 11.262417793273926, "min": -28.25762176513672, "p10": -5.428259372711181, "median": 7.735631942749023, "p90": 21.245627593994147, "max": 35.79713439941406, "pos_frac": 0.765625, "sample": [8.705429077148438, -15.241436004638672, 3.4793930053710938, 9.347030639648438, 2.6523284912109375, -0.9352340698242188, 16.746307373046875, 28.14234161376953, -6.594005584716797, -4.4235334396362305, -9.741058349609375, 7.669929504394531, 11.239326477050781, 12.192245483398438, 24.940338134765625, 12.025175094604492, 7.896564483642578, -28.25762176513672, 15.64688491821289, -8.7962646484375, -3.83966064453125, 2.0735015869140625, 6.413932800292969, 2.3328018188476562, 17.388702392578125, -3.1335105895996094, 5.210765838623047, 13.37095832824707, 13.504920959472656, 1.9186859130859375, 19.96249008178711, 15.243934631347656, 10.042703628540039, 16.513580322265625, 17.829238891601562, -3.720367431640625, -9.551538467407227, 35.79713439941406, 24.936683654785156, 21.795543670654297, 3.9868087768554688, 14.216598510742188, -0.5914573669433594, 6.148765563964844, 10.161773681640625, 2.649494171142578, 7.801334381103516, 8.5, 5.8570709228515625, 17.920761108398438, -4.238883972167969, 8.024833679199219, 26.08739471435547, 7.1011199951171875, 0.7882003784179688, 0.531280517578125, -5.858856201171875, 2.9941673278808594, 10.645561218261719, 10.731674194335938, 30.65453338623047, -1.6390838623046875, 0.7534236907958984, 8.16537094116211], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000161.npy"} +{"epoch": 0.24338624338624337, "step": 162, "batch_size": 64, "mean": 9.471763610839844, "std": 11.352885246276855, "min": -20.252288818359375, "p10": -6.012054443359373, "median": 9.512802124023438, "p90": 23.42048225402832, "max": 41.63032531738281, "pos_frac": 0.8125, "sample": [13.657058715820312, 6.586708068847656, -20.252288818359375, 4.23895263671875, 4.501091003417969, 19.813373565673828, 13.150566101074219, 6.558280944824219, 18.860931396484375, 25.74064826965332, 14.823127746582031, 17.22232437133789, 5.10441780090332, 41.63032531738281, 21.050880432128906, 7.58137321472168, 9.744293212890625, 26.635475158691406, 16.7171630859375, 25.522891998291016, 24.512523651123047, 20.59897232055664, 4.940574645996094, -4.5740509033203125, 10.355621337890625, -1.2104110717773438, 9.28131103515625, 3.1129226684570312, -13.07135009765625, 14.94464111328125, 5.484590530395508, 5.024810791015625, 1.4119873046875, 17.330711364746094, 11.39739990234375, 10.565933227539062, 15.739189147949219, 16.495588302612305, -0.5538349151611328, -9.69699478149414, -9.277496337890625, -0.08502960205078125, 23.57982635498047, 19.43391990661621, 17.700700759887695, 7.379974365234375, -10.951148986816406, 13.468780517578125, -6.6283416748046875, 1.1193084716796875, 7.128376007080078, -0.21321868896484375, 10.51251220703125, 18.41115379333496, 23.04867935180664, 14.330436706542969, 2.788881301879883, -11.59332275390625, 4.5929412841796875, 4.970853805541992, 3.854673385620117, 21.522991180419922, 25.078092575073242, 5.041618347167969], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000162.npy"} +{"epoch": 0.24489795918367346, "step": 163, "batch_size": 64, "mean": 9.466161727905273, "std": 11.845919609069824, "min": -17.436067581176758, "p10": -8.07518196105957, "median": 8.202521324157715, "p90": 23.609619140625, "max": 31.98269271850586, "pos_frac": 0.765625, "sample": [-1.689009666442871, 9.922470092773438, -7.72357177734375, 16.893516540527344, 7.272743225097656, 2.9221153259277344, -17.436067581176758, 5.30438232421875, 26.738067626953125, -9.102615356445312, 7.897239685058594, 18.68018341064453, 27.98802947998047, 7.261451721191406, 6.017738342285156, 16.917823791503906, 19.97945785522461, -2.0003585815429688, 28.95867919921875, 13.193862915039062, 2.5155715942382812, 22.412986755371094, 21.145967483520508, -8.225872039794922, -7.4395751953125, 25.28509521484375, 12.056652069091797, 22.933883666992188, 7.095590591430664, 6.621971130371094, 14.038808822631836, 4.921142578125, 17.248741149902344, -2.8920135498046875, 16.775650024414062, 18.505340576171875, -8.542076110839844, 18.980209350585938, -8.96285629272461, 3.2423229217529297, 13.809158325195312, 31.98269271850586, 14.510040283203125, 23.171871185302734, 9.507171630859375, -2.4736804962158203, -0.4328804016113281, 8.264392852783203, 4.637744903564453, -0.7289314270019531, -14.36126708984375, 23.347604751586914, 17.177963256835938, 1.1770896911621094, 2.210124969482422, -9.82232666015625, 23.482513427734375, 23.664093017578125, 26.605552673339844, 21.71122932434082, 15.149782180786133, 2.9957447052001953, 6.394374847412109, 8.140649795532227], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000163.npy"} +{"epoch": 0.24640967498110355, "step": 164, "batch_size": 64, "mean": 9.158220291137695, "std": 12.572494506835938, "min": -25.2496337890625, "p10": -5.6632501602172844, "median": 8.589317321777344, "p90": 26.36508483886719, "max": 34.51060485839844, "pos_frac": 0.796875, "sample": [-0.6008529663085938, 0.676910400390625, -2.3072052001953125, 6.235340118408203, 5.27239990234375, 10.775459289550781, 31.624267578125, 19.01708221435547, -0.42604827880859375, 4.911064147949219, 10.675094604492188, -4.311271667480469, 17.72182846069336, -12.631141662597656, 9.891681671142578, 13.310623168945312, 18.043930053710938, 9.383781433105469, 33.97412109375, -5.9575653076171875, 5.6253662109375, -11.354248046875, 8.328865051269531, 8.68780517578125, 0.4008769989013672, 8.817779541015625, 25.706741333007812, 2.0113143920898438, 15.582656860351562, 3.6353073120117188, 25.273344039916992, 27.934402465820312, -4.97651481628418, 12.177371978759766, 3.5753173828125, -12.181503295898438, 27.356178283691406, 34.51060485839844, 28.505619049072266, -12.086616516113281, 8.375978469848633, 3.6570205688476562, 4.0221405029296875, 17.9205379486084, 13.967784881591797, 13.115571975708008, 22.493995666503906, 2.339183807373047, 21.22283935546875, 4.155330657958984, 5.5702667236328125, 0.3946266174316406, 25.265750885009766, -10.889738082885742, -0.1544513702392578, -25.2496337890625, 8.490829467773438, 22.90394401550293, 24.6060791015625, 1.7768745422363281, 26.647232055664062, 11.920761108398438, 11.669231414794922, 9.09381103515625], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000164.npy"} +{"epoch": 0.24792139077853365, "step": 165, "batch_size": 64, "mean": 8.27475357055664, "std": 12.540464401245117, "min": -22.06258773803711, "p10": -6.343541145324707, "median": 8.389144897460938, "p90": 23.227915954589847, "max": 31.614158630371094, "pos_frac": 0.75, "sample": [31.614158630371094, 8.547069549560547, 11.008096694946289, 19.35504913330078, 9.233478546142578, 1.381927490234375, 5.725673675537109, -2.3566436767578125, 11.450252532958984, 4.087091445922852, 3.12603759765625, 9.985523223876953, 27.348655700683594, 0.34609413146972656, -1.6041717529296875, 7.498054504394531, 9.078353881835938, 11.605445861816406, -19.96844482421875, -5.088920593261719, -17.30707550048828, -1.9274749755859375, 20.320785522460938, -3.325967788696289, 18.721771240234375, 22.226173400878906, 8.231220245361328, 14.539716720581055, 27.680639266967773, 28.286209106445312, 6.554107666015625, 0.8122653961181641, 27.896347045898438, 25.74195098876953, 16.42669677734375, -22.06258773803711, 1.8857421875, 16.179004669189453, 19.416919708251953, 19.427352905273438, -6.466733932495117, -2.53759765625, -2.2402496337890625, 4.58869743347168, 19.278610229492188, -6.97100830078125, 3.457775115966797, 1.8062896728515625, 16.4033203125, -2.344696044921875, -6.05609130859375, 19.85944366455078, -21.335952758789062, 22.170166015625, 4.91151237487793, -7.961162567138672, 8.626777648925781, 7.191614151000977, 18.449853897094727, 8.061431884765625, 22.168495178222656, 23.65723419189453, 16.43994903564453, 16.32996368408203], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000165.npy"} +{"epoch": 0.2494331065759637, "step": 166, "batch_size": 64, "mean": 6.372375965118408, "std": 10.831868171691895, "min": -11.46927261352539, "p10": -6.717937469482421, "median": 5.708564758300781, "p90": 22.015608215332033, "max": 31.84935760498047, "pos_frac": 0.65625, "sample": [14.966720581054688, -0.8010463714599609, -3.291351318359375, 14.365814208984375, 20.87274169921875, 1.98748779296875, -5.43096923828125, 22.376815795898438, 6.1523895263671875, 5.456512451171875, -4.059883117675781, 6.25645637512207, 26.271015167236328, -4.672431945800781, 19.21319580078125, 6.5659637451171875, -0.7297821044921875, 14.233510971069336, -5.876869201660156, 3.299774169921875, -3.430204391479492, 18.119892120361328, -7.309486389160156, 5.47003173828125, 24.386741638183594, 7.819574356079102, -7.6594390869140625, 17.13055419921875, 10.703460693359375, 8.042366027832031, -9.424041748046875, -11.46927261352539, 3.728292465209961, 22.949951171875, 17.817420959472656, -1.0715408325195312, 21.17279052734375, 3.244232177734375, 10.740486145019531, 12.466085433959961, 5.9470977783203125, 27.876998901367188, -6.0313262939453125, -7.012199401855469, 10.104705810546875, -4.95196533203125, -2.837646484375, 0.2432708740234375, 8.976673126220703, 31.84935760498047, 10.34722900390625, -8.840988159179688, 0.9232635498046875, 12.206253051757812, -8.748558044433594, -2.5072059631347656, 12.824966430664062, -4.288520812988281, 27.497116088867188, -2.612203598022461, 9.147659301757812, 14.172409057617188, 1.5936031341552734, 1.3681221008300781], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000166.npy"} +{"epoch": 0.2509448223733938, "step": 167, "batch_size": 64, "mean": 9.792556762695312, "std": 11.146574020385742, "min": -13.958206176757812, "p10": -2.0099220275878906, "median": 7.364554405212402, "p90": 25.333987426757815, "max": 32.29239273071289, "pos_frac": 0.828125, "sample": [5.018180847167969, 5.027286529541016, 4.281515121459961, 9.168102264404297, -9.29998779296875, 21.30628204345703, 11.402656555175781, 5.339027404785156, 7.325162887573242, 16.56244659423828, 19.227033615112305, 4.733619689941406, 8.575920104980469, -1.8129348754882812, -1.2799015045166016, 0.3214378356933594, 24.598793029785156, 22.417144775390625, 17.639328002929688, -0.096221923828125, -13.958206176757812, -0.3654975891113281, 4.665445327758789, 2.0005264282226562, 10.444267272949219, 0.9396514892578125, 4.071525573730469, 0.1562061309814453, 4.520015716552734, 13.735198974609375, 5.478759765625, 18.089244842529297, 3.545656204223633, 12.716739654541016, 13.54861068725586, 11.620208740234375, 30.62591552734375, 31.33135986328125, 20.134170532226562, 18.700294494628906, 2.538564682006836, 22.715126037597656, 1.1741714477539062, 7.4039459228515625, 18.52223777770996, -9.687103271484375, -9.725143432617188, 31.188308715820312, -2.0943450927734375, 18.02788543701172, 20.09653091430664, 1.0365791320800781, 3.3857059478759766, 32.29239273071289, 15.474006652832031, 25.834575653076172, -2.9943313598632812, 30.180511474609375, 19.93840789794922, 25.649070739746094, 12.600502014160156, 1.5167407989501953, 3.034027099609375, -3.839700698852539], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000167.npy"} +{"epoch": 0.25245653817082386, "step": 168, "batch_size": 64, "mean": 7.715989112854004, "std": 11.370248794555664, "min": -12.906585693359375, "p10": -4.7906036376953125, "median": 4.798636436462402, "p90": 24.15982933044434, "max": 30.001670837402344, "pos_frac": 0.671875, "sample": [7.360099792480469, -6.125694274902344, 26.813030242919922, -3.5525588989257812, 5.531431198120117, 23.809383392333984, 14.210128784179688, -2.8777542114257812, -12.906585693359375, -10.550262451171875, 7.122428894042969, -2.2625503540039062, 4.352958679199219, 27.938194274902344, 11.114730834960938, 4.750776290893555, 15.742973327636719, 4.84649658203125, 0.31882476806640625, 14.860191345214844, 13.093315124511719, -2.029926300048828, 2.2603759765625, 5.62774658203125, -0.5431919097900391, 10.754871368408203, 26.256637573242188, 2.701526641845703, -5.272911071777344, 16.199081420898438, 1.4459686279296875, -0.826385498046875, 8.906265258789062, 24.310020446777344, 23.459823608398438, -3.8051910400390625, 20.81646728515625, -0.5606231689453125, -0.54156494140625, 0.7883224487304688, 2.872518539428711, 30.001670837402344, -4.432197570800781, 22.95655059814453, 17.780838012695312, -0.9859809875488281, 15.157119750976562, -6.603363037109375, 2.7920761108398438, -2.806854248046875, 12.311538696289062, 11.199832916259766, 22.033782958984375, 3.4585609436035156, -3.9381866455078125, 23.752641677856445, -4.944206237792969, -6.745201110839844, -1.0607070922851562, 0.8892803192138672, 22.95359992980957, 28.745635986328125, 28.515151977539062, 6.3823394775390625], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000168.npy"} +{"epoch": 0.25396825396825395, "step": 169, "batch_size": 64, "mean": 8.734575271606445, "std": 14.257360458374023, "min": -28.488243103027344, "p10": -5.676565170288084, "median": 7.618699073791504, "p90": 26.183674621582036, "max": 50.698760986328125, "pos_frac": 0.734375, "sample": [6.635520935058594, 25.427711486816406, 22.84423065185547, -11.087539672851562, 7.533693313598633, 2.865184783935547, -6.308307647705078, -0.0129852294921875, 9.865180969238281, 12.72994613647461, 9.009681701660156, 0.5320587158203125, 19.176177978515625, 25.531173706054688, 6.9849395751953125, -3.538503646850586, 5.119800567626953, 14.75360107421875, 14.809486389160156, -0.6376495361328125, -4.2024993896484375, 22.937255859375, 26.46331787109375, 9.936241149902344, -2.742938995361328, 45.457481384277344, 2.093963623046875, 8.723869323730469, -2.033344268798828, 11.111263275146484, 6.00163459777832, 5.265289306640625, 20.65676498413086, -2.499757766723633, 22.229957580566406, 5.214452743530273, 18.637365341186523, -28.488243103027344, 9.897294998168945, 8.093650817871094, -0.1298503875732422, 6.732845306396484, 2.3418540954589844, 0.7730026245117188, 7.703704833984375, 11.560409545898438, 9.419456481933594, 5.465789794921875, 28.097564697265625, 14.10125732421875, -0.1346282958984375, 11.608953475952148, 9.559066772460938, -18.680419921875, -11.51324462890625, 50.698760986328125, 29.80450439453125, 30.00287628173828, -15.276819229125977, 34.77456283569336, 3.0440902709960938, 21.56220054626465, -16.287811279296875, -1.2017707824707031], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000169.npy"} +{"epoch": 0.25547996976568405, "step": 170, "batch_size": 64, "mean": 8.808406829833984, "std": 14.343451499938965, "min": -31.45802879333496, "p10": -12.345910072326658, "median": 9.594230651855469, "p90": 25.318323516845705, "max": 40.11839294433594, "pos_frac": 0.765625, "sample": [11.021537780761719, 0.7069244384765625, 10.53248405456543, 9.352703094482422, 2.258586883544922, 33.23304748535156, 8.250391006469727, 9.300891876220703, 5.1904144287109375, 30.266389846801758, -17.369342803955078, 3.7409801483154297, 16.31072998046875, 34.46476745605469, 28.485126495361328, -10.103208541870117, 3.0612430572509766, 12.29608154296875, 20.682525634765625, -2.8485260009765625, 4.293048858642578, 24.847824096679688, 17.355321884155273, 2.1306705474853516, -14.071952819824219, 11.847267150878906, -18.709182739257812, -3.1522903442382812, -31.45802879333496, 17.094940185546875, 22.954631805419922, 17.625656127929688, 21.19965362548828, 10.172792434692383, -13.30706787109375, 11.530303955078125, -7.654510498046875, 14.585334777832031, 22.08063507080078, -4.417510986328125, 11.567039489746094, -0.22576522827148438, -0.4548454284667969, 18.697418212890625, 8.576133728027344, 40.11839294433594, 10.910247802734375, 24.77446746826172, 7.813343048095703, 1.69970703125, 4.4100189208984375, -3.9619197845458984, 2.1120223999023438, 31.635616302490234, -13.645767211914062, 5.770252227783203, 19.858123779296875, 25.51996612548828, 1.1447334289550781, 9.835758209228516, 22.893150329589844, 23.56244659423828, 14.086967468261719, -16.740768432617188], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000170.npy"} +{"epoch": 0.25699168556311414, "step": 171, "batch_size": 64, "mean": 9.60409927368164, "std": 15.218255996704102, "min": -35.224510192871094, "p10": -4.621766662597656, "median": 7.1346235275268555, "p90": 29.51597137451172, "max": 34.61268997192383, "pos_frac": 0.734375, "sample": [10.027061462402344, 7.429996490478516, 27.97418212890625, 6.474571228027344, 21.966873168945312, 31.49947738647461, 20.14383316040039, 26.87499237060547, 0.9746742248535156, 3.9780197143554688, -1.7380180358886719, 1.0789947509765625, 29.765708923339844, 14.200691223144531, 34.61268997192383, -4.594871520996094, 21.556304931640625, 5.717079162597656, 21.1441650390625, -1.1823883056640625, -0.7211666107177734, 7.015569686889648, 18.32917022705078, 0.458953857421875, 24.82077980041504, 1.0418281555175781, 11.91998291015625, 0.7307891845703125, 34.157188415527344, -26.029939651489258, 16.78227996826172, 16.616676330566406, 34.563072204589844, -8.597797393798828, 14.459896087646484, 27.152782440185547, -4.633293151855469, -12.00689697265625, 34.519893646240234, 27.737701416015625, -35.224510192871094, 4.052000045776367, 19.363933563232422, 3.6201934814453125, 4.6118011474609375, 28.933250427246094, 20.168182373046875, -0.7565383911132812, -3.05780029296875, 14.286102294921875, 7.2536773681640625, 31.548309326171875, 25.730958938598633, 1.547576904296875, -1.5381698608398438, -5.14764404296875, 10.9683837890625, -0.24725341796875, -2.629444122314453, -25.332290649414062, 18.376083374023438, 0.601715087890625, 2.3776397705078125, -1.0653305053710938], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000171.npy"} +{"epoch": 0.2585034013605442, "step": 172, "batch_size": 64, "mean": 8.99052906036377, "std": 13.820164680480957, "min": -27.396331787109375, "p10": -6.334555816650391, "median": 7.858592987060547, "p90": 28.88657341003418, "max": 42.719512939453125, "pos_frac": 0.796875, "sample": [-11.283828735351562, 7.741188049316406, 1.9447860717773438, 7.9759979248046875, 2.0467376708984375, 1.391519546508789, -0.12882041931152344, 14.324405670166016, 19.252601623535156, 31.698522567749023, 42.719512939453125, 9.01318359375, 9.014854431152344, -0.7307968139648438, 17.721221923828125, 37.964927673339844, 12.473846435546875, -11.927749633789062, 0.8950843811035156, 8.698982238769531, 9.079505920410156, 2.824798583984375, -18.10911750793457, 1.017242431640625, 9.64974594116211, 7.332916259765625, 4.34539794921875, 17.034912109375, 18.105087280273438, -2.210723876953125, 14.492683410644531, 19.24651336669922, 9.383575439453125, 19.638031005859375, 1.2087593078613281, 1.405233383178711, 28.917892456054688, 17.45581817626953, 28.813495635986328, 2.4685821533203125, -0.9765911102294922, 9.901908874511719, 5.750759124755859, 22.1064510345459, 22.151241302490234, -19.073944091796875, 0.9466705322265625, -6.328804016113281, 2.2007064819335938, 11.110563278198242, -7.7943267822265625, 26.32904052734375, 31.15770721435547, -27.396331787109375, 1.9657440185546875, 19.4844970703125, 1.1851425170898438, 7.146278381347656, 1.8957557678222656, 29.67474937438965, -6.3370208740234375, -0.8579769134521484, 32.09790802001953, 26.147216796875], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000172.npy"} +{"epoch": 0.2600151171579743, "step": 173, "batch_size": 64, "mean": 9.58780288696289, "std": 17.049297332763672, "min": -27.98795509338379, "p10": -9.60881118774414, "median": 11.030343055725098, "p90": 33.10646896362306, "max": 44.93310546875, "pos_frac": 0.6875, "sample": [-14.285112380981445, 0.7993545532226562, -1.8832778930664062, 13.084369659423828, 19.83429718017578, 27.06438446044922, 10.97770881652832, -3.4637069702148438, -2.960458755493164, 19.566925048828125, 3.1193466186523438, 14.323509216308594, 30.50605010986328, -11.216670989990234, -6.462865829467773, 30.731468200683594, 38.45497131347656, 3.6983184814453125, 14.412660598754883, 1.4514808654785156, 14.37255859375, 35.501548767089844, -4.4939422607421875, 29.137542724609375, -27.98795509338379, -25.355972290039062, 14.09332275390625, 22.5106201171875, 4.435787200927734, 0.7089920043945312, -8.136329650878906, 34.76643371582031, -9.365678787231445, 34.107147216796875, 12.353401184082031, 3.0063819885253906, 25.861194610595703, -6.252899169921875, 18.983924865722656, 20.389358520507812, 11.876007080078125, 1.3917617797851562, 4.518808364868164, 30.77155303955078, 14.637165069580078, -25.460140228271484, -2.6108665466308594, -7.489105224609375, 44.93310546875, 23.741310119628906, 35.58441162109375, -18.3286190032959, 11.082977294921875, 23.223968505859375, 26.009075164794922, -2.8779830932617188, -1.213348388671875, -9.713010787963867, 12.331933975219727, 39.437744140625, 2.6182861328125, 21.39507293701172, -0.24762725830078125, 1.6187744140625], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000173.npy"} +{"epoch": 0.2615268329554044, "step": 174, "batch_size": 64, "mean": 10.215535163879395, "std": 14.521068572998047, "min": -27.12865447998047, "p10": -4.236135864257812, "median": 9.016300201416016, "p90": 30.020636367797856, "max": 39.526512145996094, "pos_frac": 0.765625, "sample": [8.242103576660156, 13.723762512207031, 20.94769287109375, 5.927999496459961, 11.918380737304688, -3.5675811767578125, 3.8272476196289062, 21.689483642578125, 4.240577697753906, 9.983844757080078, 31.292190551757812, 28.770858764648438, 4.009147644042969, -3.0338821411132812, 17.89324951171875, -2.8071746826171875, 26.32364273071289, 21.504369735717773, 19.612525939941406, -27.12865447998047, 31.95953369140625, 9.150581359863281, -2.6178550720214844, 18.073204040527344, 38.63714599609375, -1.1706295013427734, 10.654022216796875, -3.5096206665039062, 36.459747314453125, 7.624114990234375, 1.8787918090820312, 39.526512145996094, 35.745872497558594, -4.5226593017578125, 16.73751449584961, 13.419403076171875, 7.185691833496094, 8.88201904296875, 2.5173301696777344, 28.90191650390625, -11.071159362792969, 28.776641845703125, 9.195781707763672, 1.1840839385986328, -0.22838592529296875, 25.049407958984375, 19.02617645263672, -11.733871459960938, 30.50008773803711, 9.901031494140625, -24.068016052246094, 20.031448364257812, 3.2631874084472656, 0.7956199645996094, 18.51903533935547, -2.9222259521484375, 12.829681396484375, -9.222663879394531, 20.583431243896484, -13.719039916992188, 6.038366317749023, 4.126808166503906, 7.5259857177734375, 0.5103912353515625], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000174.npy"} +{"epoch": 0.26303854875283444, "step": 175, "batch_size": 64, "mean": 11.47942066192627, "std": 15.892118453979492, "min": -18.3057861328125, "p10": -7.709835052490234, "median": 7.5885162353515625, "p90": 32.8669059753418, "max": 46.277374267578125, "pos_frac": 0.734375, "sample": [-15.471227645874023, 19.9211368560791, -3.1941986083984375, 3.8038196563720703, -7.693092346191406, 22.73523712158203, 0.055377960205078125, 19.382904052734375, 8.157424926757812, -2.6748313903808594, 4.593170166015625, 33.61328125, 15.269939422607422, 20.99993896484375, -8.208927154541016, 31.710111618041992, 12.441543579101562, 28.070297241210938, 30.236419677734375, 3.60748291015625, 5.28070068359375, 5.464677810668945, 5.544380187988281, 30.966110229492188, 23.995010375976562, 11.413917541503906, 0.2601509094238281, -2.1484451293945312, 33.34495544433594, -18.3057861328125, 30.057533264160156, -1.6030960083007812, 10.965629577636719, 2.9798049926757812, 5.2831878662109375, -0.9006156921386719, 15.630516052246094, 37.28315353393555, -2.484853744506836, -17.068588256835938, 9.561767578125, -7.717010498046875, 1.6409683227539062, 7.0196075439453125, -5.9835357666015625, -2.421234130859375, 29.81816864013672, -8.818046569824219, 28.234603881835938, 31.75145721435547, 10.451435089111328, 30.575342178344727, 5.656181335449219, -9.356765747070312, 4.44818115234375, 28.84130096435547, -7.203508377075195, 37.61590576171875, 23.169158935546875, 46.277374267578125, 1.3257827758789062, 34.90678405761719, 15.424560546875, 36.15029525756836], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000175.npy"} +{"epoch": 0.26455026455026454, "step": 176, "batch_size": 64, "mean": 7.407505989074707, "std": 16.222379684448242, "min": -31.898880004882812, "p10": -10.099908447265623, "median": 6.42510986328125, "p90": 29.477928543090826, "max": 47.87983703613281, "pos_frac": 0.640625, "sample": [37.548919677734375, -25.089256286621094, 16.269187927246094, 18.64221954345703, 1.1718826293945312, 4.7918853759765625, -4.075675964355469, 17.57562255859375, 6.148996353149414, 2.58953857421875, -22.66436767578125, -10.611656188964844, -7.810634613037109, 9.44449234008789, -20.304649353027344, 30.020790100097656, -0.4237213134765625, 21.86477279663086, -3.16204833984375, -1.7485733032226562, -2.6239547729492188, -1.9097251892089844, 6.903364181518555, 38.887454986572266, 19.779632568359375, 14.410423278808594, -8.905830383300781, 21.715347290039062, 2.4456787109375, 22.821434020996094, 10.08343505859375, -0.7590065002441406, -2.5938568115234375, 24.643051147460938, 16.1960506439209, 35.18880081176758, 1.6634063720703125, 16.927413940429688, -0.09863662719726562, -10.903228759765625, 2.0358200073242188, 9.078765869140625, 14.086103439331055, 30.010906219482422, 9.041824340820312, 10.898685455322266, -5.4488525390625, -4.7899627685546875, 18.937667846679688, 28.23431396484375, -1.6565704345703125, 23.303512573242188, 1.6760635375976562, 17.554031372070312, 2.1125717163085938, 6.701223373413086, 47.87983703613281, -1.35040283203125, -3.4459609985351562, 36.84748840332031, 6.749992370605469, -31.898880004882812, 7.40069580078125, -23.927490234375], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000176.npy"} +{"epoch": 0.2660619803476946, "step": 177, "batch_size": 64, "mean": 14.351624488830566, "std": 14.803488731384277, "min": -25.522369384765625, "p10": -1.2119991302490234, "median": 12.410210609436035, "p90": 34.722542190551756, "max": 43.50297546386719, "pos_frac": 0.859375, "sample": [5.096282958984375, 3.0454044342041016, 22.110891342163086, 43.50297546386719, 21.916404724121094, -1.2398414611816406, 10.212371826171875, 11.587921142578125, 40.55857849121094, 15.31201171875, 41.91083526611328, 32.997623443603516, 23.361127853393555, -0.7335929870605469, 13.283496856689453, -10.582679748535156, 35.893951416015625, 5.133819580078125, -4.2499237060546875, 12.964937210083008, 13.962799072265625, 13.018913269042969, 4.541286468505859, 32.22321319580078, 16.31609535217285, 1.9381561279296875, 7.479864120483398, 28.580535888671875, -4.714147567749023, 3.565540313720703, 13.641326904296875, 8.986373901367188, 33.32994079589844, 12.540374755859375, 5.840669631958008, 31.395206451416016, 32.135536193847656, 2.7250289916992188, 9.222381591796875, 24.13516616821289, 2.7665557861328125, 10.275400161743164, 23.71554183959961, 9.735733032226562, 22.3709716796875, -10.865135192871094, 1.944976806640625, -3.863067626953125, 34.368160247802734, 0.5918846130371094, 34.874420166015625, 0.6205120086669922, -25.522369384765625, 40.491207122802734, 9.843154907226562, 16.16602325439453, 16.71231460571289, 39.77581787109375, 24.0953369140625, 12.280046463012695, 6.938819885253906, 31.38181495666504, -1.14703369140625, 8.006034851074219], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000177.npy"} +{"epoch": 0.2675736961451247, "step": 178, "batch_size": 64, "mean": 8.388181686401367, "std": 13.835724830627441, "min": -20.70525360107422, "p10": -8.400336456298827, "median": 7.405332565307617, "p90": 27.61176223754883, "max": 38.345699310302734, "pos_frac": 0.75, "sample": [8.841737747192383, 22.917755126953125, 7.993274688720703, -1.5144424438476562, 20.344928741455078, 0.7106685638427734, -1.3152542114257812, 15.240501403808594, 22.942276000976562, 10.029338836669922, -8.848342895507812, 5.544532775878906, 10.283477783203125, -17.947683334350586, 8.831588745117188, 4.782405853271484, 33.58395767211914, -0.6894092559814453, -7.354988098144531, -2.0243377685546875, 31.520484924316406, 4.999448776245117, 8.567672729492188, -19.480133056640625, 3.477985382080078, 5.14801025390625, 4.501655578613281, 8.597564697265625, 4.179603576660156, 5.715616226196289, 19.24603271484375, 0.0060367584228515625, 6.817390441894531, 38.345699310302734, 8.486282348632812, 10.60609245300293, 9.791000366210938, 4.939857482910156, 33.86253356933594, 5.494976043701172, -13.393753051757812, 24.354347229003906, 27.73102569580078, 5.567237854003906, -20.70525360107422, 31.949310302734375, -1.91607666015625, -13.676216125488281, 30.664871215820312, 4.122402191162109, 26.930862426757812, 27.333480834960938, 10.851278305053711, 21.93360137939453, 8.109582901000977, 2.140777587890625, 18.498611450195312, -5.623069763183594, -20.311843872070312, -1.918701171875, 14.882732391357422, 17.685928344726562, 17.752212524414062, -3.295520782470703], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000178.npy"} +{"epoch": 0.2690854119425548, "step": 179, "batch_size": 64, "mean": 10.528969764709473, "std": 16.548751831054688, "min": -33.02692413330078, "p10": -10.929036903381347, "median": 9.83825397491455, "p90": 30.459345054626468, "max": 51.864349365234375, "pos_frac": 0.765625, "sample": [16.98517608642578, -4.2659149169921875, -2.751220703125, 12.265274047851562, 0.9268722534179688, 13.95379638671875, 12.906339645385742, 17.652618408203125, 37.073455810546875, 17.490375518798828, 29.845468521118164, 29.2108154296875, 27.353408813476562, -19.880813598632812, 8.767242431640625, -13.391529083251953, -33.02692413330078, -10.146459579467773, 3.4414443969726562, 9.8431396484375, -3.1277084350585938, 24.57172393798828, 9.11590576171875, 24.577301025390625, 32.71955108642578, -22.22716522216797, -2.6830978393554688, 26.337905883789062, 6.675878524780273, 9.833368301391602, 12.791057586669922, 22.26677703857422, 4.321502685546875, -6.0469512939453125, 1.4191665649414062, -11.379348754882812, 8.539932250976562, 49.029693603515625, 30.722434997558594, 0.8404159545898438, 18.6937313079834, 20.118438720703125, 19.915956497192383, 12.333026885986328, -11.264427185058594, 20.005722045898438, 37.09541320800781, 7.134437561035156, 34.21063995361328, 51.864349365234375, 19.868877410888672, 18.24204444885254, 23.6121826171875, 4.311676025390625, 0.293487548828125, 16.693588256835938, 8.143592834472656, 0.7957916259765625, 7.344884872436523, -1.778961181640625, -17.4738826751709, 0.476287841796875, 15.228981018066406, -4.5626678466796875], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000179.npy"} +{"epoch": 0.2705971277399849, "step": 180, "batch_size": 64, "mean": 8.647587776184082, "std": 15.90718936920166, "min": -30.522979736328125, "p10": -10.546871948242185, "median": 6.952813148498535, "p90": 32.66838684082032, "max": 41.494346618652344, "pos_frac": 0.75, "sample": [16.732437133789062, 0.7759132385253906, 6.746622085571289, 5.499717712402344, 3.1851654052734375, 12.530754089355469, -11.622108459472656, 10.420597076416016, 1.0125408172607422, -2.490039825439453, 32.931495666503906, 9.632293701171875, -6.9556732177734375, -0.4054832458496094, 7.159004211425781, 1.2518329620361328, -12.40142822265625, 31.127731323242188, 0.6745872497558594, -27.110733032226562, 36.22331237792969, 11.818418502807617, 5.959249496459961, 25.72589111328125, 11.277389526367188, 21.974727630615234, 0.3417625427246094, 1.1767654418945312, 7.213691711425781, 13.080509185791016, 10.735130310058594, 28.71976089477539, -14.367897033691406, 3.1665496826171875, 9.051219940185547, 14.403396606445312, 7.4856109619140625, 38.034141540527344, -0.2865734100341797, -2.4215736389160156, 5.580801010131836, 24.256757736206055, 34.361572265625, -0.08879661560058594, -3.890960693359375, 1.893106460571289, 38.642250061035156, -3.3841476440429688, 41.494346618652344, 4.128957748413086, 29.591598510742188, -18.327239990234375, 6.11962890625, -8.037986755371094, 10.293251037597656, 9.469097137451172, 38.493690490722656, -30.522979736328125, 18.695667266845703, -17.818397521972656, 17.766281127929688, 11.079105377197266, 32.054466247558594, 3.5888500213623047], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000180.npy"} +{"epoch": 0.272108843537415, "step": 181, "batch_size": 64, "mean": 12.549201965332031, "std": 14.12546157836914, "min": -15.894725799560547, "p10": -2.0698545455932607, "median": 10.173263549804688, "p90": 32.609564590454106, "max": 45.204498291015625, "pos_frac": 0.84375, "sample": [16.143646240234375, 15.314620971679688, -0.30326080322265625, 0.0007457733154296875, 5.266628265380859, 1.5847015380859375, 10.849380493164062, -10.371734619140625, 3.712696075439453, 1.3521842956542969, 24.42218780517578, 6.500144958496094, 15.06808090209961, -9.140396118164062, 16.714706420898438, 7.3711700439453125, 23.710063934326172, 6.262306213378906, 28.46484375, -8.02166748046875, 21.327484130859375, 34.50120544433594, 22.638927459716797, 17.325538635253906, 40.01466369628906, 20.966659545898438, 7.0601654052734375, 45.204498291015625, 2.4926605224609375, -15.894725799560547, 24.67359161376953, 3.413684844970703, 40.633087158203125, -7.164003372192383, 21.622802734375, 1.1117782592773438, -1.2269420623779297, 38.6590576171875, 2.7295188903808594, 7.962074279785156, 27.40018081665039, 4.992897033691406, 24.818527221679688, 32.994773864746094, 28.259899139404297, 2.875761032104492, 3.1008167266845703, 10.627969741821289, 11.740036010742188, 0.5458812713623047, 3.785236358642578, 31.710742950439453, 42.06462097167969, 3.0309524536132812, 9.84918212890625, 24.59535026550293, 3.8989105224609375, 10.497344970703125, 10.658731460571289, -2.431102752685547, 15.154403686523438, -0.3840522766113281, 24.037864685058594, -3.6288299560546875], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000181.npy"} +{"epoch": 0.273620559334845, "step": 182, "batch_size": 64, "mean": 13.048293113708496, "std": 17.718387603759766, "min": -35.30078887939453, "p10": -7.317450714111328, "median": 10.412932395935059, "p90": 36.22970886230469, "max": 44.21156311035156, "pos_frac": 0.78125, "sample": [33.24790954589844, -13.794347763061523, -10.742145538330078, 16.205039978027344, 22.379501342773438, 20.02495574951172, 19.264728546142578, -11.067642211914062, -7.152015686035156, 33.76686096191406, 17.59689712524414, 5.150169372558594, 44.21156311035156, 2.9590911865234375, 33.354339599609375, 21.134552001953125, 10.394210815429688, 9.296257019042969, 33.98283767700195, 12.269111633300781, 21.31342124938965, 0.9451770782470703, 2.0880279541015625, -7.3883514404296875, 24.97796630859375, 0.4759979248046875, 30.530515670776367, 7.771886825561523, 35.567626953125, 34.77989196777344, 41.60169982910156, 12.041671752929688, 8.606399536132812, 7.151203155517578, 38.08275604248047, 1.1484527587890625, 0.5216827392578125, 4.177177429199219, 36.513458251953125, -0.4886932373046875, 11.169136047363281, -21.852270126342773, 40.347373962402344, -3.0630111694335938, 32.91335678100586, 27.30327606201172, 5.184568405151367, -5.8684844970703125, 28.636962890625, 3.5489273071289062, 25.481590270996094, 36.79859161376953, -6.861991882324219, 28.83913230895996, 38.06977081298828, 6.024787902832031, -4.259979248046875, 10.43165397644043, 31.299072265625, 3.0914230346679688, 6.315208435058594, -15.072212219238281, -0.9851837158203125, -35.30078887939453], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000182.npy"} +{"epoch": 0.2751322751322751, "step": 183, "batch_size": 64, "mean": 5.453709602355957, "std": 14.863180160522461, "min": -37.797019958496094, "p10": -11.45608139038086, "median": 3.554828643798828, "p90": 26.223431396484383, "max": 35.78443145751953, "pos_frac": 0.671875, "sample": [4.971992492675781, 31.44646453857422, -1.6159286499023438, 0.5001907348632812, 5.557910919189453, -4.327690124511719, -18.381744384765625, 31.179969787597656, -11.466987609863281, -3.5596771240234375, -37.797019958496094, -1.773895263671875, 21.510854721069336, -5.83740234375, 14.116832733154297, 16.893733978271484, -1.1362934112548828, 15.895111083984375, 21.247215270996094, 14.528860092163086, 18.0546875, -4.3426666259765625, 19.13507080078125, -6.285646438598633, 2.7235183715820312, -4.8717803955078125, 9.623062133789062, 0.46448516845703125, -21.36407470703125, -11.430633544921875, 35.78443145751953, 9.623001098632812, 3.6174087524414062, 2.394519805908203, -8.965324401855469, 10.253898620605469, 11.20596694946289, 32.902381896972656, -31.85352325439453, 29.42477035522461, -5.938976287841797, 0.4132232666015625, 31.448707580566406, -3.0127525329589844, 2.2778892517089844, 7.873126983642578, 14.371049880981445, 3.49224853515625, -11.557723999023438, -0.9199199676513672, 9.379219055175781, 8.276947021484375, 1.6327896118164062, 1.6324005126953125, 23.92864990234375, 0.3729362487792969, 16.12579345703125, -13.8753662109375, 3.705402374267578, 1.8041152954101562, 8.988052368164062, 27.2069091796875, 20.47714614868164, 12.889495849609375], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000183.npy"} +{"epoch": 0.2766439909297052, "step": 184, "batch_size": 64, "mean": 9.592950820922852, "std": 13.45799446105957, "min": -12.73995590209961, "p10": -2.914466094970703, "median": 5.166582107543945, "p90": 30.47347755432129, "max": 40.05155944824219, "pos_frac": 0.6875, "sample": [1.172943115234375, 28.45323944091797, 31.718273162841797, 0.17704010009765625, 16.803871154785156, 1.1927337646484375, -1.0564155578613281, -1.3458633422851562, -1.8343505859375, 1.7201309204101562, -0.09967613220214844, 32.816688537597656, -0.5950164794921875, 8.585269927978516, 26.31204605102539, -6.072784423828125, 21.93120574951172, 12.986167907714844, 9.651687622070312, 35.55387878417969, -11.056816101074219, 40.05155944824219, 20.7310791015625, 36.471221923828125, -12.411209106445312, 30.29425048828125, 8.845804214477539, 13.67578125, 30.550289154052734, 2.1257858276367188, 20.89904022216797, -0.0816650390625, 5.158256530761719, -12.73995590209961, -0.19294357299804688, 9.236106872558594, 36.998226165771484, 11.639707565307617, 0.30770111083984375, 25.74750518798828, 13.020811080932617, -1.0304641723632812, 18.70494842529297, 0.10219764709472656, 16.171539306640625, 5.174907684326172, 17.092864990234375, 9.354522705078125, -0.11868858337402344, 29.740081787109375, -10.734243392944336, -2.4567413330078125, 8.959152221679688, 4.982917785644531, 17.304306030273438, 13.466583251953125, -3.6526050567626953, 3.6053466796875, -1.0306835174560547, 4.131988525390625, -3.1106338500976562, 2.575428009033203, -1.2009849548339844, -1.4244537353515625], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000184.npy"} +{"epoch": 0.2781557067271353, "step": 185, "batch_size": 64, "mean": 10.887737274169922, "std": 18.888517379760742, "min": -32.54076385498047, "p10": -12.943129158020017, "median": 12.040298461914062, "p90": 34.23690605163574, "max": 46.38831329345703, "pos_frac": 0.6875, "sample": [5.126249313354492, 41.164390563964844, -1.8502044677734375, 21.207319259643555, 41.600921630859375, -23.413997650146484, 13.451229095458984, 9.705081939697266, -7.3896026611328125, 5.1321868896484375, 37.604156494140625, 37.937034606933594, 0.528900146484375, -13.679298400878906, 43.24955749511719, 5.075048446655273, 46.38831329345703, 9.753623962402344, 31.736995697021484, 34.576480865478516, -6.116909027099609, 32.754852294921875, 23.50381851196289, 8.236518859863281, 1.6750240325927734, 26.61978530883789, 16.79227638244629, 14.571846008300781, 8.554603576660156, 26.908355712890625, -9.733524322509766, -1.8659210205078125, 17.00309944152832, 22.581558227539062, -30.061466217041016, 23.30980682373047, 26.895645141601562, 20.661592483520508, 18.679027557373047, -3.5738162994384766, -32.54076385498047, 11.979598999023438, -5.2272491455078125, 16.999008178710938, 29.18365478515625, -21.616928100585938, 31.661283493041992, -3.3799686431884766, 33.44456481933594, -5.140439987182617, 12.100997924804688, -14.440374374389648, 18.025611877441406, -8.227367401123047, 1.2916717529296875, 14.380516052246094, -18.311969757080078, -11.225400924682617, 16.406097412109375, -2.18048095703125, -7.877948760986328, 5.301921844482422, 29.432819366455078, 31.47577476501465], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000185.npy"} +{"epoch": 0.2796674225245654, "step": 186, "batch_size": 64, "mean": 12.024774551391602, "std": 18.4840087890625, "min": -37.326942443847656, "p10": -6.9321191787719725, "median": 9.701677322387695, "p90": 35.46608581542969, "max": 52.528839111328125, "pos_frac": 0.71875, "sample": [19.475051879882812, 43.61553955078125, -21.615371704101562, 14.434211730957031, 22.91313934326172, -10.490753173828125, 8.099685668945312, -16.670795440673828, -6.0579681396484375, 27.758811950683594, 14.991928100585938, -3.9978981018066406, 17.874603271484375, 21.874191284179688, 50.806915283203125, 27.332019805908203, 5.517986297607422, 5.996131896972656, 7.864093780517578, -27.598648071289062, 6.749483108520508, 27.28499412536621, 28.028966903686523, 41.873435974121094, -37.326942443847656, -4.693824768066406, -5.888669967651367, -5.53080940246582, -3.660247802734375, 2.1376876831054688, 6.8733673095703125, 24.261247634887695, 8.983062744140625, -3.7664642333984375, -6.41267204284668, -2.896251678466797, 15.742813110351562, 33.30083465576172, 28.160972595214844, 2.0824203491210938, -4.016254425048828, -9.558197021484375, 5.413356781005859, 6.300689697265625, 18.924591064453125, 7.506660461425781, 36.39405059814453, 21.430084228515625, -7.1547393798828125, 15.123710632324219, 47.26936340332031, 8.814741134643555, 14.309379577636719, 52.528839111328125, 20.097976684570312, 16.449562072753906, 43.91114807128906, 30.938806533813477, 26.628829956054688, 19.218236923217773, 9.390274047851562, 24.409713745117188, -2.1845932006835938, 10.013080596923828], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000186.npy"} +{"epoch": 0.2811791383219955, "step": 187, "batch_size": 64, "mean": 10.597940444946289, "std": 18.562044143676758, "min": -30.390464782714844, "p10": -12.270597076416015, "median": 8.308187484741211, "p90": 35.40408630371094, "max": 50.15373229980469, "pos_frac": 0.71875, "sample": [13.569541931152344, -10.244964599609375, 31.96149444580078, 42.67717742919922, 50.15373229980469, 17.907684326171875, 17.581687927246094, 8.438671112060547, 6.5084686279296875, 35.3704833984375, -30.390464782714844, 13.006393432617188, -0.3786811828613281, 13.245803833007812, 14.61083984375, 1.2048511505126953, 1.4417362213134766, 26.24615478515625, 25.079376220703125, 6.580961227416992, -14.800079345703125, -28.925199508666992, 35.87397003173828, -0.8288002014160156, 3.7068405151367188, -5.2181396484375, 1.7643623352050781, 5.39776611328125, 8.177703857421875, 34.06824493408203, 28.928695678710938, 35.418487548828125, -12.895912170410156, -2.2162094116210938, 15.2816162109375, 11.476669311523438, 5.968837738037109, 1.4943695068359375, -11.007942199707031, 19.54462432861328, -3.528951644897461, -12.447410583496094, 30.034381866455078, 0.2000255584716797, 6.3526153564453125, 17.00592803955078, 39.816200256347656, -9.922237396240234, 12.04693603515625, 23.63787841796875, 33.922210693359375, -17.13678741455078, 23.94872283935547, 46.23785400390625, 3.2656822204589844, -2.275543212890625, 43.53497314453125, 35.24745178222656, 1.9866943359375, 8.867790222167969, -4.9478912353515625, -17.974184036254883, -11.8580322265625, 16.472999572753906], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000187.npy"} +{"epoch": 0.28269085411942557, "step": 188, "batch_size": 64, "mean": 11.996978759765625, "std": 17.510475158691406, "min": -33.661224365234375, "p10": -5.284844398498534, "median": 7.537052154541016, "p90": 36.56811256408692, "max": 49.39274597167969, "pos_frac": 0.8125, "sample": [5.637939453125, -3.895334243774414, 41.307064056396484, -10.137178421020508, -0.36855316162109375, 34.07051086425781, 28.887344360351562, 5.608652114868164, 31.429595947265625, 14.703277587890625, 3.618255615234375, 49.39274597167969, 35.59791946411133, 0.220123291015625, 0.22647666931152344, 1.9456329345703125, 21.586013793945312, 39.896644592285156, 1.0512981414794922, -4.51966667175293, 14.207324981689453, 3.9550933837890625, 1.1655349731445312, 2.7729721069335938, 11.024421691894531, -2.0163650512695312, -8.232990264892578, 29.389816284179688, 11.611408233642578, 29.748165130615234, 14.998395919799805, 6.209053039550781, 6.716522216796875, 48.338951110839844, 30.902633666992188, 1.0519981384277344, 35.15135192871094, 7.4383087158203125, 7.635795593261719, 9.90350341796875, 41.39803695678711, 1.09326171875, 5.121715545654297, 18.43585205078125, 0.47264862060546875, -1.2041778564453125, 2.7972278594970703, 34.845909118652344, 3.575164794921875, 0.9523067474365234, 36.51214599609375, -22.500198364257812, -5.6127777099609375, 8.542404174804688, 12.303939819335938, 7.704441070556641, 8.343862533569336, -15.011003494262695, 28.68499755859375, 36.592098236083984, 37.291656494140625, 9.661659240722656, -6.763940811157227, -33.661224365234375], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000188.npy"} +{"epoch": 0.2842025699168556, "step": 189, "batch_size": 64, "mean": 10.962713241577148, "std": 17.227493286132812, "min": -30.78830337524414, "p10": -12.777196121215818, "median": 10.402862548828125, "p90": 36.71910285949707, "max": 49.29650115966797, "pos_frac": 0.796875, "sample": [-1.1151123046875, 13.851051330566406, 10.467254638671875, 20.407913208007812, 13.99493408203125, 39.334930419921875, 38.886474609375, 15.47071647644043, 2.277902603149414, 11.092910766601562, -20.806884765625, 37.02103805541992, -16.863555908203125, 3.0199432373046875, -1.3231735229492188, -2.271757125854492, 40.835227966308594, 26.148662567138672, -13.947032928466797, 15.658584594726562, 8.046749114990234, 20.212539672851562, 6.505588531494141, 10.732208251953125, -0.02686309814453125, 2.9246387481689453, 20.809814453125, 16.849287033081055, 4.7248077392578125, 1.3896560668945312, 35.77442932128906, -10.047576904296875, 4.531990051269531, 37.859291076660156, 36.01458740234375, 10.803016662597656, 0.31433868408203125, 4.7812957763671875, 6.5728302001953125, 16.994972229003906, 35.68722915649414, 12.212493896484375, 21.8897762298584, 11.602340698242188, 16.222076416015625, 6.004329681396484, -5.883846282958984, -21.83855628967285, 10.338470458984375, 4.892127990722656, 1.3737030029296875, 21.386568069458008, -21.226486206054688, 49.29650115966797, 29.080307006835938, 6.430309295654297, -15.799057006835938, -30.78830337524414, 11.4404296875, 6.9324951171875, 7.890649795532227, 2.3738021850585938, 42.739341735839844, 31.449312210083008], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000189.npy"} +{"epoch": 0.2857142857142857, "step": 190, "batch_size": 64, "mean": 14.685094833374023, "std": 17.54672622680664, "min": -21.308486938476562, "p10": -6.7051952362060545, "median": 12.075210571289062, "p90": 39.948209381103524, "max": 52.8197021484375, "pos_frac": 0.796875, "sample": [7.679067611694336, 28.77496337890625, 50.26390075683594, -7.1127166748046875, 19.012447357177734, 29.039657592773438, 0.77264404296875, 3.4366912841796875, -11.521217346191406, 43.080780029296875, 12.280685424804688, 27.740158081054688, 10.493860244750977, 1.0776901245117188, 11.869735717773438, 2.1030502319335938, -6.304943084716797, 40.62744140625, 9.483358383178711, 9.038541793823242, 30.908267974853516, 43.21061325073242, -0.19024658203125, 4.03985595703125, -4.73356819152832, 14.469890594482422, -21.308486938476562, 7.755428314208984, 5.827655792236328, 20.293140411376953, 15.436317443847656, -4.322395324707031, 9.569473266601562, 17.87176513671875, 26.719375610351562, 2.3757896423339844, 36.84321594238281, -8.307268142700195, -3.148895263671875, 19.703563690185547, -10.573921203613281, 24.719833374023438, 31.34033203125, 52.8197021484375, 7.937604904174805, 2.047821044921875, -2.153463363647461, 24.468841552734375, -13.687789916992188, -6.876731872558594, 14.938753128051758, 13.087379455566406, 3.9883995056152344, 34.77967834472656, 17.567123413085938, 43.697975158691406, 48.693634033203125, 3.9719924926757812, 29.631698608398438, 38.36333465576172, 0.6178131103515625, 37.356201171875, 27.269805908203125, 20.990812301635742], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000190.npy"} +{"epoch": 0.2872260015117158, "step": 191, "batch_size": 64, "mean": 11.592092514038086, "std": 18.686491012573242, "min": -36.37422180175781, "p10": -5.732493400573729, "median": 12.00841236114502, "p90": 36.89715347290039, "max": 47.91888427734375, "pos_frac": 0.75, "sample": [35.36023712158203, -3.073040008544922, 13.083831787109375, 23.943641662597656, 46.451175689697266, -1.8587722778320312, 10.71075439453125, 41.85834503173828, 11.847627639770508, 5.26666259765625, 1.6931915283203125, 47.91888427734375, 12.169197082519531, -2.598865509033203, 11.612449645996094, 2.8199462890625, -35.8446044921875, 7.125022888183594, 39.850067138671875, 16.235837936401367, 12.490516662597656, 25.65478515625, 15.017532348632812, 36.77751922607422, -22.013328552246094, 32.30670166015625, 18.63702392578125, 15.89065933227539, -4.2126922607421875, -0.03531646728515625, 14.333389282226562, -0.8812103271484375, -0.9513645172119141, 2.1762351989746094, 40.35652160644531, -30.252975463867188, -0.18903732299804688, -19.124237060546875, 9.769229888916016, 29.49256134033203, 18.31009292602539, 14.534900665283203, 12.472763061523438, 16.959762573242188, 26.956045150756836, 3.3189144134521484, 33.01203918457031, 40.84902572631836, -6.38383674621582, 3.2883529663085938, -3.7677135467529297, 8.84257698059082, 36.94842529296875, 12.312713623046875, -9.38925552368164, 19.650482177734375, 32.959716796875, -36.37422180175781, 20.71250343322754, 1.999725341796875, 1.212554931640625, 29.36859130859375, 1.1035308837890625, 3.1821212768554688], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000191.npy"} +{"epoch": 0.2887377173091459, "step": 192, "batch_size": 64, "mean": 7.284989356994629, "std": 15.297758102416992, "min": -38.96495056152344, "p10": -7.440819740295409, "median": 4.816825866699219, "p90": 26.5660499572754, "max": 44.303367614746094, "pos_frac": 0.671875, "sample": [-38.96495056152344, -15.139789581298828, 3.9317588806152344, 17.204029083251953, 21.785404205322266, 3.634157180786133, -4.657859802246094, 12.922134399414062, 40.74042510986328, -14.085739135742188, -9.84896469116211, -5.6241302490234375, -1.1364364624023438, 1.2840213775634766, 3.0823440551757812, 10.11065673828125, 27.487560272216797, 5.2724456787109375, -2.968761444091797, 2.0220108032226562, 28.174474716186523, 24.0758056640625, -4.189186096191406, -2.829181671142578, 35.04625701904297, -0.3566474914550781, 9.740249633789062, 24.41585922241211, 4.0962066650390625, 4.3612060546875, 11.491622924804688, 24.191978454589844, 21.880247116088867, 22.5787410736084, -3.361865997314453, -6.517814636230469, 6.508460998535156, -1.519296646118164, -4.631198883056641, 8.333549499511719, 7.116731643676758, -3.986309051513672, -23.501495361328125, 44.303367614746094, 17.895721435546875, 7.191188812255859, -3.3549633026123047, 2.4854507446289062, 9.343986511230469, -18.422119140625, 10.558334350585938, 33.95746994018555, 2.8202133178710938, 17.632774353027344, 0.027379989624023438, 18.632347106933594, 14.198558807373047, -2.3479537963867188, 22.743446350097656, 32.02098846435547, 17.561351776123047, -7.836393356323242, 2.59765625, 6.06181526184082], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000192.npy"} +{"epoch": 0.29024943310657597, "step": 193, "batch_size": 64, "mean": 13.545097351074219, "std": 17.217260360717773, "min": -33.3223991394043, "p10": -3.205062675476074, "median": 8.407800674438477, "p90": 37.1013111114502, "max": 52.53692626953125, "pos_frac": 0.796875, "sample": [0.7404327392578125, 6.849542617797852, 29.48521614074707, 8.20941162109375, 5.657571792602539, -11.69281005859375, 3.21319580078125, 35.7230224609375, -6.44525146484375, -3.353422164916992, 33.79004669189453, 2.210826873779297, 18.67310333251953, 22.472030639648438, 32.52595520019531, -0.693359375, 19.521820068359375, -5.067218780517578, 24.376535415649414, 27.909866333007812, -2.0772705078125, 35.26068878173828, 52.53692626953125, -5.838405609130859, 24.33057403564453, 37.5205078125, 2.7002525329589844, 4.140357971191406, -1.738555908203125, 14.82194709777832, 34.75019073486328, 20.870750427246094, 5.1516876220703125, 13.142005920410156, 12.832099914550781, 8.528305053710938, -2.5692672729492188, 5.055656433105469, 15.934822082519531, 12.925796508789062, -12.831192016601562, 7.282260894775391, 33.6441535949707, 47.096160888671875, -2.8588905334472656, 4.3953704833984375, 16.353086471557617, -1.5492782592773438, 8.287296295166016, 42.209495544433594, 28.386436462402344, 0.9128971099853516, 43.06922912597656, 44.37262725830078, 37.519161224365234, 3.284149169921875, 16.386734008789062, -33.3223991394043, 10.052688598632812, 36.12632751464844, 1.0585975646972656, 2.926492691040039, 1.4494781494140625, 0.2497234344482422], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000193.npy"} +{"epoch": 0.29176114890400606, "step": 194, "batch_size": 64, "mean": 11.22519302368164, "std": 20.43451690673828, "min": -37.97724914550781, "p10": -13.208235168457028, "median": 10.984803199768066, "p90": 38.943169403076176, "max": 49.671974182128906, "pos_frac": 0.734375, "sample": [45.38682556152344, 5.1521453857421875, 17.042892456054688, -15.911039352416992, 34.769439697265625, 6.144100189208984, -27.137659072875977, 2.988483428955078, 4.246391296386719, 11.707077026367188, 8.3812255859375, 19.053146362304688, 5.536689758300781, 34.58219909667969, -14.878509521484375, -7.0769805908203125, 22.003585815429688, -9.310928344726562, 15.68056869506836, -2.2403945922851562, 25.043380737304688, 4.657634735107422, 26.216476440429688, 32.06140899658203, -5.659612655639648, 16.652244567871094, -8.601959228515625, 24.9122314453125, -1.7025833129882812, 15.317939758300781, -2.488494873046875, 38.14612579345703, -17.319087982177734, -7.401462554931641, -32.541893005371094, -1.4712848663330078, 48.59837341308594, 21.099441528320312, 15.209484100341797, 42.80516815185547, -37.97724914550781, 12.59259033203125, 5.599309921264648, 2.2652969360351562, 19.71367645263672, 46.33338928222656, 11.585739135742188, -37.09149932861328, 49.671974182128906, 25.811279296875, 20.465927124023438, 1.4329376220703125, 24.995559692382812, 39.284759521484375, 37.384368896484375, 46.18207550048828, 11.93780517578125, 0.8286972045898438, 6.294471740722656, 25.069305419921875, 6.282022476196289, 2.183116912841797, -2.4699363708496094, 10.383867263793945], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000194.npy"} +{"epoch": 0.29327286470143615, "step": 195, "batch_size": 64, "mean": 13.85733699798584, "std": 19.184165954589844, "min": -29.31561279296875, "p10": -10.54970474243164, "median": 13.33290958404541, "p90": 40.08532485961914, "max": 50.31541442871094, "pos_frac": 0.71875, "sample": [6.1889801025390625, 12.459396362304688, 0.44628143310546875, 12.6849365234375, 47.3474235534668, 31.094863891601562, -2.0909156799316406, 14.732185363769531, 16.963592529296875, 36.7049560546875, 20.974288940429688, 30.615636825561523, -11.663345336914062, -17.39459228515625, -14.105224609375, -29.31561279296875, -1.3752708435058594, 13.183116912841797, 16.35599708557129, 36.32472229003906, -8.79473876953125, 7.796409606933594, 16.631057739257812, 23.10028076171875, 18.304550170898438, 18.763553619384766, 43.673667907714844, 44.113563537597656, 10.271675109863281, 23.458328247070312, 6.587099075317383, -2.599395751953125, 42.606868743896484, 5.9933319091796875, 40.38298797607422, 0.2907867431640625, -6.099817276000977, 37.892539978027344, 27.885528564453125, 30.827285766601562, 13.482702255249023, -9.915260314941406, -2.5230331420898438, -1.57110595703125, -0.5865421295166016, 3.9018688201904297, -2.4339599609375, 39.390777587890625, -24.964019775390625, 1.019235610961914, -15.642013549804688, -1.5665130615234375, 50.31541442871094, 33.66903305053711, 28.389358520507812, 25.11882209777832, 34.10905456542969, 30.389373779296875, -10.821609497070312, 44.359169006347656, 16.380096435546875, 2.1602783203125, 9.992355346679688, 22.99910545349121], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000195.npy"} +{"epoch": 0.2947845804988662, "step": 196, "batch_size": 64, "mean": 11.475703239440918, "std": 16.99241828918457, "min": -47.170345306396484, "p10": -5.90569896697998, "median": 10.944013595581055, "p90": 34.436848449707036, "max": 48.222686767578125, "pos_frac": 0.78125, "sample": [8.323028564453125, -47.170345306396484, -6.3626861572265625, 1.0330963134765625, 13.31878662109375, -10.494077682495117, 2.5132827758789062, 5.0469818115234375, 11.144729614257812, -4.4022064208984375, 7.101165771484375, 34.675201416015625, 36.51988220214844, 14.48883056640625, 11.75704574584961, 9.921195983886719, -28.068180084228516, 32.46099090576172, 0.4296302795410156, 23.78404998779297, -2.766765594482422, 5.87841796875, 39.76546096801758, 0.7129383087158203, -6.326808929443359, 6.049400329589844, 19.606689453125, 13.987831115722656, 11.451217651367188, 48.222686767578125, 12.540359497070312, 25.816448211669922, 2.9926300048828125, -4.92310905456543, -4.4104766845703125, 13.01458740234375, 5.449697494506836, 21.61070442199707, 12.707366943359375, 40.561798095703125, 17.04277801513672, 8.943084716796875, 31.61105728149414, 3.1078453063964844, 25.5618896484375, -7.2940673828125, -0.2186145782470703, 14.07891845703125, 19.709701538085938, 33.88069152832031, 36.595703125, 32.748741149902344, -2.2647857666015625, -4.5954132080078125, 10.743297576904297, 32.5902099609375, 14.972776412963867, 23.816482543945312, 3.7553749084472656, 4.5775604248046875, 4.212917327880859, -6.332630157470703, 13.699798583984375, 45.54022216796875], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000196.npy"} +{"epoch": 0.2962962962962963, "step": 197, "batch_size": 64, "mean": 13.864505767822266, "std": 22.848398208618164, "min": -42.04960250854492, "p10": -18.092807388305662, "median": 10.44360637664795, "p90": 42.70078582763672, "max": 52.886085510253906, "pos_frac": 0.765625, "sample": [-4.629665374755859, 47.572303771972656, 10.036336898803711, 2.5410232543945312, 17.968780517578125, 27.609939575195312, -16.31079864501953, -40.05223083496094, 1.7963714599609375, -0.223602294921875, 30.49981689453125, 42.82228088378906, -21.279212951660156, -22.518768310546875, 9.096427917480469, 47.114036560058594, 19.43518829345703, 3.5465011596679688, 52.886085510253906, 42.41729736328125, 9.584030151367188, 10.850875854492188, 28.887035369873047, 28.604141235351562, 12.817405700683594, 1.65728759765625, 7.6286468505859375, -18.856525421142578, 39.26226806640625, 18.644927978515625, 42.083656311035156, 47.68113708496094, -30.258544921875, 34.60704040527344, -3.334095001220703, -42.04960250854492, 4.925910949707031, 14.05950927734375, 27.895675659179688, 17.24005126953125, -0.4699516296386719, 38.62052917480469, 40.365325927734375, 2.388458251953125, -0.431304931640625, 45.86785888671875, 5.889984130859375, 0.6420745849609375, 9.033760070800781, 33.28449630737305, -12.879701614379883, -6.738471984863281, 30.646499633789062, 26.714696884155273, 5.773430824279785, -28.337921142578125, 50.042137145996094, 27.98534393310547, 2.9919891357421875, 34.7558708190918, 6.378196716308594, 28.8680419921875, 9.684854507446289, 33.99320983886719], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000197.npy"} +{"epoch": 0.29780801209372637, "step": 198, "batch_size": 64, "mean": 14.603824615478516, "std": 17.959632873535156, "min": -27.935073852539062, "p10": -8.193715476989746, "median": 14.234861373901367, "p90": 37.24900398254395, "max": 55.73914337158203, "pos_frac": 0.78125, "sample": [-2.4833984375, 32.138916015625, -0.34241294860839844, 23.421005249023438, 13.241193771362305, 14.241172790527344, -17.304094314575195, 2.7124557495117188, 13.486776351928711, 6.969024658203125, 36.79295349121094, 12.450698852539062, 1.8929634094238281, -21.27061653137207, 55.73914337158203, 43.702110290527344, 22.603866577148438, 26.06036376953125, 19.26153564453125, -7.821168899536133, 26.88068389892578, 26.721723556518555, 40.21826171875, -9.340085983276367, 40.69386291503906, -19.009048461914062, -17.247169494628906, -0.09821510314941406, 30.51409912109375, 29.965120315551758, 34.26737976074219, 20.346038818359375, 14.089614868164062, -27.935073852539062, 10.332305908203125, -2.4892845153808594, 1.7371788024902344, 2.569896697998047, -8.353378295898438, 16.169898986816406, 6.29278564453125, 36.529014587402344, 35.889892578125, 14.22854995727539, 22.534719467163086, 11.594894409179688, 0.15549850463867188, 42.791465759277344, 50.55291748046875, 11.275070190429688, 6.2658233642578125, -0.131744384765625, 27.578704833984375, 37.444454193115234, 7.217262268066406, 14.522171020507812, 16.8389892578125, 17.565946578979492, -1.0695247650146484, 14.935970306396484, 16.99687957763672, 10.640365600585938, 24.90697479248047, 23.561439514160156], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000198.npy"} +{"epoch": 0.29931972789115646, "step": 199, "batch_size": 64, "mean": 11.437995910644531, "std": 21.454248428344727, "min": -41.95908737182617, "p10": -14.296330833435057, "median": 12.51236343383789, "p90": 36.0936954498291, "max": 54.70920181274414, "pos_frac": 0.703125, "sample": [20.453662872314453, 31.401893615722656, 4.9280853271484375, 13.806549072265625, -15.234186172485352, -28.406723022460938, 10.489212036132812, 39.947669982910156, 24.956642150878906, 11.877120971679688, 21.849853515625, -5.086597442626953, 54.70920181274414, 30.546966552734375, 49.97658920288086, 36.28582763671875, 24.151325225830078, 34.06573486328125, 24.800125122070312, 36.09267807006836, -6.3692169189453125, -22.195697784423828, 24.345073699951172, 35.55590057373047, -5.579275131225586, 0.1719207763671875, 22.736270904541016, -9.196296691894531, 8.473709106445312, 29.917152404785156, 29.184799194335938, 7.473672866821289, 19.020816802978516, -1.6801834106445312, -1.422886848449707, 12.627120971679688, 14.074615478515625, -11.042808532714844, -27.235267639160156, 20.30084991455078, -41.95908737182617, 24.36553955078125, 7.331092834472656, 32.08379364013672, -31.269264221191406, 10.733909606933594, 12.397605895996094, 5.505451202392578, -11.374725341796875, 6.6549835205078125, 1.063302993774414, -33.77763366699219, -8.327529907226562, 21.141361236572266, -12.108001708984375, -3.434478759765625, 36.09413146972656, -9.474533081054688, 32.45344543457031, 18.77042007446289, 44.04656982421875, 8.521751403808594, 46.305084228515625, 15.516586303710938], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000199.npy"} +{"epoch": 0.30083144368858655, "step": 200, "batch_size": 64, "mean": 16.49210548400879, "std": 23.16771125793457, "min": -48.950042724609375, "p10": -7.9799310684204094, "median": 13.343205451965332, "p90": 50.13871612548828, "max": 55.24402618408203, "pos_frac": 0.734375, "sample": [7.618896484375, 27.68094253540039, 50.07177734375, 9.148979187011719, 15.246780395507812, 2.1719627380371094, 43.64906311035156, 8.584053039550781, 8.466712951660156, -3.1437301635742188, 5.3688201904296875, 36.694580078125, -13.31026840209961, 50.16740417480469, 3.1689224243164062, -2.7667160034179688, 11.809425354003906, -2.0757598876953125, 51.730125427246094, -3.12042236328125, -1.1659011840820312, -3.3395309448242188, 26.99187469482422, 40.10496139526367, 2.4907665252685547, 28.314041137695312, 38.45429229736328, -17.638954162597656, 34.05459976196289, -2.7768096923828125, 41.228118896484375, 26.485008239746094, 16.661056518554688, 54.76312255859375, 55.24402618408203, -5.959630966186523, -48.950042724609375, 31.39934539794922, 51.44212341308594, 43.70440673828125, 43.33135223388672, 26.29443359375, 53.34870910644531, 16.483016967773438, 11.571212768554688, -35.12303161621094, 4.067710876464844, 13.1312255859375, 8.246404647827148, 53.95085144042969, -8.25909423828125, 18.40302276611328, 13.555185317993164, -10.521774291992188, 13.595039367675781, 18.986907958984375, -7.328550338745117, -14.709407806396484, 23.280479431152344, 12.326831817626953, 1.8489227294921875, -6.710297584533691, 39.01598358154297, 48.041221618652344], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000200.npy"} +{"epoch": 0.30234315948601664, "step": 201, "batch_size": 64, "mean": 12.90915584564209, "std": 21.551111221313477, "min": -36.07975769042969, "p10": -15.825879287719726, "median": 9.497771263122559, "p90": 43.38706970214844, "max": 62.757423400878906, "pos_frac": 0.78125, "sample": [8.455673217773438, 22.129104614257812, 12.467082977294922, 13.622352600097656, 6.712182998657227, 12.853096008300781, 32.93497848510742, 7.462926864624023, 23.535770416259766, 1.7843093872070312, 6.651863098144531, 26.296342849731445, 32.25688934326172, 23.565383911132812, 2.5396900177001953, -28.155426025390625, 62.757423400878906, 43.581275939941406, 0.7108001708984375, 52.3431396484375, -16.292877197265625, 2.8675765991210938, 7.709785461425781, -18.548297882080078, 3.3044795989990234, 46.03940963745117, 23.22201156616211, 16.99358367919922, -14.736217498779297, 42.933921813964844, 2.8498573303222656, 35.57518005371094, 2.472410202026367, -7.685157775878906, 32.2894401550293, 29.427303314208984, 0.13299560546875, -21.812088012695312, 7.6915283203125, 7.0024871826171875, 35.208091735839844, 8.280902862548828, -2.6798229217529297, 17.50855255126953, -6.447505950927734, 21.00232696533203, 11.515636444091797, -28.136260986328125, 10.53986930847168, 55.269683837890625, -4.113382339477539, 11.558837890625, 23.17617416381836, 32.5378303527832, 26.25249671936035, 51.262794494628906, 31.268409729003906, -12.879966735839844, 2.8429641723632812, -16.346572875976562, 48.62204360961914, -0.5898895263671875, 0.6703338623046875, -36.07975769042969], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000201.npy"} +{"epoch": 0.30385487528344673, "step": 202, "batch_size": 64, "mean": 15.218246459960938, "std": 21.214271545410156, "min": -47.57545471191406, "p10": -6.156355476379393, "median": 17.627206802368164, "p90": 38.812939453125004, "max": 73.01385498046875, "pos_frac": 0.796875, "sample": [-6.580318450927734, 13.075973510742188, 55.090885162353516, 73.01385498046875, 36.96564483642578, -4.918304443359375, 26.05657958984375, 26.36669921875, 30.948089599609375, 17.136451721191406, 4.741020202636719, 21.995891571044922, 7.501247406005859, 9.21169662475586, -3.2786102294921875, 29.888626098632812, 30.895912170410156, 2.107940673828125, 26.69098663330078, -8.299751281738281, 13.576980590820312, 21.868980407714844, 27.037216186523438, 2.4921035766601562, -5.167108535766602, 18.802978515625, 6.617738723754883, 55.48591995239258, 1.7375564575195312, 26.160226821899414, -2.8528518676757812, 12.475967407226562, 21.46587371826172, 23.361907958984375, 6.7155303955078125, -47.57545471191406, 22.093292236328125, 18.117961883544922, 29.609664916992188, -30.267974853515625, 22.629165649414062, 22.173080444335938, 24.527931213378906, 13.39483642578125, 39.604637145996094, 15.327568054199219, 33.53895568847656, 4.655550003051758, 44.939361572265625, -3.7052230834960938, 0.48795127868652344, -28.129253387451172, -0.09701347351074219, -8.817480087280273, 4.2114715576171875, 32.839019775390625, 46.72892761230469, 5.160070419311523, 6.827037811279297, 28.954673767089844, -34.54093933105469, 30.852317810058594, 22.0564022064209, 39.98169708251953], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000202.npy"} +{"epoch": 0.30536659108087677, "step": 203, "batch_size": 64, "mean": 13.85640811920166, "std": 21.406339645385742, "min": -34.81797790527344, "p10": -9.236296081542969, "median": 9.538958549499512, "p90": 42.17146148681641, "max": 64.82292175292969, "pos_frac": 0.796875, "sample": [12.518089294433594, 3.6412734985351562, -26.898544311523438, -3.279876708984375, 6.720306396484375, 27.651748657226562, 3.360565185546875, 36.37548828125, 13.128326416015625, -9.303779602050781, 41.11534118652344, 10.695808410644531, 18.348169326782227, 55.19688415527344, 9.740575790405273, 64.82292175292969, 37.874717712402344, 9.277496337890625, 35.59986114501953, 17.432830810546875, -34.81797790527344, 0.14301681518554688, 15.118690490722656, -4.863613128662109, -0.8144969940185547, -15.676925659179688, 8.753189086914062, 52.19123840332031, 4.991020202636719, 30.101585388183594, 11.459854125976562, 3.6751022338867188, 37.67784118652344, 7.939876556396484, 28.07806396484375, 1.1944808959960938, 44.507667541503906, 27.722267150878906, 39.59733581542969, 20.537817001342773, 3.6470718383789062, 0.168304443359375, 4.798744201660156, 21.546058654785156, 31.59796905517578, -6.475830078125, 43.52875518798828, 42.62408447265625, -9.078834533691406, 56.967308044433594, 26.503047943115234, 2.7293357849121094, 3.1160507202148438, 6.319252014160156, 5.3372802734375, -26.528594970703125, 0.635345458984375, 9.33734130859375, 32.579551696777344, 24.40443229675293, 17.146041870117188, -23.545425415039062, -21.592647552490234, -0.48876380920410156], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000203.npy"} +{"epoch": 0.30687830687830686, "step": 204, "batch_size": 64, "mean": 15.188006401062012, "std": 21.34554672241211, "min": -39.56886291503906, "p10": -9.064740180969237, "median": 14.001398086547852, "p90": 47.88549880981446, "max": 56.66438293457031, "pos_frac": 0.75, "sample": [55.330299377441406, 43.06993103027344, -10.081792831420898, 8.03567886352539, 9.7156982421875, 56.66438293457031, 3.2163543701171875, 24.964080810546875, -15.754707336425781, 20.206329345703125, 52.64251708984375, -23.660423278808594, -5.359493255615234, 8.813411712646484, 15.679954528808594, 14.179000854492188, 27.64453125, 4.134590148925781, -19.22980499267578, 1.4162139892578125, 29.566957473754883, 13.446067810058594, 34.55003356933594, 44.318687438964844, -5.768716812133789, -3.1693878173828125, 19.562911987304688, 18.195865631103516, 4.093852996826172, 7.338706970214844, 48.254783630371094, -6.944084167480469, 4.045475006103516, 16.20484161376953, 29.320510864257812, -4.3670501708984375, 18.73596954345703, 52.47012710571289, -3.4683780670166016, 12.33935546875, 7.645442962646484, 13.823795318603516, 40.922935485839844, 40.947837829589844, -9.659378051757812, 18.297103881835938, 20.124359130859375, -1.3586864471435547, 32.62278747558594, -0.07453536987304688, 47.023834228515625, 50.689727783203125, 0.03499603271484375, 26.22467041015625, 22.336883544921875, 51.31448745727539, 28.004653930664062, 1.0223541259765625, 2.5573043823242188, 22.713790893554688, -39.56886291503906, -7.677251815795898, 14.599241256713867, -10.88836669921875], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000204.npy"} +{"epoch": 0.30839002267573695, "step": 205, "batch_size": 64, "mean": 14.476325988769531, "std": 24.380374908447266, "min": -47.63616180419922, "p10": -10.45455207824707, "median": 13.253887176513672, "p90": 44.49487762451172, "max": 74.88726806640625, "pos_frac": 0.71875, "sample": [74.88726806640625, 8.510656356811523, -0.6627540588378906, 13.088138580322266, 17.612415313720703, 60.84822463989258, 8.920343399047852, 23.654380798339844, -45.04986572265625, 42.351165771484375, 5.372926712036133, 5.235828399658203, 70.34293365478516, 18.006057739257812, 17.1136417388916, 5.382041931152344, 11.386703491210938, -4.6336212158203125, -6.1082763671875, 18.49835968017578, 12.646196365356445, 24.347686767578125, 4.379697799682617, 13.865264892578125, 34.348114013671875, -3.2881813049316406, -12.719345092773438, -4.711036682128906, 10.687633514404297, 61.756614685058594, -5.814048767089844, -9.553312301635742, 26.01153564453125, 12.901199340820312, -0.2850189208984375, 23.11236572265625, 19.990144729614258, 29.864089965820312, 0.8050498962402344, 15.744544982910156, -11.46533203125, 42.394371032714844, 30.621112823486328, 26.2569580078125, 53.28330993652344, 45.07843017578125, 2.4458465576171875, 19.11089324951172, 37.94746398925781, -8.533843994140625, 13.419635772705078, 9.356742858886719, 31.192745208740234, 13.938636779785156, -37.57179260253906, 43.13325500488281, 28.880374908447266, -14.85098648071289, 50.22948455810547, -10.561809539794922, -10.20428466796875, -47.63616180419922, -2.2893524169921875, 23.463394165039062], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000205.npy"} +{"epoch": 0.30990173847316704, "step": 206, "batch_size": 64, "mean": 10.745919227600098, "std": 24.734865188598633, "min": -43.631561279296875, "p10": -22.32185497283935, "median": 6.968430519104004, "p90": 46.96407928466797, "max": 56.6571044921875, "pos_frac": 0.671875, "sample": [-16.233957290649414, 1.8154144287109375, 3.646728515625, -31.334762573242188, -13.765714645385742, -3.044036865234375, 6.5245513916015625, 9.732315063476562, 36.853912353515625, 14.628005981445312, -8.817068099975586, 54.25501251220703, 22.721752166748047, -6.697126388549805, -10.378273010253906, 31.72161865234375, -2.5388946533203125, 56.6571044921875, -24.930953979492188, 7.113882064819336, 55.22284698486328, 27.250431060791016, 7.99993896484375, 7.3246917724609375, -9.152042388916016, 46.96491241455078, 8.701408386230469, -36.19688415527344, 29.667917251586914, 31.288360595703125, 38.41459655761719, 49.04429626464844, 2.5107955932617188, 6.778289794921875, 42.63929748535156, 5.5968017578125, -43.631561279296875, -25.41986846923828, -5.69868278503418, -1.6411285400390625, 23.578392028808594, -1.0197715759277344, 27.01397705078125, -11.372917175292969, -3.9419593811035156, -29.889324188232422, 49.90961837768555, 26.697662353515625, 5.224967956542969, 8.4935302734375, 31.15118408203125, 45.71308898925781, 25.749603271484375, -12.428321838378906, 24.37841033935547, 46.962135314941406, 6.822978973388672, 4.680091857910156, 14.741073608398438, 50.94914245605469, -36.496376037597656, 3.5910491943359375, 0.49819183349609375, 21.13849639892578], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000206.npy"} +{"epoch": 0.31141345427059713, "step": 207, "batch_size": 64, "mean": 15.113813400268555, "std": 22.498563766479492, "min": -32.39173889160156, "p10": -10.230665588378907, "median": 9.700296401977539, "p90": 48.950424957275395, "max": 64.47627258300781, "pos_frac": 0.75, "sample": [64.47627258300781, 6.463785171508789, -9.327129364013672, 5.510993957519531, 12.206733703613281, 20.118621826171875, -3.889923095703125, 7.911102294921875, 2.3456344604492188, 49.321868896484375, 11.469856262207031, 7.777656555175781, -0.7082710266113281, 50.06183624267578, -4.107400894165039, -9.965751647949219, 16.41522216796875, 28.25830078125, 15.8448486328125, 44.357601165771484, 42.81338119506836, 12.229354858398438, 15.702919006347656, 0.318359375, -13.143415451049805, -8.058090209960938, -4.092126846313477, 48.09874725341797, -17.26947021484375, 8.946800231933594, 47.352783203125, 9.692859649658203, 63.07794189453125, -10.344200134277344, 6.0562896728515625, -5.849330902099609, -21.899202346801758, 18.036483764648438, 9.14532470703125, 2.428091049194336, 32.97813415527344, 40.55815124511719, 5.260658264160156, 24.737079620361328, 1.4559326171875, 28.880401611328125, 33.00825119018555, -32.39173889160156, 44.101478576660156, 23.6058349609375, -23.809104919433594, 31.183561325073242, 9.707733154296875, 15.999214172363281, 6.188232421875, 56.912757873535156, 49.3154296875, 6.667579650878906, 22.228439331054688, 25.46738624572754, -10.620681762695312, -4.0942535400390625, 5.8976898193359375, 56.260494232177734], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000207.npy"} +{"epoch": 0.3129251700680272, "step": 208, "batch_size": 64, "mean": 8.14013957977295, "std": 22.422189712524414, "min": -44.396636962890625, "p10": -16.992495727539062, "median": 6.470747947692871, "p90": 38.81125793457032, "max": 55.40144348144531, "pos_frac": 0.609375, "sample": [5.32917594909668, 1.6802310943603516, 35.336795806884766, -9.768997192382812, 41.55729675292969, 42.134422302246094, 6.567432403564453, -7.9908294677734375, -17.802032470703125, -37.755523681640625, -5.5279083251953125, -13.82928466796875, 36.46142578125, 27.888946533203125, 33.57709884643555, 6.374063491821289, 8.813690185546875, 16.3248291015625, -5.929464340209961, -17.727554321289062, 30.632339477539062, -8.442237854003906, 4.4666748046875, -19.71971893310547, 27.41788101196289, 29.100431442260742, 34.732826232910156, -15.277359008789062, 11.567451477050781, 23.986459732055664, -13.649532318115234, -1.7978897094726562, -14.436946868896484, 14.617996215820312, -30.552413940429688, 23.856918334960938, 45.65401840209961, 34.19219970703125, 15.180000305175781, 0.4336204528808594, 55.40144348144531, 16.458587646484375, 5.123085021972656, -9.44913101196289, 39.818328857421875, -13.835739135742188, 46.964813232421875, -4.922178268432617, 17.76152992248535, 10.223798751831055, -14.938339233398438, 22.50666046142578, -0.9596099853515625, 25.93206787109375, -14.934642791748047, 12.644805908203125, 11.894241333007812, -5.950716018676758, -29.753690719604492, -2.387115478515625, -44.396636962890625, 10.673660278320312, 6.099143981933594, 43.31806182861328], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000208.npy"} +{"epoch": 0.3144368858654573, "step": 209, "batch_size": 64, "mean": 18.138729095458984, "std": 26.70542335510254, "min": -58.63734436035156, "p10": -4.867845153808593, "median": 14.943488121032715, "p90": 51.71173934936524, "max": 74.3055648803711, "pos_frac": 0.75, "sample": [48.10102462768555, 49.29785919189453, 6.899658203125, 18.21567153930664, -8.360496520996094, 62.053619384765625, 14.270589828491211, 43.91822814941406, 11.300971984863281, 59.462005615234375, -1.4340744018554688, 3.7999954223632812, -30.225250244140625, 45.85377502441406, 4.35235595703125, 15.616386413574219, -4.18756103515625, -2.6087417602539062, -2.582408905029297, 66.25514221191406, 4.6109619140625, -3.350128173828125, -0.7886924743652344, 29.692703247070312, 5.364265441894531, 8.687530517578125, 31.388084411621094, 25.480453491210938, 54.96142578125, 20.064132690429688, 25.460424423217773, 28.443695068359375, 10.42715835571289, 48.69792938232422, 52.09569549560547, -1.827789306640625, 50.81584167480469, 26.461105346679688, -58.63734436035156, 3.93072509765625, -11.959342956542969, 4.2052459716796875, -4.6870880126953125, -4.9453125, 43.61579895019531, 13.60555648803711, 74.3055648803711, 43.7265625, 18.82757568359375, 41.17844772338867, 10.694551467895508, -29.55405044555664, 6.510103225708008, 24.952529907226562, 10.358428955078125, 4.118814468383789, 28.89761734008789, -54.02093505859375, 18.840057373046875, 24.158451080322266, 48.94294738769531, 53.97385787963867, 33.477317810058594, -0.32109832763671875], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000209.npy"} +{"epoch": 0.31594860166288735, "step": 210, "batch_size": 64, "mean": 17.608631134033203, "std": 24.584627151489258, "min": -29.342666625976562, "p10": -16.780210685729976, "median": 13.578474044799805, "p90": 54.67536773681641, "max": 65.02630615234375, "pos_frac": 0.796875, "sample": [57.35771942138672, 10.439834594726562, 13.347381591796875, 18.82891845703125, -2.629180908203125, 28.625213623046875, 65.02630615234375, 25.780426025390625, 59.27238464355469, 55.39910888671875, 3.8861351013183594, 58.74320983886719, 53.9703369140625, 9.194686889648438, 54.97752380371094, 3.679473876953125, -28.765975952148438, -25.979244232177734, 48.48027038574219, -19.80438232421875, 47.81333923339844, 15.158798217773438, 10.12150764465332, -4.94976806640625, 46.66864776611328, 3.7477874755859375, 0.042209625244140625, 8.866722106933594, 49.31188201904297, -1.6633682250976562, 49.61640167236328, 16.38420867919922, 19.86407470703125, 9.713638305664062, 15.048927307128906, -2.4289016723632812, 3.1692047119140625, -10.646434783935547, 0.12726593017578125, 48.19065856933594, -19.408971786499023, 29.940155029296875, 18.330612182617188, 5.626930236816406, 34.673797607421875, -0.6240100860595703, 17.345312118530273, 8.687484741210938, 13.716896057128906, 5.032886505126953, 13.440052032470703, 35.687843322753906, 16.164287567138672, -27.044710159301758, 5.037010192871094, 60.817726135253906, 34.50450134277344, 26.042266845703125, 35.63469696044922, -29.342666625976562, 3.008596420288086, -20.477806091308594, 12.962554931640625, 33.209983825683594], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000210.npy"} +{"epoch": 0.31746031746031744, "step": 211, "batch_size": 64, "mean": 16.591938018798828, "std": 23.04530906677246, "min": -31.267784118652344, "p10": -8.78426284790039, "median": 10.791126251220703, "p90": 51.078378295898446, "max": 83.72442626953125, "pos_frac": 0.765625, "sample": [0.9473705291748047, -31.267784118652344, 24.211219787597656, 4.231027603149414, 0.19660186767578125, -0.21329307556152344, -8.250167846679688, -0.558807373046875, 23.12139892578125, 4.580488204956055, 16.775680541992188, -2.4545555114746094, 24.33441925048828, 48.677154541015625, 6.904499053955078, 29.19290542602539, 1.2148609161376953, -0.6674232482910156, 48.33567428588867, -11.02315902709961, 9.430992126464844, -15.76165771484375, 25.509967803955078, -16.50152587890625, 7.914608001708984, -12.859235763549805, 0.6108512878417969, 16.879776000976562, 57.95553207397461, 12.770378112792969, 22.64539337158203, 12.151260375976562, 15.435522079467773, 2.4551620483398438, 52.45887756347656, 18.39395523071289, 13.3311767578125, 7.6041717529296875, -9.013160705566406, 25.048721313476562, 8.1199951171875, 83.72442626953125, 69.170166015625, 2.317403793334961, -3.8663253784179688, 30.117794036865234, 52.06690979003906, 28.010086059570312, 22.20665740966797, 56.45741271972656, -10.378334045410156, 20.139850616455078, 48.77180480957031, 44.17790222167969, 35.35602569580078, 45.92167663574219, 8.878021240234375, 33.1948356628418, -8.13886833190918, 54.44804382324219, 5.7886199951171875, -4.7508544921875, 9.341087341308594, 6.0607452392578125], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000211.npy"} +{"epoch": 0.31897203325774753, "step": 212, "batch_size": 64, "mean": 17.505916595458984, "std": 25.33898162841797, "min": -60.134918212890625, "p10": -10.054711532592773, "median": 17.73275375366211, "p90": 54.67212448120118, "max": 67.75814819335938, "pos_frac": 0.734375, "sample": [55.806304931640625, 29.638622283935547, 34.29895782470703, 49.66523361206055, -3.377573013305664, 6.613067626953125, 64.90470886230469, 27.477140426635742, -9.830909729003906, 41.709571838378906, -6.062046051025391, -60.134918212890625, 41.44603729248047, 67.75814819335938, 7.193870544433594, 42.219200134277344, 36.91871643066406, 26.403169631958008, -15.635566711425781, 25.310129165649414, 20.157440185546875, 3.675323486328125, 0.2658405303955078, 18.91088104248047, -35.04234313964844, -0.7961273193359375, 28.93353271484375, 3.2802257537841797, 52.02570343017578, 58.06986999511719, 25.442943572998047, 33.90663146972656, 26.37201690673828, 14.172065734863281, 16.55462646484375, 9.395713806152344, -9.983043670654297, 24.21588897705078, 1.1614303588867188, 12.581981658935547, -2.1130828857421875, 9.421546936035156, -0.3667335510253906, -5.3553924560546875, 20.746530532836914, 32.16785430908203, 22.58043098449707, 59.47215270996094, -14.778850555419922, -13.173538208007812, -2.7364673614501953, 2.6627120971679688, 28.194435119628906, -10.085426330566406, 32.426605224609375, 55.848175048828125, 44.109642028808594, 59.165748596191406, 36.723785400390625, 1.754730224609375, 7.8329620361328125, 12.91937255859375, -22.38006591796875, -0.28098297119140625], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000212.npy"} +{"epoch": 0.3204837490551776, "step": 213, "batch_size": 64, "mean": 19.930387496948242, "std": 27.206741333007812, "min": -61.01996612548828, "p10": -10.855122756958007, "median": 17.35070037841797, "p90": 56.660162353515624, "max": 91.68264770507812, "pos_frac": 0.796875, "sample": [37.70473861694336, 26.588455200195312, 7.34759521484375, 47.11260986328125, 25.60704803466797, 12.090906143188477, -15.79833984375, -10.424007415771484, -11.039886474609375, 42.73957443237305, 57.64747619628906, 3.5836868286132812, 12.569320678710938, -9.078609466552734, -61.01996612548828, -16.495407104492188, 35.25450134277344, 91.68264770507812, -4.532196044921875, 30.08441925048828, 43.71848678588867, -29.258663177490234, 53.83257293701172, 71.1690902709961, 43.08067321777344, 13.506072998046875, -4.546573638916016, -26.697105407714844, 5.486457824707031, 10.111154556274414, -13.14120101928711, 19.6116943359375, 20.45142364501953, 14.517169952392578, 26.920394897460938, 24.207611083984375, 4.299617767333984, 32.19172668457031, 53.10936737060547, 7.61932373046875, 9.8758544921875, 19.449424743652344, 57.13815689086914, 2.2071399688720703, 43.03375244140625, 21.135986328125, 3.925952911376953, 38.1673469543457, 59.48399353027344, 4.956443786621094, -0.6252365112304688, 31.21129608154297, -8.336227416992188, 0.7596282958984375, 5.436859130859375, 20.70545196533203, 12.122161865234375, 56.448974609375, 15.251976013183594, 3.937744140625, 49.888580322265625, 56.75067138671875, 42.67797088623047, 58.127071380615234], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000213.npy"} +{"epoch": 0.3219954648526077, "step": 214, "batch_size": 64, "mean": 20.214689254760742, "std": 27.888322830200195, "min": -37.30230712890625, "p10": -12.53691997528076, "median": 17.456165313720703, "p90": 56.80301971435547, "max": 81.45387268066406, "pos_frac": 0.6875, "sample": [35.54425048828125, 27.83514404296875, -4.296905517578125, 14.492023468017578, 17.552734375, 46.16395568847656, 4.185138702392578, 13.322214126586914, 34.580177307128906, 46.18531036376953, 55.84656524658203, 41.95315933227539, 26.006376266479492, -1.0379180908203125, 43.77173614501953, 46.19630432128906, 36.72718811035156, -37.30230712890625, 32.298866271972656, 32.464359283447266, -2.707183837890625, 31.110301971435547, 12.191925048828125, -5.4560546875, -0.9284191131591797, 44.672454833984375, -18.885513305664062, 23.364164352416992, 61.52439498901367, 41.553428649902344, 17.359596252441406, -6.168479919433594, -12.007226943969727, 3.7900161743164062, 31.47077178955078, 45.80574035644531, -25.434539794921875, -8.894973754882812, 57.212928771972656, 81.45387268066406, -2.515289306640625, -12.763931274414062, 53.52930450439453, 38.50640106201172, 63.71394729614258, 73.6346435546875, 4.924015045166016, 0.679229736328125, 12.869060516357422, -7.798236846923828, -20.47735595703125, 65.2577133178711, 10.498586654663086, -5.164752960205078, 6.034517288208008, -1.1667594909667969, 66.66055297851562, 16.429840087890625, -36.473968505859375, 35.4766845703125, 34.079551696777344, 38.602962493896484, -4.473613739013672, -19.83856773376465], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000214.npy"} +{"epoch": 0.3235071806500378, "step": 215, "batch_size": 64, "mean": 20.5859317779541, "std": 28.928173065185547, "min": -43.705726623535156, "p10": -16.899303245544434, "median": 15.504276275634766, "p90": 55.56245307922364, "max": 77.50411987304688, "pos_frac": 0.734375, "sample": [21.761127471923828, -24.802230834960938, -43.705726623535156, 27.343826293945312, 19.559463500976562, -27.48351287841797, 10.153457641601562, -3.164093017578125, 52.83912658691406, 55.78622055053711, 9.3780517578125, -2.9396629333496094, -21.3787841796875, 16.71477508544922, 22.975021362304688, 59.7998046875, 3.2257766723632812, 51.48802185058594, 2.4573593139648438, 0.8575592041015625, 14.293777465820312, 6.880989074707031, -3.804851531982422, 35.904991149902344, 50.56134796142578, 3.2115650177001953, -1.9784164428710938, 44.945098876953125, 48.12776184082031, -16.24747657775879, 0.4951820373535156, 51.24823760986328, 4.138591766357422, -14.156585693359375, -13.272491455078125, -23.37213134765625, 43.28443908691406, 34.58965301513672, 39.50382995605469, 70.9381103515625, 14.100555419921875, 12.131217956542969, -0.270904541015625, -1.0528182983398438, 47.6610107421875, 55.04032897949219, 65.48961639404297, 65.09529113769531, 48.40516662597656, 77.50411987304688, 28.13370132446289, 54.894248962402344, 41.959442138671875, -17.17865753173828, 12.00257682800293, 3.3659496307373047, 22.74200439453125, 69.40476989746094, 43.54033660888672, -1.2213306427001953, 43.51439666748047, 3.400707244873047, 45.127357482910156, -22.446670532226562], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000215.npy"} +{"epoch": 0.3250188964474679, "step": 216, "batch_size": 64, "mean": 21.47696304321289, "std": 25.634645462036133, "min": -47.528587341308594, "p10": -5.1634498596191385, "median": 20.817537307739258, "p90": 53.54847793579102, "max": 79.27835083007812, "pos_frac": 0.78125, "sample": [5.2393341064453125, 51.96327209472656, 45.56640625, 47.46409606933594, 31.023035049438477, 11.76730728149414, 19.213817596435547, 8.925460815429688, 32.59808349609375, 50.32067108154297, 38.13170623779297, 29.11566162109375, 5.502571105957031, 8.29534912109375, 24.86688232421875, -9.215988159179688, 8.126197814941406, 20.22528076171875, -2.7276458740234375, 65.77603149414062, 31.552520751953125, 59.52760314941406, 28.96851348876953, 45.56182098388672, 30.95185089111328, 18.296337127685547, 61.57196807861328, 1.9937705993652344, 3.2062911987304688, 61.05165100097656, 46.010169982910156, -47.528587341308594, 15.06357192993164, 27.343074798583984, 16.660919189453125, 29.589385986328125, -24.286224365234375, 1.011545181274414, 22.638469696044922, -3.0831642150878906, -2.517345428466797, 79.27835083007812, 54.22785186767578, -16.556602478027344, 11.479438781738281, -17.467010498046875, 21.409793853759766, 2.902515411376953, 1.5048904418945312, 37.272308349609375, 69.18275451660156, -25.508434295654297, -5.8951873779296875, -0.03800392150878906, 51.50884246826172, -0.9816150665283203, 14.234052658081055, 35.40367889404297, -3.4560623168945312, 49.967010498046875, -2.20050048828125, 44.73710632324219, 28.298721313476562, 29.459976196289062], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000216.npy"} +{"epoch": 0.32653061224489793, "step": 217, "batch_size": 64, "mean": 22.724578857421875, "std": 27.873289108276367, "min": -36.34539031982422, "p10": -9.644093704223632, "median": 16.94437026977539, "p90": 56.77318267822266, "max": 87.02664184570312, "pos_frac": 0.75, "sample": [39.8564453125, 53.747589111328125, -10.309967041015625, -2.9244041442871094, -1.1627025604248047, -7.418628692626953, 4.683784484863281, 87.02664184570312, -8.187347412109375, 14.29156494140625, 74.98567199707031, 76.32929992675781, 8.197105407714844, -10.268413543701172, 14.3447265625, 6.433998107910156, 55.62580871582031, 31.786643981933594, 10.0689697265625, 56.14588928222656, 15.993341445922852, 29.062856674194336, 9.537429809570312, 50.76704406738281, 13.581428527832031, 52.9099006652832, -36.34539031982422, -2.5137252807617188, 3.451457977294922, 17.868717193603516, 56.03010177612305, 23.420677185058594, 22.986114501953125, -12.85760498046875, 35.39509582519531, -19.000293731689453, 8.614486694335938, 35.64574432373047, -0.239990234375, -22.596694946289062, -31.579483032226562, 46.896514892578125, 29.562774658203125, -2.509124755859375, -0.90826416015625, 8.912940979003906, 13.113433837890625, 14.663177490234375, 38.28929138183594, 78.3714599609375, 24.152847290039062, 49.975685119628906, 16.020023345947266, 2.6737537384033203, 62.53068542480469, 39.87202453613281, 63.73680877685547, 32.70970916748047, 28.504676818847656, 53.2308235168457, 36.16115951538086, 57.042022705078125, 20.611854553222656, -2.6251983642578125], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000217.npy"} +{"epoch": 0.328042328042328, "step": 218, "batch_size": 64, "mean": 13.889861106872559, "std": 31.380884170532227, "min": -76.06334686279297, "p10": -20.506337738037107, "median": 14.634086608886719, "p90": 55.14914016723634, "max": 82.22662353515625, "pos_frac": 0.671875, "sample": [6.609901428222656, 1.1317138671875, 20.29418182373047, 29.99427604675293, 4.16497802734375, -12.303634643554688, 10.40374755859375, -0.54888916015625, -2.72625732421875, 51.329612731933594, 15.714401245117188, 14.617568969726562, 57.17719268798828, -47.61515808105469, -20.77458953857422, -34.96757507324219, 8.920272827148438, 61.635162353515625, -37.05418395996094, -8.088603973388672, 30.789390563964844, 22.344192504882812, 7.108909606933594, 17.656414031982422, 35.492733001708984, 82.22662353515625, 56.32825469970703, 74.597412109375, 23.41744041442871, 31.937576293945312, -0.6305694580078125, 31.805999755859375, 28.7548828125, -13.705928802490234, -14.198467254638672, -19.880416870117188, 7.532958984375, 21.705564498901367, -0.82220458984375, 46.44574737548828, 50.13439178466797, 31.230682373046875, -4.941112518310547, 6.9042510986328125, 19.28652572631836, -19.676097869873047, 37.130332946777344, -0.6142406463623047, -37.242469787597656, -13.579757690429688, 52.39787292480469, -46.27253723144531, 20.968063354492188, 0.2857933044433594, 18.813087463378906, 44.09014892578125, 6.434238433837891, 65.82054901123047, -76.06334686279297, -5.8652801513671875, 26.043724060058594, 14.650604248046875, 41.83721923828125, 70.35784912109375], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000218.npy"} +{"epoch": 0.3295540438397581, "step": 219, "batch_size": 64, "mean": 14.903000831604004, "std": 24.777393341064453, "min": -41.011253356933594, "p10": -14.907868194580077, "median": 11.254783630371094, "p90": 50.01106147766114, "max": 65.69242095947266, "pos_frac": 0.71875, "sample": [11.488876342773438, 56.082218170166016, 37.487709045410156, 10.786828994750977, 27.270858764648438, -0.22747039794921875, 3.9104347229003906, 1.8168468475341797, 15.997314453125, -15.693145751953125, -4.932538986206055, 65.26360321044922, 34.871917724609375, -27.972126007080078, -24.892784118652344, 28.792083740234375, 24.43720245361328, 2.8612442016601562, 19.33932113647461, 2.2594165802001953, 2.8524608612060547, -13.00799560546875, -13.075553894042969, 15.223834991455078, -16.160720825195312, 2.8592529296875, 7.291236877441406, -1.6956424713134766, 22.123703002929688, 11.02069091796875, 41.86389923095703, 55.530426025390625, 56.39021301269531, 59.283470153808594, 26.986839294433594, 49.795379638671875, -6.2415924072265625, 4.88264274597168, -5.202766418457031, 22.59603500366211, 28.143125534057617, 15.6676025390625, -41.011253356933594, 27.803977966308594, -5.801414489746094, -3.7178726196289062, 33.223876953125, 2.9395751953125, 23.248443603515625, 65.69242095947266, 38.009246826171875, 45.316131591796875, 14.853267669677734, -4.341667175292969, -37.408817291259766, 4.551158905029297, 9.670692443847656, 7.34381103515625, 39.39002990722656, -1.6136856079101562, 50.10349655151367, -19.97747802734375, 44.277259826660156, 25.16656494140625], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000219.npy"} +{"epoch": 0.3310657596371882, "step": 220, "batch_size": 64, "mean": 17.65694808959961, "std": 30.0477237701416, "min": -53.57484817504883, "p10": -13.331594848632813, "median": 16.024919509887695, "p90": 57.403983306884776, "max": 84.443115234375, "pos_frac": 0.65625, "sample": [21.03911781311035, -9.252716064453125, 27.00800323486328, 11.750228881835938, 4.480354309082031, 29.521209716796875, 79.60171508789062, 19.158981323242188, 9.998584747314453, 8.855117797851562, -7.7477569580078125, 69.14717102050781, 5.338228225708008, -33.102386474609375, -13.527435302734375, -12.370048522949219, 55.77886199951172, -1.8533401489257812, -4.885257720947266, 1.048858642578125, 44.31171417236328, 15.797637939453125, -5.182201385498047, -38.901641845703125, -28.92542266845703, -15.146821975708008, -6.028827667236328, -16.89532470703125, -12.8746337890625, 35.762939453125, 39.85223388671875, 25.859359741210938, 30.8134765625, 52.464256286621094, 58.1004638671875, 6.6055450439453125, 47.567626953125, 31.637794494628906, 44.16425323486328, -5.603813171386719, 4.506492614746094, 32.29457473754883, -8.694572448730469, 28.216060638427734, 84.443115234375, -6.038238525390625, 63.01190948486328, -0.3153247833251953, 21.010194778442383, 58.76387023925781, 49.64769744873047, -5.993797302246094, 51.336578369140625, -2.3934974670410156, 17.11144256591797, 16.66968536376953, -53.57484817504883, 16.252201080322266, 42.37298583984375, 2.5936031341552734, 81.65151977539062, -8.35323715209961, 50.77336502075195, 31.386789321899414], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000220.npy"} +{"epoch": 0.3325774754346183, "step": 221, "batch_size": 64, "mean": 19.449796676635742, "std": 29.804393768310547, "min": -46.71910095214844, "p10": -17.8038516998291, "median": 12.565549850463867, "p90": 61.05582733154301, "max": 90.53543090820312, "pos_frac": 0.75, "sample": [10.499212265014648, -16.992572784423828, 20.553871154785156, 22.6240234375, -1.7359962463378906, 52.33892822265625, -5.282575607299805, 12.43841552734375, 29.676074981689453, -26.04035186767578, -2.88800048828125, 15.116012573242188, 12.692684173583984, 17.53296661376953, -20.05266571044922, 10.836450576782227, 1.1198272705078125, -2.0721092224121094, 33.16827392578125, 31.08047103881836, 50.53746795654297, 50.77388000488281, 12.294902801513672, 46.568572998046875, 90.53543090820312, 6.2067413330078125, 44.70379638671875, 76.8277587890625, -4.738441467285156, 10.67881965637207, 31.652297973632812, 64.79164123535156, 3.9655113220214844, 28.207672119140625, 80.10514068603516, 9.689151763916016, 40.004852294921875, -20.529388427734375, 26.919525146484375, 49.655609130859375, 37.11969757080078, -18.15154266357422, 4.625480651855469, -0.8209037780761719, 0.6807117462158203, -0.9071502685546875, 1.276407241821289, 72.16766357421875, 5.043617248535156, 6.230342864990234, -27.760665893554688, -46.71910095214844, 3.1849632263183594, 79.23968505859375, 44.854705810546875, -29.775197982788086, 13.686195373535156, 24.52063751220703, 81.73408508300781, 44.44580078125, 1.3064804077148438, -0.249603271484375, 41.07954788208008, 14.511314392089844], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000221.npy"} +{"epoch": 0.3340891912320484, "step": 222, "batch_size": 64, "mean": 26.194103240966797, "std": 30.851490020751953, "min": -39.84600830078125, "p10": -9.535285758972167, "median": 25.46910858154297, "p90": 62.7867000579834, "max": 100.99746704101562, "pos_frac": 0.765625, "sample": [-3.0590858459472656, -34.21807098388672, 28.93218994140625, 10.708709716796875, 51.55465316772461, 52.547523498535156, 29.34061050415039, -10.254207611083984, 55.27113342285156, 68.93827056884766, 33.983154296875, 6.488849639892578, -28.06330108642578, 4.013206481933594, 45.56993865966797, 5.692291259765625, 11.805854797363281, 9.179153442382812, 8.03231430053711, 44.872825622558594, 36.90215301513672, -0.265380859375, 46.211883544921875, 59.481300354003906, -4.413673400878906, 63.46006774902344, -11.905006408691406, 96.28414916992188, -2.381898880004883, 40.39508056640625, 21.24814796447754, 20.988388061523438, 62.27507019042969, 54.961578369140625, 17.990768432617188, 38.252166748046875, 40.47882080078125, -5.7146148681640625, -7.85780143737793, -3.1743011474609375, -39.84600830078125, 30.60985565185547, 22.006027221679688, 17.512557983398438, 3.6522979736328125, 100.99746704101562, 13.678688049316406, -32.68302917480469, 3.6512374877929688, 46.522254943847656, 53.693138122558594, -1.3456611633300781, 53.46708679199219, 73.3479995727539, 36.654518127441406, 12.719108581542969, 63.0059700012207, 56.06158447265625, 9.68670654296875, 57.01847839355469, 39.80253601074219, 39.649383544921875, 72.91082763671875, -10.903244018554688], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000222.npy"} +{"epoch": 0.3356009070294785, "step": 223, "batch_size": 64, "mean": 21.540252685546875, "std": 28.409948348999023, "min": -28.907073974609375, "p10": -11.733687019348144, "median": 18.851890563964844, "p90": 60.18026428222659, "max": 85.13412475585938, "pos_frac": 0.71875, "sample": [38.70435333251953, 9.269233703613281, 45.68206024169922, 8.765228271484375, -5.967063903808594, 37.97347640991211, -2.6652679443359375, 25.985565185546875, 10.731548309326172, 32.72212600708008, 2.3661537170410156, 70.86155700683594, 42.14897918701172, 47.897003173828125, 6.994037628173828, -16.751949310302734, -1.6657600402832031, 45.873321533203125, 7.93963623046875, -8.699974060058594, 54.04579544067383, 27.144981384277344, -16.97882080078125, 37.11906433105469, -15.045394897460938, 2.34356689453125, -6.105409622192383, 49.08815002441406, -6.75261116027832, -20.09014129638672, 47.27055740356445, 14.762916564941406, -28.907073974609375, 6.100223541259766, 1.74493408203125, 72.50096893310547, 47.75177001953125, 33.210628509521484, -11.736587524414062, -24.902698516845703, -10.130836486816406, -11.726919174194336, 29.30821990966797, 41.07616424560547, 69.03509521484375, 14.969364166259766, 31.607513427734375, 44.55491638183594, 17.027984619140625, 62.809322357177734, 84.50191497802734, -10.362922668457031, 85.13412475585938, 63.12848663330078, 43.47748565673828, 27.028045654296875, 47.07600402832031, 46.2945556640625, 20.675796508789062, -3.496173858642578, -0.5450897216796875, 22.355316162109375, 3.066631317138672, 0.9821395874023438], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000223.npy"} +{"epoch": 0.3371126228269085, "step": 224, "batch_size": 64, "mean": 12.420958518981934, "std": 29.1590633392334, "min": -56.11946487426758, "p10": -26.215832328796385, "median": 7.004047393798828, "p90": 51.46282463073732, "max": 85.13006591796875, "pos_frac": 0.671875, "sample": [22.808330535888672, 85.13006591796875, 21.443880081176758, 25.030075073242188, 8.028488159179688, 62.15866470336914, 32.889198303222656, 35.4488525390625, -1.8174362182617188, 5.64251708984375, 46.378726959228516, 7.842153549194336, 42.909019470214844, 56.62785720825195, -28.635894775390625, -1.3474693298339844, 7.936735153198242, 15.895984649658203, 29.96044158935547, 2.2006683349609375, 5.762489318847656, 25.484664916992188, -1.2467498779296875, -43.30487823486328, -8.644134521484375, -0.23422622680664062, -12.624786376953125, -12.31378173828125, 20.725311279296875, 7.103759765625, 37.954071044921875, -56.11946487426758, -24.2534122467041, -17.203460693359375, -3.9770126342773438, 0.1316509246826172, -3.3912200927734375, -42.154808044433594, 6.904335021972656, 25.976181030273438, -28.469741821289062, 26.591049194335938, 44.267784118652344, 6.034217834472656, -27.056869506835938, 6.55364990234375, 16.371017456054688, 31.078685760498047, -28.074539184570312, -9.690910339355469, -4.887886047363281, 25.143495559692383, 42.314125061035156, 53.6417236328125, 80.14314270019531, 25.460617065429688, 4.948211669921875, 13.198760986328125, 0.9705600738525391, 65.89915466308594, -7.927337646484375, 70.57089233398438, 3.30120849609375, 3.454967498779297], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000224.npy"} +{"epoch": 0.3386243386243386, "step": 225, "batch_size": 64, "mean": 23.1850643157959, "std": 30.624958038330078, "min": -43.01141357421875, "p10": -7.990974998474117, "median": 16.050302505493164, "p90": 68.48686065673829, "max": 91.19357299804688, "pos_frac": 0.765625, "sample": [3.8475284576416016, 27.678634643554688, 5.32421875, -0.623199462890625, 5.00372314453125, 45.25323486328125, -1.6562309265136719, -0.538665771484375, 30.81883430480957, 15.182621002197266, 7.103691101074219, 53.96502685546875, 9.572731018066406, 66.62348937988281, -16.594005584716797, 5.071323394775391, 16.917984008789062, 11.729133605957031, 47.75497055053711, 67.62353515625, 71.31053924560547, 30.69849967956543, 85.16063690185547, 35.744293212890625, 91.19357299804688, 17.754146575927734, 3.447662353515625, 49.24378204345703, 68.85685729980469, -3.990083694458008, 0.2427520751953125, -24.457275390625, 37.87059783935547, -11.333717346191406, 77.15635681152344, 38.3575439453125, 2.275676727294922, 17.228485107421875, 39.707489013671875, 13.407341003417969, 4.358711242675781, 11.44610595703125, 63.73529815673828, -1.8880023956298828, 39.719512939453125, -43.01141357421875, -29.453643798828125, -3.7960586547851562, 25.01214599609375, 14.028831481933594, 51.542579650878906, -0.14318275451660156, 6.053886413574219, 77.67098999023438, 54.08414077758789, -1.9826679229736328, 10.142135620117188, 22.178001403808594, 73.0184326171875, 31.396265029907227, -35.661773681640625, 29.23602294921875, 55.92974090576172, -9.705642700195312], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000225.npy"} +{"epoch": 0.3401360544217687, "step": 226, "batch_size": 64, "mean": 18.544370651245117, "std": 33.095645904541016, "min": -55.92768859863281, "p10": -23.79973754882812, "median": 18.817094802856445, "p90": 61.54630279541016, "max": 78.43881225585938, "pos_frac": 0.71875, "sample": [9.418342590332031, -26.73827362060547, 30.234909057617188, 28.53255271911621, 22.956329345703125, 26.469268798828125, 32.01612091064453, 3.3831024169921875, 41.21223449707031, -13.52774429321289, 52.42439270019531, 14.351945877075195, 37.01799774169922, 57.235599517822266, -40.55494689941406, -1.3366546630859375, 5.495077133178711, -55.92768859863281, 62.31587600708008, 36.567955017089844, 69.32212829589844, -7.656394958496094, 52.69536590576172, 5.759574890136719, 32.55371856689453, 0.42333030700683594, 8.206687927246094, 60.43065643310547, 48.963172912597656, 42.361183166503906, -13.108701705932617, 52.54545593261719, 14.757366180419922, 21.90728759765625, 69.44636535644531, 14.26275634765625, 28.665054321289062, -47.10221862792969, -6.519895553588867, 3.618295669555664, 0.7275238037109375, 22.903976440429688, -16.943153381347656, -48.95586395263672, 70.06951904296875, 78.43881225585938, -41.10154724121094, 21.00732421875, -43.255577087402344, 33.85298156738281, 15.148265838623047, 6.770685195922852, 16.62686538696289, 25.844934463500977, -5.2364349365234375, 75.18397521972656, 58.8873291015625, 62.024436950683594, -9.445770263671875, -5.649164199829102, 49.37476348876953, -1.6274032592773438, -7.124650955200195, 56.2403564453125], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000226.npy"} +{"epoch": 0.3416477702191988, "step": 227, "batch_size": 64, "mean": 19.442760467529297, "std": 34.534671783447266, "min": -61.1021728515625, "p10": -16.071001434326167, "median": 11.483623504638672, "p90": 69.16846389770508, "max": 81.747314453125, "pos_frac": 0.71875, "sample": [46.88810729980469, 19.53873634338379, 1.4035568237304688, 60.39628601074219, -0.675994873046875, 0.20514678955078125, 41.909461975097656, 76.20794677734375, -59.43855285644531, -4.492824554443359, 81.747314453125, -12.203224182128906, -2.8338260650634766, 70.5266342163086, 17.029510498046875, 14.308151245117188, 5.261011123657227, -2.8817367553710938, 65.74605560302734, -12.513114929199219, 37.740478515625, 56.660438537597656, 5.337318420410156, 5.542173385620117, 80.84966278076172, 27.575180053710938, -2.2158355712890625, 41.61643981933594, -5.029611587524414, -4.1786346435546875, 40.34736633300781, 78.7420654296875, 29.029800415039062, 7.4673614501953125, 2.4290313720703125, 44.4053955078125, 81.02023315429688, 4.786872863769531, 29.736007690429688, 69.95230865478516, 4.087257385253906, 17.844268798828125, -17.595809936523438, 20.84375, 56.562347412109375, 9.5311279296875, 5.33074951171875, 5.591241836547852, -27.622055053710938, 0.6479911804199219, -44.05120086669922, 36.123512268066406, 35.05316162109375, 43.06903076171875, 1.6474895477294922, -61.1021728515625, 13.436119079589844, -1.4539604187011719, 67.33949279785156, -6.2695465087890625, -46.109710693359375, -23.204002380371094, 54.878150939941406, 61.816734313964844], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000227.npy"} +{"epoch": 0.3431594860166289, "step": 228, "batch_size": 64, "mean": 21.414390563964844, "std": 31.206031799316406, "min": -48.263851165771484, "p10": -14.514068603515623, "median": 23.108272552490234, "p90": 68.07125701904299, "max": 89.5245361328125, "pos_frac": 0.75, "sample": [-1.6972217559814453, 54.44102478027344, 3.6064300537109375, 72.33409881591797, 24.594833374023438, 21.553009033203125, 22.907257080078125, 75.43749237060547, 12.878265380859375, -38.37877655029297, 30.934019088745117, 7.0162200927734375, 6.85736083984375, -48.263851165771484, 23.309288024902344, 3.504047393798828, 50.302833557128906, -14.950042724609375, 15.852245330810547, 28.947885513305664, 2.099794387817383, 75.019287109375, -33.185577392578125, 27.540122985839844, -13.311203002929688, 53.46249008178711, 42.36753845214844, 89.5245361328125, 17.267595291137695, 48.503456115722656, -8.964832305908203, -13.496795654296875, 50.490596771240234, 2.5374374389648438, 40.25285339355469, -5.958147048950195, 28.254478454589844, -2.5302257537841797, -21.011627197265625, -10.451164245605469, 17.848190307617188, 39.32183074951172, 44.424041748046875, -34.294654846191406, 32.19145202636719, 5.091562271118164, 72.8378677368164, 76.97628021240234, -29.873504638671875, 6.2169036865234375, -3.3791275024414062, 18.540233612060547, 43.86979675292969, 32.611610412597656, -6.617851257324219, 25.25751495361328, 63.46856689453125, 70.04383850097656, 57.621238708496094, 27.724868774414062, 2.9552764892578125, 25.272872924804688, 35.3941650390625, 27.42095184326172], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000228.npy"} +{"epoch": 0.34467120181405897, "step": 229, "batch_size": 64, "mean": 18.325944900512695, "std": 35.071048736572266, "min": -68.69827270507812, "p10": -17.958324432373043, "median": 13.720224380493164, "p90": 61.8668758392334, "max": 95.97457885742188, "pos_frac": 0.71875, "sample": [28.984222412109375, 60.1407470703125, 41.04724884033203, 31.566421508789062, 10.600715637207031, 25.035980224609375, 47.836402893066406, 20.035215377807617, 16.839733123779297, -32.21281433105469, 52.747215270996094, 35.955169677734375, 55.707733154296875, -2.3638839721679688, 27.01300048828125, 7.520910263061523, -59.31805419921875, -10.40566635131836, 57.879600524902344, 60.80543899536133, 16.981571197509766, 2.4884262084960938, 17.315673828125, 34.036842346191406, -38.365234375, 8.87350845336914, -18.93987274169922, -1.7585773468017578, 6.532663345336914, -11.480384826660156, -0.5849761962890625, 95.97457885742188, -68.69827270507812, 59.189788818359375, -15.668045043945312, 6.884954452514648, 53.25700378417969, -45.413028717041016, 5.5477447509765625, 26.098724365234375, 62.32177734375, 34.39137268066406, 0.2513923645019531, -3.8339176177978516, 49.18879318237305, 2.7232131958007812, 69.61043548583984, 28.5180721282959, 63.07148742675781, 9.785404205322266, -0.5892868041992188, -2.097705841064453, 31.81548309326172, -8.301925659179688, 73.80484008789062, 6.451263427734375, 1.0211639404296875, -0.03428077697753906, 63.999881744384766, 83.52850341796875, 58.85163879394531, 3.0132904052734375, 1.9881439208984375, -64.30702209472656], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000229.npy"} +{"epoch": 0.34618291761148906, "step": 230, "batch_size": 64, "mean": 21.908802032470703, "std": 32.590457916259766, "min": -67.70857238769531, "p10": -3.032050895690918, "median": 13.899380683898926, "p90": 67.22787399291992, "max": 111.7711181640625, "pos_frac": 0.859375, "sample": [-5.1052703857421875, 17.215011596679688, 53.019630432128906, 2.4010963439941406, 17.69670867919922, -59.6597900390625, 4.911264419555664, 2.1703567504882812, 14.557998657226562, 73.82234191894531, 21.3280029296875, 74.38835144042969, 62.46074676513672, 71.51545715332031, 15.3294677734375, 25.49825096130371, 28.228618621826172, 64.15234375, -19.22974395751953, 4.6696014404296875, -67.70857238769531, 5.890144348144531, 26.691558837890625, 37.13492202758789, 39.29015350341797, 1.9935455322265625, 68.24639129638672, 11.088241577148438, 61.89360809326172, 48.715309143066406, 34.485107421875, 5.514247894287109, -2.735879898071289, 5.681182861328125, 10.505538940429688, 15.824012756347656, 5.269783020019531, 9.212440490722656, 111.7711181640625, 17.1158447265625, 11.294166564941406, 7.402336120605469, 2.181713104248047, 19.74175262451172, 93.83724212646484, 43.97040557861328, -25.301176071166992, 70.84246063232422, 10.361083984375, 2.680492401123047, 64.85133361816406, -32.14796447753906, 61.745635986328125, 38.81016540527344, 23.79705810546875, 11.188365936279297, 3.556215286254883, -0.1535358428955078, 13.240762710571289, 3.2212257385253906, 8.285749435424805, 48.56401062011719, -3.1589813232421875, 8.103679656982422], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000230.npy"} +{"epoch": 0.3476946334089191, "step": 231, "batch_size": 64, "mean": 32.709712982177734, "std": 33.16936111450195, "min": -64.5330810546875, "p10": -4.9789482116699215, "median": 36.89725112915039, "p90": 73.50893478393556, "max": 92.44654846191406, "pos_frac": 0.828125, "sample": [62.45356750488281, 18.416099548339844, 55.576900482177734, 71.45647430419922, 4.4334259033203125, 19.22020721435547, 2.8217430114746094, 64.27862548828125, 17.02765655517578, 9.207275390625, 41.285003662109375, 1.2563018798828125, 43.8250732421875, -5.008991241455078, -5.7417144775390625, 40.50957489013672, 28.969696044921875, 66.58216094970703, 25.035293579101562, -3.9603805541992188, 43.79588317871094, -4.908847808837891, 41.6341552734375, 58.212825775146484, 7.804126739501953, 84.46380615234375, -6.816864013671875, -31.40097427368164, 79.55426025390625, 42.481014251708984, 73.98453521728516, -43.34010696411133, 39.81805419921875, 72.02865600585938, 55.16237258911133, 2.817962646484375, 5.663593292236328, 31.07938003540039, 4.4051513671875, -3.0388412475585938, 92.44654846191406, 5.815185546875, 37.49397277832031, 39.771087646484375, 33.641029357910156, 17.84993553161621, 55.57335662841797, -13.885822296142578, 22.624034881591797, -3.759632110595703, 65.63433837890625, 81.98037719726562, 36.30052947998047, 53.071617126464844, 59.641883850097656, 75.84090423583984, 46.432037353515625, 56.13494873046875, 35.02012634277344, 60.98066711425781, -64.5330810546875, 35.49128723144531, 72.39920043945312, 80.4129638671875], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000231.npy"} +{"epoch": 0.3492063492063492, "step": 232, "batch_size": 64, "mean": 21.717304229736328, "std": 39.99732971191406, "min": -108.30191040039062, "p10": -18.12575798034668, "median": 14.854707717895508, "p90": 72.78762283325196, "max": 132.42984008789062, "pos_frac": 0.703125, "sample": [2.0569381713867188, 71.2198486328125, 46.52972412109375, 82.83660125732422, 8.417060852050781, 43.74409484863281, 16.956443786621094, 72.1219253540039, -0.5887527465820312, -17.743873596191406, -18.180004119873047, 5.7763824462890625, -7.633460998535156, 15.443546295166016, 27.078815460205078, 68.67637634277344, -1.1871490478515625, 5.1212158203125, 45.18196105957031, 6.513561248779297, -2.5113906860351562, 40.34913635253906, 54.18414306640625, 32.12507629394531, 10.634063720703125, 40.41991424560547, -9.676958084106445, 81.20486450195312, -11.595569610595703, 20.54071807861328, 36.60069274902344, 73.07292175292969, -21.802791595458984, -3.057962417602539, 18.04833984375, 4.490997314453125, 1.9043903350830078, -44.964385986328125, 86.08120727539062, 25.488479614257812, -1.6834487915039062, 69.98318481445312, -10.79718017578125, 112.0740966796875, 82.21112060546875, 132.42984008789062, -17.999183654785156, -21.51569366455078, -7.946453094482422, 13.130685806274414, 18.001564025878906, 66.75061798095703, 51.868896484375, 14.265869140625, 8.329769134521484, -36.36164855957031, 1.1638069152832031, 70.7685546875, 11.212547302246094, 19.395030975341797, -18.758201599121094, -108.30191040039062, 19.176559448242188, 18.631921768188477], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000232.npy"} +{"epoch": 0.3507180650037793, "step": 233, "batch_size": 64, "mean": 16.842357635498047, "std": 33.443668365478516, "min": -54.82306671142578, "p10": -20.448489189147946, "median": 6.582165718078613, "p90": 55.43459930419922, "max": 96.37751770019531, "pos_frac": 0.65625, "sample": [90.95958709716797, 5.389533996582031, 65.8849868774414, -24.371227264404297, 10.836963653564453, 31.245277404785156, 29.93584442138672, 19.731693267822266, -7.422061920166016, -9.772575378417969, 12.257522583007812, 96.37751770019531, -3.901927947998047, -0.7897567749023438, -5.638328552246094, 26.916839599609375, 53.9073600769043, 6.979631423950195, -3.4608688354492188, 4.045326232910156, 65.79168701171875, 6.184700012207031, 55.590545654296875, 55.07072448730469, -32.16693115234375, 20.658218383789062, -14.32470703125, 35.13141632080078, -30.391677856445312, -21.41168975830078, 50.611968994140625, 3.111654281616211, 49.90034484863281, 31.605403900146484, 52.05792999267578, -54.82306671142578, 18.31444549560547, 3.3831863403320312, -4.516937255859375, 0.6829338073730469, 9.744155883789062, -46.31354522705078, 43.834930419921875, -1.0116424560546875, 40.70642852783203, -11.880149841308594, -5.008781433105469, 28.970855712890625, 50.38903045654297, 47.32074737548828, -16.95590591430664, -18.201021194458008, 3.909402847290039, 87.93123626708984, 48.71876525878906, 84.73735046386719, 4.594614028930664, -11.937564849853516, 53.08949279785156, 3.3253021240234375, 26.028209686279297, -9.965339660644531, -23.797170639038086, 0.1100311279296875], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000233.npy"} +{"epoch": 0.35222978080120937, "step": 234, "batch_size": 64, "mean": 16.384502410888672, "std": 36.10811233520508, "min": -51.242393493652344, "p10": -29.309519195556636, "median": 8.95009994506836, "p90": 67.85909423828126, "max": 86.24002838134766, "pos_frac": 0.671875, "sample": [8.933753967285156, -47.33244323730469, 0.721923828125, -32.29962158203125, 29.961578369140625, -0.7095527648925781, 2.7232189178466797, -31.60607147216797, 52.992095947265625, -17.178268432617188, 23.258438110351562, 28.909061431884766, 55.32953643798828, 21.29402732849121, 74.33695983886719, 54.63511276245117, -21.584243774414062, -47.333194732666016, 31.97857666015625, -4.494749069213867, 9.535409927368164, 2.2944068908691406, 66.99063110351562, 86.24002838134766, -0.39742088317871094, -8.741172790527344, 69.11518859863281, 1.0794658660888672, -51.242393493652344, 12.106330871582031, 55.151641845703125, 80.52009582519531, 75.1904296875, 58.33878707885742, -3.136516571044922, -51.03654479980469, -0.7318572998046875, -0.7735595703125, 7.129144668579102, -23.081188201904297, 61.01885223388672, 34.24895477294922, 8.966445922851562, 47.228309631347656, 57.63493347167969, 5.913541793823242, 6.357963562011719, 43.6490478515625, 68.23129272460938, -20.412126541137695, -5.077392578125, 22.19150733947754, -23.950897216796875, 30.764278411865234, -48.30202102661133, 2.316570281982422, 44.047332763671875, 7.459663391113281, 9.332672119140625, 8.373790740966797, 18.028968811035156, 81.50513458251953, 45.269020080566406, -23.274734497070312], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000234.npy"} +{"epoch": 0.35374149659863946, "step": 235, "batch_size": 64, "mean": 29.62804412841797, "std": 32.200523376464844, "min": -48.724403381347656, "p10": -5.136475753784179, "median": 26.174182891845703, "p90": 69.62090377807617, "max": 93.2527847290039, "pos_frac": 0.84375, "sample": [1.2595596313476562, 26.524490356445312, 12.256370544433594, 31.576068878173828, 37.69697570800781, 24.869522094726562, 20.29759979248047, 93.2527847290039, 89.19638061523438, 51.95478820800781, 12.21240234375, 51.88496398925781, 21.015628814697266, 30.94074821472168, 67.10981750488281, 61.696109771728516, 33.554100036621094, 8.697673797607422, 60.286556243896484, 70.20655822753906, 9.786239624023438, 9.896385192871094, 13.345001220703125, 68.32291412353516, 69.63086700439453, 48.21739196777344, -5.406944274902344, -9.315414428710938, 70.66841125488281, -48.724403381347656, 47.64649963378906, 3.1368465423583984, 8.965185165405273, 19.427459716796875, 69.59765625, 14.329103469848633, 32.40229415893555, 6.97747802734375, 49.61248779296875, -32.72904968261719, -17.588048934936523, 54.3836669921875, 41.398284912109375, 13.075263977050781, 62.16294860839844, 5.412776947021484, -3.6080245971679688, 65.08151245117188, 88.58163452148438, 11.720359802246094, 25.823875427246094, -7.2731781005859375, 80.17112731933594, 27.128021240234375, 2.2200088500976562, -35.26045227050781, 58.15668487548828, 65.79915618896484, 68.07852172851562, 3.65594482421875, 40.755401611328125, -4.505382537841797, 0.49738311767578125, -1.9481945037841797], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000235.npy"} +{"epoch": 0.35525321239606955, "step": 236, "batch_size": 64, "mean": 22.264503479003906, "std": 37.58650588989258, "min": -80.91139221191406, "p10": -12.208569145202636, "median": 14.399649620056152, "p90": 75.71823806762696, "max": 106.21070861816406, "pos_frac": 0.734375, "sample": [60.06900405883789, -6.596466064453125, 1.6419601440429688, 54.36850357055664, 13.991506576538086, 8.931503295898438, 61.126983642578125, 36.94020080566406, -10.619819641113281, 11.313095092773438, 30.375244140625, 12.97906494140625, -10.77070426940918, 5.8323211669921875, -12.356775283813477, 6.472862243652344, 50.95793914794922, 60.12284851074219, 39.039825439453125, 74.69778442382812, -3.7409400939941406, -6.023246765136719, 10.737106323242188, -0.8177528381347656, 14.807792663574219, 16.64484405517578, 42.041465759277344, 54.110443115234375, 78.62925720214844, 48.602333068847656, 75.03694152832031, 1.1970291137695312, 8.495529174804688, 13.346546173095703, 75.37843322753906, -25.000534057617188, 2.3654022216796875, 106.21070861816406, 18.41025161743164, 18.718229293823242, -47.448997497558594, 25.841236114501953, 57.339813232421875, 75.9955062866211, 33.48872375488281, 28.279542922973633, -2.359771728515625, -20.51026153564453, 77.86074829101562, 4.082386016845703, 2.076305389404297, -80.13436889648438, -80.91139221191406, 78.84297180175781, 77.63563537597656, 67.52667999267578, 17.904190063476562, -13.92176628112793, -11.862754821777344, -4.223812103271484, 75.8638687133789, -4.033027648925781, 17.927000045776367, 12.002975463867188], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000236.npy"} +{"epoch": 0.35676492819349964, "step": 237, "batch_size": 64, "mean": 26.60751724243164, "std": 38.99484634399414, "min": -80.4775390625, "p10": -12.408360290527343, "median": 25.46572494506836, "p90": 72.3487434387207, "max": 106.31558227539062, "pos_frac": 0.78125, "sample": [64.81393432617188, 62.76604461669922, 18.520767211914062, 83.7627182006836, -5.0946197509765625, -12.898941040039062, 17.32459259033203, 24.151588439941406, 11.912853240966797, 59.99205017089844, 44.952606201171875, 46.22920227050781, -11.263671875, 4.4304962158203125, 61.47998046875, 28.924644470214844, -3.4279441833496094, 41.10717010498047, -32.1875, 63.92675018310547, -68.43150329589844, 55.562740325927734, 26.779861450195312, 49.38762283325195, 96.21977233886719, -5.122001647949219, 49.300201416015625, 58.22618103027344, -8.766448974609375, 18.954681396484375, 72.54280090332031, 13.442039489746094, 14.651969909667969, -80.4775390625, 39.19244384765625, 4.665805816650391, 7.258766174316406, -71.80182647705078, 104.52471923828125, 8.88947868347168, 34.40647888183594, 28.14513397216797, 13.390655517578125, 33.95143127441406, 6.159156799316406, 0.11612319946289062, 44.5616455078125, 48.63636779785156, 41.15618896484375, 69.8794937133789, 71.89594268798828, 15.658462524414062, 78.37437438964844, 106.31558227539062, -31.720733642578125, 11.985729217529297, -2.740884780883789, 60.17451477050781, 5.725181579589844, 32.797279357910156, -9.11141586303711, 22.772964477539062, -13.929023742675781, 79.8579330444336], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000237.npy"} +{"epoch": 0.35827664399092973, "step": 238, "batch_size": 64, "mean": 26.61792755126953, "std": 36.98060989379883, "min": -50.50526428222656, "p10": -21.5973388671875, "median": 26.805984497070312, "p90": 75.98388671875, "max": 92.95640563964844, "pos_frac": 0.71875, "sample": [-16.410053253173828, 9.820274353027344, 68.38328552246094, -20.081932067871094, 67.24703216552734, 76.71363067626953, 3.862651824951172, 20.844078063964844, 74.2811508178711, -24.348154067993164, 25.58068084716797, -15.040542602539062, 79.1587905883789, 11.580223083496094, 37.47607421875, 28.031288146972656, -1.6993541717529297, -11.618459701538086, 41.16777038574219, 79.83548736572266, 55.26929473876953, 85.17485046386719, 60.785865783691406, 48.22119140625, 6.3899688720703125, 68.83946228027344, 30.327880859375, -38.81200408935547, -30.516090393066406, 52.99305725097656, 53.95733642578125, 51.14387130737305, 3.4156360626220703, 70.21997833251953, -2.8802146911621094, 13.13448715209961, 47.746002197265625, -2.6587963104248047, 78.97630310058594, 67.9564208984375, 4.464290618896484, -7.506500244140625, -1.1973075866699219, 42.493560791015625, 59.91514587402344, 25.53936767578125, 92.95640563964844, 51.38523864746094, 34.622520446777344, 43.365234375, 11.43402099609375, 45.666770935058594, 72.09465026855469, -20.591323852539062, -11.658294677734375, 1.3320732116699219, -50.50526428222656, 7.816535949707031, 82.57758331298828, -22.028488159179688, 40.44586181640625, -23.73248291015625, -33.48769760131836, 3.677011489868164], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000238.npy"} +{"epoch": 0.35978835978835977, "step": 239, "batch_size": 64, "mean": 26.155561447143555, "std": 39.08329772949219, "min": -65.5430908203125, "p10": -18.10002212524414, "median": 24.270248413085938, "p90": 78.5378791809082, "max": 106.09187316894531, "pos_frac": 0.765625, "sample": [15.621868133544922, 5.720855712890625, 42.85115051269531, 0.09389877319335938, 91.47465515136719, 14.54461669921875, -8.12994384765625, 3.2993545532226562, -13.977828979492188, 27.289878845214844, -18.41423797607422, 24.299560546875, 3.145000457763672, 83.72816467285156, 60.39164733886719, 11.570236206054688, -32.43246078491211, -34.59996032714844, 21.3387451171875, 72.54632568359375, 4.011295318603516, 25.706321716308594, 70.02754974365234, 78.68840789794922, 78.1866455078125, 25.067834854125977, 40.202354431152344, 48.890926361083984, 35.169036865234375, 20.284141540527344, 72.75376892089844, 27.248201370239258, -24.35240936279297, -14.57423210144043, 23.200668334960938, 69.93499755859375, -3.2702980041503906, 10.277593612670898, -17.366851806640625, 27.246475219726562, -3.242870330810547, 22.558807373046875, 20.94359588623047, 25.777130126953125, -58.50669860839844, 40.52581787109375, 103.90027618408203, 102.69430541992188, 106.09187316894531, -53.05526351928711, -0.26583099365234375, 8.951278686523438, -65.5430908203125, 69.13841247558594, 56.26617431640625, 53.565521240234375, 80.77735137939453, -3.732433319091797, 24.240936279296875, 64.88442993164062, 3.9932403564453125, 41.287864685058594, 38.63573455810547, 26.375381469726562], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000239.npy"} +{"epoch": 0.36130007558578986, "step": 240, "batch_size": 64, "mean": 33.40362548828125, "std": 38.86969757080078, "min": -75.88787078857422, "p10": -10.2266845703125, "median": 34.09905815124512, "p90": 84.28110046386719, "max": 106.81700134277344, "pos_frac": 0.796875, "sample": [41.58956527709961, -15.237251281738281, 79.25717163085938, -1.1143035888671875, 43.23521423339844, 106.81700134277344, 39.32379150390625, 49.526161193847656, -35.350303649902344, -25.848304748535156, 4.088813781738281, -3.5793590545654297, 51.6783332824707, 31.73493766784668, 66.18316650390625, 84.46549224853516, 54.47264099121094, -19.577299118041992, 83.8508529663086, 34.365509033203125, -9.44437026977539, 66.55453491210938, 33.83260726928711, -34.85828399658203, 34.97541809082031, 55.321922302246094, 33.64839172363281, 70.56492614746094, 101.28897094726562, 31.303611755371094, 71.4889907836914, 100.78955078125, 7.648826599121094, 23.540313720703125, 3.148468017578125, 66.70632934570312, 16.75048065185547, 58.409820556640625, 78.71968078613281, 4.045259475708008, 71.62997436523438, 14.290424346923828, -10.561962127685547, 50.601036071777344, 91.06745147705078, -75.88787078857422, -2.7447071075439453, 0.20725631713867188, 34.62287902832031, 3.5340118408203125, 36.70698165893555, 81.69862365722656, -2.7778396606445312, 11.375015258789062, 1.6626052856445312, 16.49596405029297, 86.56838989257812, 91.92579650878906, 55.198768615722656, 17.60874366760254, 60.565635681152344, 7.6540985107421875, -6.355735778808594, 18.429336547851562], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000240.npy"} +{"epoch": 0.36281179138321995, "step": 241, "batch_size": 64, "mean": 21.52923011779785, "std": 38.40837478637695, "min": -72.27718353271484, "p10": -21.672070312499997, "median": 13.905441284179688, "p90": 74.00965805053711, "max": 105.67350006103516, "pos_frac": 0.6875, "sample": [-11.75537109375, -26.792648315429688, 52.880653381347656, -23.207468032836914, 55.70049285888672, -18.814712524414062, 12.120407104492188, 51.15289306640625, 64.22664642333984, 52.75712585449219, -6.164947509765625, 60.784324645996094, -10.272697448730469, 26.288713455200195, 15.144584655761719, 70.3600082397461, 2.263294219970703, 3.879732131958008, 7.478492736816406, 75.48854064941406, 53.20832824707031, 40.73675537109375, -7.56732177734375, 2.2995071411132812, 16.745895385742188, -4.572683334350586, 54.896183013916016, -4.346590042114258, -12.073295593261719, -22.896652221679688, 74.72472381591797, 98.61927795410156, 94.34352111816406, 10.537284851074219, -4.994606018066406, -39.501190185546875, -7.90728759765625, 34.5439453125, 24.669708251953125, 3.7171592712402344, -72.27718353271484, 3.4280433654785156, 0.1671314239501953, 80.21994018554688, 18.650758743286133, 29.694847106933594, -56.845703125, 105.67350006103516, 33.923065185546875, -31.895187377929688, 80.334228515625, 12.666297912597656, 58.81224060058594, 15.589401245117188, 72.34117126464844, -7.628215789794922, 3.7710494995117188, 65.15516662597656, 58.204856872558594, 41.618682861328125, 4.132013320922852, 17.883018493652344, -11.54881477355957, -2.900358200073242], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000241.npy"} +{"epoch": 0.36432350718065004, "step": 242, "batch_size": 64, "mean": 28.31048583984375, "std": 40.97209548950195, "min": -78.35444641113281, "p10": -6.945840835571287, "median": 19.703784942626953, "p90": 85.66906814575195, "max": 136.55563354492188, "pos_frac": 0.78125, "sample": [-55.84103775024414, 18.72815704345703, 32.11072540283203, 5.685009002685547, 38.84247589111328, -29.745044708251953, 84.94866180419922, 58.09673309326172, 29.145736694335938, 51.413665771484375, 37.282371520996094, 53.62644577026367, 0.15751075744628906, 107.01444244384766, 80.30319213867188, -8.831130981445312, 85.97781372070312, -5.570068359375, 1.6000442504882812, -7.535457611083984, 17.61994171142578, 40.977439880371094, 86.97723388671875, 5.27556037902832, -1.9669265747070312, 23.543899536132812, 20.679412841796875, -1.37884521484375, 63.396934509277344, 46.915496826171875, 55.456459045410156, 0.8356113433837891, 103.32723999023438, 13.338083267211914, 62.14728546142578, 11.704597473144531, -0.6906108856201172, 0.09992599487304688, 136.55563354492188, 11.34714126586914, -37.00636291503906, 46.827491760253906, 45.27961730957031, 2.6322669982910156, 42.714820861816406, 1.60406494140625, 56.93865966796875, 10.173316955566406, 62.14973449707031, 72.636474609375, 90.70005798339844, 48.43147277832031, 107.28384399414062, -4.519197463989258, -0.5352649688720703, 36.030799865722656, 53.984283447265625, 0.4557209014892578, 8.466438293457031, -78.35444641113281, 2.8315811157226562, -5.027095794677734, -41.72783660888672, 16.3290958404541], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000242.npy"} +{"epoch": 0.36583522297808013, "step": 243, "batch_size": 64, "mean": 26.324024200439453, "std": 37.974300384521484, "min": -62.084625244140625, "p10": -21.325096511840812, "median": 21.997230529785156, "p90": 78.34377059936524, "max": 94.59002685546875, "pos_frac": 0.75, "sample": [4.304988861083984, 71.69245910644531, 60.84973907470703, -31.239730834960938, 61.49787139892578, 4.309907913208008, -62.084625244140625, -0.8007736206054688, 62.70629119873047, -2.8989791870117188, 57.540557861328125, 31.70915985107422, 6.534759521484375, 17.872528076171875, 20.302978515625, 88.23666381835938, -0.7648372650146484, 9.757682800292969, 82.90277099609375, -9.71759033203125, 2.4113006591796875, 89.48617553710938, 41.19044494628906, -5.488489151000977, 54.82514953613281, 38.92584228515625, 9.772865295410156, 45.06658172607422, 75.31944274902344, 40.75465393066406, -49.613250732421875, -32.27560043334961, 48.41815185546875, -6.921289443969727, 74.66339874267578, 41.736297607421875, 66.85112762451172, 76.52535247802734, -40.106689453125, 23.691482543945312, 94.59002685546875, 35.14947509765625, 32.17198181152344, 89.7111587524414, 12.23590087890625, 0.5008201599121094, 1.6836509704589844, 8.474264144897461, 79.12309265136719, 39.02898406982422, -1.7272186279296875, 19.870895385742188, 7.3717041015625, 74.3932113647461, -25.329547882080078, 36.30479431152344, 33.886722564697266, 7.081508636474609, -11.981376647949219, -10.138336181640625, -31.052268981933594, 84.63766479492188, 10.0809326171875, 30.724700927734375], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000243.npy"} +{"epoch": 0.3673469387755102, "step": 244, "batch_size": 64, "mean": 34.653926849365234, "std": 37.80606460571289, "min": -69.8133773803711, "p10": -1.6973220825195312, "median": 26.684513092041016, "p90": 87.08038635253907, "max": 100.09657287597656, "pos_frac": 0.84375, "sample": [12.078971862792969, 43.42444610595703, 29.419967651367188, 19.88237762451172, -6.42352294921875, 29.26180076599121, -2.95184326171875, 82.63334655761719, 34.463340759277344, -21.44391632080078, 16.35519790649414, 67.03147888183594, 13.371932983398438, 73.28157043457031, 34.00132751464844, -2.233154296875, 58.113548278808594, 81.4043960571289, -69.8133773803711, 80.968017578125, 25.350509643554688, 12.259540557861328, -46.661521911621094, 56.87306213378906, 12.206710815429688, 77.63788604736328, 62.17216491699219, 72.38214111328125, 86.57494354248047, 13.857019424438477, 94.86085510253906, 43.98986053466797, -1.0275745391845703, -1.5685501098632812, -1.512664794921875, 18.780046463012695, 0.184478759765625, 70.81324768066406, 79.92578125, 100.09657287597656, 2.9354286193847656, 88.87713623046875, 1.0004119873046875, 9.98193359375, 2.3389892578125, 88.05795288085938, 28.018516540527344, 64.9204330444336, 4.032482147216797, 20.12063980102539, 3.764474868774414, 12.154312133789062, 81.12420654296875, 34.489845275878906, 94.45210266113281, 36.061866760253906, -1.7525100708007812, 19.9522705078125, 10.042186737060547, 2.3977127075195312, 67.80645751953125, 17.640050888061523, 87.29700469970703, 92.11709594726562], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000244.npy"} +{"epoch": 0.3688586545729403, "step": 245, "batch_size": 64, "mean": 39.84870910644531, "std": 38.20399856567383, "min": -63.08111572265625, "p10": -3.5440979003906232, "median": 40.8222713470459, "p90": 88.04446411132812, "max": 103.95121002197266, "pos_frac": 0.875, "sample": [54.577430725097656, 61.498565673828125, 58.33407974243164, 88.1632080078125, 21.73628807067871, 6.568359375, 4.254001617431641, 78.35090637207031, 67.98223114013672, 54.28917694091797, 2.391773223876953, 29.543670654296875, 76.010498046875, 38.25165939331055, 37.43054962158203, 83.52503967285156, 10.333511352539062, 76.76007080078125, -32.046142578125, 103.95121002197266, 98.11725616455078, 4.214286804199219, -1.915008544921875, 45.96338653564453, 77.04281616210938, 35.755096435546875, 50.674041748046875, -4.242279052734375, 65.45484924316406, 2.144346237182617, 86.24699401855469, -45.556861877441406, 1.4462509155273438, 48.892974853515625, 11.869987487792969, 57.45671081542969, 3.7975616455078125, 31.391122817993164, 62.42116928100586, 102.53137969970703, 36.991668701171875, 4.8873748779296875, 84.46723937988281, 4.122398376464844, -5.341394424438477, 40.84392547607422, 90.3347396850586, 85.36270904541016, 6.787506103515625, -6.180511474609375, 54.33934020996094, 71.29385375976562, -9.636566162109375, 57.967288970947266, 95.86767578125, 40.80061721801758, -63.08111572265625, 89.72023010253906, 32.991825103759766, 17.134258270263672, 5.100128173828125, 87.76739501953125, 30.435718536376953, 41.7290153503418], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000245.npy"} +{"epoch": 0.37037037037037035, "step": 246, "batch_size": 64, "mean": 30.170146942138672, "std": 48.89647674560547, "min": -85.21586608886719, "p10": -23.76462478637695, "median": 20.517555236816406, "p90": 87.1149513244629, "max": 145.24893188476562, "pos_frac": 0.75, "sample": [72.3570556640625, 81.20089721679688, 87.26289367675781, 84.18193054199219, 10.749313354492188, 6.661746978759766, -76.46163940429688, 85.58808898925781, 30.090866088867188, -15.846818923950195, 82.91380310058594, 80.87738037109375, 44.05755615234375, -6.148160934448242, 50.51036071777344, 67.13154602050781, 13.318809509277344, -7.360189437866211, -9.442390441894531, -1.287689208984375, 22.5753173828125, 57.263832092285156, -0.9008407592773438, 90.59001159667969, 103.61096954345703, -47.88627624511719, 26.801101684570312, 145.24893188476562, -26.221435546875, 11.029998779296875, 12.597375869750977, 81.501708984375, 15.523666381835938, 3.8687191009521484, -37.272857666015625, 54.14436340332031, -77.20606231689453, 13.128984451293945, 86.7697525024414, 4.248565673828125, 47.18141174316406, -62.703041076660156, -18.032066345214844, 93.11449432373047, 45.4684944152832, 0.1250457763671875, 61.395172119140625, 76.39018249511719, 88.50961303710938, -85.21586608886719, 2.75830078125, 17.54631805419922, 62.05720520019531, 108.04834747314453, 9.235492706298828, -2.742156982421875, 75.09976196289062, 75.56494903564453, -5.65362548828125, 2.185089111328125, 33.591407775878906, 18.459793090820312, 63.48951721191406, 5.2444000244140625], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000246.npy"} +{"epoch": 0.37188208616780044, "step": 247, "batch_size": 64, "mean": 19.326343536376953, "std": 41.74576187133789, "min": -81.29138946533203, "p10": -37.17328643798828, "median": 19.149724006652832, "p90": 70.31873016357422, "max": 133.8326416015625, "pos_frac": 0.734375, "sample": [-53.063629150390625, 69.41036224365234, 36.11334228515625, 20.228797912597656, 5.081806182861328, -12.247421264648438, 4.5355987548828125, 86.9981689453125, 88.10446166992188, -1.2926177978515625, 63.44389343261719, 31.4107666015625, 70.7080307006836, 31.44353675842285, 17.72845458984375, 80.49920654296875, 56.41499328613281, 27.365306854248047, -8.302162170410156, -66.33895874023438, 133.8326416015625, 80.79719543457031, -63.835655212402344, -18.141199111938477, 5.951324462890625, 18.2681884765625, 44.87489700317383, -4.092063903808594, -44.18055725097656, 53.651092529296875, 25.203094482421875, 19.74669647216797, 34.17742919921875, 4.73291015625, 26.385406494140625, 13.096351623535156, 55.980552673339844, -81.29138946533203, -38.4593505859375, 1.657358169555664, 0.09357070922851562, 13.381731033325195, 0.301361083984375, 76.62250518798828, 54.7281494140625, 18.06412124633789, 0.20856857299804688, -23.60102081298828, 20.729267120361328, 51.63885498046875, 23.087936401367188, 45.35661315917969, -17.728713989257812, 18.552751541137695, -60.77875518798828, 46.559356689453125, 60.132450103759766, 60.47894287109375, -6.461029052734375, -34.17247009277344, -14.85943603515625, 48.66349792480469, 21.32317352294922, 17.96760368347168], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000247.npy"} +{"epoch": 0.37339380196523053, "step": 248, "batch_size": 64, "mean": 31.508869171142578, "std": 47.85458755493164, "min": -56.607208251953125, "p10": -29.22377490997314, "median": 20.516719818115234, "p90": 94.47240753173828, "max": 121.94037628173828, "pos_frac": 0.734375, "sample": [6.30609130859375, 66.44932556152344, -45.011932373046875, -53.112945556640625, 102.94129180908203, 80.05672454833984, 82.44844055175781, 68.10751342773438, -0.3131580352783203, -19.413057327270508, 1.5248889923095703, 90.18263244628906, 32.200042724609375, -30.41225242614746, 86.18011474609375, 43.34376525878906, 107.18527221679688, -21.73717498779297, -51.08223342895508, 25.935531616210938, -26.450660705566406, 8.636077880859375, 19.433868408203125, 9.307756423950195, 86.30595397949219, 62.36966323852539, 83.13208770751953, 17.002952575683594, 48.023929595947266, 95.90814208984375, -49.224754333496094, 82.22816467285156, -4.20440673828125, -9.274410247802734, 93.05628967285156, 84.5379638671875, 18.652435302734375, 21.599571228027344, 24.194414138793945, 30.674896240234375, 67.26713562011719, 73.61709594726562, 15.616125106811523, 105.30450439453125, 105.00248718261719, 33.80582809448242, 7.774177551269531, -0.4045600891113281, 8.880311965942383, 70.055908203125, 121.94037628173828, 7.111133575439453, 70.17033386230469, 6.718177795410156, -56.607208251953125, 7.739252090454102, -24.296875, 95.07931518554688, 75.04657745361328, -1.1036300659179688, 3.4571704864501953, 7.825443267822266, -38.3931884765625, -12.727142333984375], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000248.npy"} +{"epoch": 0.3749055177626606, "step": 249, "batch_size": 64, "mean": 12.360498428344727, "std": 44.955291748046875, "min": -102.89512634277344, "p10": -46.74131622314453, "median": 10.749309539794922, "p90": 74.83503036499025, "max": 96.58171844482422, "pos_frac": 0.6875, "sample": [13.359947204589844, -36.6993408203125, 8.31985855102539, 45.315277099609375, 16.259342193603516, -34.12226867675781, -58.76787567138672, 39.81183624267578, 42.38818359375, 42.857818603515625, 32.625389099121094, 65.36283874511719, 6.151771545410156, 72.04883575439453, -78.98995971679688, -17.288711547851562, 36.99920654296875, -41.279762268066406, -46.71443176269531, -35.209983825683594, 9.667497634887695, -4.165435791015625, -49.93341827392578, 10.465110778808594, 37.41474914550781, 10.337394714355469, 0.7033786773681641, -12.310478210449219, 89.59989929199219, -30.699066162109375, -14.938423156738281, 78.038818359375, 8.300846099853516, 30.25248146057129, 51.16703414916992, -73.85406494140625, 11.197181701660156, 6.0949859619140625, 15.643449783325195, -46.752838134765625, 8.651865005493164, 90.69096374511719, 66.32437133789062, 85.62602233886719, 27.33685302734375, 9.30141830444336, -59.44392395019531, 53.485530853271484, 27.296852111816406, 11.03350830078125, 35.79358673095703, 76.02911376953125, 41.95965576171875, 0.5895919799804688, 21.846792221069336, 22.133773803710938, -25.91575813293457, 62.753387451171875, 96.58171844482422, -102.89512634277344, 80.19108581542969, -39.24353790283203, -4.028594970703125, 6.315673828125], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000249.npy"} +{"epoch": 0.3764172335600907, "step": 250, "batch_size": 64, "mean": 32.52125549316406, "std": 44.06401443481445, "min": -108.55470275878906, "p10": -10.889102554321289, "median": 26.81318473815918, "p90": 85.6246322631836, "max": 129.91873168945312, "pos_frac": 0.78125, "sample": [39.7982177734375, 14.565099716186523, -1.8613834381103516, 12.236810684204102, 3.175994873046875, 39.99247741699219, 47.255123138427734, 104.26750183105469, 85.88224792480469, -0.44647216796875, 70.06320190429688, -20.183143615722656, 70.05079650878906, 15.51092529296875, 60.76030731201172, 6.106756210327148, -2.26605224609375, -108.55470275878906, 68.90708923339844, 18.60466766357422, 40.613006591796875, -10.540477752685547, 16.943431854248047, -56.02527618408203, 75.85303497314453, 19.078582763671875, 93.69151306152344, 32.072410583496094, 6.3662109375, 41.255279541015625, -11.295581817626953, 48.384857177734375, 85.02352905273438, 0.9696693420410156, 32.93390655517578, 14.429161071777344, 0.5967674255371094, 68.00056457519531, 111.14649200439453, 39.94427490234375, -55.012115478515625, -1.5823249816894531, 39.88552474975586, 2.8303756713867188, 116.26899719238281, 67.84854125976562, 76.81625366210938, 68.86373901367188, 70.70454406738281, 78.54522705078125, -11.03851318359375, -18.55030059814453, 89.59065246582031, 4.995258331298828, 12.76275634765625, 11.621124267578125, 129.91873168945312, 72.89179229736328, 21.553958892822266, -0.2907695770263672, -5.115047454833984, 83.14192199707031, 33.632789611816406, 17.770553588867188], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000250.npy"} +{"epoch": 0.3779289493575208, "step": 251, "batch_size": 64, "mean": 20.47119903564453, "std": 43.782081604003906, "min": -85.29487609863281, "p10": -40.44852523803711, "median": 19.402865409851074, "p90": 73.66767807006836, "max": 115.39974212646484, "pos_frac": 0.6875, "sample": [3.5843677520751953, 95.48900604248047, 97.9461441040039, -1.3193683624267578, 28.66790771484375, 49.32701873779297, -85.29487609863281, 24.782093048095703, 58.20087432861328, 115.39974212646484, 6.024131774902344, -65.03668975830078, 13.842880249023438, -14.650230407714844, 18.742412567138672, -28.380634307861328, 62.25876998901367, 100.55618286132812, 14.487554550170898, -71.39067077636719, -33.83075714111328, 96.49987030029297, -0.1374492645263672, -47.38893127441406, 17.582366943359375, -20.11054229736328, 20.95409393310547, 50.12109375, -19.43675994873047, -2.2517623901367188, 67.6308364868164, 61.82978820800781, 13.609508514404297, 23.736276626586914, 43.72057342529297, 24.670684814453125, 60.01636505126953, 40.275115966796875, -42.543304443359375, -0.7599563598632812, 49.93136215209961, 1.192779541015625, 73.2314224243164, 18.066303253173828, 17.31621551513672, 30.3800048828125, 27.155181884765625, 14.252830505371094, 41.78221130371094, 58.49310302734375, 73.85464477539062, 4.8914794921875, 58.22128677368164, -23.3206787109375, -4.666542053222656, -1.7148075103759766, 52.39278030395508, -42.370704650878906, 26.26026725769043, -49.244606018066406, -35.96343994140625, 44.784820556640625, 77.74366760253906, 20.063318252563477], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000251.npy"} +{"epoch": 0.3794406651549509, "step": 252, "batch_size": 64, "mean": 17.26245880126953, "std": 47.788272857666016, "min": -101.45217895507812, "p10": -55.972418975830074, "median": 15.613492965698242, "p90": 80.35558319091798, "max": 115.96031188964844, "pos_frac": 0.71875, "sample": [37.90441131591797, -85.74742126464844, -15.782632827758789, -86.00445556640625, 50.01470947265625, 1.2991104125976562, 17.408069610595703, 65.07688903808594, 1.7496833801269531, 89.5817642211914, 81.17850494384766, 50.472267150878906, 22.655227661132812, 4.129203796386719, 103.09020233154297, -13.655311584472656, 98.58463287353516, -60.26915740966797, 19.91315460205078, -1.2206363677978516, -58.432640075683594, 17.48179054260254, 36.24726867675781, 15.434947967529297, 17.596572875976562, 9.855438232421875, 14.14306640625, -10.066749572753906, 78.43543243408203, -0.04145050048828125, 51.530250549316406, 115.96031188964844, 67.86288452148438, 7.4846954345703125, 31.39130401611328, 5.9979248046875, 31.318313598632812, 11.760175704956055, 31.14951515197754, -25.640247344970703, 36.528324127197266, -22.29686737060547, -0.084320068359375, 63.97389602661133, 0.4238433837890625, 115.5791015625, -50.231903076171875, 4.6898345947265625, -101.45217895507812, -68.87887573242188, -14.184785842895508, 15.792037963867188, 52.301910400390625, -60.45270538330078, 9.707313537597656, 84.96549224853516, 10.257148742675781, 72.7698745727539, 17.3135986328125, 29.13774871826172, 60.96405029296875, 30.3907470703125, -22.656885147094727, 10.393974304199219], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000252.npy"} +{"epoch": 0.38095238095238093, "step": 253, "batch_size": 64, "mean": 24.230724334716797, "std": 41.131431579589844, "min": -68.18624114990234, "p10": -24.115024566650387, "median": 18.43200397491455, "p90": 78.67312622070314, "max": 112.19766235351562, "pos_frac": 0.703125, "sample": [62.00696563720703, -1.294952392578125, 96.99430847167969, 9.158302307128906, -1.8097152709960938, 23.254314422607422, 28.632041931152344, 75.84913635253906, 65.890625, 33.87548828125, 60.892051696777344, -3.8842239379882812, 66.38746643066406, 4.44378662109375, -1.9955883026123047, -63.54214096069336, -19.12348175048828, 35.77899932861328, -14.4349365234375, 51.77983856201172, 70.70945739746094, 45.38842010498047, -60.427860260009766, 52.63275146484375, 19.04184913635254, 5.93768310546875, 79.88340759277344, 27.90863037109375, 2.7300796508789062, 43.71846008300781, 17.822158813476562, 12.481246948242188, 74.29269409179688, -3.710704803466797, 11.996185302734375, 112.19766235351562, 29.21612548828125, -68.18624114990234, 15.99267578125, 27.141939163208008, 11.439750671386719, -11.987869262695312, 26.736114501953125, -9.081947326660156, 90.7978744506836, -26.672945022583008, -12.015768051147461, 32.28242492675781, 96.99205780029297, 26.12980842590332, 16.333328247070312, 83.84130859375, 107.86078643798828, 11.642738342285156, 73.56394958496094, -26.254257202148438, 37.197113037109375, -33.09764862060547, 61.933311462402344, -40.120513916015625, -15.932777404785156, -2.2280826568603516, 13.365921020507812, 12.416736602783203], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000253.npy"} +{"epoch": 0.382464096749811, "step": 254, "batch_size": 64, "mean": 25.899559020996094, "std": 42.4937858581543, "min": -69.0812759399414, "p10": -17.104741859436036, "median": 14.372123718261719, "p90": 91.37611618041994, "max": 102.28266143798828, "pos_frac": 0.6875, "sample": [-2.464019775390625, 23.422576904296875, 98.49774169921875, 14.403701782226562, -9.564453125, 60.46055603027344, 68.52565002441406, 76.87953186035156, 4.673494338989258, 0.09405708312988281, -7.04022216796875, 12.71578598022461, 49.429908752441406, 71.33181762695312, 75.20409393310547, 78.16380310058594, 97.98583984375, 23.55225372314453, -23.133689880371094, 62.913841247558594, -8.736320495605469, 102.28266143798828, -30.61090087890625, 93.5205078125, -16.162574768066406, -69.0812759399414, -27.466049194335938, 94.67861938476562, 24.61781883239746, -2.0984458923339844, 99.59538269042969, -8.660186767578125, 7.1976776123046875, 0.5143852233886719, -3.1748619079589844, 14.340545654296875, 2.282825469970703, 74.68113708496094, 1.58831787109375, 39.472503662109375, 14.448554992675781, -7.746669769287109, 16.823535919189453, -28.560043334960938, -17.508527755737305, 93.94527435302734, -1.8713226318359375, 86.3725357055664, 49.260406494140625, 24.66225242614746, 15.547195434570312, -13.833564758300781, -15.177055358886719, 69.08689880371094, 80.50112915039062, -7.096382141113281, 35.31464385986328, 4.10725212097168, 65.61553192138672, 66.58561706542969, 6.2699737548828125, 10.248504638671875, 3.910003662109375, -58.168006896972656], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000254.npy"} +{"epoch": 0.3839758125472411, "step": 255, "batch_size": 64, "mean": 32.5498046875, "std": 46.4442024230957, "min": -76.26533508300781, "p10": -12.91929244995117, "median": 19.629122734069824, "p90": 101.86907196044922, "max": 127.29446411132812, "pos_frac": 0.765625, "sample": [93.92770385742188, 52.76359558105469, 127.29446411132812, 55.359222412109375, 73.30729675292969, 30.378326416015625, -8.407051086425781, -8.910575866699219, 10.611064910888672, 75.86750793457031, -52.260223388671875, -1.6632251739501953, 14.640098571777344, 78.70293426513672, -18.694372177124023, 11.667095184326172, 48.452232360839844, 11.869087219238281, 10.426368713378906, -76.26533508300781, 91.48500061035156, 8.516197204589844, 21.564208984375, 9.486656188964844, 106.60079956054688, 72.53873443603516, -22.08942413330078, 16.852787017822266, 109.21842193603516, -10.629547119140625, 103.36250305175781, 71.9911117553711, -13.900611877441406, 29.783489227294922, 24.791717529296875, 17.69403648376465, 8.573869705200195, 65.52862548828125, 104.75399017333984, 17.44307518005371, 3.5762767791748047, 71.02474975585938, 83.7464599609375, -8.625625610351562, 12.807256698608398, -3.2008209228515625, 31.70018768310547, 114.38314819335938, -43.49311065673828, 40.15552520751953, 1.4764785766601562, 100.92031860351562, 9.684028625488281, 102.27568054199219, 37.80450439453125, 61.395355224609375, 4.432811737060547, 58.440547943115234, 73.2669677734375, -73.71737670898438, -1.32757568359375, 1.8911666870117188, 50.106048583984375, -8.167396545410156], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000255.npy"} +{"epoch": 0.3854875283446712, "step": 256, "batch_size": 64, "mean": 29.04998779296875, "std": 50.365257263183594, "min": -98.77123260498047, "p10": -24.37005233764648, "median": 23.724624633789062, "p90": 95.55722579956056, "max": 146.76611328125, "pos_frac": 0.6875, "sample": [-28.58368682861328, 17.192398071289062, 57.889705657958984, 39.29013442993164, 71.61863708496094, -31.73163604736328, -14.749670028686523, 101.01618957519531, 32.560951232910156, -11.794408798217773, -48.025146484375, 3.0439586639404297, -10.516876220703125, 108.80143737792969, 22.618316650390625, 106.67610931396484, -0.37316131591796875, 6.6213836669921875, -98.77123260498047, 57.94523620605469, 4.933284759521484, 72.21749877929688, -10.461935043334961, 20.319625854492188, -25.958389282226562, -76.11447143554688, 41.481807708740234, -4.749961853027344, 22.206703186035156, 63.198448181152344, 2.2955474853515625, 43.25569152832031, 46.508155822753906, 86.10346984863281, 80.59231567382812, 56.74378204345703, 90.22918701171875, 79.17291259765625, -6.80206298828125, 101.4208984375, 25.463340759277344, 33.03157043457031, 122.040771484375, 0.4182281494140625, 91.75398254394531, 12.435012817382812, 76.34028625488281, 5.322898864746094, 46.37091827392578, 146.76611328125, -18.09516143798828, 78.66136932373047, -0.94390869140625, 4.312103271484375, 71.021728515625, -16.485923767089844, 52.163604736328125, -8.578712463378906, -3.923768997192383, 97.18718719482422, -79.44735717773438, 24.8309326171875, -20.66393280029297, 51.89672088623047], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000256.npy"} +{"epoch": 0.3869992441421013, "step": 257, "batch_size": 64, "mean": 34.765472412109375, "std": 50.34027862548828, "min": -86.24866485595703, "p10": -16.421791839599603, "median": 20.66988754272461, "p90": 104.14242782592774, "max": 166.48690795898438, "pos_frac": 0.75, "sample": [-0.6863365173339844, 14.457229614257812, -18.731536865234375, 166.48690795898438, 111.20613098144531, 46.27357864379883, 3.265249252319336, 71.03240203857422, 22.313095092773438, 72.27396392822266, 101.0870361328125, 19.02667999267578, 6.726114273071289, -7.0215301513671875, 85.97113037109375, 79.11913299560547, 97.91363525390625, -1.4816436767578125, -38.558868408203125, -2.5146408081054688, 2.971414566040039, 49.21105194091797, 40.73443603515625, 12.00714111328125, 44.47156524658203, 3.23968505859375, -1.0115699768066406, 104.55304718017578, 84.41979217529297, -1.8855743408203125, 77.93824768066406, 101.52650451660156, 37.1563720703125, 6.518516540527344, 40.319602966308594, 27.056907653808594, 12.412628173828125, 94.70938110351562, 114.60357666015625, -66.83053588867188, -86.24866485595703, 133.8173828125, 29.535240173339844, 17.04895782470703, -5.236480712890625, -35.96294403076172, 14.024177551269531, 2.5428466796875, 43.73204803466797, 56.582618713378906, 81.04052734375, 14.820281982421875, 104.42255401611328, 14.778095245361328, -43.466156005859375, 105.9302978515625, -4.356658935546875, -25.148948669433594, 103.48880004882812, 11.337890625, 53.05735397338867, 12.766159057617188, 25.237411499023438, -11.032386779785156], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000257.npy"} +{"epoch": 0.3885109599395314, "step": 258, "batch_size": 64, "mean": 27.98311424255371, "std": 36.487125396728516, "min": -69.34129333496094, "p10": -1.1522834777831987, "median": 24.757946968078613, "p90": 78.62808380126955, "max": 116.10360717773438, "pos_frac": 0.890625, "sample": [51.0087890625, 8.549747467041016, 30.268692016601562, -3.030385971069336, 11.509040832519531, 86.52164459228516, 110.73982238769531, 56.015228271484375, 51.184104919433594, 3.2299556732177734, 16.53143882751465, 23.592376708984375, -46.97462463378906, 19.418169021606445, 32.57404327392578, 73.69314575195312, 24.58154296875, -35.15274429321289, 37.64398193359375, -69.34129333496094, 3.8921241760253906, 40.91736602783203, -50.333946228027344, 19.861373901367188, 20.091873168945312, 38.25023651123047, 14.705192565917969, 51.085296630859375, 15.795642852783203, 15.934677124023438, 29.148834228515625, 4.082996368408203, 36.00371551513672, 63.415077209472656, 24.934350967407227, 18.14971923828125, 5.8412322998046875, 16.805816650390625, 34.728179931640625, 116.10360717773438, 30.60309600830078, -20.16351318359375, 101.27433776855469, 48.48237609863281, 31.332000732421875, 91.92311096191406, 53.73027038574219, 50.47270584106445, 5.376304626464844, 80.7876205444336, 4.698844909667969, 17.934814453125, 44.502830505371094, 27.375839233398438, 17.978858947753906, 6.893041610717773, 41.28814697265625, -55.73980712890625, 7.8208770751953125, 3.8283252716064453, 43.317779541015625, 62.48126220703125, 80.74305725097656, 12.001142501831055], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000258.npy"} +{"epoch": 0.3900226757369615, "step": 259, "batch_size": 64, "mean": 41.544677734375, "std": 49.04655456542969, "min": -60.50257873535156, "p10": -28.878215789794904, "median": 49.23664665222168, "p90": 102.45923461914063, "max": 128.90969848632812, "pos_frac": 0.78125, "sample": [-2.027069091796875, -58.906768798828125, -60.42578125, 76.10578918457031, 44.81744384765625, 80.15982055664062, 97.35655212402344, 96.40028381347656, 54.971092224121094, -60.50257873535156, 63.82133483886719, -2.0494766235351562, 29.303308486938477, 101.45550537109375, 64.66783142089844, -5.944122314453125, -36.760643005371094, 4.434417724609375, 113.73843383789062, 31.439987182617188, 48.68929672241211, 78.28846740722656, 90.44105529785156, 96.89469909667969, 59.183937072753906, -8.26126480102539, -49.17076110839844, 18.227310180664062, 13.433204650878906, 13.120607376098633, 77.88003540039062, 68.76884460449219, -6.889217376708984, 24.986900329589844, 62.267242431640625, 49.78399658203125, 123.3341293334961, -10.485885620117188, 81.52952575683594, 83.88999938964844, 102.889404296875, 51.43416213989258, 12.554580688476562, 128.90969848632812, 10.507865905761719, 5.88714599609375, -37.66082763671875, -6.156499862670898, -54.81245422363281, 3.7362213134765625, 118.97035217285156, 103.76416015625, 76.059326171875, 59.795501708984375, 59.419677734375, 66.0932388305664, 36.018218994140625, 33.935462951660156, 14.72735595703125, 38.99090576171875, 72.36451721191406, 105.99890899658203, 59.230751037597656, 48.23420715332031], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000259.npy"} +{"epoch": 0.3915343915343915, "step": 260, "batch_size": 64, "mean": 33.04047393798828, "std": 50.7944221496582, "min": -81.30026245117188, "p10": -32.55564918518066, "median": 27.79305076599121, "p90": 100.43629531860353, "max": 110.33708190917969, "pos_frac": 0.703125, "sample": [101.49856567382812, -42.155609130859375, 80.53623962402344, -23.291576385498047, 1.7502326965332031, 110.33708190917969, 43.17655944824219, 30.20813751220703, 104.00495910644531, -50.550872802734375, 92.73338317871094, 64.49345397949219, 87.87565612792969, 68.78898620605469, 83.02157592773438, -34.91072463989258, 96.82489013671875, 65.79576873779297, 22.044126510620117, 109.08332824707031, 78.70267486572266, 3.9931488037109375, 101.64160919189453, 104.24085235595703, -9.185508728027344, 25.37796401977539, 88.48435974121094, 97.9576644897461, 0.48828125, -12.401138305664062, 14.752265930175781, 20.600296020507812, 96.5309829711914, 35.021270751953125, -0.5268306732177734, 42.014766693115234, 24.98326873779297, -22.560317993164062, -81.30026245117188, 22.88262176513672, 3.841470718383789, 60.6868896484375, -1.1618976593017578, -4.577117919921875, 16.02233123779297, 48.665626525878906, 107.7962875366211, -17.728477478027344, 95.92575073242188, -18.590682983398438, -49.775779724121094, 50.08324432373047, 35.24437713623047, 11.46533203125, 73.9079360961914, 52.950462341308594, -15.64208984375, 73.18568420410156, 82.23583984375, -30.90764617919922, 0.07440567016601562, -65.75353240966797, -33.26193618774414, -3.0582962036132812], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000260.npy"} +{"epoch": 0.3930461073318216, "step": 261, "batch_size": 64, "mean": 28.170169830322266, "std": 44.352500915527344, "min": -56.51527404785156, "p10": -23.45346984863281, "median": 21.256797790527344, "p90": 96.03213958740236, "max": 114.84336853027344, "pos_frac": 0.71875, "sample": [1.1423530578613281, 21.163650512695312, 32.0806884765625, 0.2794933319091797, -20.660903930664062, 58.11249542236328, -2.5257644653320312, 102.93252563476562, 25.57470703125, -4.055673599243164, -24.650283813476562, -17.169692993164062, -7.7758636474609375, 103.51582336425781, 64.36270141601562, -15.006118774414062, -1.3686752319335938, 114.84336853027344, 7.218545913696289, 99.112060546875, 8.079666137695312, 25.173721313476562, -12.279666900634766, -44.518768310546875, 96.90463256835938, 58.70728302001953, 114.22750091552734, 41.445865631103516, -4.295127868652344, 35.55790710449219, 49.681583404541016, 73.15457153320312, 49.04289245605469, 93.99632263183594, 38.768287658691406, 10.087175369262695, 99.01531982421875, -51.23333740234375, -30.562965393066406, 65.08443450927734, 45.30872344970703, 10.500600814819336, 76.2177505493164, 65.2002944946289, 13.224067687988281, -56.51527404785156, 2.4653873443603516, -35.288726806640625, -39.713134765625, 11.005542755126953, 26.000259399414062, -7.460601806640625, 75.52053833007812, 89.4930419921875, 14.987655639648438, -16.493507385253906, 38.70820236206055, 21.349945068359375, 0.70703125, 92.72123718261719, 17.566925048828125, 77.67512512207031, 25.685577392578125, 0.8613910675048828], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000261.npy"} +{"epoch": 0.3945578231292517, "step": 262, "batch_size": 64, "mean": 27.859447479248047, "std": 42.421966552734375, "min": -62.416847229003906, "p10": -24.461809158325195, "median": 25.483367919921875, "p90": 84.98135986328126, "max": 111.70481872558594, "pos_frac": 0.734375, "sample": [-36.99131774902344, 43.95825958251953, 20.534339904785156, -0.8877658843994141, 8.573654174804688, 81.88783264160156, 7.936798095703125, 2.952545166015625, 29.34685516357422, 91.74382781982422, -13.64358139038086, 70.0941390991211, -38.103729248046875, 4.558122634887695, 60.310001373291016, -43.76231002807617, 30.3106632232666, 86.39533996582031, 58.56707763671875, 53.683841705322266, -62.416847229003906, -2.4140281677246094, 7.387565612792969, -1.1284637451171875, 24.489952087402344, 77.62576293945312, 9.7325439453125, 111.70481872558594, -43.372955322265625, 6.81220817565918, 85.79563903808594, 53.72966766357422, 31.157913208007812, 74.34378051757812, -19.087806701660156, 96.59159088134766, 5.09111213684082, 31.46927261352539, 110.60110473632812, 5.660087585449219, -16.463407516479492, -13.19903564453125, -22.877033233642578, 53.25946044921875, 65.71743774414062, 39.137176513671875, 43.694175720214844, 9.805925369262695, -37.91267395019531, 27.334583282470703, 61.273590087890625, 0.33740997314453125, 76.15495300292969, -1.2778797149658203, 31.049795150756836, 26.476783752441406, 73.58242797851562, 90.52249145507812, 5.02093505859375, 83.08137512207031, 20.24401092529297, -9.529533386230469, 81.47518157958984, -25.14099884033203], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000262.npy"} +{"epoch": 0.3960695389266818, "step": 263, "batch_size": 64, "mean": 25.826818466186523, "std": 43.09117889404297, "min": -86.85318756103516, "p10": -18.12960739135742, "median": 22.76093292236328, "p90": 77.79038848876954, "max": 105.97714233398438, "pos_frac": 0.6875, "sample": [37.59395217895508, 60.55476760864258, -34.34923553466797, -15.874252319335938, -7.797983169555664, -6.398139953613281, 73.5745849609375, -3.9489288330078125, 75.6895751953125, 76.43794250488281, 46.51922607421875, 4.686239242553711, -14.328994750976562, 46.6013069152832, 3.1878509521484375, -55.56724548339844, 76.91744995117188, -6.808837890625, 25.374847412109375, -10.503211975097656, 54.774261474609375, 78.16450500488281, 99.69894409179688, 16.682636260986328, 15.5045166015625, 3.3804092407226562, 82.64165496826172, 44.115325927734375, 79.2918930053711, 64.27079772949219, 101.0164794921875, 21.842178344726562, -18.515472412109375, 19.046463012695312, -11.029422760009766, 29.662811279296875, -79.841796875, 76.19340515136719, 33.42639923095703, 75.94279479980469, 23.6796875, -11.372856140136719, -17.22925567626953, 75.70752716064453, -28.130340576171875, -3.2401123046875, 30.849502563476562, 76.20320892333984, 55.913429260253906, 15.222274780273438, 6.6870269775390625, 105.97714233398438, -4.4983367919921875, 4.197223663330078, 37.05645751953125, -7.575414657592773, 28.370269775390625, 70.40287780761719, 20.199520111083984, -22.57265281677246, 8.944107055664062, -86.85318756103516, 88.26705932617188, 28.88146209716797], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000263.npy"} +{"epoch": 0.3975812547241119, "step": 264, "batch_size": 64, "mean": 30.485029220581055, "std": 47.556827545166016, "min": -88.39399719238281, "p10": -25.53769378662109, "median": 24.92467498779297, "p90": 96.46225738525393, "max": 127.18118286132812, "pos_frac": 0.734375, "sample": [55.48304748535156, -24.076095581054688, 18.24298858642578, 1.2161846160888672, 1.7931900024414062, -11.313364028930664, 3.1642608642578125, 1.5814895629882812, 83.07818603515625, 21.782943725585938, -40.433265686035156, 5.331016540527344, -88.39399719238281, 64.16068267822266, -19.25336456298828, 48.50273132324219, 56.80369567871094, 48.97355651855469, 8.575782775878906, 101.82246398925781, 77.07147979736328, 51.52359390258789, 79.19676208496094, 43.54412841796875, 54.448760986328125, 113.06777954101562, -1.1844310760498047, 24.976394653320312, -7.1735992431640625, 51.86882019042969, 15.780380249023438, -9.674354553222656, 89.7166976928711, 5.2395477294921875, -13.426227569580078, 24.872955322265625, 106.0062026977539, -18.569374084472656, 67.6181411743164, 98.76524353027344, -26.164093017578125, -18.100311279296875, 26.61444854736328, 118.10893249511719, 64.5420913696289, 79.4447021484375, -59.71148681640625, 62.649749755859375, -36.85398864746094, 3.202392578125, -42.30096435546875, 6.955863952636719, 109.78056335449219, 44.933231353759766, 49.43271255493164, -32.7206916809082, 22.73505401611328, 59.471282958984375, 29.393630981445312, -1.2023162841796875, 8.125091552734375, 127.18118286132812, 73.72511291503906, 91.088623046875], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000264.npy"} +{"epoch": 0.39909297052154197, "step": 265, "batch_size": 64, "mean": 32.10042190551758, "std": 53.8140983581543, "min": -95.24935913085938, "p10": -35.356951141357406, "median": 27.436251640319824, "p90": 102.85817260742188, "max": 113.84188842773438, "pos_frac": 0.75, "sample": [12.164077758789062, 2.7096385955810547, 4.295951843261719, -42.01617431640625, 10.764612197875977, -8.087669372558594, 49.75928497314453, 28.867530822753906, -64.00178527832031, 102.57025146484375, 27.497920989990234, 0.959259033203125, 50.55677795410156, 47.20634460449219, -95.24935913085938, -19.818763732910156, 46.706336975097656, 4.1529693603515625, 27.374582290649414, -85.78532409667969, 22.71396255493164, 102.9815673828125, 95.33365631103516, 20.116483688354492, 3.744600296020508, -7.352519989013672, 79.94661712646484, -2.4400558471679688, 32.896240234375, 3.7086849212646484, 109.68817138671875, 113.84188842773438, -14.869277954101562, 99.32561492919922, 72.46481323242188, 106.70563507080078, 6.111234664916992, 20.947521209716797, -0.8762664794921875, -19.463401794433594, 39.27970886230469, 89.37043762207031, 91.5687484741211, 106.6294937133789, 95.67169952392578, 76.91120910644531, 108.78123474121094, 40.72877502441406, 16.301864624023438, -48.67298889160156, 24.384506225585938, 47.0283203125, -18.203487396240234, 101.61831665039062, 98.18301391601562, 96.17613220214844, 105.97938537597656, -69.3409423828125, 44.524452209472656, -8.120929718017578, 62.534095764160156, 6.275444030761719, 72.1312026977539, -71.46420288085938], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000265.npy"} +{"epoch": 0.40060468631897206, "step": 266, "batch_size": 64, "mean": 31.350914001464844, "std": 47.237945556640625, "min": -99.0143051147461, "p10": -16.806063461303708, "median": 19.32813262939453, "p90": 98.15975494384766, "max": 133.63766479492188, "pos_frac": 0.75, "sample": [-17.653213500976562, 98.83920288085938, 97.47700500488281, 9.609010696411133, 50.879615783691406, -1.356557846069336, -1.1564407348632812, -35.847625732421875, 7.846574783325195, 42.53559875488281, 35.75840377807617, 9.700408935546875, 7.9921722412109375, 53.654388427734375, 72.35990142822266, 59.8383903503418, 5.24853515625, 133.63766479492188, -14.82938003540039, -9.309173583984375, 104.83418273925781, 16.732070922851562, 4.3491973876953125, 99.7846908569336, 45.43585968017578, 118.94044494628906, -3.6565704345703125, 98.45236206054688, 53.79057312011719, -20.681106567382812, 88.93346405029297, 27.81121826171875, 96.5713119506836, -9.395553588867188, 44.150779724121094, -12.076499938964844, 42.24909973144531, 72.12875366210938, 86.88676452636719, 0.23592758178710938, 2.5628585815429688, -34.15757751464844, -32.19252014160156, 8.61142349243164, -99.0143051147461, 10.464935302734375, 18.118545532226562, 21.684112548828125, 37.201515197753906, 57.081932067871094, -63.547264099121094, 9.683492660522461, -4.72216796875, 20.5377197265625, 91.09488677978516, 51.22832107543945, 114.90058135986328, -10.429523468017578, 54.49413299560547, 10.374740600585938, 76.78944396972656, 8.336935043334961, 90.70549011230469, 5.949489593505859], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000266.npy"} +{"epoch": 0.4021164021164021, "step": 267, "batch_size": 64, "mean": 24.608699798583984, "std": 50.22145462036133, "min": -109.30638122558594, "p10": -28.850992393493648, "median": 19.572982788085938, "p90": 92.36011505126956, "max": 114.67431640625, "pos_frac": 0.6875, "sample": [70.52412414550781, 4.403493881225586, 5.419643402099609, -84.93344116210938, 8.257369995117188, -25.296100616455078, 72.11512756347656, 103.51573181152344, 70.08998107910156, 4.915245056152344, -13.963773727416992, 57.38410949707031, 2.569721221923828, 114.58777618408203, 7.408927917480469, -53.10151672363281, 32.121551513671875, -59.263370513916016, -11.351806640625, -88.19442749023438, -30.3745174407959, -24.435150146484375, -2.2254714965820312, 60.23755645751953, 73.10987854003906, 96.80001831054688, -1.144989013671875, 18.13461685180664, 81.83099365234375, -16.910362243652344, 34.547630310058594, 1.437051773071289, 86.18325805664062, 65.0660400390625, -20.090126037597656, 23.83298110961914, 39.310325622558594, -13.795623779296875, 4.4792633056640625, 114.67431640625, 30.914154052734375, -0.05609321594238281, 103.94134521484375, -3.471080780029297, 84.74382781982422, 61.18606185913086, 94.95380401611328, 25.00621795654297, -109.30638122558594, 86.30817413330078, 42.46636199951172, -36.40716552734375, -2.4834442138671875, 21.011348724365234, 9.11328125, 6.965724945068359, 63.91171646118164, 55.88172912597656, 96.37199401855469, 38.21897888183594, 9.500530242919922, 66.79122924804688, 23.667030334472656, -2.148651123046875], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000267.npy"} +{"epoch": 0.4036281179138322, "step": 268, "batch_size": 64, "mean": 28.344114303588867, "std": 41.492061614990234, "min": -63.73664855957031, "p10": -12.35407848358154, "median": 15.022745132446289, "p90": 90.34244232177734, "max": 127.72628784179688, "pos_frac": 0.75, "sample": [13.63995361328125, 110.60306549072266, 1.1234016418457031, -5.803131103515625, 65.87480163574219, 96.1392593383789, 27.023040771484375, -1.7196502685546875, -13.644229888916016, 24.702533721923828, 86.84439086914062, 0.8701171875, 0.021310806274414062, 5.871929168701172, 13.581321716308594, 14.016227722167969, 33.121864318847656, -21.736892700195312, -0.8952865600585938, 89.89021301269531, 71.67570495605469, 90.5362548828125, -3.378377914428711, 1.3631134033203125, -13.847633361816406, 30.332733154296875, 15.155776977539062, 67.34512329101562, 24.103851318359375, -4.1494598388671875, 82.13703918457031, 7.240055084228516, 19.311702728271484, 18.050552368164062, -17.807403564453125, 74.93246459960938, -6.185523986816406, -16.337940216064453, -49.287384033203125, 14.889713287353516, 59.558502197265625, 8.515253067016602, 2.8381881713867188, 77.58261108398438, 70.19771575927734, 34.76622009277344, 102.86874389648438, -9.343725204467773, 11.252105712890625, -63.73664855957031, -5.0567626953125, -6.407814025878906, 48.51202392578125, 1.4213809967041016, 127.72628784179688, 59.97892761230469, 18.047988891601562, 31.685684204101562, 99.14540100097656, 35.36063003540039, 1.1662425994873047, 113.0885009765625, 44.96799087524414, 4.283203125], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000268.npy"} +{"epoch": 0.4051398337112623, "step": 269, "batch_size": 64, "mean": 33.835933685302734, "std": 45.128963470458984, "min": -90.38407897949219, "p10": -7.07512092590332, "median": 20.007545471191406, "p90": 96.3263038635254, "max": 125.6972885131836, "pos_frac": 0.796875, "sample": [-4.35400390625, -28.564743041992188, 13.946670532226562, 82.20419311523438, 52.818634033203125, -7.204891204833984, 20.295852661132812, 93.79366302490234, 15.029670715332031, -6.7723236083984375, -13.493911743164062, 23.623626708984375, 53.7984619140625, 38.863868713378906, 97.33927917480469, 79.73158264160156, 0.4729499816894531, 41.95946502685547, 125.6972885131836, -65.59156036376953, 19.71923828125, 3.229217529296875, 89.41205596923828, 13.91522216796875, 12.53570556640625, 96.64447021484375, -20.175546646118164, 121.05987548828125, 45.58134460449219, 95.58391571044922, 18.497045516967773, 13.177398681640625, -6.130147933959961, 55.061492919921875, 7.6606292724609375, 3.9177303314208984, 6.330829620361328, 39.40217590332031, -1.592437744140625, 94.02144622802734, 98.65777587890625, 55.28030776977539, 21.73542022705078, 9.26394271850586, 91.70134735107422, -19.175399780273438, 49.211647033691406, 16.201522827148438, 1.0252532958984375, 2.7590789794921875, 118.226806640625, -0.4288368225097656, 109.62968444824219, 15.980499267578125, -0.33402252197265625, -90.38407897949219, 5.900787353515625, 67.78549194335938, 27.527496337890625, 56.83671569824219, 70.96244049072266, 26.905868530273438, 90.98245239257812, 17.802059173583984], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000269.npy"} +{"epoch": 0.40665154950869237, "step": 270, "batch_size": 64, "mean": 27.584157943725586, "std": 44.98433303833008, "min": -91.86714172363281, "p10": -11.742106628417966, "median": 21.551910400390625, "p90": 92.73197021484377, "max": 115.26485443115234, "pos_frac": 0.78125, "sample": [45.63861083984375, 102.87161254882812, -9.290771484375, 111.28662109375, 36.32966232299805, 106.82684326171875, 14.399618148803711, 28.247669219970703, 56.127044677734375, 19.827041625976562, 115.26485443115234, 78.76073455810547, 26.336585998535156, 71.14871978759766, 4.294410705566406, -35.18620300292969, 37.46598815917969, 63.737030029296875, 11.915576934814453, 63.48670959472656, 23.500137329101562, 62.0179443359375, 8.518272399902344, -41.39388656616211, 4.948280334472656, 13.438644409179688, 77.09159851074219, -80.75173950195312, 19.63424301147461, 11.63735580444336, 26.55816650390625, 23.276779174804688, 7.793983459472656, 54.31768035888672, -0.33984375, 8.459148406982422, 97.02310943603516, -12.792678833007812, 16.74178695678711, -91.86714172363281, 109.367431640625, 74.18628692626953, 75.517822265625, -5.469987869262695, 15.76559829711914, 42.260520935058594, -3.7106857299804688, 3.659332275390625, 88.44437408447266, 46.6810302734375, 94.56951141357422, 0.7122421264648438, -28.430648803710938, 46.13896179199219, 3.09222412109375, -6.490211486816406, -1.3281478881835938, -82.01525115966797, 44.1431884765625, 9.365768432617188, 31.08447265625, -3.7019577026367188, 9.264823913574219, 24.979278564453125], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000270.npy"} +{"epoch": 0.40816326530612246, "step": 271, "batch_size": 64, "mean": 22.469223022460938, "std": 53.712581634521484, "min": -78.07442474365234, "p10": -29.810458946228025, "median": 6.9714460372924805, "p90": 99.51278686523438, "max": 163.72747802734375, "pos_frac": 0.640625, "sample": [25.351943969726562, 40.735107421875, -10.399658203125, 1.1902618408203125, 105.66289520263672, 93.28572082519531, 13.684967041015625, 3.5036373138427734, 99.72702026367188, -30.251312255859375, 65.59033203125, -10.931493759155273, 133.88848876953125, -22.98149871826172, 49.187744140625, 96.34114074707031, 3.0151424407958984, -20.076309204101562, 2.8854846954345703, 113.54109191894531, 11.415168762207031, 7.176990509033203, 85.53730773925781, -14.469476699829102, -20.289093017578125, 0.52886962890625, -14.426132202148438, 56.324676513671875, -9.188400268554688, -28.781801223754883, 6.765901565551758, 68.00827026367188, 12.0501708984375, -72.58016967773438, -3.4139404296875, 97.06708526611328, 18.094379425048828, 2.8797378540039062, 88.19168090820312, 97.90533447265625, 2.5837554931640625, -56.44603729248047, 163.72747802734375, -43.44835662841797, -10.93194580078125, 27.323272705078125, -4.585849761962891, -78.07442474365234, -68.10521697998047, 7.417152404785156, 12.191059112548828, -22.67249298095703, 99.01290893554688, 100.78451538085938, 59.26275634765625, 3.97088623046875, -39.65960693359375, 47.91712188720703, -3.1722946166992188, 10.040897369384766, -17.699617385864258, -19.565292358398438, 116.66571044921875, 9.746742248535156], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000271.npy"} +{"epoch": 0.40967498110355255, "step": 272, "batch_size": 64, "mean": 41.11281204223633, "std": 41.209903717041016, "min": -65.44352722167969, "p10": -4.301744842529297, "median": 41.97307205200195, "p90": 106.59646301269532, "max": 115.42097473144531, "pos_frac": 0.84375, "sample": [18.40050506591797, -3.9478683471679688, -15.197616577148438, 62.94234848022461, 44.161155700683594, 109.313232421875, 32.975830078125, 83.56237030029297, 113.34290313720703, 15.326675415039062, 72.03873443603516, 45.47536087036133, 20.75200653076172, -4.262336730957031, 56.956817626953125, 38.25251770019531, 59.41119384765625, 5.97747802734375, 58.156341552734375, 55.85847854614258, 94.88847351074219, 13.063003540039062, 71.36830139160156, 54.13340759277344, 115.42097473144531, 12.722297668457031, 46.50189971923828, -33.847923278808594, 9.113388061523438, 105.44429779052734, 50.320274353027344, 111.48143005371094, 74.4564208984375, 0.36801719665527344, 61.53459930419922, 12.515460968017578, 7.452411651611328, 1.2379570007324219, 34.240966796875, -65.44352722167969, 75.09754180908203, 110.68750762939453, 114.87506866455078, 39.78498840332031, 2.7763290405273438, 15.124469757080078, 81.43757629394531, 62.69055938720703, 62.22636795043945, 72.16814422607422, 33.22615051269531, 80.79873657226562, -19.172988891601562, -4.318634033203125, 5.631996154785156, 38.106536865234375, 49.744850158691406, 56.016510009765625, -12.626544952392578, -1.2855186462402344, -6.965089797973633, 5.4415130615234375, 107.09024810791016, 16.19523811340332], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000272.npy"} +{"epoch": 0.41118669690098264, "step": 273, "batch_size": 64, "mean": 30.509675979614258, "std": 55.367435455322266, "min": -105.77188110351562, "p10": -38.564067840576165, "median": 30.4300594329834, "p90": 93.18349685668946, "max": 168.49496459960938, "pos_frac": 0.75, "sample": [0.09842681884765625, 45.22832489013672, 90.22552490234375, -40.424888610839844, 87.340576171875, -21.523765563964844, -52.662841796875, 74.0242919921875, -68.61579895019531, 41.31230163574219, 51.18876647949219, -34.22215270996094, 40.74199676513672, -2.668203353881836, 16.11975860595703, 26.700199127197266, 102.25786590576172, 16.90314483642578, 92.43929290771484, 71.8907699584961, 82.07128143310547, 11.49539566040039, -1.6659202575683594, -9.978191375732422, -105.77188110351562, 80.0672836303711, 49.2999267578125, 4.124076843261719, -24.904794692993164, 4.651432037353516, 55.94842529296875, 168.49496459960938, 93.50244140625, -91.23666381835938, 6.4886932373046875, 56.59745788574219, 64.26741027832031, 57.102848052978516, 3.4998855590820312, 81.709716796875, -59.076393127441406, 34.15991973876953, 76.03496551513672, -11.268302917480469, 40.333126068115234, 154.07862854003906, 114.5635757446289, 60.46165466308594, 15.880218505859375, 62.58034133911133, 0.06444740295410156, 21.21894073486328, 1.479940414428711, -15.960235595703125, 17.43795394897461, 106.95613861083984, 1.651458740234375, 43.098960876464844, 22.465099334716797, -20.948875427246094, 74.83416748046875, 108.7401351928711, -68.32022094726562, 50.036102294921875], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000273.npy"} +{"epoch": 0.4126984126984127, "step": 274, "batch_size": 64, "mean": 33.16278076171875, "std": 52.246578216552734, "min": -98.51477813720703, "p10": -27.132769584655758, "median": 28.860288619995117, "p90": 105.1793167114258, "max": 125.27327728271484, "pos_frac": 0.765625, "sample": [43.45452117919922, -27.912841796875, -9.042137145996094, 3.6413421630859375, -14.012420654296875, -74.81736755371094, 91.27110290527344, 97.8341064453125, 22.18976593017578, 10.642667770385742, 57.677040100097656, 86.78734588623047, 0.769561767578125, -18.61444091796875, 54.13678741455078, 112.94593811035156, 108.93173217773438, -67.28982543945312, 7.489109039306641, 26.85822105407715, 102.16319274902344, 93.51683044433594, 51.10603713989258, 98.87806701660156, 57.18629455566406, 2.7993831634521484, 106.38037872314453, 107.96115112304688, 33.30779266357422, 8.5228271484375, 6.955226898193359, 11.186065673828125, 82.84698486328125, -1.054351806640625, -12.403055191040039, 51.179649353027344, -55.541786193847656, -28.76793670654297, 84.66663360595703, 4.181396484375, -25.31260108947754, 45.1085205078125, 19.270679473876953, 28.083480834960938, -10.902566909790039, 34.24481201171875, 27.849945068359375, -98.51477813720703, 34.5621337890625, 29.637096405029297, 107.39661407470703, 88.18991088867188, 4.122280120849609, 32.74336242675781, 12.802688598632812, -17.396257400512695, -54.0312385559082, 12.179370880126953, 109.60215759277344, 102.37683868408203, 68.01272583007812, 39.248085021972656, 125.27327728271484, 89.86036682128906], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000274.npy"} +{"epoch": 0.41421012849584277, "step": 275, "batch_size": 64, "mean": 33.73168182373047, "std": 45.6679801940918, "min": -91.94196319580078, "p10": -16.007207679748525, "median": 26.09314727783203, "p90": 103.7429397583008, "max": 125.52397918701172, "pos_frac": 0.796875, "sample": [36.587127685546875, 22.59372901916504, -26.128684997558594, 52.871788024902344, 96.93761444091797, 19.208282470703125, 42.9019775390625, -91.94196319580078, 109.32520294189453, 87.8760986328125, 11.805084228515625, 14.168258666992188, -0.9234085083007812, 107.97677612304688, -2.6457767486572266, 4.522449493408203, 82.210205078125, 47.8952522277832, 93.530517578125, -24.613319396972656, -79.9320068359375, 112.95701599121094, 8.764602661132812, 10.189720153808594, 59.372108459472656, 2.359375, -26.49441146850586, 5.620536804199219, 3.174915313720703, 17.593780517578125, 38.72596740722656, 125.52397918701172, 22.716087341308594, 36.650726318359375, 106.65950775146484, 44.534423828125, 60.22370910644531, 22.53316307067871, -3.3710784912109375, -5.158653259277344, 35.98789978027344, 6.3500518798828125, 29.47020721435547, 1.1084785461425781, 10.494569778442383, 112.47368621826172, 55.09916687011719, 79.78612518310547, -21.742019653320312, 53.59934616088867, 5.588077545166016, 11.281562805175781, -5.359579086303711, 17.00933837890625, 106.68817901611328, 91.45638275146484, -7.391994476318359, 61.753334045410156, 55.687408447265625, 82.97254180908203, 44.91344451904297, 35.12347412109375, -19.69944190979004, 69.3766860961914], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000275.npy"} +{"epoch": 0.41572184429327286, "step": 276, "batch_size": 64, "mean": 32.57639694213867, "std": 43.78650665283203, "min": -70.2720718383789, "p10": -10.684268951416014, "median": 23.671632766723633, "p90": 94.62132110595705, "max": 122.02627563476562, "pos_frac": 0.828125, "sample": [91.34111785888672, 8.944381713867188, 7.740137100219727, 48.43505096435547, 8.276285171508789, 17.374977111816406, 122.02627563476562, -54.70494842529297, 50.8905143737793, 13.054792404174805, 17.703258514404297, 21.526391983032227, 41.86189270019531, 62.115325927734375, -11.225997924804688, 108.17402648925781, -1.6324539184570312, 4.687858581542969, 20.034042358398438, 3.004383087158203, 30.630313873291016, 78.71186065673828, 82.6581039428711, 114.34933471679688, 20.268142700195312, -54.20416259765625, 72.79077911376953, -14.622261047363281, 42.672157287597656, 96.0271224975586, 8.495128631591797, 15.805374145507812, -25.267372131347656, -70.2720718383789, 66.88906860351562, -9.076141357421875, 78.52307891845703, 0.28995513916015625, 39.1044921875, 65.26789855957031, -62.20832824707031, 27.75933837890625, 105.53604125976562, 2.001861572265625, -8.470458984375, 23.157257080078125, 83.80457305908203, 41.16691589355469, 84.72438049316406, 40.59266662597656, -9.420234680175781, 6.2932281494140625, 12.737876892089844, 24.18600845336914, 22.4832763671875, 116.8704833984375, 101.57649993896484, 47.28053665161133, 44.377769470214844, 47.15087127685547, 16.547014236450195, 54.673370361328125, 42.31301498413086, 1.0872268676757812], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000276.npy"} +{"epoch": 0.41723356009070295, "step": 277, "batch_size": 64, "mean": 18.530241012573242, "std": 46.672607421875, "min": -83.49005126953125, "p10": -35.07578048706054, "median": 13.974435806274414, "p90": 81.98902816772461, "max": 122.80328369140625, "pos_frac": 0.640625, "sample": [81.34347534179688, -69.76103210449219, 71.30762481689453, -0.28905487060546875, 62.51214599609375, -53.954532623291016, 15.89498519897461, 17.51715087890625, 82.26569366455078, 20.758331298828125, -30.60681915283203, -12.739524841308594, 19.281692504882812, 0.6240692138671875, -23.564132690429688, 34.43791961669922, 28.77094841003418, -5.5172882080078125, 4.597930908203125, 22.057994842529297, 43.55181884765625, 44.352073669433594, 6.420753479003906, 12.053886413574219, -7.663616180419922, -9.4140625, -11.217857360839844, -36.00847625732422, -16.370010375976562, 78.6702880859375, 0.35330772399902344, 19.684906005859375, -32.89949035644531, 93.99919128417969, 28.944128036499023, 84.74874877929688, -18.56658935546875, -68.71208953857422, 44.22944641113281, 34.516658782958984, -1.6727142333984375, -43.89901351928711, 87.906005859375, 70.80596923828125, 31.164306640625, 10.547523498535156, -14.058753967285156, 56.33765411376953, -66.10871124267578, 122.80328369140625, 52.93705749511719, -19.712732315063477, 101.7462158203125, 44.52104187011719, -7.549552917480469, 1.3102989196777344, 78.49024963378906, -83.49005126953125, 72.11663818359375, 107.83554077148438, -26.902671813964844, 8.595714569091797, 0.44838523864746094, 46.15312957763672], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000277.npy"} +{"epoch": 0.41874527588813304, "step": 278, "batch_size": 64, "mean": 33.54290771484375, "std": 49.240379333496094, "min": -87.10670471191406, "p10": -22.008595848083495, "median": 30.127193450927734, "p90": 104.049609375, "max": 128.1458282470703, "pos_frac": 0.796875, "sample": [-22.72905921936035, -58.67681884765625, 81.31231689453125, 48.72001647949219, 4.1375885009765625, -5.375724792480469, -87.10670471191406, 32.51899719238281, 113.46161651611328, 128.1458282470703, 26.505691528320312, 0.9887237548828125, 103.34517669677734, 104.35150909423828, 30.816505432128906, -10.026365280151367, 20.50381088256836, 66.84365844726562, 64.56558227539062, 70.77908325195312, 50.61650848388672, 48.849334716796875, 22.303016662597656, 7.432838439941406, -73.08259582519531, 118.77813720703125, -31.932357788085938, 82.45989990234375, 35.4168701171875, 11.587188720703125, 14.393077850341797, 53.22541046142578, -9.54107666015625, -20.3275146484375, 71.26541137695312, 10.580223083496094, 88.55210876464844, 29.437881469726562, 59.775455474853516, 66.29474639892578, 108.31266021728516, 119.71571350097656, -10.65170669555664, 59.18913269042969, 39.268821716308594, 34.52881622314453, 12.358062744140625, 4.034482955932617, -46.538963317871094, 8.640182495117188, 39.105499267578125, 79.69764709472656, -69.9188232421875, -3.9120216369628906, 9.310279846191406, 106.88272094726562, 27.665802001953125, 101.15480041503906, 41.467830657958984, 19.648773193359375, 14.683530807495117, 4.085247039794922, 80.667236328125, 18.184219360351562], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000278.npy"} +{"epoch": 0.42025699168556313, "step": 279, "batch_size": 64, "mean": 43.09828567504883, "std": 43.83491516113281, "min": -78.67098999023438, "p10": -6.478665924072264, "median": 41.32652282714844, "p90": 103.00316162109375, "max": 128.8107147216797, "pos_frac": 0.84375, "sample": [-0.9430446624755859, 6.024349212646484, 117.31532287597656, 22.00494384765625, -78.67098999023438, 93.33491516113281, 17.656841278076172, -5.052299499511719, -13.362213134765625, 59.97300338745117, 21.57917022705078, 92.85584259033203, 45.137046813964844, 100.95832824707031, 52.42487716674805, 128.8107147216797, 40.857513427734375, 63.813899993896484, -26.67909812927246, 4.613086700439453, -27.81678009033203, 91.38998413085938, 46.109413146972656, 43.97724151611328, 16.170181274414062, 41.7955322265625, 26.664636611938477, -1.9449234008789062, 24.875343322753906, 79.56898498535156, 14.5626220703125, 67.86226654052734, 114.7612075805664, 27.983741760253906, -13.862884521484375, 87.21220397949219, 46.438331604003906, 53.45222473144531, -7.0899658203125, 115.10479736328125, 101.96334075927734, 13.969722747802734, 102.14956665039062, 11.967208862304688, 20.295913696289062, 38.719886779785156, 8.280597686767578, 9.111335754394531, 70.53005981445312, 104.5126953125, 63.94290542602539, -18.288970947265625, 54.5572395324707, 103.36898803710938, 2.466968536376953, 16.234695434570312, 31.26837158203125, 11.40887451171875, 84.26953125, 75.87873077392578, 72.51162719726562, 65.18467712402344, 112.16781616210938, 11.95211410522461], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000279.npy"} +{"epoch": 0.4217687074829932, "step": 280, "batch_size": 64, "mean": 45.48133087158203, "std": 43.62464141845703, "min": -22.431926727294922, "p10": -1.526358795166015, "median": 28.95522117614746, "p90": 110.5740074157715, "max": 153.95196533203125, "pos_frac": 0.859375, "sample": [76.9354248046875, 112.53738403320312, 6.908052444458008, 69.16050720214844, -4.5776824951171875, 112.34207153320312, 2.1691761016845703, -2.5041351318359375, 27.70933723449707, 75.60685729980469, 26.12451171875, 23.044700622558594, 78.37969970703125, 74.88748168945312, 103.4979248046875, 101.27816772460938, 51.328468322753906, 35.567874908447266, 100.13406372070312, 24.93195343017578, 4.870208740234375, 9.08212661743164, -0.731109619140625, -0.2466411590576172, 113.74507141113281, 70.56156921386719, 11.290760040283203, 64.7187271118164, 104.06130981445312, 153.95196533203125, 27.912731170654297, 9.8878173828125, 18.374832153320312, 59.70997619628906, 6.828014373779297, 51.088714599609375, 126.76824951171875, 4.041168212890625, 114.38408660888672, 106.44852447509766, -20.77117156982422, -22.431926727294922, -1.8671798706054688, -11.238883972167969, 50.31003952026367, 33.24374771118164, 40.17109680175781, -5.066312789916992, 29.997711181640625, 12.316574096679688, 112.9068832397461, 23.80538558959961, 21.398265838623047, 93.71393585205078, 18.739286422729492, 13.5291748046875, 31.816909790039062, 18.080810546875, 20.103647232055664, 20.12939453125, 4.767341613769531, 94.41114807128906, 105.82125854492188, 74.70811462402344], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000280.npy"} +{"epoch": 0.42328042328042326, "step": 281, "batch_size": 64, "mean": 39.685516357421875, "std": 50.116275787353516, "min": -76.30277252197266, "p10": -17.347862434387203, "median": 36.89564514160156, "p90": 104.72877807617188, "max": 124.4527587890625, "pos_frac": 0.75, "sample": [-31.515010833740234, 79.43118286132812, 10.940681457519531, -2.0008087158203125, 92.36163330078125, 63.330413818359375, 30.46317481994629, 75.94265747070312, 63.029632568359375, 115.01327514648438, 26.118873596191406, 109.48380279541016, 68.06797790527344, 58.050758361816406, -11.167434692382812, 7.875307083129883, 19.006052017211914, 103.13890075683594, -4.625753402709961, 93.5427017211914, 84.28428649902344, 3.969573974609375, -13.411880493164062, 45.474830627441406, 85.68008422851562, 7.075664520263672, 10.747032165527344, -10.940998077392578, 39.261497497558594, -76.30277252197266, 12.663040161132812, 9.040332794189453, -3.0074539184570312, 37.69226837158203, 104.37559509277344, -53.183380126953125, 72.01164245605469, 124.4527587890625, 9.922569274902344, -43.573001861572266, 111.83696746826172, 75.89115905761719, 114.00199127197266, 68.58047485351562, 111.26202392578125, 36.099021911621094, 91.99282836914062, 15.719623565673828, 98.5788803100586, 47.524574279785156, -5.715667724609375, 7.3574066162109375, 104.88014221191406, -51.6651725769043, 9.149757385253906, 95.70184326171875, 93.1719970703125, -19.149749755859375, 78.69998168945312, 72.11373901367188, -11.52437973022461, -12.444517135620117, 14.125144958496094, -19.034711837768555], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000281.npy"} +{"epoch": 0.42479213907785335, "step": 282, "batch_size": 64, "mean": 36.91607666015625, "std": 54.56476974487305, "min": -84.80996704101562, "p10": -28.62924346923828, "median": 28.449417114257812, "p90": 109.96043548583985, "max": 156.40093994140625, "pos_frac": 0.703125, "sample": [25.66791534423828, -26.942283630371094, -54.742897033691406, -0.4106292724609375, 10.6190185546875, 84.48013305664062, 62.59120559692383, 14.283092498779297, -7.453041076660156, 119.03285217285156, 73.34217071533203, 99.04850769042969, 21.295900344848633, 70.84071350097656, 106.66908264160156, 38.8623046875, 119.6195068359375, 57.613521575927734, -5.26025390625, 69.41751098632812, 31.230918884277344, 32.683746337890625, -2.423654556274414, 121.6463623046875, 20.07499885559082, -5.793994903564453, -44.96551513671875, 88.46441650390625, 107.49736022949219, 19.061824798583984, -21.017398834228516, -16.440492630004883, -84.80996704101562, 102.43213653564453, 7.88609504699707, -52.028099060058594, 110.34597778320312, 15.956445693969727, -35.37324523925781, 43.18617248535156, 81.55027770996094, 92.7731704711914, 6.6990814208984375, 61.293941497802734, 109.06083679199219, 156.40093994140625, 55.95339584350586, 1.8174800872802734, -7.331611633300781, 36.55470275878906, -17.560028076171875, -17.979339599609375, -24.814559936523438, 18.141193389892578, -29.35222625732422, 133.27915954589844, 120.10023498535156, 72.94634246826172, -39.292030334472656, 19.54052734375, 47.68940734863281, 60.51390838623047, 88.66786193847656, 19.78769302368164], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000282.npy"} +{"epoch": 0.42630385487528344, "step": 283, "batch_size": 64, "mean": 32.96443557739258, "std": 54.39464569091797, "min": -94.84585571289062, "p10": -33.01968078613281, "median": 17.778154373168945, "p90": 106.3696815490723, "max": 138.8465576171875, "pos_frac": 0.78125, "sample": [116.88877868652344, -66.85150909423828, -35.16966247558594, -42.11164855957031, 65.00599670410156, 50.68264389038086, 6.4227142333984375, -4.679985046386719, 81.1236572265625, 0.5860881805419922, -15.867294311523438, 69.88047790527344, 20.043075561523438, 18.623783111572266, 99.09791564941406, 13.403057098388672, 16.932525634765625, 110.3573989868164, -33.376251220703125, 41.856781005859375, 98.25658416748047, 65.70016479492188, 82.51631927490234, 0.09946441650390625, 51.60008239746094, 109.48615264892578, 81.66307830810547, 4.412330627441406, 129.21731567382812, 12.519615173339844, 3.6128768920898438, 97.48890686035156, -66.68529510498047, 19.496810913085938, 0.9005584716796875, 74.19369506835938, -74.26290130615234, 16.47198486328125, 45.50715637207031, 93.70573425292969, 111.37312316894531, -32.18768310546875, 93.16410827636719, 91.55165100097656, 12.86605453491211, 15.619152069091797, 25.570419311523438, -94.84585571289062, 4.77973747253418, -17.022918701171875, 86.19156646728516, 7.981075286865234, 138.8465576171875, 0.7305717468261719, 94.59942626953125, 61.59876251220703, -3.7502059936523438, -10.490970611572266, 8.351091384887695, 11.322433471679688, -28.342864990234375, 118.83172607421875, 10.590850830078125, 43.64691162109375], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000283.npy"} +{"epoch": 0.42781557067271353, "step": 284, "batch_size": 64, "mean": 35.21404266357422, "std": 47.9246711730957, "min": -96.74362182617188, "p10": -8.08647193908691, "median": 19.7674503326416, "p90": 102.90740966796876, "max": 133.43824768066406, "pos_frac": 0.8125, "sample": [-9.209243774414062, 7.611564636230469, 40.21666717529297, 23.005264282226562, 131.037841796875, 67.04035949707031, 3.4383907318115234, -11.120941162109375, 131.97789001464844, 7.486110687255859, 0.7461967468261719, 22.12594223022461, 1.5178413391113281, -3.4114837646484375, 82.07717895507812, -13.085189819335938, 7.264593124389648, 76.6302490234375, 0.17803955078125, 104.39788818359375, 8.247268676757812, 45.28645324707031, 11.318222045898438, -19.79198455810547, -22.834983825683594, 24.276397705078125, 11.570060729980469, 17.573509216308594, 31.693859100341797, -5.466670989990234, 99.42962646484375, 53.42369842529297, 67.5229263305664, 69.1229248046875, 18.81253433227539, 15.620628356933594, 81.62709045410156, 114.55612182617188, 119.84307861328125, 10.687660217285156, 90.02869415283203, 133.43824768066406, 9.760162353515625, 3.2855873107910156, -4.109975814819336, -0.08156394958496094, 83.07208251953125, 13.90322494506836, 56.275909423828125, 94.69390869140625, 3.9757461547851562, 51.40049362182617, 95.03933715820312, 20.722366333007812, 15.843421936035156, 59.14051818847656, 128.72544860839844, 34.86268615722656, 45.07244873046875, -96.74362182617188, 59.239341735839844, -67.55167388916016, 2.8744125366210938, -1.6121902465820312], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000284.npy"} +{"epoch": 0.4293272864701436, "step": 285, "batch_size": 64, "mean": 30.66926383972168, "std": 49.257694244384766, "min": -74.9166488647461, "p10": -25.26895885467529, "median": 21.741992950439453, "p90": 105.22244186401369, "max": 116.004638671875, "pos_frac": 0.71875, "sample": [34.425132751464844, 6.835746765136719, -8.6761474609375, 97.58008575439453, 13.710678100585938, -40.586429595947266, -74.9166488647461, -1.1660003662109375, 53.13692092895508, -21.275026321411133, 46.094093322753906, 109.33702087402344, 94.7732925415039, 23.510887145996094, 99.34901428222656, -41.029754638671875, 52.19164276123047, 110.63813781738281, 1.8005256652832031, 7.834522247314453, 31.038551330566406, 2.0353317260742188, -33.292598724365234, -36.568477630615234, -2.0933837890625, -62.53834533691406, -15.246124267578125, 31.526473999023438, 47.049072265625, -20.02301025390625, -20.983200073242188, 114.59190368652344, -18.261924743652344, 100.52387237548828, 79.93479919433594, 58.72932052612305, 29.66558074951172, 20.382217407226562, 64.7908935546875, 93.77957153320312, 62.14928436279297, 2.7196426391601562, 5.340232849121094, 114.74525451660156, 84.84113311767578, 22.38147735595703, 2.6032142639160156, 116.004638671875, -16.294769287109375, -3.1844749450683594, 46.748252868652344, 81.34474182128906, 13.42169189453125, 71.20892333984375, 0.1284332275390625, 38.46356201171875, 114.9327163696289, 107.23611450195312, -26.98064422607422, 15.74554443359375, 0.640167236328125, 21.102508544921875, -6.05120849609375, 64.97834777832031], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000285.npy"} +{"epoch": 0.4308390022675737, "step": 286, "batch_size": 64, "mean": 48.064430236816406, "std": 50.73775863647461, "min": -56.66770935058594, "p10": -1.3829555511474587, "median": 40.15768814086914, "p90": 119.9106544494629, "max": 165.42547607421875, "pos_frac": 0.890625, "sample": [48.84828186035156, 8.013574600219727, 4.540239334106445, 41.90727233886719, 15.3338623046875, 75.25991821289062, 11.248908996582031, 1.1348514556884766, 24.86893653869629, -2.3773040771484375, 42.43238830566406, 17.233856201171875, 38.408103942871094, 98.09803771972656, 106.7038345336914, 133.88385009765625, 94.38276672363281, 53.372833251953125, -26.478485107421875, 22.079063415527344, 59.65631866455078, -23.89037322998047, 25.46993637084961, 115.93182373046875, 0.9371910095214844, -44.92698669433594, 57.77428436279297, 50.51633071899414, -22.872589111328125, 64.01907348632812, 110.78258514404297, 79.46476745605469, 106.46601867675781, 124.31874084472656, 67.52461242675781, 153.60076904296875, 30.319095611572266, 93.51341247558594, -40.55989456176758, 10.046585083007812, 122.8663330078125, 165.42547607421875, 23.2288818359375, 10.383895874023438, 64.56455993652344, 19.858322143554688, 11.360490798950195, 37.342498779296875, 120.59175872802734, 116.68061828613281, 118.3214111328125, 38.163978576660156, 34.675777435302734, 11.747259140014648, 5.245357513427734, 45.65882873535156, 76.10974884033203, 20.955982208251953, -56.66770935058594, 134.0294952392578, 58.930419921875, 10.56850814819336, 57.74134826660156, 1.353668212890625], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000286.npy"} +{"epoch": 0.4323507180650038, "step": 287, "batch_size": 64, "mean": 47.355857849121094, "std": 53.72928237915039, "min": -93.02908325195312, "p10": -3.5314613342285157, "median": 38.775604248046875, "p90": 120.6083236694336, "max": 146.52584838867188, "pos_frac": 0.828125, "sample": [54.71215057373047, -59.44285583496094, 12.977958679199219, 92.70211791992188, 146.52584838867188, 111.68634033203125, 16.34783935546875, 36.5372314453125, 48.20104217529297, -3.576324462890625, 50.54302978515625, 23.79629135131836, 41.01397705078125, 47.339691162109375, 127.43934631347656, 132.33279418945312, 136.97140502929688, 56.954071044921875, 105.537841796875, 67.89932250976562, 46.387939453125, 31.935516357421875, 93.26937866210938, 5.381834030151367, 10.93301010131836, 92.03619384765625, -1.3995704650878906, -35.51288604736328, 89.38239288330078, 4.355258941650391, 89.50130462646484, 13.766494750976562, -93.02908325195312, 8.980293273925781, -2.815786361694336, 95.3041000366211, 16.604270935058594, 13.265331268310547, 19.93596649169922, 101.29541015625, 79.80313873291016, -21.83039093017578, 121.9034423828125, 113.02957153320312, -22.845130920410156, 12.32666015625, 125.92405700683594, 5.422420501708984, 104.45635223388672, 102.26919555664062, -0.35513877868652344, 14.616378784179688, 77.94974517822266, 10.125329971313477, 1.2431831359863281, 19.72425079345703, 113.12239074707031, 16.627784729003906, 73.80369567871094, -14.09848403930664, -3.4267807006835938, 133.79031372070312, 117.58638000488281, 3.5298843383789062], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000287.npy"} +{"epoch": 0.43386243386243384, "step": 288, "batch_size": 64, "mean": 33.36609649658203, "std": 51.90345001220703, "min": -76.92802429199219, "p10": -33.20124359130859, "median": 31.056407928466797, "p90": 105.7457862854004, "max": 141.25808715820312, "pos_frac": 0.703125, "sample": [53.722900390625, 3.2476730346679688, -36.6356201171875, -76.92802429199219, 31.69556427001953, 15.72446060180664, 28.37611198425293, -22.731178283691406, 67.89585876464844, 46.453224182128906, 18.30087661743164, 65.73228454589844, 25.88982391357422, 104.18355560302734, -28.418548583984375, 69.30892944335938, -39.13163757324219, 52.808956146240234, -16.3197021484375, 40.22300338745117, -61.42041778564453, 106.41531372070312, 141.25808715820312, 109.03268432617188, -7.794036865234375, 124.866455078125, 30.450281143188477, 63.97077178955078, 10.884239196777344, 27.299997329711914, 125.63221740722656, -51.7122802734375, 53.953948974609375, 61.29569625854492, 95.88798522949219, 55.40031051635742, 38.41206359863281, -22.606521606445312, 28.70525360107422, -31.287437438964844, -34.021446228027344, -60.07562255859375, 118.54950714111328, -1.9593048095703125, 2.0375289916992188, -16.825241088867188, 88.55811309814453, -19.445465087890625, 84.863037109375, 88.8109130859375, 87.46022033691406, 0.91351318359375, 73.09405517578125, 13.555938720703125, -7.676361083984375, -2.138683319091797, 70.7405776977539, 27.042518615722656, -0.6728954315185547, 115.07965087890625, 31.662534713745117, 79.71826171875, 40.33549499511719, 53.78036880493164], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000288.npy"} +{"epoch": 0.43537414965986393, "step": 289, "batch_size": 64, "mean": 33.762855529785156, "std": 56.94797134399414, "min": -100.21513366699219, "p10": -27.850790977478024, "median": 19.562674522399902, "p90": 112.56386032104493, "max": 172.5660400390625, "pos_frac": 0.71875, "sample": [34.19342803955078, 17.115371704101562, 93.81501770019531, -17.824758529663086, -37.69921112060547, -22.7857666015625, -8.920269012451172, 39.318809509277344, 62.464317321777344, 37.129417419433594, 3.2093429565429688, 43.92462158203125, 87.03831481933594, 100.62590026855469, 24.71051025390625, 50.57105255126953, 132.76535034179688, -44.297332763671875, 7.940517425537109, 107.1546401977539, 12.737190246582031, 118.61474609375, 4.7313995361328125, -18.56072998046875, 95.7658462524414, 13.771408081054688, 111.96928405761719, 6.905460357666016, -12.50408935546875, 121.1971435546875, -2.3409576416015625, 27.770917892456055, -21.844127655029297, -100.21513366699219, 140.7601318359375, -11.212261199951172, 7.635690689086914, 172.5660400390625, 5.957237243652344, 20.447654724121094, 0.03788566589355469, 28.394607543945312, -29.996566772460938, 18.67769432067871, 59.910858154296875, -22.84398078918457, 41.09804916381836, -3.004009246826172, -36.4451904296875, -58.457820892333984, 83.68919372558594, 29.961517333984375, 7.06903076171875, 29.326583862304688, 112.70679473876953, 105.66769409179688, 96.16848754882812, 112.2303466796875, 117.39498901367188, 5.503082275390625, 3.836292266845703, -43.46025848388672, 106.38597106933594, -7.630741119384766], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000289.npy"} +{"epoch": 0.436885865457294, "step": 290, "batch_size": 64, "mean": 38.2220573425293, "std": 56.21426773071289, "min": -89.44570922851562, "p10": -9.127553558349609, "median": 32.19342613220215, "p90": 120.6957618713379, "max": 142.92807006835938, "pos_frac": 0.796875, "sample": [56.39289474487305, 34.94158172607422, 97.91138458251953, 142.92807006835938, 36.89039611816406, 7.470220565795898, -28.67558479309082, -1.1521472930908203, 10.04437255859375, 129.01351928710938, 42.08638000488281, 32.2583122253418, 21.627288818359375, -78.88980865478516, 40.18165588378906, 11.026519775390625, 2.6055984497070312, -9.177497863769531, 2.8686866760253906, -1.9682235717773438, 48.203460693359375, 12.411094665527344, 119.53922271728516, 121.55148315429688, 11.144752502441406, 14.942192077636719, 10.749874114990234, -9.011016845703125, 12.059194564819336, -74.80140686035156, 113.69205474853516, 124.50729370117188, 97.29955291748047, 43.3388557434082, 34.32054138183594, 132.85366821289062, 113.8891372680664, 61.4530029296875, 42.635475158691406, -45.0191650390625, 95.64543151855469, 86.59471130371094, 16.985546112060547, -89.44570922851562, -0.41870880126953125, -4.0032806396484375, -2.4558658599853516, 131.36512756347656, 111.94017791748047, 104.78997802734375, 20.982364654541016, 59.916961669921875, 1.470001220703125, 16.170333862304688, -86.89117431640625, 118.14151000976562, 22.918434143066406, 121.19142150878906, 39.88340759277344, 33.23723602294922, 26.267574310302734, 32.1285400390625, 53.036346435546875, 2.618499755859375], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000290.npy"} +{"epoch": 0.4383975812547241, "step": 291, "batch_size": 64, "mean": 42.50508117675781, "std": 58.740379333496094, "min": -106.98513793945312, "p10": -19.233210372924805, "median": 21.360015869140625, "p90": 120.82523727416992, "max": 213.2677001953125, "pos_frac": 0.765625, "sample": [153.00103759765625, 118.32067108154297, 0.7669525146484375, -18.949783325195312, 32.36759948730469, 19.276611328125, -11.201606750488281, 3.896411895751953, 117.88301086425781, 2.383453369140625, 89.61370849609375, 74.29238891601562, -19.354679107666016, -1.893899917602539, 82.81391906738281, 105.5988540649414, -27.27043914794922, -18.42101287841797, 23.44342041015625, 78.3460464477539, -1.604156494140625, 1.0665206909179688, 48.031402587890625, 44.48651885986328, 67.50355529785156, 104.52317810058594, 119.231689453125, 1.2090911865234375, 127.1837158203125, 5.9608154296875, 63.50055694580078, 132.94891357421875, -0.7770042419433594, 5.392127990722656, -24.202880859375, 0.1697521209716797, 86.13096618652344, 2.3772430419921875, 127.99014282226562, 10.234077453613281, -5.3110198974609375, 121.50818634033203, -106.98513793945312, 32.19678497314453, 124.49382019042969, 56.25761413574219, 58.37060546875, 107.0550537109375, 52.9501953125, 213.2677001953125, -26.098758697509766, 18.681655883789062, -16.716777801513672, 15.685829162597656, -39.51172637939453, 8.171077728271484, 15.205963134765625, 117.03826141357422, 15.025001525878906, 75.47643280029297, 99.6181640625, 66.22781372070312, 13.150924682617188, -21.701515197753906], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000291.npy"} +{"epoch": 0.4399092970521542, "step": 292, "batch_size": 64, "mean": 33.248558044433594, "std": 59.916481018066406, "min": -104.39608764648438, "p10": -46.82526779174805, "median": 27.11006736755371, "p90": 107.80049514770508, "max": 180.38327026367188, "pos_frac": 0.734375, "sample": [-104.39608764648438, -9.415519714355469, 95.05673217773438, 0.8422565460205078, 126.04142761230469, 70.38557434082031, 31.164615631103516, 180.38327026367188, 83.68486785888672, -34.75044250488281, -45.43775939941406, 5.495355606079102, 19.866846084594727, 13.237052917480469, -64.36441040039062, -2.3988189697265625, 58.52508544921875, 62.60115051269531, 89.67350769042969, 26.594406127929688, 40.128517150878906, 86.95965576171875, 82.9489517211914, -70.181396484375, 1.97003173828125, 6.911308288574219, 6.662448883056641, 108.37763214111328, -55.16618347167969, 65.97116088867188, 27.011070251464844, 77.35016632080078, 7.61070442199707, -9.35601806640625, -2.4071826934814453, -77.8017349243164, 106.45384216308594, -96.823486328125, -0.9618377685546875, 10.018943786621094, -14.69232177734375, 100.31946563720703, 82.93804168701172, -7.094079971313477, 127.19049072265625, 69.79782104492188, 21.240028381347656, 78.72771453857422, 27.209064483642578, 11.036270141601562, 129.13546752929688, 81.23269653320312, 4.272619247436523, 92.05624389648438, 47.721744537353516, 10.732490539550781, 55.27980422973633, 28.462848663330078, 119.73184204101562, 37.34062957763672, 44.44854736328125, -20.28826904296875, -47.41991424560547, 130.06295776367188], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000292.npy"} +{"epoch": 0.4414210128495843, "step": 293, "batch_size": 64, "mean": 48.86211013793945, "std": 61.626182556152344, "min": -120.698486328125, "p10": -15.216847229003905, "median": 39.43608856201172, "p90": 123.65052337646485, "max": 166.58050537109375, "pos_frac": 0.796875, "sample": [5.687145233154297, 26.53705596923828, 17.02170181274414, 116.97720336914062, 71.28041076660156, 30.841228485107422, 1.3017768859863281, 18.692432403564453, 68.8210678100586, 11.070465087890625, 123.82731628417969, -11.96522331237793, 123.0584716796875, 89.56916809082031, 93.56886291503906, 12.971656799316406, 102.43882751464844, 74.26676940917969, 77.45940399169922, 104.71802520751953, 79.34852600097656, -33.4869270324707, -13.510276794433594, -70.47471618652344, 96.04086303710938, 3.8023223876953125, 80.23149108886719, -34.64625930786133, 25.339820861816406, 163.42779541015625, 5.209266662597656, 141.05685424804688, 134.76412963867188, -64.80616760253906, 87.49929809570312, 3.968189239501953, 118.07740020751953, -120.698486328125, -5.959735870361328, 5.484619140625, 35.44435119628906, 127.16984558105469, -36.706424713134766, -12.319320678710938, -11.765625, 4.586799621582031, 50.17962646484375, 102.57112884521484, 166.58050537109375, 39.82627868652344, 116.58509826660156, 24.420806884765625, 64.73436737060547, 5.691204071044922, 103.66378784179688, -15.948234558105469, 116.85139465332031, 34.856903076171875, 62.70880889892578, 126.27317810058594, 39.0458984375, -7.280887603759766, 107.95574951171875, 123.23800659179688], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000293.npy"} +{"epoch": 0.4429327286470144, "step": 294, "batch_size": 64, "mean": 34.70924377441406, "std": 50.52445983886719, "min": -88.18043518066406, "p10": -9.514960861206054, "median": 17.56937026977539, "p90": 117.45863494873048, "max": 171.78717041015625, "pos_frac": 0.765625, "sample": [121.26007080078125, 27.745697021484375, 43.44367980957031, 38.50506591796875, 103.94708251953125, 22.09430694580078, 127.71891784667969, -30.625381469726562, -24.74382781982422, 8.463874816894531, 40.39697265625, -88.18043518066406, -7.556913375854492, 32.449615478515625, 19.52776527404785, 97.13142395019531, 117.91004943847656, 12.036079406738281, 116.40533447265625, 26.510887145996094, -4.1432952880859375, 16.28076934814453, 3.121469497680664, 60.86802673339844, -9.655982971191406, 129.85281372070312, -9.185909271240234, 58.51385498046875, -5.614952087402344, 171.78717041015625, 90.55026245117188, -11.233882904052734, 3.583902359008789, 139.9542694091797, 16.849252700805664, 6.4128875732421875, 2.7928314208984375, -4.9974517822265625, -5.248992919921875, 25.140182495117188, 11.319908142089844, 10.06085205078125, 113.87224578857422, 0.11265182495117188, 9.145223617553711, 61.83934783935547, 47.24714660644531, 38.2588996887207, 8.290634155273438, 129.1387939453125, -17.274478912353516, 49.26987075805664, 89.44284057617188, 7.051414489746094, 18.289487838745117, 55.30632019042969, 1.8620758056640625, -4.676698684692383, 15.78900146484375, 6.0066986083984375, 76.15702056884766, -24.80685043334961, 48.10224533081055, -8.48040771484375], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000294.npy"} +{"epoch": 0.4444444444444444, "step": 295, "batch_size": 64, "mean": 31.628929138183594, "std": 55.0975227355957, "min": -92.05537414550781, "p10": -26.684968566894522, "median": 15.818511962890625, "p90": 107.74636154174806, "max": 161.068359375, "pos_frac": 0.703125, "sample": [127.38345336914062, 15.127029418945312, -5.8380584716796875, -10.2235107421875, 65.37162780761719, 66.24681091308594, 108.54106903076172, 23.399921417236328, 16.509994506835938, 39.02565002441406, 136.77081298828125, -5.236675262451172, 161.068359375, 20.92224884033203, 8.771564483642578, 10.995201110839844, 3.019317626953125, 11.185234069824219, -13.431930541992188, 92.43215942382812, 113.00205993652344, -70.42317199707031, -3.187732696533203, 10.77668571472168, 89.25515747070312, 25.733673095703125, 6.63267707824707, -16.889572143554688, 105.89204406738281, 1.5539932250976562, -47.22050476074219, -7.173496246337891, 133.23829650878906, 96.95196533203125, 8.993789672851562, -70.19628143310547, 93.29653930664062, 22.25748062133789, 42.900630950927734, 121.61460876464844, 68.98985290527344, -92.05537414550781, -5.5738677978515625, -30.88299560546875, 83.82521057128906, 56.497154235839844, -39.415916442871094, -12.836189270019531, -34.86573791503906, 66.08172607421875, -6.32380485534668, 7.141719818115234, 19.772903442382812, 12.52191162109375, 23.6738224029541, 10.846357345581055, 84.62016296386719, -12.687484741210938, 24.599815368652344, 4.7678680419921875, 94.89116668701172, 87.84506225585938, 93.00399017333984, -9.235118865966797], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000295.npy"} +{"epoch": 0.4459561602418745, "step": 296, "batch_size": 64, "mean": 39.71464538574219, "std": 60.18115234375, "min": -108.19680786132812, "p10": -36.072994995117185, "median": 34.92073440551758, "p90": 118.8950180053711, "max": 156.81820678710938, "pos_frac": 0.796875, "sample": [56.08001708984375, 116.77687072753906, 91.38865661621094, 11.837186813354492, 0.5973739624023438, 34.22499084472656, 3.4394054412841797, 156.81820678710938, -3.250701904296875, 81.93795776367188, 28.098751068115234, 12.261241912841797, -48.357391357421875, 119.80279541015625, 6.446102142333984, 46.6158447265625, 110.37113952636719, 71.63548278808594, 13.74639892578125, 50.29679870605469, 1.9725341796875, 27.27176284790039, 5.776763916015625, -86.83615112304688, -52.08270263671875, -28.984222412109375, 3.075042724609375, 49.58647155761719, 22.995277404785156, 35.616477966308594, 45.51405334472656, -52.70749282836914, 61.35247802734375, 8.6434326171875, 151.01290893554688, 33.57354736328125, 1.9014205932617188, -33.103641510009766, 99.0502700805664, -57.84037780761719, 48.652565002441406, 70.60101318359375, 130.76742553710938, -108.19680786132812, 116.18013000488281, 54.353729248046875, 97.09597778320312, 92.38470458984375, 78.91914367675781, 80.89090728759766, 106.859130859375, 10.801620483398438, 122.998046875, 18.211271286010742, 156.13812255859375, -7.46563720703125, 7.21826171875, 131.34188842773438, -15.723487854003906, -37.01641845703125, -33.871673583984375, 90.06048583984375, 75.37838745117188, 58.60338592529297], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000296.npy"} +{"epoch": 0.4474678760393046, "step": 297, "batch_size": 64, "mean": 40.172122955322266, "std": 51.102203369140625, "min": -77.87517547607422, "p10": -10.431658935546869, "median": 28.5865535736084, "p90": 114.40265045166016, "max": 133.37359619140625, "pos_frac": 0.84375, "sample": [88.39492797851562, -37.12910461425781, 18.774269104003906, 85.1316909790039, 32.267852783203125, 32.87043762207031, 16.56024932861328, 115.59683227539062, -4.2301177978515625, -77.87517547607422, 89.65090942382812, 5.0951385498046875, 21.043216705322266, 25.769298553466797, 4.83656120300293, 123.20650482177734, 21.736557006835938, 54.9307975769043, 13.388256072998047, 3.5992431640625, 39.10798645019531, 13.279891967773438, -58.50971984863281, -51.66748809814453, -63.188636779785156, 123.96471405029297, 37.904273986816406, 8.194000244140625, 94.46060180664062, 10.695640563964844, 110.64775848388672, 128.9407501220703, -5.020416259765625, 2.8912487030029297, 21.43613052368164, 15.635213851928711, 13.208755493164062, -12.750762939453125, 92.52061462402344, 84.12996673583984, 31.40380859375, 17.36243438720703, 91.94699096679688, 32.43202209472656, 23.400070190429688, 73.08222198486328, 54.516029357910156, 0.9598016738891602, -15.6715087890625, 111.61622619628906, 21.882678985595703, 88.10745239257812, 100.35568237304688, 82.56333923339844, -1.6560020446777344, 60.938697814941406, 126.75640869140625, 65.18032836914062, 6.1180572509765625, 133.37359619140625, 0.00318145751953125, 41.0943717956543, 125.72675323486328, 60.02430725097656], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000297.npy"} +{"epoch": 0.4489795918367347, "step": 298, "batch_size": 64, "mean": 31.78000259399414, "std": 59.42924880981445, "min": -109.87554931640625, "p10": -44.21075668334961, "median": 17.936220169067383, "p90": 117.1938934326172, "max": 141.83261108398438, "pos_frac": 0.734375, "sample": [25.997291564941406, -78.84192657470703, 141.83261108398438, 17.82684326171875, 128.07077026367188, 14.222366333007812, 91.20527648925781, 13.737625122070312, -61.487518310546875, 82.43924713134766, 128.19866943359375, 107.38103485107422, -44.7884521484375, -3.063079833984375, 10.578330993652344, 41.45673751831055, 82.99752807617188, -24.153900146484375, 102.01557922363281, 78.65316772460938, 3.9840660095214844, -4.088657379150391, 107.55738067626953, 45.96136474609375, 43.081146240234375, 21.598358154296875, -79.21332550048828, 16.78011131286621, 70.35894775390625, 123.60210418701172, 5.059972763061523, 128.9049530029297, -6.7509918212890625, 21.361473083496094, 28.196033477783203, 90.61708068847656, 7.852872848510742, 117.99564361572266, 7.132654190063477, 4.780952453613281, 3.82525634765625, -11.573785781860352, -11.072090148925781, 20.479736328125, 22.634918212890625, 128.75448608398438, 94.1593246459961, -6.9595947265625, -10.55228042602539, 10.70794677734375, 44.15592575073242, 14.965362548828125, -42.86280059814453, -44.86248779296875, 3.6799774169921875, 91.13484954833984, -71.02789306640625, 67.43142700195312, -13.2724609375, -109.87554931640625, 115.3231430053711, 18.045597076416016, 1.9898147583007812, 109.64087677001953], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000298.npy"} +{"epoch": 0.4504913076341648, "step": 299, "batch_size": 64, "mean": 27.498905181884766, "std": 61.069374084472656, "min": -101.54492950439453, "p10": -56.19384307861328, "median": 16.771967887878418, "p90": 110.98894500732423, "max": 155.30877685546875, "pos_frac": 0.671875, "sample": [87.54824829101562, 82.396240234375, -8.16987419128418, -18.827308654785156, 12.821443557739258, 93.410400390625, 33.00236511230469, 62.07961654663086, 155.30877685546875, -0.3511505126953125, -55.06029510498047, 61.31175231933594, -101.54492950439453, 5.466331481933594, -79.80387878417969, -17.659889221191406, 12.788848876953125, 112.25386047363281, 51.511138916015625, -56.679649353027344, 108.0374755859375, -28.228435516357422, 28.071956634521484, 65.80659484863281, -61.16792297363281, -84.02362823486328, -0.214447021484375, 14.39725112915039, 140.2506866455078, -1.8919677734375, 117.06671142578125, 6.076286315917969, 35.23998260498047, -73.37033081054688, 12.226547241210938, 20.251312255859375, 36.49237060546875, 117.56318664550781, 16.904998779296875, 10.116752624511719, 37.49089050292969, -35.86760711669922, 92.00096893310547, 87.69737243652344, 146.21568298339844, -48.13977813720703, 16.63893699645996, 100.64347076416016, 74.53323364257812, 72.63345336914062, 1.2615833282470703, 31.25989532470703, 73.198974609375, -63.527496337890625, 7.573577880859375, 87.17469787597656, -3.312713623046875, 68.202880859375, -0.8359241485595703, 7.2512969970703125, -1.561807632446289, 20.131568908691406, -53.55978012084961, 131.4191131591797], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000299.npy"} +{"epoch": 0.4520030234315949, "step": 300, "batch_size": 64, "mean": 35.40083312988281, "std": 58.41526794433594, "min": -91.35420227050781, "p10": -43.28495635986328, "median": 30.557811737060547, "p90": 122.98138809204102, "max": 146.4553985595703, "pos_frac": 0.75, "sample": [24.653806686401367, 106.75408172607422, 12.117233276367188, 41.12858581542969, -1.7158546447753906, 12.797500610351562, 86.61467742919922, 12.1263427734375, 8.567018508911133, -86.03965759277344, 129.7425994873047, 29.98249053955078, 87.55201721191406, 135.62547302246094, 130.38385009765625, 70.58389282226562, 123.91850280761719, -41.65141296386719, -14.026588439941406, 57.477020263671875, 1.2235889434814453, 57.98188018798828, 31.133132934570312, -20.014930725097656, -54.33296203613281, 63.72337341308594, 93.54000854492188, -28.111221313476562, 33.648460388183594, 45.95473861694336, 5.984157562255859, -91.35420227050781, 79.742431640625, 0.5346717834472656, -60.3089599609375, 52.301692962646484, 25.564496994018555, 135.91944885253906, 16.6507568359375, 123.6025161743164, 87.26620483398438, 36.79347610473633, 4.86334228515625, 146.4553985595703, 63.611061096191406, -43.98504638671875, -0.15761947631835938, 93.14071655273438, -10.3399658203125, 72.98959350585938, 66.4771728515625, 12.893943786621094, 39.117584228515625, 49.780494689941406, -10.314933776855469, -51.005577087402344, 21.694793701171875, 112.01747131347656, 86.70120239257812, -73.70630645751953, 5.297584533691406, 6.089317321777344, 121.53208923339844, -11.533302307128906], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000300.npy"} +{"epoch": 0.45351473922902497, "step": 301, "batch_size": 64, "mean": 29.857980728149414, "std": 58.31682205200195, "min": -117.35735321044922, "p10": -36.327588653564455, "median": 24.079012870788574, "p90": 114.3900650024414, "max": 194.49514770507812, "pos_frac": 0.75, "sample": [96.30667877197266, 19.93311309814453, 45.243125915527344, 26.34365463256836, 11.620040893554688, -32.45869445800781, 68.13997650146484, 123.28816223144531, 78.41645812988281, 26.65087127685547, 21.81437110900879, 19.502573013305664, 28.435806274414062, -24.343097686767578, -97.36536407470703, 35.96177673339844, 15.792633056640625, 72.42851257324219, 86.81498718261719, 5.666095733642578, -49.57904052734375, 37.77629470825195, 118.29234313964844, -10.289161682128906, 52.28398895263672, 3.368804931640625, -4.37440299987793, 113.7769775390625, 63.44694519042969, -36.65418243408203, -33.5198860168457, 27.220436096191406, 49.322689056396484, 107.20028686523438, -23.773208618164062, 3.5324935913085938, -41.0389404296875, 194.49514770507812, -45.753326416015625, 18.98495101928711, -15.451070785522461, 33.61512756347656, 32.13611602783203, -75.35546875, 6.2708740234375, 83.41563415527344, 101.87808227539062, 44.98054504394531, 14.68798828125, 114.65281677246094, 37.54498291015625, 51.451995849609375, 70.62330627441406, -22.80868911743164, -35.56553649902344, 9.656070709228516, 115.95915222167969, 120.66291046142578, 21.502639770507812, 2.7812576293945312, 4.951789855957031, -117.35735321044922, 129.66452026367188, 8.102134704589844], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000301.npy"} +{"epoch": 0.455026455026455, "step": 302, "batch_size": 64, "mean": 22.624004364013672, "std": 55.73525619506836, "min": -105.64839172363281, "p10": -44.58986873626708, "median": 19.904560089111328, "p90": 94.50794372558596, "max": 170.62063598632812, "pos_frac": 0.71875, "sample": [60.97040557861328, 138.258056640625, -3.935791015625, 170.62063598632812, 32.00151062011719, 5.234735488891602, 106.81924438476562, -22.54558563232422, 132.66421508789062, 11.347763061523438, 36.69929504394531, 20.88703155517578, 9.538183212280273, 4.704944610595703, 69.98249816894531, 118.37142944335938, 3.9621047973632812, 17.80792236328125, 0.7274398803710938, 25.777236938476562, 21.867839813232422, -89.2153091430664, -80.81889343261719, 39.27912902832031, 20.048416137695312, -16.768781661987305, 38.50969696044922, 39.673561096191406, 5.118541717529297, -10.716384887695312, -21.374778747558594, 76.22654724121094, 53.808685302734375, 16.94974708557129, -29.58637046813965, 97.1343994140625, 121.72747802734375, -19.955062866210938, 2.8380279541015625, 24.857158660888672, 67.07772827148438, 84.0434341430664, 6.088878631591797, 33.17201232910156, 56.50079345703125, 40.52742004394531, -97.81817626953125, -12.283546447753906, -14.39544677734375, 19.760704040527344, 73.79275512695312, 39.53111267089844, -14.271766662597656, 3.9243316650390625, 28.253192901611328, -70.08601379394531, -51.72900390625, 88.37954711914062, -18.3609619140625, -51.01993942260742, -105.64839172363281, 17.38897705078125, 68.54959106445312, 27.06215476989746], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000302.npy"} +{"epoch": 0.4565381708238851, "step": 303, "batch_size": 64, "mean": 43.9742317199707, "std": 63.64446258544922, "min": -96.96221923828125, "p10": -41.18609428405762, "median": 61.07869338989258, "p90": 125.04119262695313, "max": 171.8966064453125, "pos_frac": 0.703125, "sample": [-10.654220581054688, 67.13371276855469, 88.824951171875, 23.216184616088867, 128.2171630859375, 89.22793579101562, 83.16183471679688, -58.689697265625, 103.73912811279297, 60.53703308105469, 113.92997741699219, -40.27385711669922, 46.2103385925293, -6.273714065551758, -75.2998046875, -66.31887817382812, -56.83851623535156, 113.5413818359375, -96.96221923828125, -34.8094482421875, -0.0963592529296875, 13.96925163269043, 171.8966064453125, 73.65536499023438, -59.77775573730469, 69.85942077636719, 95.99014282226562, -36.384239196777344, -4.656642913818359, 20.985931396484375, 61.62035369873047, -2.2139129638671875, 11.235466003417969, 25.156494140625, 12.848960876464844, -5.727794647216797, 129.11123657226562, 8.392250061035156, 97.11697387695312, 78.39273071289062, 24.0728759765625, 96.68312072753906, 69.62781524658203, 126.23361206054688, 0.24318695068359375, 95.99067687988281, 135.87405395507812, 36.028167724609375, 66.40650939941406, 113.14144134521484, -27.46453857421875, -0.7619190216064453, -41.57705307006836, 85.28656005859375, 130.62265014648438, 82.40690612792969, 23.404314041137695, 72.9796142578125, 88.36384582519531, 108.54931640625, 122.25888061523438, -33.894447326660156, 71.69775390625, 135.18362426757812], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000303.npy"} +{"epoch": 0.4580498866213152, "step": 304, "batch_size": 64, "mean": 44.965667724609375, "std": 50.294124603271484, "min": -104.4561767578125, "p10": -14.210608673095695, "median": 40.00384330749512, "p90": 111.0638442993164, "max": 134.59970092773438, "pos_frac": 0.796875, "sample": [122.22877502441406, -1.6622085571289062, 84.61624145507812, 106.06190490722656, 15.403900146484375, 53.35129928588867, 38.380577087402344, 50.04229736328125, -21.676755905151367, 38.83266830444336, 5.2915802001953125, 100.58268737792969, 92.64694213867188, 37.94276428222656, 111.19642639160156, 53.00067901611328, -2.8608627319335938, 53.83011245727539, 110.75448608398438, -104.4561767578125, 38.428436279296875, 99.74617004394531, 28.017837524414062, 29.150184631347656, -6.728233337402344, 12.382415771484375, 0.7126178741455078, 38.71853256225586, 49.16896057128906, 115.87981414794922, 70.16414642333984, -0.04394721984863281, 125.36801147460938, 63.61247253417969, 8.83489990234375, -60.44276428222656, 63.374794006347656, 87.15890502929688, 28.982177734375, 38.028564453125, 0.8387050628662109, -18.378023147583008, 134.59970092773438, 41.175018310546875, 2.87860107421875, 8.826034545898438, 47.325592041015625, 61.68604278564453, 105.2222671508789, 129.69314575195312, -20.377227783203125, -1.0355987548828125, 106.49703979492188, -6.871417999267578, 104.17668914794922, -17.355976104736328, 45.62816619873047, 124.0966567993164, 77.95417785644531, 28.492233276367188, 36.95429992675781, -27.24013900756836, 44.186004638671875, 94.80924987792969], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000304.npy"} +{"epoch": 0.4595616024187453, "step": 305, "batch_size": 64, "mean": 33.390316009521484, "std": 61.2466926574707, "min": -135.92825317382812, "p10": -50.01671829223633, "median": 29.25416851043701, "p90": 110.806893157959, "max": 143.39450073242188, "pos_frac": 0.734375, "sample": [99.58009338378906, 20.190574645996094, 13.3016357421875, -47.29071807861328, -10.263626098632812, 0.5826911926269531, 143.39450073242188, -56.21446990966797, 44.36767578125, 130.97398376464844, 12.991535186767578, 133.67799377441406, -52.616973876953125, 83.67425537109375, -76.12432861328125, -49.14898681640625, 28.458175659179688, 4.023929595947266, -52.17549133300781, 58.58885192871094, 23.87563705444336, 35.781959533691406, 20.981101989746094, 65.61929321289062, 57.555030822753906, 71.93019104003906, 53.39727783203125, 3.234588623046875, 69.0224609375, -135.92825317382812, -6.678680419921875, 56.02630615234375, 103.00149536132812, 104.97075653076172, -19.487289428710938, 17.606748580932617, 135.7884521484375, -27.12811279296875, 25.166372299194336, 35.833404541015625, 10.875274658203125, 23.208236694335938, 82.20240020751953, 128.8363800048828, 88.34650421142578, -11.111949920654297, 25.029808044433594, -45.24485778808594, 118.64898681640625, 82.95547485351562, 85.9344253540039, 33.995994567871094, 29.17074966430664, 103.23279571533203, 54.22712707519531, 112.07101440429688, -31.937942504882812, 40.67707824707031, -82.00018310546875, 107.8572769165039, -15.266363143920898, 29.337587356567383, 95.78300476074219, -50.38860321044922], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000305.npy"} +{"epoch": 0.46107331821617537, "step": 306, "batch_size": 64, "mean": 32.89083480834961, "std": 47.500335693359375, "min": -97.45838165283203, "p10": -12.514241409301755, "median": 28.3307466506958, "p90": 90.78329391479492, "max": 163.05136108398438, "pos_frac": 0.796875, "sample": [115.72396850585938, 52.69477081298828, 5.307126998901367, 120.04843139648438, 16.00531005859375, 77.7101821899414, 17.696819305419922, 35.67020034790039, 31.963136672973633, 62.223976135253906, 100.53800201416016, 83.2701416015625, -44.495079040527344, 18.39773941040039, -13.285091400146484, -97.45838165283203, 91.34251403808594, 49.847900390625, 42.61899185180664, 5.259098052978516, 0.08654022216796875, 62.58844757080078, 89.47844696044922, 10.578290939331055, 14.30158805847168, 11.486419677734375, -23.68373680114746, 62.36370849609375, 10.345924377441406, 35.27027893066406, -33.19773864746094, 83.40625, -3.4732513427734375, 7.11412239074707, 62.92503356933594, 42.18486785888672, 111.21849060058594, 146.6728057861328, 7.5788421630859375, 24.69835662841797, 32.861419677734375, 10.045625686645508, 11.993488311767578, 48.32731628417969, -55.10497283935547, 16.15875244140625, -7.714574813842773, 39.636444091796875, 7.868843078613281, 32.97221374511719, 81.35860443115234, 63.783058166503906, -7.3470611572265625, 2.56634521484375, 39.762908935546875, -2.746051788330078, 12.452491760253906, -10.715591430664062, 57.135963439941406, 163.05136108398438, -38.536224365234375, 32.59040832519531, 84.9222412109375, -3.3328895568847656], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000306.npy"} +{"epoch": 0.46258503401360546, "step": 307, "batch_size": 64, "mean": 20.443254470825195, "std": 60.42987823486328, "min": -103.63569641113281, "p10": -51.63292388916015, "median": 8.152483940124512, "p90": 110.67835540771486, "max": 140.4525909423828, "pos_frac": 0.546875, "sample": [84.11742401123047, -24.058082580566406, 12.078693389892578, -34.34685516357422, -66.91258239746094, 76.20481872558594, 140.4525909423828, -32.456199645996094, 123.3472900390625, 67.40023803710938, -36.30397033691406, 31.019447326660156, 13.616973876953125, 123.39777374267578, -103.63569641113281, 56.58998107910156, 39.05497741699219, 0.25873565673828125, 83.36802673339844, -51.653106689453125, 60.34735107421875, -61.76652526855469, -10.41290283203125, -51.58583068847656, 35.01123046875, -64.07154083251953, -28.043167114257812, 49.68621826171875, 83.43574523925781, -1.9110298156738281, -15.271141052246094, 20.73145866394043, -1.6482734680175781, -41.441158294677734, -45.230918884277344, 62.813385009765625, -37.40748596191406, -5.168647766113281, 74.38792419433594, -25.825973510742188, 4.136203765869141, -25.50556182861328, -1.9240493774414062, 126.16458129882812, 112.08012390136719, -30.15886688232422, 44.01852798461914, 107.40756225585938, 117.53050994873047, 61.58361053466797, -81.47747802734375, 41.87024688720703, 97.07051086425781, 4.226274490356445, 72.67463684082031, 53.48828887939453, -3.4989776611328125, 120.24465942382812, -45.72991180419922, -18.94188690185547, -61.25844192504883, 35.80743408203125, 83.77416229248047, -3.38311767578125], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000307.npy"} +{"epoch": 0.46409674981103555, "step": 308, "batch_size": 64, "mean": 32.54762649536133, "std": 58.17353439331055, "min": -123.61224365234375, "p10": -41.454301834106445, "median": 25.99996566772461, "p90": 110.91519927978518, "max": 140.62753295898438, "pos_frac": 0.734375, "sample": [125.2500228881836, 78.0649642944336, 79.12159729003906, -41.659786224365234, 105.36116027832031, 71.90750122070312, -18.26927947998047, 31.423416137695312, 30.30389404296875, -14.825019836425781, 103.33721923828125, 91.00381469726562, 113.29550170898438, 21.69603729248047, 6.054534912109375, -53.13212966918945, 33.137977600097656, 102.93539428710938, 87.16624450683594, 39.87434005737305, 66.31878662109375, -23.18670654296875, 131.67449951171875, 64.17472839355469, 32.723426818847656, 55.63871765136719, -1.1431140899658203, 16.496421813964844, 69.50216674804688, -72.58795166015625, 140.62753295898438, -10.141441345214844, 17.521259307861328, -44.58515548706055, 64.53453826904297, 1.2023773193359375, 78.59593963623047, -4.0025482177734375, 7.9799346923828125, -123.61224365234375, 12.6910400390625, 1.4305496215820312, 54.15522766113281, 122.8883056640625, 9.657459259033203, 37.27227783203125, 54.185508728027344, -40.97483825683594, 70.95504760742188, 1.5088081359863281, 101.46573638916016, 8.208099365234375, -16.20159912109375, 78.11376190185547, 134.68133544921875, 16.241310119628906, 123.80435943603516, -67.51834106445312, -40.907997131347656, 9.640676498413086, 5.797971725463867, -68.44612121582031, 15.035888671875, -0.41499900817871094], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000308.npy"} +{"epoch": 0.4656084656084656, "step": 309, "batch_size": 64, "mean": 32.49545669555664, "std": 53.731441497802734, "min": -95.21755981445312, "p10": -23.250779724121095, "median": 33.015727043151855, "p90": 106.25049209594728, "max": 149.3380584716797, "pos_frac": 0.71875, "sample": [82.34168243408203, 141.11880493164062, 15.760322570800781, 95.84724426269531, 39.591453552246094, 4.177650451660156, 73.01436614990234, -17.93939208984375, 45.442169189453125, 5.147193908691406, 50.91731262207031, -1.5255508422851562, -53.98295211791992, -21.856718063354492, 16.001419067382812, -83.11624145507812, 22.54890251159668, 101.8084945678711, -45.481407165527344, -4.511285781860352, 4.553028106689453, 84.27487182617188, 108.15420532226562, 4.762205123901367, 65.29690551757812, 66.47731018066406, -11.253517150878906, 17.860227584838867, 1.1856918334960938, -3.5116729736328125, 8.822050094604492, -11.801498413085938, -17.939071655273438, 109.75418090820312, 63.70330810546875, 24.39797592163086, 41.55254364013672, 2.4715003967285156, -6.083993911743164, 57.670143127441406, -17.573440551757812, 131.4820556640625, 89.40534973144531, 34.58699035644531, 149.3380584716797, -95.21755981445312, 90.54004669189453, 42.595394134521484, 31.4444637298584, 57.16620635986328, -23.20172119140625, 7.7689361572265625, 43.408363342285156, 40.05989074707031, 121.07892608642578, 69.70439147949219, 49.19721984863281, 77.7226791381836, -33.70814514160156, -58.44940185546875, 46.16241455078125, -23.271804809570312, 44.25206756591797, 129.56797790527344], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000309.npy"} +{"epoch": 0.4671201814058957, "step": 310, "batch_size": 64, "mean": 20.145675659179688, "std": 52.93830108642578, "min": -67.30021667480469, "p10": -42.72982635498047, "median": 11.932455062866211, "p90": 90.2706840515137, "max": 162.27703857421875, "pos_frac": 0.625, "sample": [92.36225891113281, -5.4452056884765625, 25.17855453491211, 43.93096160888672, 26.6785888671875, -53.86273956298828, -19.729766845703125, 78.32208251953125, 95.0457534790039, 0.7305393218994141, -36.10923767089844, -41.99339294433594, 44.24774932861328, 124.42082214355469, 8.97967529296875, -1.9369850158691406, 3.1413116455078125, 51.379364013671875, 140.17587280273438, -22.67974853515625, 11.586673736572266, -32.102054595947266, -67.1133804321289, 162.27703857421875, -22.43915557861328, -25.93964385986328, 64.77645111083984, -18.76593017578125, 27.731033325195312, 66.02478790283203, -67.30021667480469, 44.79133605957031, -6.4669036865234375, 85.07011413574219, -24.18292236328125, 40.481109619140625, 6.348236083984375, 71.0724868774414, 7.733421325683594, 65.13699340820312, 12.278236389160156, 18.575653076171875, -45.46478271484375, -43.045440673828125, 69.15479278564453, 23.977798461914062, -6.9877471923828125, 52.69657897949219, 2.84588623046875, -16.66656494140625, 14.887245178222656, 101.99645233154297, 85.39034271240234, -67.08964538574219, -1.455841064453125, -32.397560119628906, 17.8006591796875, 123.17037963867188, 34.266761779785156, -24.791748046875, -64.78108215332031, 72.37166595458984, 5.057615280151367, 15.977638244628906], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000310.npy"} +{"epoch": 0.46863189720332576, "step": 311, "batch_size": 64, "mean": 35.264381408691406, "std": 58.27051544189453, "min": -136.1396026611328, "p10": -23.116149139404296, "median": 30.878334045410156, "p90": 100.68037567138673, "max": 274.3860778808594, "pos_frac": 0.765625, "sample": [84.45091247558594, 0.5096664428710938, 20.239601135253906, -8.864204406738281, -20.800277709960938, -26.027084350585938, 41.438358306884766, 100.28498077392578, 4.016756057739258, 75.06330108642578, 16.56079864501953, -136.1396026611328, 7.038398742675781, 79.2248764038086, 57.857818603515625, -6.29606819152832, 74.36123657226562, 31.36835479736328, 105.67190551757812, 39.491729736328125, 7.051239013671875, 44.70587158203125, 2.7628040313720703, 40.80705261230469, 100.8498306274414, 5.977878570556641, -23.70614242553711, -21.739498138427734, 0.0363922119140625, 37.176361083984375, -37.50819396972656, 139.36691284179688, 163.2719268798828, 38.54802703857422, 17.068344116210938, 55.045494079589844, 16.703636169433594, 76.83328247070312, 31.213958740234375, 61.17744445800781, 274.3860778808594, 15.351150512695312, -6.081489562988281, 94.37274169921875, -36.14872741699219, 15.748886108398438, 23.90289306640625, -7.2454071044921875, 58.863502502441406, 27.95221710205078, 132.87014770507812, 72.64651489257812, 54.42140197753906, -35.60149383544922, 34.282188415527344, 79.59466552734375, 3.5650405883789062, -46.50398254394531, -10.632492065429688, 30.542709350585938, -6.326210021972656, 34.37824249267578, 101.49482727050781, 55.99290466308594], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000311.npy"} +{"epoch": 0.47014361300075586, "step": 312, "batch_size": 64, "mean": 43.10749435424805, "std": 48.30134201049805, "min": -62.13087463378906, "p10": -18.414965820312496, "median": 35.695037841796875, "p90": 112.14987106323248, "max": 146.81886291503906, "pos_frac": 0.859375, "sample": [31.10781478881836, 6.8482666015625, -20.54986572265625, 15.987319946289062, 36.88606262207031, 11.708076477050781, 44.0695686340332, -11.822723388671875, 25.797256469726562, 21.313133239746094, 132.94515991210938, 58.112945556640625, 90.97827911376953, 69.55814361572266, 2.9959144592285156, 70.54059600830078, 13.558448791503906, 4.745151519775391, 18.056371688842773, 99.04678344726562, 117.7654800415039, 27.082481384277344, 6.813533782958984, 32.78179168701172, 34.50401306152344, 123.54757690429688, 13.592353820800781, -21.601455688476562, 37.96330261230469, 93.91841125488281, 129.9950714111328, -62.13087463378906, 61.46062469482422, 88.26348876953125, -60.77954864501953, 38.930904388427734, 89.55851745605469, 29.569480895996094, 94.13006591796875, 146.81886291503906, 135.50289916992188, 3.092082977294922, 32.039085388183594, 57.04920959472656, 94.2177734375, 28.245849609375, 32.499717712402344, 98.67784118652344, 49.21942138671875, -26.419063568115234, -13.43353271484375, 71.33988952636719, 118.33836364746094, 56.00018310546875, 13.37884521484375, 60.24623107910156, 51.98992156982422, 39.77839660644531, -49.02090835571289, 93.4425048828125, 59.048423767089844, -22.79064178466797, 18.118480682373047, 14.251861572265625], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000312.npy"} +{"epoch": 0.47165532879818595, "step": 313, "batch_size": 64, "mean": 23.641815185546875, "std": 53.048343658447266, "min": -92.57783508300781, "p10": -42.477140426635735, "median": 14.876091003417969, "p90": 94.55109786987305, "max": 173.90499877929688, "pos_frac": 0.671875, "sample": [-6.539506912231445, 26.735008239746094, 53.80305480957031, 14.96249008178711, 19.56951904296875, 42.44544982910156, 9.415538787841797, 26.025747299194336, 88.1153793334961, -48.68678283691406, 2.144620895385742, 34.421966552734375, 48.26377868652344, 23.361404418945312, 8.687797546386719, -6.2960357666015625, 0.40765380859375, -35.843570709228516, -19.490036010742188, -4.354621887207031, 46.944114685058594, 64.80815887451172, 4.460123062133789, 138.3601837158203, -85.55268859863281, -45.320098876953125, -7.333343505859375, 36.912322998046875, 92.8988037109375, 41.158531188964844, 129.03506469726562, 79.50135803222656, -66.706298828125, -5.124757766723633, 125.82865905761719, 39.406471252441406, 2.4512786865234375, 9.750446319580078, -8.614814758300781, 125.5788345336914, 30.164554595947266, 14.789691925048828, 59.08198547363281, -12.306930541992188, 173.90499877929688, 3.402313232421875, -11.396499633789062, -12.058952331542969, 28.123687744140625, 11.482170104980469, 95.25922393798828, 41.05023193359375, 34.02555847167969, -1.2983894348144531, -1.6502571105957031, -92.57783508300781, 63.370399475097656, -51.35954666137695, 98.712890625, -31.857574462890625, -48.59963607788086, 24.11865234375, 11.519386291503906, 91.58483123779297], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000313.npy"} +{"epoch": 0.47316704459561604, "step": 314, "batch_size": 64, "mean": 43.26057434082031, "std": 53.16264724731445, "min": -53.28810119628906, "p10": -8.862994003295897, "median": 37.480703353881836, "p90": 122.6002685546875, "max": 165.98660278320312, "pos_frac": 0.734375, "sample": [32.86829376220703, 14.01772689819336, 21.91712188720703, 122.00782775878906, 42.99831771850586, 57.888526916503906, 0.3557586669921875, 88.9522933959961, -39.22374725341797, 60.72637176513672, -0.7796630859375, -9.601024627685547, 153.6600341796875, 42.91145324707031, -7.140922546386719, 165.98660278320312, 53.78230667114258, 46.53856658935547, 104.98394012451172, -3.6561050415039062, 5.5435638427734375, -0.2660369873046875, 103.14939880371094, 122.85417175292969, 118.04193115234375, -53.28810119628906, 18.836219787597656, 129.7056884765625, 14.102401733398438, -4.385009765625, 83.51639556884766, 43.030181884765625, 24.479198455810547, -6.8658905029296875, 2.7440433502197266, 37.422122955322266, 69.12454223632812, -30.551162719726562, 23.681154251098633, 69.22026062011719, -5.816717147827148, -6.0066986083984375, 126.14278411865234, 42.77024459838867, 90.04530334472656, 19.49066162109375, 77.59310913085938, 116.07550811767578, -5.890129089355469, 123.4103775024414, 53.69105529785156, 115.40634155273438, 66.68099975585938, 12.663276672363281, 83.98773193359375, 22.645309448242188, -24.578018188476562, 37.539283752441406, 19.431228637695312, -2.0477523803710938, 46.90996551513672, -44.185569763183594, -45.154354095458984, 128.58404541015625], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000314.npy"} +{"epoch": 0.47467876039304613, "step": 315, "batch_size": 64, "mean": 33.62580871582031, "std": 49.026329040527344, "min": -89.85330200195312, "p10": -33.4709014892578, "median": 41.067378997802734, "p90": 99.28922424316407, "max": 137.26077270507812, "pos_frac": 0.734375, "sample": [-22.716796875, 65.43620300292969, 103.86412048339844, -3.3521595001220703, -3.7853317260742188, 28.947656631469727, -89.85330200195312, -2.062541961669922, -51.77758026123047, 45.378273010253906, -56.72486114501953, 41.41468811035156, -14.08773422241211, 111.91390228271484, -3.743877410888672, 49.17925262451172, 33.97998809814453, -17.203163146972656, 17.759769439697266, 1.3303241729736328, 40.720069885253906, 59.77803039550781, 1.627462387084961, 41.92859649658203, 26.827590942382812, 43.31863784790039, 42.7503662109375, -19.640655517578125, 33.81899642944336, 58.337440490722656, 45.34657287597656, 55.76712417602539, 99.50038146972656, 16.208572387695312, 23.518287658691406, 77.33303833007812, 84.27412414550781, -46.87721252441406, -38.079803466796875, 46.95564270019531, 93.45700073242188, 1.780487060546875, 84.90057373046875, 105.91759490966797, -15.792984008789062, 64.75991821289062, 58.112648010253906, 137.26077270507812, -42.75905227661133, 33.71617889404297, 55.88691711425781, 9.335174560546875, 95.93405151367188, 0.34063148498535156, 66.84724426269531, 12.816211700439453, 98.79652404785156, 47.86753845214844, 105.54232788085938, -44.605712890625, 85.00761413574219, -5.243932723999023, 121.66456604003906, 53.199188232421875], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000315.npy"} +{"epoch": 0.47619047619047616, "step": 316, "batch_size": 64, "mean": 44.688846588134766, "std": 52.00922775268555, "min": -50.2003173828125, "p10": -17.286224937438963, "median": 40.170732498168945, "p90": 121.63944091796876, "max": 157.6485137939453, "pos_frac": 0.75, "sample": [-12.271400451660156, 11.52325439453125, 72.90028381347656, -28.644775390625, -43.15513610839844, -12.94012451171875, 57.59161376953125, 34.20268249511719, 19.344825744628906, 96.4250717163086, 124.33065032958984, 122.74444580078125, 78.721923828125, 125.65235900878906, 41.305999755859375, -29.250564575195312, -50.2003173828125, 17.956748962402344, -17.67670249938965, 72.41514587402344, 19.20488166809082, 119.06109619140625, 6.053703308105469, 21.267005920410156, 30.919769287109375, 36.60019302368164, 59.3514404296875, 11.190048217773438, -12.342777252197266, 29.693702697753906, 108.19145202636719, 109.32893371582031, 78.60565185546875, 157.6485137939453, -11.426004409790039, 64.4700927734375, -8.453689575195312, 89.9217300415039, 76.51470184326172, 77.03026580810547, 111.50357055664062, 50.97278594970703, 39.035465240478516, 0.5796394348144531, 124.03340148925781, 10.938371658325195, -0.7175941467285156, 132.5074462890625, -6.689735412597656, 52.095428466796875, -33.74433898925781, -32.255714416503906, 8.503768920898438, -16.375110626220703, 43.050209045410156, 26.851699829101562, -0.112518310546875, 115.81495666503906, 82.56434631347656, 86.44989776611328, 63.963478088378906, 53.823211669921875, 124.70640563964844, 78.78046417236328], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000316.npy"} +{"epoch": 0.47770219198790626, "step": 317, "batch_size": 64, "mean": 45.36719512939453, "std": 51.12873077392578, "min": -82.72000122070312, "p10": -15.726213073730468, "median": 42.963748931884766, "p90": 116.74709320068361, "max": 149.5123291015625, "pos_frac": 0.8125, "sample": [81.47412872314453, 83.23805236816406, 60.660892486572266, 101.6724853515625, 49.15544128417969, 149.5123291015625, -21.520912170410156, 41.97277069091797, -31.246641159057617, 37.78681182861328, 7.208732604980469, 33.43104934692383, -15.344917297363281, 2.8493423461914062, 45.091796875, 11.016773223876953, 96.67549133300781, 23.858642578125, 87.6602554321289, 130.89613342285156, -32.293212890625, -3.7721786499023438, 33.08375549316406, -53.56880187988281, 35.16912841796875, 43.95472717285156, 97.96102905273438, 58.95014953613281, 79.0259017944336, -82.72000122070312, 123.0551986694336, 12.164443969726562, 63.59911346435547, 135.61566162109375, 118.25263214111328, -45.79557800292969, 46.585906982421875, -0.004276275634765625, 57.16697692871094, 126.23529815673828, 29.790287017822266, 49.15034484863281, 135.08383178710938, -7.082817077636719, 24.99176025390625, 12.137332916259766, 21.67816925048828, 100.52212524414062, 21.719131469726562, 4.2843780517578125, 70.45806884765625, 24.476612091064453, 41.289466857910156, 113.23416900634766, -3.371490478515625, 58.31715393066406, -15.889625549316406, 56.65251159667969, 110.61553192138672, 93.81938171386719, 2.0012588500976562, 99.85479736328125, 23.807403564453125, 47.24623107910156], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000317.npy"} +{"epoch": 0.47921390778533635, "step": 318, "batch_size": 64, "mean": 32.15528106689453, "std": 66.7603530883789, "min": -93.28560638427734, "p10": -57.892232513427736, "median": 28.96119499206543, "p90": 128.6902618408203, "max": 198.67181396484375, "pos_frac": 0.65625, "sample": [28.52676010131836, 93.15245819091797, 16.63665771484375, -78.20173645019531, 109.7407455444336, 105.04399108886719, 40.802001953125, -58.34228515625, 51.20573425292969, 133.76104736328125, 12.371173858642578, -60.620994567871094, 63.013179779052734, 64.79330444335938, 117.84341430664062, -2.6115379333496094, 19.17193603515625, -34.29884338378906, 36.590232849121094, 6.350767135620117, -8.171249389648438, 72.69317626953125, 132.73898315429688, -18.69225311279297, 17.179790496826172, 70.82014465332031, 132.1092071533203, -87.96273803710938, 93.75733947753906, 80.36439514160156, -13.295707702636719, 33.188568115234375, -51.246002197265625, 21.127201080322266, 7.393241882324219, 198.67181396484375, 169.77992248535156, -30.068519592285156, 129.02447509765625, 11.367935180664062, -43.77229309082031, 29.3956298828125, 64.117431640625, -93.28560638427734, -5.681121826171875, 68.72557067871094, -1.5819625854492188, 137.09788513183594, -2.097003936767578, 88.19004821777344, 2.0331554412841797, 127.91043090820312, 41.281349182128906, 61.66209411621094, -76.48204040527344, -27.303688049316406, 62.07154846191406, -76.52714538574219, 40.52928161621094, -4.564971923828125, 81.49763488769531, -56.84210968017578, -22.420909881591797, 38.27684020996094], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000318.npy"} +{"epoch": 0.48072562358276644, "step": 319, "batch_size": 64, "mean": 45.84477615356445, "std": 60.0948371887207, "min": -67.7557373046875, "p10": -27.439994812011715, "median": 42.076045989990234, "p90": 125.40345840454101, "max": 199.36639404296875, "pos_frac": 0.75, "sample": [62.82807159423828, 137.21090698242188, 21.69244384765625, 123.60025024414062, 20.228605270385742, 118.115966796875, 2.732208251953125, 38.69013977050781, 31.397018432617188, 46.42756652832031, 109.53346252441406, 106.72083282470703, -4.6840057373046875, 0.10391998291015625, 19.391151428222656, 61.423614501953125, 12.98858642578125, 158.9724578857422, 8.086898803710938, 65.02178192138672, 7.634494781494141, -24.919479370117188, 38.7723388671875, 60.90336227416992, 174.6040802001953, -8.177558898925781, 125.4199447631836, 71.87352752685547, 123.16830444335938, 125.72637939453125, -33.42677307128906, -44.07704162597656, 56.73114013671875, 199.36639404296875, -9.70498275756836, 63.13208770751953, -24.978363037109375, 84.36441802978516, 71.0407943725586, -46.61518478393555, 125.364990234375, 42.4415283203125, -13.811927795410156, -1.9063911437988281, 9.232475280761719, 17.948312759399414, -66.82054138183594, -10.580818176269531, -37.19105529785156, 91.61640930175781, -12.493499755859375, 45.715362548828125, 34.47636413574219, -28.494979858398438, 41.71056365966797, 96.85191345214844, 60.1658935546875, 83.40422058105469, 73.6457748413086, 21.666589736938477, 74.66212463378906, -67.7557373046875, 135.92489624023438, 66.97355651855469], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000319.npy"} +{"epoch": 0.48223733938019653, "step": 320, "batch_size": 64, "mean": 35.11654281616211, "std": 61.37388610839844, "min": -126.48258972167969, "p10": -25.887144660949705, "median": 16.56216049194336, "p90": 111.62650985717774, "max": 237.9410400390625, "pos_frac": 0.6875, "sample": [83.4600830078125, -40.440677642822266, 1.419830322265625, 52.64495086669922, 17.018470764160156, 32.10772705078125, 120.336181640625, 3.4373741149902344, 70.9376449584961, -3.6863784790039062, -36.92909240722656, 109.54444885253906, -0.4456005096435547, -1.808938980102539, -51.44800567626953, 102.00479125976562, 66.21947479248047, 9.192222595214844, -15.370895385742188, 87.20474243164062, -36.64825439453125, -1.5563163757324219, -126.48258972167969, 3.736268997192383, 12.712417602539062, 237.9410400390625, 149.64651489257812, 93.9464340209961, 103.89622497558594, -21.629867553710938, 30.989418029785156, -17.82486343383789, 11.859748840332031, 25.007904052734375, -0.9096794128417969, 112.5188217163086, 10.434349060058594, -22.718955993652344, -8.00692367553711, -8.003253936767578, 39.91630935668945, 139.84190368652344, 9.885208129882812, 53.35113525390625, 16.105850219726562, 49.9307861328125, 131.2428741455078, 46.20934295654297, 1.341339111328125, -27.24493980407715, 2.9231033325195312, -61.68675994873047, 142.23629760742188, -15.853202819824219, 0.3201866149902344, 66.2890625, 19.409759521484375, 85.14315795898438, 98.056640625, 54.71739959716797, 66.86234283447266, -7.778205871582031, 90.62324523925781, 91.30908203125], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000320.npy"} +{"epoch": 0.4837490551776266, "step": 321, "batch_size": 64, "mean": 37.189849853515625, "std": 58.26282501220703, "min": -99.22706604003906, "p10": -41.099889373779284, "median": 33.136085510253906, "p90": 120.63108673095705, "max": 136.7195281982422, "pos_frac": 0.78125, "sample": [84.14752197265625, 80.96431732177734, 2.5373077392578125, 85.1669692993164, 80.03884887695312, -19.93872833251953, 136.7195281982422, 64.20343780517578, 117.26516723632812, 36.911521911621094, 135.0430908203125, 22.594196319580078, 41.34858322143555, 78.6064453125, -96.58949279785156, 7.381092071533203, 15.352622985839844, 57.74700927734375, 36.158538818359375, 111.20958709716797, 25.427352905273438, 22.9771728515625, -69.11162567138672, -8.324066162109375, 45.060874938964844, -72.179931640625, -66.51897430419922, -73.6526107788086, 57.154457092285156, 29.497909545898438, 31.801422119140625, 54.261417388916016, 92.23934936523438, 58.28266525268555, 12.738578796386719, 67.22848510742188, 55.856292724609375, -3.096071243286133, 22.76284408569336, 106.34728240966797, 3.0846710205078125, -0.9317359924316406, 21.761493682861328, 85.96843719482422, 12.432754516601562, -99.22706604003906, 110.66482543945312, 131.90771484375, 122.07362365722656, 58.230716705322266, 10.658035278320312, 8.718194961547852, 29.506004333496094, 123.80513000488281, 126.27468872070312, -10.728553771972656, 25.13524627685547, 34.47074890136719, 136.52745056152344, -46.00945281982422, 19.158912658691406, -4.316535949707031, 45.00885009765625, -29.644241333007812], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000321.npy"} +{"epoch": 0.4852607709750567, "step": 322, "batch_size": 64, "mean": 49.24391174316406, "std": 53.71333694458008, "min": -92.46636962890625, "p10": -15.381970405578612, "median": 37.97625541687012, "p90": 124.33892822265625, "max": 135.6407012939453, "pos_frac": 0.859375, "sample": [-14.345624923706055, 68.55829620361328, 129.33285522460938, 17.90118408203125, 99.30192565917969, 15.672401428222656, 131.9278564453125, 85.54175567626953, 112.58049011230469, 36.344451904296875, 49.256080627441406, 52.13829040527344, 124.93562316894531, 135.6407012939453, 81.57611083984375, 5.8323516845703125, 33.04722595214844, 33.85960388183594, 5.740795135498047, 24.191802978515625, 72.63803100585938, 0.24106597900390625, -60.98693084716797, 121.78199768066406, 113.16839599609375, 18.456192016601562, 24.369842529296875, 38.038978576660156, 1.1323471069335938, -10.267814636230469, -26.7457275390625, 88.31364440917969, 34.41270446777344, 115.33342742919922, 114.05897521972656, 58.08775329589844, 18.183677673339844, 130.25222778320312, 12.570114135742188, -17.875396728515625, 61.45953369140625, 54.99469757080078, 2.4923744201660156, 120.82428741455078, 24.819740295410156, 122.94664001464844, 128.3295135498047, 90.33926391601562, -32.19468688964844, -92.46636962890625, 37.91353225708008, 19.978286743164062, 19.950565338134766, 42.83976745605469, 110.344482421875, 23.71142578125, 55.41284942626953, 29.110366821289062, 66.9981689453125, -38.6920280456543, 135.31851196289062, -15.826118469238281, 82.18045043945312, 26.627321243286133], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000322.npy"} +{"epoch": 0.48677248677248675, "step": 323, "batch_size": 64, "mean": 34.64881896972656, "std": 66.80699157714844, "min": -122.08167266845703, "p10": -38.02350158691405, "median": 15.815597534179688, "p90": 133.4409378051758, "max": 183.72784423828125, "pos_frac": 0.71875, "sample": [11.260169982910156, -71.03656005859375, 64.33442687988281, 35.64453125, -15.028724670410156, 121.46458435058594, 29.967056274414062, 11.29959487915039, 6.176338195800781, 135.4706268310547, 32.92579650878906, -26.32978630065918, 128.64227294921875, 19.06810760498047, 103.12615203857422, -24.78274154663086, -44.06999206542969, 91.31524658203125, 84.1332015991211, 9.622772216796875, 56.30726623535156, 102.9427490234375, 17.322357177734375, 14.959548950195312, 150.333740234375, -10.483299255371094, -41.946563720703125, 57.37208557128906, 0.2077960968017578, -28.86968994140625, 183.72784423828125, -28.340301513671875, 10.268836975097656, -48.0206184387207, 133.7905731201172, 17.74681854248047, -53.751953125, 119.68798828125, 82.58126831054688, 0.6872196197509766, 16.56786346435547, 54.58867645263672, -9.58258056640625, 4.309104919433594, 147.4643096923828, 161.5256805419922, 132.6251220703125, -113.22987365722656, 158.1270751953125, 3.6653518676757812, -122.08167266845703, -3.5960159301757812, 94.09429168701172, 15.063331604003906, -2.33758544921875, 75.01062774658203, 79.0322265625, 67.89352416992188, 3.4813690185546875, -8.092899322509766, 25.133373260498047, 2.3435516357421875, 6.9742584228515625, -11.181381225585938], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000323.npy"} +{"epoch": 0.48828420256991684, "step": 324, "batch_size": 64, "mean": 42.810333251953125, "std": 54.005149841308594, "min": -110.8078842163086, "p10": -15.373353004455566, "median": 32.97072982788086, "p90": 112.88522644042969, "max": 168.96768188476562, "pos_frac": 0.859375, "sample": [72.36221313476562, 39.073089599609375, 32.91548156738281, 11.149024963378906, -55.0858039855957, 135.5922088623047, 43.26592254638672, 53.85658264160156, -28.310562133789062, -6.000236511230469, 10.362998962402344, 111.50601196289062, 64.78695678710938, 49.03975296020508, 79.62966918945312, 16.1610107421875, 116.23709869384766, -25.59648895263672, 70.77918243408203, 8.537200927734375, 56.54150390625, 17.6881103515625, 5.343273162841797, 72.86481475830078, 31.4952392578125, 12.996118545532227, -22.15747833251953, 15.280067443847656, 168.96768188476562, 17.143970489501953, 19.20361328125, -110.8078842163086, 52.00904846191406, 113.476318359375, 27.726272583007812, 46.60771560668945, 24.96283721923828, -15.096410751342773, 68.86763000488281, 75.19982147216797, 35.89537048339844, -37.07855224609375, 159.72119140625, 14.576362609863281, 145.38690185546875, 19.177654266357422, 4.4129486083984375, 110.52943420410156, 53.87588882446289, 111.47396087646484, 144.8646697998047, 2.546710968017578, 5.0551605224609375, 85.35931396484375, 92.73094177246094, 1.9445343017578125, 33.025978088378906, 0.8868255615234375, -15.492042541503906, 51.98698043823242, 108.59646606445312, 105.7923583984375, 24.0091552734375, 2.0094127655029297], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000324.npy"} +{"epoch": 0.4897959183673469, "step": 325, "batch_size": 64, "mean": 42.71232986450195, "std": 66.55587005615234, "min": -170.6421661376953, "p10": -28.588523864746094, "median": 41.81354331970215, "p90": 117.03997650146485, "max": 215.1746826171875, "pos_frac": 0.75, "sample": [37.71585464477539, 110.34269714355469, 2.214588165283203, 95.25218200683594, -20.56157684326172, 57.85600280761719, 82.09341430664062, 53.371681213378906, 54.88041687011719, 63.342796325683594, 69.27742004394531, 97.83850860595703, -0.6773548126220703, -27.980392456054688, 57.830047607421875, -11.320056915283203, 114.8463134765625, 92.48359680175781, 89.24401092529297, -81.64309692382812, 151.64999389648438, -28.849151611328125, 109.20840454101562, 1.4860591888427734, -0.7668304443359375, 164.81585693359375, 14.65097427368164, 100.33123779296875, -49.61190414428711, 49.28150177001953, -67.80679321289062, 41.90888595581055, 81.30667877197266, 41.71820068359375, -65.78887176513672, 73.28671264648438, -46.03470993041992, 98.40251159667969, 43.17267608642578, 215.1746826171875, 48.83192443847656, 17.786794662475586, 21.182373046875, 176.70584106445312, -170.6421661376953, 19.84178924560547, 31.694488525390625, 20.19001007080078, 117.98011779785156, 65.76861572265625, 139.26980590820312, -7.230506896972656, 37.495758056640625, -13.464553833007812, 13.739387512207031, -10.64385986328125, 34.393699645996094, 50.2541618347168, 162.50697326660156, 41.358306884765625, 20.802200317382812, 43.60346221923828, 22.235977172851562, -14.0145263671875], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000325.npy"} +{"epoch": 0.491307634164777, "step": 326, "batch_size": 64, "mean": 19.520490646362305, "std": 59.92258834838867, "min": -104.13430786132812, "p10": -68.41730766296386, "median": 16.927675247192383, "p90": 95.26742324829102, "max": 145.36656188964844, "pos_frac": 0.59375, "sample": [-23.751075744628906, -9.226299285888672, 15.331974029541016, 18.538753509521484, 38.02561950683594, -104.13430786132812, 145.36656188964844, 103.050048828125, -3.6541748046875, 69.95415496826172, -29.437652587890625, 35.35988998413086, 24.367412567138672, 1.5211181640625, 49.4996452331543, 91.14653778076172, 7.983652114868164, 58.64396667480469, -8.906875610351562, 47.76737976074219, 103.37223052978516, -5.0630645751953125, 18.52337646484375, 69.3037109375, -47.52739715576172, -15.528594970703125, -91.08441162109375, -12.438812255859375, 0.97491455078125, -6.363563537597656, 137.29928588867188, -100.17183685302734, 47.354026794433594, -11.022907257080078, 57.051673889160156, 28.381820678710938, 5.436378479003906, -21.987762451171875, -42.75437927246094, -33.751922607421875, 95.79680633544922, 120.7892074584961, -72.01554870605469, -7.652191162109375, 94.03219604492188, 27.073387145996094, 31.610111236572266, -72.87763214111328, 85.13629913330078, 128.4379119873047, -3.7617454528808594, -11.112024307250977, -86.58763122558594, 82.16988372802734, -14.1231689453125, 13.015533447265625, -77.86048889160156, 76.12826538085938, 57.26180648803711, 31.09649658203125, 84.22761535644531, -60.02141189575195, 33.052886962890625, 88.04582214355469], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000326.npy"} +{"epoch": 0.4928193499622071, "step": 327, "batch_size": 64, "mean": 34.24985885620117, "std": 65.29631805419922, "min": -126.68238830566406, "p10": -47.71833915710449, "median": 30.544631958007812, "p90": 123.2050018310547, "max": 180.389892578125, "pos_frac": 0.71875, "sample": [41.75597381591797, -49.02106475830078, -30.08124542236328, 146.92352294921875, 31.536758422851562, 59.916656494140625, -87.50513458251953, 63.61097717285156, -71.65202331542969, 66.42095947265625, 135.56094360351562, 22.622180938720703, -78.25077056884766, 112.3463134765625, 38.380714416503906, 120.4888916015625, 99.19400024414062, 10.646125793457031, 39.01719665527344, -39.89873123168945, -0.6073894500732422, 13.576313018798828, 60.518653869628906, 147.96340942382812, 124.36904907226562, 5.2064361572265625, 45.36260986328125, 62.525970458984375, 83.53771209716797, 6.4390411376953125, 22.668792724609375, 8.437503814697266, -57.23338317871094, 103.080322265625, 95.41940307617188, 2.6073226928710938, 33.07923889160156, 29.552505493164062, -9.875732421875, 1.7158546447753906, 143.64027404785156, 19.235305786132812, -126.68238830566406, 5.46728515625, 90.59003448486328, 180.389892578125, -25.367950439453125, 88.79159545898438, 136.577880859375, 39.39794158935547, 102.48839569091797, -7.646936416625977, 21.029556274414062, 8.099163055419922, -44.678646087646484, -22.250452041625977, 97.98172760009766, 75.54752349853516, 38.875030517578125, -5.392223358154297, -6.723274230957031, -82.50879669189453, 69.64387512207031, -14.869682312011719], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000327.npy"} +{"epoch": 0.4943310657596372, "step": 328, "batch_size": 64, "mean": 42.193260192871094, "std": 55.13753128051758, "min": -82.19010162353516, "p10": -13.99642810821533, "median": 27.53561782836914, "p90": 118.78080673217774, "max": 164.41259765625, "pos_frac": 0.765625, "sample": [109.60728454589844, 5.94389533996582, 8.934694290161133, 29.129287719726562, 103.48782348632812, 9.422307968139648, -14.970897674560547, 89.80113983154297, 54.564430236816406, 22.675811767578125, 21.53404998779297, 130.64938354492188, 121.42539978027344, 24.804988861083984, 49.4208984375, -44.05134582519531, 134.05636596679688, 19.905759811401367, 48.04570007324219, -7.702899932861328, 29.568252563476562, 0.90521240234375, 6.311063766479492, 43.6084098815918, -19.234603881835938, -9.725257873535156, 163.27496337890625, 25.94194793701172, -55.665435791015625, 39.370826721191406, -82.19010162353516, 98.53558349609375, 83.76161193847656, 8.684478759765625, 113.71298217773438, -18.553817749023438, 23.649429321289062, -2.4554443359375, 164.41259765625, 13.1566162109375, 110.84764099121094, 118.84019470214844, -5.749687194824219, -11.722665786743164, 3.2046661376953125, 95.82781219482422, -3.850667953491211, 13.093002319335938, 2.4582672119140625, 30.826160430908203, 66.7648696899414, -25.792037963867188, 52.188690185546875, 33.872406005859375, 10.70159912109375, 67.27676391601562, 84.28362274169922, -1.2425289154052734, 118.6422348022461, 49.24701690673828, 98.20172119140625, -0.0923309326171875, 137.22792053222656, 111.56072235107422], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000328.npy"} +{"epoch": 0.4958427815570673, "step": 329, "batch_size": 64, "mean": 42.49573516845703, "std": 61.471458435058594, "min": -73.68582153320312, "p10": -30.884706497192376, "median": 29.101985931396484, "p90": 134.47635574340822, "max": 170.98651123046875, "pos_frac": 0.75, "sample": [9.339654922485352, 12.075580596923828, 48.51325225830078, 29.89971160888672, -34.67997741699219, 36.62078857421875, 170.98651123046875, -17.115310668945312, 113.61590576171875, 17.122802734375, 89.9503173828125, 49.13557434082031, -11.265920639038086, 87.04716491699219, 0.40748023986816406, 9.913200378417969, 32.198822021484375, 127.94717407226562, -33.875762939453125, 33.42017364501953, 0.6677093505859375, 30.013826370239258, 144.7066650390625, 74.14830017089844, -62.344093322753906, 138.14022827148438, 149.86643981933594, 91.7578353881836, 28.30426025390625, 23.432167053222656, 127.98287200927734, 101.40803527832031, -36.306495666503906, 126.89089965820312, 5.709661483764648, 8.881301879882812, 137.25927734375, -0.1665973663330078, 114.4102554321289, 78.03237915039062, 153.6181640625, 113.09178161621094, 7.268260955810547, -44.362884521484375, 0.1590576171875, 125.21306610107422, 1.6516456604003906, 23.684547424316406, 20.203826904296875, 31.25394058227539, -9.83700180053711, 65.8583984375, -1.1276702880859375, -23.905574798583984, 141.15850830078125, 99.00613403320312, -22.840089797973633, 77.3501205444336, -12.7509765625, -73.68582153320312, 31.483596801757812, 8.202926635742188, -0.26259803771972656, -44.756500244140625], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000329.npy"} +{"epoch": 0.4973544973544973, "step": 330, "batch_size": 64, "mean": 43.419342041015625, "std": 71.19536590576172, "min": -141.939697265625, "p10": -47.29979705810547, "median": 35.43434524536133, "p90": 129.07528076171874, "max": 167.80799865722656, "pos_frac": 0.734375, "sample": [6.100547790527344, -29.08221435546875, -13.447027206420898, -112.32636260986328, 33.90839385986328, -141.939697265625, 105.57334899902344, 15.359283447265625, -23.576576232910156, 120.3494644165039, 117.966796875, 48.983001708984375, -87.06754302978516, -1.9589462280273438, 29.38888931274414, 135.98287963867188, 146.22738647460938, -65.77808380126953, 167.80799865722656, 128.9193572998047, 75.14241027832031, -1.2101173400878906, 98.69943237304688, 1.788503646850586, 125.60244750976562, 129.14210510253906, 5.2150115966796875, 10.702278137207031, -44.56184387207031, 13.224205017089844, 50.2413330078125, 96.9399185180664, -7.2011871337890625, 61.56644821166992, -64.42910766601562, 123.87886810302734, 95.78199768066406, 121.05538940429688, 100.43186950683594, 20.450023651123047, 7.80242919921875, 63.778167724609375, 43.00013732910156, 83.10537719726562, 114.8435287475586, 116.27226257324219, 2.821941375732422, 41.4181022644043, -0.799102783203125, 12.552017211914062, -6.16864013671875, 33.718292236328125, 135.92599487304688, 110.40525817871094, -21.494644165039062, 21.918212890625, 36.960296630859375, -48.47320556640625, 152.562744140625, -78.99269104003906, 93.2820816040039, 116.61129760742188, 11.640419006347656, 142.2967529296875], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000330.npy"} +{"epoch": 0.4988662131519274, "step": 331, "batch_size": 64, "mean": 56.48115921020508, "std": 68.10791778564453, "min": -142.877197265625, "p10": -16.631608581542963, "median": 53.216758728027344, "p90": 138.8811248779297, "max": 221.1815643310547, "pos_frac": 0.84375, "sample": [146.5503387451172, 13.981178283691406, 28.275653839111328, 96.92898559570312, 103.25199890136719, 138.79244995117188, 97.24504089355469, 89.82546997070312, 77.447509765625, -9.705703735351562, 4.458538055419922, 166.11363220214844, 137.32545471191406, 138.91912841796875, 102.13453674316406, 11.099922180175781, 154.57620239257812, 42.01029968261719, 33.70697021484375, 142.79335021972656, 81.3887939453125, 6.593410491943359, 13.620635986328125, 20.492462158203125, -19.599853515625, 126.88493347167969, 89.13167572021484, 221.1815643310547, 17.913681030273438, 67.36471557617188, 62.70802307128906, 49.14850997924805, 134.66673278808594, 89.11505126953125, 3.7498931884765625, 0.46556854248046875, 53.370208740234375, -83.56797790527344, -74.65087890625, 84.20958709716797, -40.9957275390625, 149.5822296142578, 48.06813049316406, -0.275177001953125, 29.19211769104004, -142.877197265625, 53.06330871582031, 1.252044677734375, -28.235694885253906, 26.74625587463379, 24.56281280517578, 101.62709045410156, 110.74488830566406, 32.72996520996094, 46.20695495605469, 6.667350769042969, -0.9374608993530273, 120.92496490478516, 72.52337646484375, -79.06462097167969, 131.84420776367188, 72.8648681640625, 92.50180053710938, 126.16018676757812], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000331.npy"} +{"epoch": 0.5003779289493575, "step": 332, "batch_size": 64, "mean": 46.33306884765625, "std": 60.922752380371094, "min": -75.0548324584961, "p10": -6.4986648559570295, "median": 24.365734100341797, "p90": 136.96165161132814, "max": 179.7081298828125, "pos_frac": 0.8125, "sample": [-32.656436920166016, 2.2223892211914062, 3.1645889282226562, 0.9981689453125, 16.870485305786133, 100.91197967529297, 23.082870483398438, 29.41606330871582, 23.784683227539062, 41.8781852722168, -2.6668167114257812, 179.7081298828125, 132.4519805908203, 76.72933959960938, 124.91995239257812, 22.81433868408203, 23.414260864257812, 0.3600959777832031, 90.65438842773438, 34.679473876953125, 79.41268157958984, 13.028671264648438, -70.87271118164062, 136.1659698486328, 88.55140686035156, 104.46129608154297, -75.0548324584961, 16.82964324951172, 8.123275756835938, -0.41718292236328125, 24.88465118408203, 137.3026580810547, 28.826873779296875, -4.4850006103515625, -7.361663818359375, 42.18211364746094, 1.677560806274414, 163.778564453125, -61.89793395996094, 3.380037307739258, 80.48068237304688, 110.35316467285156, 91.30462646484375, -4.060075759887695, 22.76067352294922, 0.5514755249023438, 77.54795837402344, 108.68829345703125, 110.42857360839844, 50.11625671386719, 159.1674346923828, 9.117485046386719, 60.8599739074707, -3.7271347045898438, 14.445869445800781, -19.989395141601562, 142.77999877929688, 7.351795196533203, 25.72967529296875, 137.94015502929688, 173.60018920898438, 93.62504577636719, -28.857250213623047, 23.846817016601562], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000332.npy"} +{"epoch": 0.5018896447467877, "step": 333, "batch_size": 64, "mean": 51.451988220214844, "std": 59.72532272338867, "min": -88.33504486083984, "p10": -11.71493854522705, "median": 42.58345413208008, "p90": 141.38120422363284, "max": 185.69436645507812, "pos_frac": 0.8125, "sample": [15.039234161376953, -12.226644515991211, 19.369735717773438, 89.22564697265625, 22.761367797851562, 0.02600860595703125, 39.4613151550293, 81.60443115234375, 6.085559844970703, -2.35638427734375, 64.32848358154297, 70.91236877441406, 71.28742218017578, 105.83040618896484, 120.79046630859375, 28.981552124023438, 40.100433349609375, 144.58045959472656, 165.09814453125, 150.29876708984375, -4.8847808837890625, 45.783470153808594, 46.82384490966797, 33.26496887207031, 54.75407409667969, -49.89757537841797, -27.483707427978516, 52.761436462402344, 9.542167663574219, 46.51799774169922, 136.38058471679688, 137.19122314453125, -14.275955200195312, 57.16602325439453, 88.21734619140625, 38.99668502807617, 171.63296508789062, 4.802818298339844, 12.50937271118164, 30.845687866210938, -1.7487049102783203, 39.36677551269531, -88.33504486083984, 7.783224105834961, 50.947181701660156, -52.416015625, 185.69436645507812, 17.12018585205078, -10.520957946777344, 45.06647491455078, 12.776351928710938, -3.02166748046875, 83.98419189453125, 143.17691040039062, 10.805421829223633, -13.052879333496094, 85.02777862548828, 15.107124328613281, 129.97000122070312, 61.168006896972656, 162.67880249023438, 78.01122283935547, 123.94719696044922, 117.5438003540039], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000333.npy"} +{"epoch": 0.5034013605442177, "step": 334, "batch_size": 64, "mean": 36.76668930053711, "std": 68.86322784423828, "min": -118.65348052978516, "p10": -37.425795745849605, "median": 23.161453247070312, "p90": 133.60936889648437, "max": 194.95559692382812, "pos_frac": 0.6875, "sample": [-55.22020721435547, -118.65348052978516, 56.13135528564453, 91.9336166381836, 56.931671142578125, -16.772247314453125, -92.74906921386719, 110.6078872680664, 16.95354461669922, -111.94632720947266, -0.900238037109375, 194.95559692382812, -11.799785614013672, 64.86311340332031, 4.503456115722656, 86.65164947509766, -10.9703369140625, -20.348024368286133, 48.1661376953125, 85.20916748046875, 87.32682800292969, 154.07717895507812, 31.02947235107422, 65.5036849975586, 73.2833251953125, -54.980655670166016, 23.8729248046875, 1.003549575805664, 112.46855163574219, 7.750522613525391, -3.7328052520751953, 0.5405502319335938, 144.01358032226562, -83.5152587890625, 84.85497283935547, 136.37442016601562, 51.409912109375, 10.51177978515625, 42.53587341308594, -5.812705993652344, 9.386550903320312, -23.465103149414062, -6.8245849609375, -8.79400634765625, 133.64968872070312, -1.3814926147460938, 0.8798294067382812, 10.976016998291016, -34.697418212890625, 114.37608337402344, 105.54251861572266, 56.99738311767578, -33.52716064453125, 78.63748931884766, -38.59510040283203, 22.449981689453125, 47.36781311035156, 146.32791137695312, 2.374420166015625, 15.284952163696289, 112.62615966796875, 80.4383773803711, 173.45938110351562, 133.51528930664062], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000334.npy"} +{"epoch": 0.5049130763416477, "step": 335, "batch_size": 64, "mean": 41.21553039550781, "std": 68.2203140258789, "min": -99.630615234375, "p10": -37.08243103027343, "median": 25.744760513305664, "p90": 144.29544067382812, "max": 176.30569458007812, "pos_frac": 0.75, "sample": [75.07667541503906, 62.529075622558594, -37.641937255859375, 176.30569458007812, 21.469390869140625, 116.17977905273438, 37.86906433105469, 2.1029529571533203, 168.50973510742188, 86.55561065673828, 153.4000244140625, 132.05267333984375, 30.415634155273438, 57.77601623535156, 152.21963500976562, 136.91334533691406, 9.123008728027344, 64.57950592041016, 17.46564483642578, 145.4579315185547, -40.156002044677734, 0.0681915283203125, 41.76270294189453, 151.35699462890625, -55.31842041015625, 16.979217529296875, 90.71298217773438, -26.33538055419922, -35.77691650390625, 67.3040542602539, 114.06053161621094, 9.222190856933594, 7.492454528808594, 59.042259216308594, 113.86264038085938, -31.851268768310547, 143.72378540039062, -11.526569366455078, 21.562782287597656, 144.54043579101562, 7.9724884033203125, -6.27635383605957, 22.4649658203125, 30.195228576660156, 58.95841979980469, 98.87279510498047, -12.680763244628906, -94.95458984375, 26.491825103759766, 1.996683120727539, 24.997695922851562, -35.61894607543945, -7.523582458496094, -99.630615234375, -91.6854248046875, -53.32195281982422, 129.19728088378906, 84.57810974121094, 2.7746734619140625, 75.982177734375, -10.128913879394531, 6.681877136230469, 15.337982177734375, 74.0267333984375], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000335.npy"} +{"epoch": 0.5064247921390779, "step": 336, "batch_size": 64, "mean": 42.551612854003906, "std": 70.7847671508789, "min": -94.9492416381836, "p10": -43.87224426269531, "median": 28.031761169433594, "p90": 144.20301513671876, "max": 230.39027404785156, "pos_frac": 0.765625, "sample": [-52.841522216796875, 2.20062255859375, 139.36248779296875, 36.32020568847656, 212.05245971679688, 138.81591796875, 68.68951416015625, -1.8865280151367188, 146.27752685546875, 1.5980205535888672, 3.397188186645508, -6.846155166625977, 150.86146545410156, -4.967864990234375, 135.0846405029297, 20.256389617919922, 6.498771667480469, 78.2919921875, 167.67184448242188, -76.49317932128906, -39.71234130859375, 55.837646484375, 166.26553344726562, 44.689735412597656, 4.6966552734375, 102.427490234375, 35.39540481567383, -94.9492416381836, -30.955352783203125, -51.10181427001953, 159.5680389404297, -59.36511993408203, 41.562644958496094, 28.559722900390625, 7.991840362548828, 9.126935958862305, 0.9947052001953125, -11.075111389160156, 48.04778289794922, 118.81065368652344, 14.467300415039062, -16.24083709716797, 54.09043884277344, 11.953990936279297, 124.54930114746094, 33.01214599609375, 45.626556396484375, 7.1788330078125, 24.76923942565918, 115.68305969238281, 10.672332763671875, 0.097412109375, 68.1737060546875, 127.57997131347656, 230.39027404785156, 51.217857360839844, -45.655059814453125, 13.021575927734375, 81.17858123779297, -22.448989868164062, 32.2271728515625, 85.10888671875, 27.503799438476562, -52.01399230957031], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000336.npy"} +{"epoch": 0.5079365079365079, "step": 337, "batch_size": 64, "mean": 33.22272491455078, "std": 62.960208892822266, "min": -120.07857513427734, "p10": -34.93184738159179, "median": 27.341251373291016, "p90": 116.42899627685547, "max": 185.19793701171875, "pos_frac": 0.71875, "sample": [8.007743835449219, -79.3261489868164, -120.07857513427734, -21.796714782714844, 31.903228759765625, 107.29867553710938, -11.792848587036133, 112.50291442871094, 34.478057861328125, 4.340553283691406, 129.79901123046875, 17.25615692138672, 45.90148162841797, -102.95030975341797, -43.12432861328125, -17.84276580810547, 33.65357971191406, 126.16390991210938, 20.29859161376953, -16.659194946289062, 6.206474304199219, 0.0052433013916015625, -22.135414123535156, -65.56509399414062, 97.56815338134766, 81.2587890625, -11.546218872070312, 41.49304962158203, 49.80029296875, 152.81373596191406, 25.96947479248047, 3.4622116088867188, 126.16360473632812, -8.039260864257812, 101.90106201171875, 59.04937744140625, 116.94796752929688, -11.174484252929688, 2.8183822631835938, 72.78816223144531, 130.287353515625, 6.2055511474609375, 115.21806335449219, 28.713027954101562, 61.92814636230469, -24.054519653320312, 62.061920166015625, 25.607559204101562, 51.55517578125, 23.267669677734375, 79.01905822753906, 185.19793701171875, -1.8830490112304688, -19.3291015625, 31.202041625976562, 90.59266662597656, 8.977792739868164, -39.59355926513672, 85.63113403320312, 68.96207427978516, -88.70573425292969, 20.785476684570312, 107.69670104980469, 39.092403411865234], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000337.npy"} +{"epoch": 0.509448223733938, "step": 338, "batch_size": 64, "mean": 34.49760818481445, "std": 65.88002014160156, "min": -139.17752075195312, "p10": -33.62076034545898, "median": 19.954204559326172, "p90": 125.89161529541016, "max": 157.16470336914062, "pos_frac": 0.71875, "sample": [-55.63720703125, 22.823856353759766, 127.10888671875, 120.60006713867188, 123.05131530761719, 101.06011199951172, -84.3926773071289, 105.16097259521484, 23.533554077148438, 135.7299346923828, 155.77920532226562, 16.114784240722656, -0.8444595336914062, 34.63609313964844, 5.211273193359375, -83.07904052734375, 9.01751708984375, -95.3865966796875, -0.027191162109375, 2.3963241577148438, -26.165428161621094, 119.21084594726562, 17.084552764892578, -3.197603225708008, 9.545890808105469, 74.10818481445312, -139.17752075195312, 91.02547454833984, 75.58694458007812, 64.8864974975586, -3.7751235961914062, 82.35824584960938, 13.287006378173828, 33.42586898803711, 56.130409240722656, 69.84928894042969, 9.740028381347656, 16.881561279296875, 157.16470336914062, 12.006484985351562, 16.485084533691406, 120.42758178710938, -25.814590454101562, 95.41877746582031, 5.094203948974609, 23.937347412109375, -34.103858947753906, -32.4935302734375, 29.212158203125, -23.373828887939453, 25.045860290527344, 147.17823791503906, 7.266376495361328, 4.11273193359375, 55.435184478759766, 69.91828918457031, -1.7239837646484375, 135.51834106445312, 109.20287322998047, -64.16629028320312, -22.239442825317383, 37.82622528076172, 141.82626342773438, -4.976070404052734], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000338.npy"} +{"epoch": 0.5109599395313681, "step": 339, "batch_size": 64, "mean": 40.781593322753906, "std": 61.73299026489258, "min": -110.45777893066406, "p10": -30.931806182861315, "median": 36.023475646972656, "p90": 130.0973182678223, "max": 167.80984497070312, "pos_frac": 0.765625, "sample": [51.70209503173828, 37.41454315185547, 12.300003051757812, -19.772987365722656, -13.225028991699219, 133.2892608642578, 4.9312591552734375, 37.31690979003906, 12.424076080322266, -67.7345199584961, 52.153778076171875, -15.71826171875, 9.45352554321289, 33.961727142333984, 47.20884323120117, 9.515861511230469, -76.8105239868164, 108.06564331054688, 111.63619995117188, 6.72099494934082, 122.64945220947266, 32.335777282714844, 70.2182846069336, 71.66568756103516, 24.815162658691406, 136.65277099609375, 1.8156280517578125, 29.34457778930664, -44.51068878173828, 61.34730911254883, 55.38859176635742, 85.24496459960938, 150.53622436523438, 150.87283325195312, 72.97733306884766, 5.669384002685547, 88.36991882324219, -35.71415710449219, 89.77529907226562, 61.58697509765625, 148.61215209960938, 39.06101989746094, -16.03700065612793, -11.520408630371094, 34.73004150390625, -0.6758880615234375, 34.270904541015625, 77.29141235351562, -83.63109588623047, -41.291778564453125, 11.298273086547852, 6.185573577880859, 98.86091613769531, 116.14906311035156, -110.45777893066406, 167.80984497070312, -7.06268310546875, 46.660369873046875, 6.1237335205078125, 99.3625717163086, 83.11170959472656, 48.41592025756836, -0.1831188201904297, 157.06361389160156], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000339.npy"} +{"epoch": 0.5124716553287982, "step": 340, "batch_size": 64, "mean": 41.218807220458984, "std": 74.30816650390625, "min": -139.19955444335938, "p10": -42.79327697753905, "median": 22.483112335205078, "p90": 146.99323425292968, "max": 164.55844116210938, "pos_frac": 0.625, "sample": [59.34538269042969, 138.68490600585938, 18.711627960205078, 65.81188201904297, -3.3444976806640625, 156.26588439941406, 1.148305892944336, -2.390146255493164, -31.792266845703125, 159.50390625, -0.08400726318359375, 80.56040954589844, 51.19374084472656, 114.23115539550781, 155.32391357421875, 102.3936767578125, 16.252931594848633, -65.35102844238281, 62.93963623046875, 82.70074462890625, -22.138216018676758, -12.939844131469727, -64.24493408203125, 83.58722686767578, -13.11474609375, 160.50111389160156, -11.04827880859375, 131.06732177734375, -22.22344207763672, 145.39920043945312, -98.22515869140625, 123.1759033203125, 8.336334228515625, 33.63836669921875, 149.32359313964844, 53.04897689819336, 127.7064208984375, -0.2513561248779297, -12.056777954101562, 142.1028594970703, 97.04783630371094, -26.270156860351562, -1.9290924072265625, 147.6763916015625, 55.89561080932617, -7.762598037719727, -75.71330261230469, -71.48150634765625, 3.8244781494140625, 136.03326416015625, -5.0607757568359375, 50.699832916259766, 76.33368682861328, -15.077600479125977, -139.19955444335938, -47.50799560546875, 143.3652801513672, 14.383781433105469, 59.164459228515625, 164.55844116210938, 26.254596710205078, 5.265739440917969, -21.012481689453125, 4.764701843261719], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000340.npy"} +{"epoch": 0.5139833711262283, "step": 341, "batch_size": 64, "mean": 46.7509765625, "std": 70.32353210449219, "min": -111.98063659667969, "p10": -36.22440795898437, "median": 32.32845497131348, "p90": 145.6838821411133, "max": 164.64376831054688, "pos_frac": 0.75, "sample": [-66.51638793945312, 71.56905364990234, 135.44906616210938, 60.858062744140625, 115.24942779541016, 71.78530883789062, 122.9603500366211, 164.64376831054688, 147.55126953125, -33.033905029296875, 131.6940460205078, 27.554641723632812, -93.9704360961914, -6.089450836181641, 25.137540817260742, 3.904582977294922, 122.34516143798828, 4.628547668457031, 114.55622863769531, 150.61764526367188, 109.51066589355469, 144.80517578125, 146.0604705810547, 70.4278793334961, -89.22216796875, 136.1004180908203, 97.30113220214844, 10.022022247314453, -12.010780334472656, -16.277435302734375, 32.86821365356445, 14.004196166992188, -21.036346435546875, 2.7201919555664062, 23.594345092773438, 133.58270263671875, 48.51265335083008, 16.328107833862305, 69.46331024169922, -52.23127746582031, -31.135108947753906, -48.59771728515625, 54.67510223388672, 147.867431640625, 6.5578155517578125, 149.55819702148438, 31.7886962890625, 77.27510070800781, 94.96158599853516, 155.19668579101562, 62.124847412109375, 10.568756103515625, 101.66737365722656, -37.591766357421875, 5.684814453125, 100.62689208984375, 74.98090362548828, 29.49706268310547, -1.9179706573486328, -22.50579833984375, -19.262596130371094, 11.58624267578125, 15.018461227416992, -111.98063659667969], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000341.npy"} +{"epoch": 0.5154950869236583, "step": 342, "batch_size": 64, "mean": 48.285316467285156, "std": 68.95088195800781, "min": -102.50482940673828, "p10": -30.734461975097645, "median": 30.8187255859375, "p90": 146.90867614746094, "max": 213.3849639892578, "pos_frac": 0.734375, "sample": [30.671791076660156, 25.145172119140625, -1.8093032836914062, -9.008529663085938, 4.498620986938477, 135.38421630859375, 23.824665069580078, 116.827880859375, -45.34071350097656, 10.236480712890625, -4.403581619262695, 49.47412109375, -2.4890193939208984, 142.14923095703125, 4.108421325683594, -43.935546875, 0.7642421722412109, -102.50482940673828, -2.4879817962646484, -20.78447723388672, 23.622478485107422, 140.78956604003906, 107.04780578613281, 145.4154510498047, -34.998741149902344, 55.03778076171875, 36.43865966796875, 70.24916076660156, 114.07575988769531, 49.33242416381836, 44.457096099853516, 49.61062240600586, 30.954376220703125, 117.46986389160156, 40.40586853027344, -12.494237899780273, 113.17930603027344, 12.611373901367188, -41.245849609375, 140.72679138183594, 20.815933227539062, 152.044921875, 82.89788818359375, 76.85325622558594, -46.808929443359375, 157.72999572753906, 0.7939376831054688, -4.830585479736328, 213.3849639892578, 168.8298797607422, 99.20088958740234, -72.75679779052734, 21.19164276123047, 147.5486297607422, -14.944698333740234, 149.8570098876953, 67.32991027832031, -4.421440124511719, 4.918006896972656, 59.55179977416992, 63.308937072753906, 30.683074951171875, 13.34893798828125, 190.7266845703125], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000342.npy"} +{"epoch": 0.5170068027210885, "step": 343, "batch_size": 64, "mean": 32.68980407714844, "std": 63.00702667236328, "min": -130.55462646484375, "p10": -15.113537597656249, "median": 20.61648941040039, "p90": 106.83208770751956, "max": 228.8349609375, "pos_frac": 0.75, "sample": [62.75396728515625, 10.374549865722656, -8.879280090332031, 7.0076141357421875, -6.8638763427734375, 69.70243072509766, -13.262664794921875, -0.8619289398193359, -4.426788330078125, -7.305824279785156, -121.12413787841797, 17.558685302734375, 47.97462463378906, 56.820350646972656, 228.8349609375, -6.170192718505859, 132.56674194335938, 169.5384979248047, 109.7059097290039, 91.77284240722656, 34.256622314453125, 5.630289077758789, 74.5882568359375, 99.58594512939453, 9.127758026123047, 54.62592697143555, 16.427093505859375, -41.37443542480469, 41.89739227294922, -4.375814437866211, -82.67932891845703, 41.559593200683594, 97.56402587890625, 21.219676971435547, 29.148040771484375, 4.1085357666015625, 80.09061431884766, 110.4189453125, -116.97514343261719, 143.95912170410156, -15.906768798828125, 48.128662109375, 32.596824645996094, 142.813232421875, 47.22174072265625, 15.879791259765625, 60.0401611328125, 20.013301849365234, 15.0465087890625, 100.12650299072266, 93.16313934326172, 8.177040100097656, 7.684013366699219, 65.7696304321289, 44.881019592285156, 24.2115478515625, 1.557586669921875, 15.9615478515625, 50.59698486328125, 16.27509307861328, -130.55462646484375, -3.3352508544921875, -29.130176544189453, 6.41059684753418], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000343.npy"} +{"epoch": 0.5185185185185185, "step": 344, "batch_size": 64, "mean": 49.046180725097656, "std": 67.06901550292969, "min": -93.7380599975586, "p10": -30.70462474822998, "median": 39.694040298461914, "p90": 131.48955535888672, "max": 242.06491088867188, "pos_frac": 0.75, "sample": [-60.76411437988281, 123.9876937866211, 25.078895568847656, 38.07960891723633, 141.49493408203125, -2.4188785552978516, 9.312625885009766, 26.14609146118164, 21.222640991210938, 61.647979736328125, 26.193099975585938, 11.30035400390625, 18.46455192565918, 95.71549987792969, 77.875, 53.29244613647461, 76.30918884277344, 242.06491088867188, -9.829902648925781, 78.16854858398438, -31.218629837036133, -29.505279541015625, -37.905677795410156, 162.86032104492188, 3.564220428466797, -15.886360168457031, -49.11009216308594, 2.5356063842773438, 164.3928985595703, 82.72691345214844, -38.26715087890625, 151.902587890625, -8.427467346191406, 99.96580505371094, 51.91851806640625, 138.33139038085938, 131.44036865234375, 16.093551635742188, 84.981201171875, -86.15351104736328, -2.1719322204589844, 9.102764129638672, -16.951332092285156, 4.031415939331055, -13.084175109863281, -1.051004409790039, 131.51063537597656, 127.10740661621094, 59.700714111328125, 74.7503662109375, 89.7474594116211, 41.3084716796875, 95.16287994384766, 14.131624221801758, 130.47314453125, 15.957963943481445, 82.41693115234375, 96.8061752319336, 17.829818725585938, 108.58809661865234, -93.7380599975586, 94.49267578125, 110.12234497070312, 115.13084411621094], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000344.npy"} +{"epoch": 0.5200302343159486, "step": 345, "batch_size": 64, "mean": 43.28343200683594, "std": 66.59827423095703, "min": -104.20065307617188, "p10": -28.172695159912106, "median": 33.44426727294922, "p90": 128.6061935424805, "max": 190.7712860107422, "pos_frac": 0.765625, "sample": [49.620025634765625, 15.939945220947266, 162.90435791015625, -88.45633697509766, 11.716106414794922, 7.90911865234375, 2.1503448486328125, -45.90986633300781, 32.666770935058594, -4.777900695800781, 124.72172546386719, 113.62774658203125, 97.78804779052734, 93.9207992553711, -55.7109260559082, 105.56072235107422, -73.19181060791016, 47.679588317871094, 40.04266357421875, 103.18922424316406, 190.7712860107422, 7.340887069702148, 113.20381164550781, 60.57478332519531, 102.26451110839844, -7.8861083984375, 8.3341064453125, 38.04003143310547, 0.711181640625, 34.221763610839844, 73.10657501220703, 162.47311401367188, 111.48457336425781, 53.81523895263672, 49.87989807128906, -98.7935791015625, 147.876708984375, 168.5594482421875, 77.79145812988281, -17.04665756225586, 130.27096557617188, 26.50084686279297, -30.260543823242188, 123.35975646972656, 45.45344543457031, -21.453899383544922, 32.175941467285156, -23.301048278808594, 20.160186767578125, 28.287010192871094, 26.008407592773438, 17.93596649169922, -12.060340881347656, 29.954437255859375, -5.925567626953125, 90.30662536621094, 0.6302242279052734, -104.20065307617188, -22.39641571044922, 23.659400939941406, 68.72064971923828, 71.21647644042969, 95.23223876953125, 141.75216674804688], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000345.npy"} +{"epoch": 0.5215419501133787, "step": 346, "batch_size": 64, "mean": 51.671791076660156, "std": 70.61689758300781, "min": -145.36322021484375, "p10": -32.468910598754874, "median": 38.96010780334473, "p90": 142.0842468261719, "max": 181.91024780273438, "pos_frac": 0.765625, "sample": [102.84561920166016, 122.0108642578125, 93.28555297851562, 123.50662994384766, 92.76516723632812, 58.55216979980469, 24.786758422851562, 69.43482208251953, 129.86587524414062, 155.23135375976562, 143.12582397460938, 5.4631195068359375, 96.8922119140625, 129.04049682617188, -36.881412506103516, 148.51673889160156, -94.04591369628906, 36.59415054321289, -22.173072814941406, 41.77473068237305, 74.91227722167969, 82.18173217773438, 66.45201110839844, 41.32606506347656, 131.73545837402344, 181.91024780273438, -145.36322021484375, 32.075862884521484, 11.84218978881836, -82.74172973632812, 9.886932373046875, -48.924949645996094, 132.4562530517578, -2.7956581115722656, 32.57252883911133, 35.266212463378906, 8.097206115722656, -11.110893249511719, 114.8909912109375, 129.87615966796875, 160.93560791015625, 107.6373291015625, -10.308128356933594, 158.3497772216797, 21.502471923828125, 28.59490203857422, 94.71897888183594, 52.68916320800781, -50.33978271484375, 76.48249816894531, 20.188140869140625, 18.213134765625, 24.782926559448242, -2.554859161376953, -52.663414001464844, 14.709526062011719, 26.38842010498047, 112.43138122558594, -14.945106506347656, 165.14212036132812, -11.581775665283203, -2.2214603424072266, 14.051528930664062, 139.65390014648438], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000346.npy"} +{"epoch": 0.5230536659108088, "step": 347, "batch_size": 64, "mean": 39.41404342651367, "std": 63.5050048828125, "min": -89.09062194824219, "p10": -35.80510940551758, "median": 26.89834213256836, "p90": 137.2056777954102, "max": 171.5556640625, "pos_frac": 0.6875, "sample": [43.53169250488281, -2.4107017517089844, 34.068565368652344, 76.26414489746094, -84.17378234863281, 25.32129669189453, 90.94699096679688, 55.48548126220703, 92.36952209472656, 127.24732971191406, 1.0261383056640625, 122.75875854492188, 21.4052734375, -70.21764373779297, -42.781158447265625, 170.05557250976562, 23.219619750976562, 37.3796272277832, -11.537445068359375, 12.227729797363281, 28.475387573242188, 4.688028335571289, 73.1839599609375, 0.578460693359375, -38.56083679199219, 19.637943267822266, 82.42906951904297, 119.13541412353516, 146.10635375976562, -37.695098876953125, 30.73377227783203, -18.54218101501465, -31.39513397216797, 115.34859466552734, -7.917638778686523, 64.15005493164062, -5.8070526123046875, 94.41978454589844, 15.27947998046875, 45.023765563964844, 42.78080368041992, 16.410255432128906, -14.455352783203125, 94.10444641113281, 4.946979522705078, 153.4534149169922, -39.79083251953125, -10.463630676269531, 171.5556640625, 157.98785400390625, 147.93821716308594, 116.11265563964844, -1.061431884765625, 39.11622619628906, -89.09062194824219, 54.974853515625, 46.24413299560547, 4.142932891845703, -2.188518524169922, -1.2183399200439453, -16.84244155883789, -1.6610794067382812, 141.47354125976562, 86.56986236572266], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000347.npy"} +{"epoch": 0.5245653817082389, "step": 348, "batch_size": 64, "mean": 47.37086486816406, "std": 73.0594711303711, "min": -114.03347778320312, "p10": -32.77149505615234, "median": 30.316761016845703, "p90": 155.71249084472657, "max": 222.31976318359375, "pos_frac": 0.703125, "sample": [127.17387390136719, 144.28445434570312, 13.6378173828125, 2.2184524536132812, 159.1124267578125, 56.92710876464844, -31.15948486328125, -14.964447021484375, -114.03347778320312, 4.401832580566406, 173.31588745117188, -42.19563293457031, 30.386764526367188, 55.83357620239258, 108.02215576171875, 130.91897583007812, 30.24675750732422, 169.28375244140625, 36.88643264770508, 169.57012939453125, 14.03091049194336, 118.87149047851562, 133.0227813720703, 12.379066467285156, 10.465911865234375, 138.82081604003906, -5.913909912109375, 134.21290588378906, -34.878395080566406, -24.755172729492188, 79.187744140625, -0.6870498657226562, 4.207239151000977, 222.31976318359375, 46.03886413574219, -75.48210144042969, 52.18899917602539, -55.84917068481445, -17.28331756591797, 76.88488006591797, 157.55404663085938, 148.96839904785156, 44.805877685546875, -0.26333045959472656, 49.479736328125, -15.270393371582031, -34.6124267578125, -33.46235656738281, 3.5106582641601562, 69.28729248046875, -16.892040252685547, 164.15411376953125, -14.519815444946289, 63.48326873779297, 85.69947814941406, 6.614799499511719, 67.75035095214844, 23.8338623046875, -24.017425537109375, 9.861486434936523, -11.075912475585938, 84.52188110351562, 151.41552734375, 13.258678436279297], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000348.npy"} +{"epoch": 0.5260770975056689, "step": 349, "batch_size": 64, "mean": 46.96872329711914, "std": 68.36551666259766, "min": -99.50178527832031, "p10": -20.71122817993164, "median": 34.348609924316406, "p90": 144.72497100830077, "max": 182.00050354003906, "pos_frac": 0.6875, "sample": [-55.05574417114258, 38.45208740234375, 144.7349090576172, 35.73656463623047, 45.790382385253906, -1.9620094299316406, 73.34484100341797, 148.82374572753906, 56.06278991699219, 16.594985961914062, -3.0375308990478516, 27.219266891479492, 125.32139587402344, 18.400009155273438, 32.960655212402344, 96.29750061035156, 56.78718566894531, -55.96161651611328, -99.50178527832031, 142.57334899902344, 40.47276306152344, 121.56761169433594, -23.205673217773438, 3.2004852294921875, 121.54280090332031, 5.4396820068359375, 5.277732849121094, 58.39316177368164, -11.348403930664062, 131.6824951171875, 109.9831314086914, 122.886962890625, 4.7505645751953125, 21.126218795776367, -3.7694854736328125, 142.29217529296875, 21.560670852661133, 174.86305236816406, -83.42220306396484, 51.91807174682617, 172.1697998046875, 2.3895950317382812, 7.1611480712890625, 51.1700439453125, 66.76220703125, 153.7041015625, 144.7017822265625, -3.4232139587402344, -20.09893798828125, -3.025754928588867, 77.43803405761719, -15.552932739257812, -5.5533447265625, -3.4350204467773438, 44.98499298095703, 174.20840454101562, -24.27911376953125, -20.702987670898438, -20.714759826660156, 122.82524108886719, -0.3440113067626953, -8.333320617675781, 73.15320587158203, 182.00050354003906], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000349.npy"} +{"epoch": 0.527588813303099, "step": 350, "batch_size": 64, "mean": 60.128379821777344, "std": 66.33708953857422, "min": -79.91622924804688, "p10": -16.9440071105957, "median": 64.61466979980469, "p90": 152.37058715820314, "max": 193.16224670410156, "pos_frac": 0.78125, "sample": [127.4872817993164, -18.15570068359375, 73.804443359375, -8.104080200195312, 90.74332427978516, 16.149187088012695, 154.45077514648438, 85.89134216308594, 80.84858703613281, 133.24295043945312, 12.59417724609375, -43.40614318847656, 68.67013549804688, 97.57440185546875, 51.23102569580078, 74.36808776855469, 122.3141098022461, 14.547657012939453, -10.231258392333984, -7.132795333862305, 75.05072021484375, 80.53305053710938, -75.6980972290039, 101.10810852050781, 62.86376190185547, 2.4845962524414062, -79.91622924804688, 193.16224670410156, -10.832780838012695, 32.32913589477539, 126.3500747680664, -42.329498291015625, 131.39263916015625, 9.293746948242188, 115.15052795410156, 157.95053100585938, 68.18978118896484, 135.74801635742188, 159.391845703125, 191.3690185546875, 50.29523468017578, 166.462646484375, 147.51681518554688, -14.116722106933594, 43.39936447143555, -1.83154296875, 10.246955871582031, 12.635961532592773, -32.226139068603516, 66.3655776977539, 79.93817138671875, 52.585208892822266, 1.8812198638916016, 53.27531433105469, 42.015037536621094, -51.938018798828125, 71.2911376953125, 51.731231689453125, -7.3124237060546875, 56.313629150390625, 154.47952270507812, 111.6075439453125, 92.99988555908203, 140.12208557128906], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000350.npy"} +{"epoch": 0.5291005291005291, "step": 351, "batch_size": 64, "mean": 45.15464782714844, "std": 74.24632263183594, "min": -150.6239013671875, "p10": -43.19097900390624, "median": 35.467830657958984, "p90": 136.6725006103516, "max": 151.49627685546875, "pos_frac": 0.75, "sample": [-3.928384780883789, 107.29277801513672, 144.33636474609375, 114.8393783569336, -1.6083641052246094, 121.88059997558594, -13.29501724243164, 33.264801025390625, 150.33169555664062, 29.105758666992188, 20.158447265625, 139.47625732421875, 19.428434371948242, -14.284774780273438, 24.154476165771484, -16.42975616455078, 13.036941528320312, 8.965171813964844, 105.66797637939453, 91.71089172363281, 104.32787322998047, -88.59241485595703, 146.56674194335938, 12.613784790039062, 130.13040161132812, 151.49627685546875, 75.99862670898438, 110.90235900878906, -150.6239013671875, 44.129150390625, 123.66361999511719, -69.1917724609375, 92.34368896484375, -1.214202880859375, 109.46147155761719, -47.16613006591797, -51.12090301513672, 126.00448608398438, 37.670860290527344, 26.270511627197266, 87.64496612548828, 150.2706298828125, 25.868194580078125, -33.801124572753906, 79.57470703125, 26.475601196289062, 70.05299377441406, 64.65455627441406, 5.3570098876953125, 95.86174774169922, -33.915626525878906, 1.8290519714355469, 104.27316284179688, 90.9839096069336, 146.12782287597656, 32.39239501953125, 11.426666259765625, 97.37733459472656, -150.3870391845703, 14.721555709838867, -141.7255401611328, 97.61793518066406, 91.99531555175781, -2.5531005859375], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000351.npy"} +{"epoch": 0.5306122448979592, "step": 352, "batch_size": 64, "mean": 48.034217834472656, "std": 68.9246826171875, "min": -106.74618530273438, "p10": -19.252674293518066, "median": 32.93823051452637, "p90": 140.90152282714843, "max": 249.49716186523438, "pos_frac": 0.71875, "sample": [130.1855926513672, 176.8634033203125, 130.97413635253906, 8.699569702148438, 140.32083129882812, -102.91189575195312, -8.260082244873047, -0.5510711669921875, 31.310558319091797, 65.75283813476562, 66.14185333251953, 110.59231567382812, -65.84164428710938, -2.153789520263672, 64.25775146484375, 25.2938232421875, -21.02484130859375, -5.2432098388671875, -53.541770935058594, 19.2608642578125, 92.72219848632812, 65.91456604003906, 21.946456909179688, 150.64117431640625, 143.36795043945312, 75.82351684570312, 29.95574951171875, -106.74618530273438, 37.716426849365234, -15.18350601196289, 22.93758773803711, -0.5691127777099609, 12.96417236328125, 76.04107666015625, 43.63529968261719, 85.52203369140625, 24.556081771850586, 139.76510620117188, 153.5000457763672, 43.207176208496094, 141.150390625, -12.659721374511719, 249.49716186523438, 14.139314651489258, 84.14183807373047, 133.19683837890625, -19.919288635253906, 21.165191650390625, -17.697240829467773, 48.84920883178711, -2.4699554443359375, 74.30111694335938, 39.468170166015625, 122.29456329345703, 131.79901123046875, 2.4680023193359375, -27.867835998535156, 148.4449462890625, -12.14200210571289, -1.9450225830078125, 0.9474639892578125, 92.68002319335938, 34.56590270996094, 21.938753128051758], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000352.npy"} +{"epoch": 0.5321239606953893, "step": 353, "batch_size": 64, "mean": 48.601470947265625, "std": 67.32315063476562, "min": -156.17796325683594, "p10": -12.282382965087889, "median": 29.160648345947266, "p90": 138.23888702392577, "max": 162.17843627929688, "pos_frac": 0.71875, "sample": [83.40906524658203, 160.3958740234375, -45.32821273803711, 48.42597579956055, -81.29898071289062, 25.537364959716797, 86.98551177978516, -12.825462341308594, 155.44471740722656, 25.638336181640625, -0.7561988830566406, 32.682960510253906, 85.99380493164062, -11.01519775390625, 138.3575897216797, 14.352052688598633, 40.43663024902344, 117.6185073852539, 112.23612976074219, 137.9619140625, 122.90553283691406, 155.9439697265625, 2.2672901153564453, 85.29720306396484, -13.49957275390625, -4.521205902099609, 152.61996459960938, 24.587181091308594, 125.0085678100586, 76.28399658203125, 79.2298583984375, -2.946613311767578, 75.65794372558594, -0.12215042114257812, -156.17796325683594, 133.2890625, -54.48809814453125, -33.14432144165039, 132.90773010253906, 131.5408935546875, 73.65438842773438, 141.3333740234375, 162.17843627929688, 2.1092910766601562, -8.56622314453125, 25.408145904541016, 109.47248840332031, 17.224679946899414, -3.470752716064453, 16.039459228515625, 38.55110168457031, 20.850112915039062, -5.8662567138671875, 36.18748474121094, -0.3236198425292969, 19.764236450195312, 7.947456359863281, -0.9374542236328125, -6.43817138671875, 9.791900634765625, 117.6121826171875, 1.9199981689453125, 135.22854614257812, 53.931785583496094], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000353.npy"} +{"epoch": 0.5336356764928194, "step": 354, "batch_size": 64, "mean": 54.04368591308594, "std": 71.4162826538086, "min": -101.82670593261719, "p10": -48.314458847045884, "median": 50.363616943359375, "p90": 148.01138153076172, "max": 178.521240234375, "pos_frac": 0.765625, "sample": [167.41415405273438, 46.12320327758789, -30.022865295410156, 110.71124267578125, -58.221229553222656, 49.578330993652344, 22.364273071289062, 105.64806365966797, 132.68295288085938, 6.583362579345703, 117.51333618164062, 148.9406280517578, 90.01361846923828, 52.583351135253906, 21.07665252685547, 1.1582298278808594, 133.39859008789062, -34.6695671081543, 129.54986572265625, 178.521240234375, 71.92056274414062, 140.12469482421875, 64.99421691894531, 62.35844421386719, -79.18273162841797, -1.967824935913086, -101.82670593261719, 120.01991271972656, 40.830604553222656, 48.89411163330078, 39.67352294921875, 106.54832458496094, 147.9517059326172, 51.192840576171875, 48.9984130859375, 27.99378204345703, 72.13058471679688, -60.95611572265625, 148.03695678710938, 14.54107666015625, 96.00714874267578, 138.32595825195312, -54.162269592285156, -72.10232543945312, 160.45260620117188, -63.80845642089844, 160.4073944091797, 125.67474365234375, 10.291379928588867, -9.531486511230469, 33.76616668701172, 51.148902893066406, 111.56867980957031, 150.04928588867188, 52.609737396240234, 22.893840789794922, -11.449272155761719, 7.962406158447266, -16.60846710205078, 98.23548889160156, 37.95014953613281, 130.70362854003906, -32.27128601074219, -22.541683197021484], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000354.npy"} +{"epoch": 0.5351473922902494, "step": 355, "batch_size": 64, "mean": 55.343788146972656, "std": 76.34100341796875, "min": -123.06583404541016, "p10": -48.41522903442383, "median": 58.68581771850586, "p90": 149.27842712402344, "max": 189.2913818359375, "pos_frac": 0.734375, "sample": [89.60966491699219, 164.36187744140625, -48.482330322265625, 7.0669097900390625, 157.15875244140625, 69.11764526367188, 35.735984802246094, -16.34690284729004, -48.25865936279297, 68.81307220458984, 71.89073181152344, 13.931060791015625, 80.99931335449219, -55.85040283203125, 131.88177490234375, 114.3726806640625, -3.786273956298828, 63.46109390258789, -76.254150390625, 112.07906341552734, -53.59367370605469, 63.221981048583984, 30.631439208984375, 143.84982299804688, 135.6817169189453, 36.98541259765625, 86.7318344116211, 23.71434783935547, 123.56898498535156, 189.2913818359375, -52.748680114746094, 32.32530975341797, -6.328792572021484, 102.17596435546875, 13.1397705078125, -115.59722137451172, 80.29109191894531, -10.211761474609375, 54.149654388427734, 143.4062957763672, -7.367332458496094, 18.01287841796875, 133.40530395507812, -2.1034393310546875, 0.2237873077392578, 175.43865966796875, 148.566650390625, 10.857990264892578, 149.2954559326172, -123.06583404541016, 143.7039794921875, 141.8977813720703, 154.8547821044922, -3.0255393981933594, 149.2386932373047, -18.84684181213379, -6.450675964355469, 10.813274383544922, 164.25277709960938, 6.007057189941406, 119.05681610107422, 16.432050704956055, 83.89383697509766, 124.72457122802734], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000355.npy"} +{"epoch": 0.5366591080876795, "step": 356, "batch_size": 64, "mean": 44.74551010131836, "std": 82.811279296875, "min": -155.526123046875, "p10": -57.8351104736328, "median": 34.12021827697754, "p90": 150.40841369628907, "max": 192.5756378173828, "pos_frac": 0.71875, "sample": [146.85614013671875, 157.53111267089844, 55.79937744140625, -84.90641784667969, 126.6531753540039, 16.753936767578125, 2.2912445068359375, 192.5756378173828, 80.66806030273438, 2.659648895263672, -106.11735534667969, -138.26275634765625, 78.76023864746094, -90.82880401611328, 145.8438720703125, 162.06039428710938, 12.388160705566406, 19.872692108154297, 136.22225952148438, -1.1769390106201172, 151.12277221679688, -155.526123046875, 152.51144409179688, 32.490966796875, 9.541252136230469, 155.0367889404297, -49.26224899291992, -38.92195129394531, 52.45548629760742, 32.65386962890625, 66.57218170166016, 2.9623794555664062, -10.368471145629883, 3.249134063720703, -60.713157653808594, 116.90196228027344, 126.1111068725586, -51.119667053222656, 63.3857421875, 120.47402954101562, 1.6536674499511719, 4.933502197265625, 146.05441284179688, -19.066177368164062, 43.41722106933594, 89.95362854003906, 98.43022155761719, 8.14404296875, -49.15819549560547, 72.644287109375, -1.6375923156738281, 93.34667205810547, 145.43185424804688, 148.7415771484375, -5.7318115234375, 104.92777252197266, 33.51828384399414, -22.90686798095703, 155.81829833984375, -11.382003784179688, -83.17523193359375, 148.36117553710938, 34.72215270996094, 91.47036743164062], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000356.npy"} +{"epoch": 0.5381708238851096, "step": 357, "batch_size": 64, "mean": 38.04316711425781, "std": 70.36360931396484, "min": -141.17701721191406, "p10": -41.215333175659175, "median": 35.045127868652344, "p90": 135.28802337646485, "max": 173.1215362548828, "pos_frac": 0.75, "sample": [131.22654724121094, -2.3679332733154297, 126.0068588256836, -21.46783447265625, -135.462890625, 144.713134765625, 33.937744140625, 61.37361526489258, 29.167373657226562, 33.274749755859375, -13.13995361328125, 41.474815368652344, -42.165122985839844, 15.780826568603516, 153.7605743408203, 75.29647827148438, 133.46136474609375, 75.47514343261719, 81.08233642578125, 6.496212005615234, 84.24871063232422, 36.897369384765625, 53.92782211303711, 6.085908889770508, 23.53905487060547, 55.31267547607422, -5.264020919799805, 9.969635009765625, -58.8392333984375, 61.88132858276367, -66.03880310058594, 4.246465682983398, -28.858829498291016, 83.06597137451172, 64.9782485961914, 151.07522583007812, 136.0708770751953, 47.77125549316406, 106.50270080566406, 147.80770874023438, -21.438682556152344, 58.21781921386719, 13.433563232421875, 3.7736434936523438, 137.61065673828125, 40.634376525878906, 2.021392822265625, -16.64899444580078, -38.9991569519043, 36.15251159667969, 38.32661056518555, 173.1215362548828, 91.13170623779297, 23.94498062133789, 100.13118743896484, 27.600738525390625, 2.157480239868164, 3.1644058227539062, 127.07732391357422, -99.30105590820312, -96.63185119628906, -141.17701721191406, 129.15213012695312, -0.9966259002685547], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000357.npy"} +{"epoch": 0.5396825396825397, "step": 358, "batch_size": 64, "mean": 53.22576904296875, "std": 73.90312194824219, "min": -108.48838806152344, "p10": -32.573615264892574, "median": 33.73353958129883, "p90": 154.44116668701173, "max": 229.23663330078125, "pos_frac": 0.796875, "sample": [108.49752044677734, 69.97364807128906, 86.90487670898438, 155.20416259765625, -33.553749084472656, 160.50779724121094, 141.67535400390625, -36.11931610107422, -9.445804595947266, 17.473373413085938, -11.312358856201172, 100.77778625488281, 30.48987579345703, 98.95187377929688, 138.03176879882812, 40.89573669433594, -57.680450439453125, 4.6329498291015625, 103.33868408203125, 22.90658950805664, 19.620330810546875, 30.234127044677734, -19.65570831298828, 117.22147369384766, 134.85256958007812, 11.356758117675781, 13.634124755859375, 29.959457397460938, -30.286636352539062, 10.98892593383789, -68.41094207763672, 34.360801696777344, -81.4189453125, 5.285566329956055, -30.03931427001953, 52.99263000488281, 95.52891540527344, 42.11589050292969, 17.25843048095703, 0.09354972839355469, 156.39190673828125, 170.40106201171875, 229.23663330078125, 8.242565155029297, 189.71231079101562, 152.6608428955078, 100.04192352294922, -26.22634506225586, 33.10627746582031, 69.5, 0.4320716857910156, -52.20207214355469, -108.48838806152344, 138.805908203125, 3.81903076171875, 133.45948791503906, 26.81528091430664, 78.05277252197266, 19.2349853515625, 93.26473999023438, 108.10523223876953, 126.47533416748047, 52.280548095703125, 185.4846954345703], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000358.npy"} +{"epoch": 0.5411942554799698, "step": 359, "batch_size": 64, "mean": 27.08429718017578, "std": 67.56941223144531, "min": -110.96987915039062, "p10": -55.5496223449707, "median": 27.302234649658203, "p90": 125.20428543090821, "max": 186.96983337402344, "pos_frac": 0.671875, "sample": [-45.455810546875, 70.83277893066406, -22.762481689453125, 11.568405151367188, 51.354469299316406, 42.79022979736328, -27.133846282958984, 20.05115509033203, -52.182373046875, -79.6207275390625, 186.96983337402344, 57.141571044921875, 7.503387451171875, 30.408447265625, -4.778373718261719, 66.25384521484375, 137.77178955078125, -43.491432189941406, 0.8497848510742188, -94.76777648925781, 19.753658294677734, -17.001224517822266, 31.530609130859375, -57.86579895019531, 19.952392578125, 131.24517822265625, 60.32177734375, 28.457645416259766, 43.878387451171875, -92.20600891113281, 165.78668212890625, 159.59967041015625, -49.965667724609375, 121.18057250976562, 41.559112548828125, 26.563156127929688, 2.6904678344726562, 83.50691986083984, 35.84710693359375, 28.04131317138672, -56.99272918701172, 95.48941040039062, 126.9287338256836, 69.4638900756836, 15.881156921386719, 78.67221069335938, -41.31476593017578, -102.87124633789062, -40.235076904296875, 66.61447143554688, 30.262928009033203, -5.460353851318359, -110.96987915039062, -8.235483169555664, 82.56427764892578, -1.0246353149414062, 90.10768127441406, 12.439268112182617, 39.4525146484375, 113.94584655761719, 29.65627670288086, 148.91680908203125, 4.723056793212891, -0.798248291015625], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000359.npy"} +{"epoch": 0.5427059712773998, "step": 360, "batch_size": 64, "mean": 46.08378601074219, "std": 67.29199981689453, "min": -103.27854919433594, "p10": -32.85621643066405, "median": 32.12338447570801, "p90": 135.6813507080078, "max": 189.94384765625, "pos_frac": 0.734375, "sample": [4.555877685546875, 148.56881713867188, 13.26611328125, 26.817764282226562, 41.31719207763672, 87.91431427001953, -5.062038421630859, 34.46992874145508, 23.819828033447266, 132.30984497070312, -1.2014179229736328, -55.024627685546875, -5.5171966552734375, -65.89915466308594, 122.28993225097656, -43.90760803222656, 189.94384765625, -40.03818130493164, 1.8540153503417969, 126.80036926269531, 32.27919387817383, -3.3616294860839844, -41.12298583984375, 20.843521118164062, 4.94427490234375, 0.8180084228515625, 118.64646911621094, 8.230552673339844, 93.42667388916016, -1.1738739013671875, 44.157936096191406, 15.574958801269531, 86.83999633789062, -39.389190673828125, 31.967575073242188, 127.90496063232422, -17.61260986328125, 75.22643280029297, 137.12628173828125, 11.852294921875, 185.1983642578125, -6.7713775634765625, 114.70056915283203, -12.422918319702148, 188.36810302734375, 34.68456268310547, 141.65835571289062, 15.725875854492188, 37.71995162963867, 122.68218994140625, 113.17584991455078, 68.314453125, 156.4248504638672, -10.422449111938477, -8.559392929077148, 57.01371765136719, 0.04922676086425781, -103.27854919433594, 43.794349670410156, 112.53843688964844, 36.1219482421875, 5.191444396972656, 90.15860748291016, 122.83964538574219], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000360.npy"} +{"epoch": 0.54421768707483, "step": 361, "batch_size": 64, "mean": 53.72078323364258, "std": 67.26924133300781, "min": -97.33767700195312, "p10": -20.744250106811524, "median": 49.11079788208008, "p90": 141.52383117675782, "max": 180.53790283203125, "pos_frac": 0.765625, "sample": [61.82402801513672, 89.39020538330078, 13.358654022216797, -11.307029724121094, 146.03204345703125, 62.211814880371094, -46.549625396728516, -97.33767700195312, 46.22047805786133, 45.46223831176758, 100.89602661132812, -50.73127365112305, -2.5097579956054688, 139.3050537109375, 100.77015686035156, 92.82804107666016, -20.846515655517578, 9.51877212524414, 51.74259948730469, 2.5129241943359375, 112.47607421875, 67.5885238647461, 15.603630065917969, 148.12060546875, 124.56571197509766, 129.3551788330078, 103.61296081542969, -93.79313659667969, 141.0306396484375, 106.97994995117188, 38.485965728759766, -2.1051788330078125, 115.19044494628906, 180.53790283203125, 127.54963684082031, 76.65548706054688, 141.73519897460938, 86.70972442626953, -58.42298889160156, -8.372413635253906, -1.8015460968017578, 6.156055450439453, 149.98878479003906, 139.0258331298828, 15.833660125732422, 148.7106170654297, 129.62396240234375, 15.365776062011719, -46.05481719970703, -18.6458740234375, 84.60479736328125, 23.32745361328125, 77.24807739257812, 18.623363494873047, 163.0220947265625, 18.196218490600586, 113.74319458007812, 6.232719421386719, 2.3212432861328125, 47.32969665527344, 50.89189910888672, 31.568693161010742, -2.9712677001953125, -20.505630493164062], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000361.npy"} +{"epoch": 0.54572940287226, "step": 362, "batch_size": 64, "mean": 57.43996810913086, "std": 83.78388977050781, "min": -140.2513427734375, "p10": -30.69611892700195, "median": 45.22222900390625, "p90": 147.3018508911133, "max": 377.21417236328125, "pos_frac": 0.765625, "sample": [-28.406394958496094, 4.768720626831055, -2.9429473876953125, 1.7051525115966797, 0.8451461791992188, -140.2513427734375, 36.669654846191406, 75.67816162109375, 377.21417236328125, 120.28132629394531, 24.145469665527344, -9.324642181396484, 30.07598114013672, -3.689239501953125, -2.683135986328125, -4.599033355712891, 71.62785339355469, 74.40518188476562, 88.84573364257812, 162.70370483398438, -3.886594772338867, 36.547760009765625, 26.34956169128418, 81.68490600585938, 128.17213439941406, 7.058349609375, 116.98236846923828, 10.408660888671875, 4.086635589599609, 96.59092712402344, 225.5791015625, 5.601957321166992, -18.100120544433594, 142.74574279785156, 30.12812042236328, 167.90350341796875, 123.53678894042969, 18.307952880859375, 66.61263275146484, -31.67742919921875, 2.4733848571777344, 133.14212036132812, 144.71484375, 148.4105682373047, 31.575790405273438, 58.9625244140625, 106.8584213256836, 175.89979553222656, 110.67098999023438, 117.6917724609375, -37.564659118652344, 33.659881591796875, 138.98538208007812, -86.91712188720703, 53.774803161621094, 77.83589935302734, 142.48419189453125, -80.83551025390625, -52.90062713623047, 97.74241638183594, 178.0438232421875, -76.1778564453125, 72.7740478515625, 73.15045166015625], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000362.npy"} +{"epoch": 0.54724111866969, "step": 363, "batch_size": 64, "mean": 55.66880798339844, "std": 72.6978988647461, "min": -133.38763427734375, "p10": -13.811557197570801, "median": 40.03212928771973, "p90": 157.87615814208985, "max": 258.9974060058594, "pos_frac": 0.84375, "sample": [90.75395202636719, -97.16740417480469, 155.49151611328125, 57.96434783935547, 62.909881591796875, 39.303489685058594, 9.48245620727539, 169.7593231201172, 21.173324584960938, -38.5466194152832, -7.7754669189453125, 67.02017211914062, 258.9974060058594, 193.42526245117188, 10.524024963378906, 170.85964965820312, 40.402950286865234, 74.25397491455078, 26.65087890625, 135.1663360595703, 22.26205062866211, 90.628173828125, 14.142274856567383, 167.8970489501953, 146.27317810058594, 30.10643196105957, 5.35479736328125, 25.570289611816406, -13.790046691894531, 23.064735412597656, -13.820775985717773, -133.38763427734375, 69.71894073486328, -88.15971374511719, 80.4052734375, 72.64425659179688, 38.96771240234375, 104.32434844970703, 39.66130828857422, -2.5212631225585938, 14.278202056884766, 10.604606628417969, 37.96165466308594, 154.8042449951172, 9.368940353393555, 170.36788940429688, 102.87641906738281, 42.074981689453125, 144.03091430664062, 10.612380981445312, 127.09001922607422, 2.6101722717285156, 120.10757446289062, 75.33744812011719, -43.81294250488281, 64.81240844726562, 158.8981475830078, -22.072277069091797, 92.55940246582031, 31.871143341064453, 0.4617137908935547, 64.70339965820312, 56.37605285644531, 16.890398025512695], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000363.npy"} +{"epoch": 0.5487528344671202, "step": 364, "batch_size": 64, "mean": 60.426368713378906, "std": 86.24189758300781, "min": -145.85400390625, "p10": -30.04920196533203, "median": 55.96076202392578, "p90": 173.98097229003906, "max": 255.7533721923828, "pos_frac": 0.765625, "sample": [181.8035888671875, -5.4836883544921875, 18.197479248046875, 164.84884643554688, 177.821044921875, 13.352989196777344, 69.22418975830078, 110.29838562011719, -19.45873260498047, 183.833740234375, 203.17503356933594, 99.21520233154297, -9.107990264892578, -60.625694274902344, 109.3787841796875, 150.1005401611328, 45.87073516845703, -17.33646011352539, 255.7533721923828, 1.7232666015625, 165.44049072265625, 45.887413024902344, 101.29901123046875, 145.97947692871094, -107.69529724121094, -46.29924774169922, 170.89700317382812, 0.03149604797363281, 1.284921646118164, 102.79852294921875, 147.04962158203125, 66.03411102294922, -8.995471954345703, 72.16492462158203, 28.032669067382812, 1.6583709716796875, 117.60386657714844, 175.30267333984375, -29.285072326660156, 23.81255531311035, 101.43949127197266, 74.6091537475586, -30.376686096191406, -73.01408386230469, 210.26559448242188, 11.162052154541016, 4.302032470703125, 138.30224609375, 7.279449462890625, 125.09996032714844, 4.7310791015625, 123.4366226196289, -94.94589233398438, 68.52779388427734, -145.85400390625, 11.831130981445312, 85.5918197631836, 119.69992065429688, -0.8388233184814453, 12.28173828125, 0.4710426330566406, -23.147438049316406, 150.71697998046875, 140.12960815429688], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000364.npy"} +{"epoch": 0.5502645502645502, "step": 365, "batch_size": 64, "mean": 56.61901092529297, "std": 65.39251708984375, "min": -88.48480224609375, "p10": -7.25778770446777, "median": 52.307743072509766, "p90": 138.67686004638674, "max": 277.08673095703125, "pos_frac": 0.84375, "sample": [38.65155792236328, 18.999780654907227, 90.8612060546875, 0.885284423828125, 45.90681457519531, 2.0598716735839844, 134.29104614257812, 114.55793762207031, 116.47383117675781, 90.92996215820312, 119.97908020019531, 53.616172790527344, -88.48480224609375, 1.9606590270996094, 24.122940063476562, 128.93797302246094, -2.8826065063476562, 2.699840545654297, -8.811592102050781, 0.13321685791015625, 70.47219848632812, 96.7396011352539, 116.69495391845703, 3.5657215118408203, -1.3682270050048828, -70.02525329589844, 56.564292907714844, 156.45738220214844, 36.54340362548828, 91.09114074707031, 5.5735015869140625, 10.636674880981445, 140.69473266601562, 43.66415023803711, 127.11933898925781, 76.81782531738281, 139.07498168945312, -3.632244110107422, 55.43056106567383, 66.40726470947266, 150.3000946044922, 65.8216552734375, 50.99931335449219, -22.1129150390625, 99.06367492675781, 137.74790954589844, 5.95942497253418, -18.307729721069336, 277.08673095703125, 44.051849365234375, 82.0726089477539, 2.473997116088867, 130.40945434570312, 6.909515380859375, 0.046169281005859375, 58.6138916015625, 6.9239959716796875, -37.566951751708984, 68.81217956542969, 4.245384216308594, 155.95875549316406, 147.42514038085938, -9.94256591796875, 113.21498107910156], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000365.npy"} +{"epoch": 0.5517762660619804, "step": 366, "batch_size": 64, "mean": 48.10562515258789, "std": 80.54195404052734, "min": -130.17758178710938, "p10": -62.62295379638671, "median": 47.94317817687988, "p90": 146.92462768554688, "max": 211.2564239501953, "pos_frac": 0.71875, "sample": [3.441478729248047, 159.15646362304688, 99.72440338134766, 51.09955978393555, -10.406570434570312, 134.94371032714844, -71.81912231445312, -18.687795639038086, -21.283538818359375, -10.089454650878906, -53.01325988769531, 106.45818328857422, 16.038841247558594, 79.85043334960938, 87.18167114257812, 43.62774658203125, -66.74139404296875, 69.0643310546875, 2.8378429412841797, 95.3896255493164, 78.52066040039062, 50.57404327392578, 52.267547607421875, -8.912960052490234, 26.407270431518555, 107.88884735107422, 47.24942398071289, 148.173828125, -130.17758178710938, -18.57712745666504, 183.78964233398438, 4.413368225097656, -3.486879348754883, 211.2564239501953, -76.79401397705078, 2.8605709075927734, -47.29753112792969, -82.36227416992188, 18.18850326538086, 42.56346130371094, 4.728923797607422, -29.17660903930664, 6.282224655151367, 48.636932373046875, -70.24661254882812, 13.666572570800781, 11.533391952514648, 205.49156188964844, 172.73974609375, 54.15782165527344, 51.802215576171875, 140.36109924316406, 122.28645324707031, -108.24478149414062, 143.63314819335938, -25.456754684448242, 142.24462890625, 130.2882843017578, 163.69869995117188, 120.47511291503906, 141.38307189941406, 87.18926239013672, 144.00982666015625, 103.95745849609375], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000366.npy"} +{"epoch": 0.5532879818594104, "step": 367, "batch_size": 64, "mean": 45.722740173339844, "std": 68.87721252441406, "min": -148.966064453125, "p10": -36.66516265869141, "median": 35.816246032714844, "p90": 136.2424072265625, "max": 161.97857666015625, "pos_frac": 0.796875, "sample": [3.619304656982422, 161.97857666015625, 66.2640151977539, -11.600982666015625, 71.91195678710938, -2.4122314453125, 132.98025512695312, 134.22332763671875, 71.16868591308594, 3.9339256286621094, 24.292861938476562, 8.0233154296875, 9.624092102050781, 25.087493896484375, 142.21231079101562, 13.999706268310547, 71.13215637207031, -5.951408386230469, -36.72633361816406, 123.15967559814453, 15.098220825195312, 62.38124084472656, -12.895421981811523, -40.734405517578125, 91.1842041015625, -147.9629364013672, -54.19158935546875, 108.24779510498047, 13.647563934326172, 29.539825439453125, 120.35238647460938, 115.22209167480469, 92.25019836425781, 84.3197021484375, 98.80455780029297, 5.941108703613281, 34.075927734375, -62.14747619628906, 12.415815353393555, 139.7790985107422, 32.1241455078125, -148.966064453125, 11.774103164672852, 158.28639221191406, 103.85201263427734, -36.522430419921875, 72.10044860839844, 19.629344940185547, 103.48780822753906, 21.315196990966797, 35.90367126464844, 50.682861328125, -88.01725006103516, 122.92296600341797, 71.17636108398438, 141.42318725585938, 35.72882080078125, -18.60854148864746, 93.6246337890625, 142.1785430908203, 21.921417236328125, 66.70046997070312, 64.18107604980469, 137.10772705078125], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000367.npy"} +{"epoch": 0.5547996976568406, "step": 368, "batch_size": 64, "mean": 42.043800354003906, "std": 70.29700469970703, "min": -145.95094299316406, "p10": -44.376702880859376, "median": 34.29493713378906, "p90": 135.83025360107425, "max": 166.0392608642578, "pos_frac": 0.734375, "sample": [-145.95094299316406, 102.595458984375, 6.111839294433594, 14.203073501586914, 76.45220947265625, 103.66138458251953, 130.97145080566406, 45.024085998535156, -21.39545440673828, -20.2244873046875, 146.7576446533203, 6.893512725830078, 29.512359619140625, 35.05628967285156, 154.36514282226562, 115.58761596679688, -26.852386474609375, -51.66352844238281, -59.751800537109375, 115.69855499267578, 33.53358459472656, 28.10365104675293, 62.95130157470703, -36.79175567626953, 147.36227416992188, 23.87480926513672, -40.81037902832031, 139.75523376464844, 166.0392608642578, 50.95498275756836, -19.801206588745117, 155.87203979492188, 71.8666000366211, 1.6266136169433594, 13.189334869384766, 102.32536315917969, 32.32273864746094, 91.74839782714844, 16.67516326904297, 92.42140197753906, 45.83042907714844, -3.069234848022461, 110.00912475585938, 22.4769287109375, -43.86541748046875, -20.631996154785156, 33.28361129760742, -17.834503173828125, 137.91259765625, -51.71080017089844, 64.67066955566406, 126.94387817382812, 116.0618896484375, 117.22539520263672, 8.564912796020508, 80.73744201660156, 47.64545440673828, -44.5958251953125, -101.27617645263672, 71.44999694824219, 98.75460815429688, 30.480073928833008, -100.3304443359375, 71.79925537109375], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000368.npy"} +{"epoch": 0.5563114134542706, "step": 369, "batch_size": 64, "mean": 38.35271453857422, "std": 70.02681732177734, "min": -126.61248779296875, "p10": -32.612778854370106, "median": 29.35350799560547, "p90": 140.21044311523437, "max": 217.6778564453125, "pos_frac": 0.734375, "sample": [30.113853454589844, -81.2216567993164, 47.52391815185547, 77.3621826171875, -89.73123168945312, 64.96762084960938, 39.38564682006836, -0.8904800415039062, 147.7602996826172, 26.75014877319336, 19.941680908203125, 113.74380493164062, 117.40266418457031, 100.27953338623047, 147.62387084960938, 4.42987060546875, 62.073585510253906, 55.74250793457031, 19.55876922607422, 27.147640228271484, 11.907440185546875, -126.61248779296875, 41.47877502441406, -76.86297607421875, 41.83636474609375, 81.66795349121094, -25.106868743896484, 69.8865966796875, 55.65401840209961, -24.97200584411621, 111.57379150390625, -10.017364501953125, 38.18883514404297, 143.70999145507812, 76.6817398071289, 137.6907501220703, 163.1776123046875, 2.5012359619140625, 17.133636474609375, -83.92537689208984, -17.267669677734375, 28.593162536621094, -13.701091766357422, 67.95543670654297, -4.049694061279297, 36.400184631347656, 217.6778564453125, 5.4051971435546875, 140.973388671875, -18.286842346191406, -11.529579162597656, 26.032821655273438, 1.0405387878417969, 138.43023681640625, 1.8581314086914062, -12.217988967895508, 3.4085330963134766, 161.99844360351562, 18.76160430908203, 44.949432373046875, -35.82959747314453, 51.97479248046875, -88.9515380859375, 135.39224243164062], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000369.npy"} +{"epoch": 0.5578231292517006, "step": 370, "batch_size": 64, "mean": 55.01481628417969, "std": 80.53404235839844, "min": -176.93946838378906, "p10": -34.110466003417955, "median": 45.84370803833008, "p90": 160.66396789550782, "max": 197.02972412109375, "pos_frac": 0.75, "sample": [60.731201171875, 162.33441162109375, 108.0088882446289, 39.74980926513672, 197.02972412109375, 5.934112548828125, 170.9571533203125, -4.159637451171875, 156.2528076171875, 15.836688995361328, 15.692535400390625, 51.027862548828125, 1.6941909790039062, 140.34762573242188, 183.97093200683594, 100.67434692382812, 78.57041931152344, -81.23859405517578, -21.909866333007812, 81.509765625, 67.6973876953125, 87.25331115722656, 75.93656921386719, 72.6964111328125, 155.5754852294922, 78.20526123046875, 81.89308166503906, 26.60776138305664, -2.638153076171875, -4.9175262451171875, -2.0868682861328125, -4.324607849121094, -13.086784362792969, -80.70175170898438, 12.494293212890625, 69.0224380493164, 179.7515869140625, 38.517242431640625, 150.5524444580078, 134.8739471435547, 176.41845703125, -176.93946838378906, 39.50117492675781, 89.05488586425781, 16.81435203552246, 163.06121826171875, 101.23194885253906, 116.41001892089844, 132.3409881591797, 156.76626586914062, -154.23968505859375, 9.61895751953125, 147.05767822265625, -3.8719043731689453, -39.33929443359375, 26.66839599609375, 29.848388671875, -0.9854278564453125, -64.08260345458984, 2.9771251678466797, 34.47998809814453, 130.87564086914062, -39.71419906616211, 40.65955352783203], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000370.npy"} +{"epoch": 0.5593348450491308, "step": 371, "batch_size": 64, "mean": 49.89393615722656, "std": 71.07530975341797, "min": -75.18950653076172, "p10": -48.97417411804199, "median": 48.0980224609375, "p90": 147.18679809570315, "max": 195.23037719726562, "pos_frac": 0.734375, "sample": [138.6936798095703, -75.18950653076172, 172.30758666992188, 65.25215911865234, 81.55332946777344, 9.06243896484375, 114.03749084472656, 16.50663185119629, -9.247581481933594, 11.973752975463867, -7.66094970703125, 101.76778411865234, -60.18596267700195, 165.63194274902344, 4.721385955810547, 192.3341064453125, -2.344545364379883, 99.98535919189453, 17.028366088867188, 150.8267059326172, 53.46549987792969, -73.42924499511719, -5.570863723754883, 9.172279357910156, 41.16389465332031, 119.78874206542969, 107.00057983398438, 195.23037719726562, 109.34898376464844, 75.77899169921875, 131.052001953125, 157.88619995117188, -51.81035614013672, 4.317474365234375, 81.29823303222656, 34.834625244140625, -12.919143676757812, -63.391258239746094, -24.330245971679688, 160.0243682861328, -57.42976379394531, 29.066333770751953, 8.288564682006836, 66.35655212402344, 61.07691955566406, -30.035560607910156, 86.26838684082031, 82.72281646728516, -50.576148986816406, 42.73054504394531, 103.07508087158203, -18.086830139160156, 5.934329986572266, 92.30897521972656, 115.78884887695312, 1.759521484375, 99.40108489990234, 29.931617736816406, 91.76206970214844, 69.64398956298828, 130.95123291015625, 85.58428192138672, -44.039894104003906, -45.23623275756836], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000371.npy"} +{"epoch": 0.5608465608465608, "step": 372, "batch_size": 64, "mean": 29.362394332885742, "std": 84.52034759521484, "min": -147.4298095703125, "p10": -79.68051071166991, "median": 18.93576717376709, "p90": 153.42777099609378, "max": 184.77157592773438, "pos_frac": 0.671875, "sample": [-34.64643859863281, 22.986087799072266, 131.750244140625, 87.2086181640625, 79.29364013671875, 66.82630157470703, 161.4140167236328, -38.913124084472656, 127.64739227294922, 126.22772979736328, 176.61663818359375, -6.8550872802734375, 96.92448425292969, 184.77157592773438, 57.05137634277344, 87.46707153320312, 105.0718994140625, -138.92013549804688, 10.822288513183594, 24.216697692871094, 10.310382843017578, -4.550260543823242, 22.114837646484375, 146.85018920898438, 5.848194122314453, -18.681983947753906, -96.69660949707031, -4.3307037353515625, 163.6120147705078, -73.1412582397461, 82.31629180908203, 35.1552734375, -33.068721771240234, -5.275539398193359, -82.48304748535156, 17.43390464782715, -147.4298095703125, 12.861312866210938, 119.76114654541016, 25.077184677124023, 176.76797485351562, 64.71559143066406, 125.70980834960938, 42.08453369140625, -53.33338928222656, 59.46998596191406, -142.79232788085938, 2.4126205444335938, 2.4324893951416016, 20.43762969970703, 4.6320343017578125, -137.84133911132812, 89.3565673828125, 4.121437072753906, -25.8631534576416, -43.70661926269531, -114.58766174316406, 61.22570037841797, 156.24673461914062, 157.52098083496094, -65.47802734375, -27.199432373046875, 3.1792373657226562, 17.037818908691406], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000372.npy"} +{"epoch": 0.562358276643991, "step": 373, "batch_size": 64, "mean": 39.78559494018555, "std": 84.01707458496094, "min": -146.3348388671875, "p10": -78.5537971496582, "median": 35.96095657348633, "p90": 148.34815368652343, "max": 198.8687286376953, "pos_frac": 0.65625, "sample": [-116.04158020019531, 135.64259338378906, 124.50553894042969, 149.02407836914062, 130.02618408203125, -108.1935806274414, -24.44031524658203, 120.92153930664062, 93.2169418334961, 39.22926330566406, 105.53567504882812, -118.48479461669922, 28.737075805664062, -40.98518371582031, -84.21556091308594, -23.561908721923828, 42.93756103515625, 78.8405532836914, -146.3348388671875, -42.49693298339844, 63.37239456176758, -13.016731262207031, 80.00785064697266, -76.33527374267578, 139.42636108398438, 141.38925170898438, -19.096328735351562, -0.6445159912109375, 82.9353256225586, 101.99405670166016, 157.82489013671875, -0.3429107666015625, 29.71194076538086, 146.77099609375, -74.37865447998047, -0.9193000793457031, 14.749267578125, 100.91574096679688, -0.8731613159179688, 134.57046508789062, 96.23930358886719, -53.381744384765625, -88.82563781738281, -31.27908706665039, 30.520126342773438, 110.90568542480469, -79.50459289550781, 151.7015838623047, 20.51110076904297, 51.090484619140625, -23.054489135742188, 161.4892120361328, 4.255367279052734, 191.63534545898438, 33.015281677246094, 40.17525863647461, 59.24345016479492, 74.09162902832031, 25.11377716064453, 198.8687286376953, 38.90663146972656, 3.807506561279297, 23.724143981933594, 155.10507202148438], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000373.npy"} +{"epoch": 0.563869992441421, "step": 374, "batch_size": 64, "mean": 65.10909271240234, "std": 76.45340728759766, "min": -140.3079376220703, "p10": -7.364636230468749, "median": 57.98932456970215, "p90": 162.7034912109375, "max": 257.2420349121094, "pos_frac": 0.84375, "sample": [257.2420349121094, 138.8468780517578, 118.06507873535156, -7.757942199707031, 35.5300178527832, 123.08885955810547, 164.9349822998047, 160.8919677734375, 163.4798583984375, 66.23214721679688, 76.98860168457031, 14.467269897460938, 98.36116027832031, 197.89602661132812, 75.02095794677734, 35.1485595703125, 135.65692138671875, 5.9617767333984375, 21.069992065429688, 60.081520080566406, 15.250007629394531, 119.42001342773438, 36.8281364440918, -101.59893798828125, 87.54081726074219, 81.0406723022461, 52.984676361083984, 146.2230224609375, -6.446922302246094, 102.36398315429688, 56.34983825683594, 82.0252685546875, 1.6566085815429688, 12.359611511230469, 77.594482421875, 59.62881088256836, 15.6346435546875, -140.3079376220703, 181.74099731445312, 87.54728698730469, 40.630550384521484, -98.40675354003906, 28.244909286499023, 197.92530822753906, 184.8165283203125, 41.74895477294922, -89.261474609375, -1.1065673828125, 48.71186828613281, 53.58118438720703, 124.54473876953125, 113.53282928466797, 147.32530212402344, 50.625335693359375, 15.992557525634766, 2.8992977142333984, 53.95641326904297, 93.24295043945312, 125.55364990234375, 142.22340393066406, -47.457374572753906, -15.440841674804688, 46.692657470703125, -2.6355133056640625], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000374.npy"} +{"epoch": 0.5653817082388511, "step": 375, "batch_size": 64, "mean": 46.15903091430664, "std": 78.95697784423828, "min": -150.6210479736328, "p10": -62.58892135620116, "median": 40.28340148925781, "p90": 144.13934783935548, "max": 222.03854370117188, "pos_frac": 0.703125, "sample": [-66.16230010986328, -70.23404693603516, 55.776466369628906, 98.33547973632812, 96.16927337646484, 17.70778465270996, 175.66937255859375, -4.001224517822266, 20.176605224609375, 86.01800537109375, -23.22437286376953, 123.78248596191406, -32.21209716796875, 144.91209411621094, 6.686092376708984, -5.1250762939453125, 34.39079284667969, -75.4437255859375, 95.52115631103516, -5.640041351318359, 46.17601013183594, 155.36886596679688, 150.08407592773438, -85.63009643554688, 112.11327362060547, 142.33627319335938, 3.5308456420898438, -54.25103759765625, 50.50335693359375, 134.23170471191406, 10.979331970214844, 0.1673564910888672, 9.160150527954102, -49.837791442871094, 52.82403564453125, 74.27091979980469, 81.28726959228516, 32.05226135253906, 163.82911682128906, 88.67487335205078, 136.76492309570312, 52.29442596435547, 121.07499694824219, -150.6210479736328, -21.678878784179688, 29.080810546875, 170.95468139648438, 5.151214599609375, 222.03854370117188, 85.17524719238281, 138.1360321044922, 91.5782470703125, -3.2980575561523438, 122.04544067382812, -25.088611602783203, 22.91240692138672, 94.22869110107422, -90.21212768554688, -28.655906677246094, 140.04959106445312, -10.735984802246094, 113.93286895751953, 18.00598907470703, -69.92874145507812], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000375.npy"} +{"epoch": 0.5668934240362812, "step": 376, "batch_size": 64, "mean": 59.58985900878906, "std": 86.45333862304688, "min": -123.83079528808594, "p10": -50.91130180358886, "median": 52.9393196105957, "p90": 163.71029663085938, "max": 285.9309997558594, "pos_frac": 0.703125, "sample": [44.496826171875, -3.390411376953125, -0.3741016387939453, 36.804046630859375, 5.601112365722656, -17.053905487060547, -3.6592941284179688, 122.98396301269531, -9.31146240234375, 47.280548095703125, 86.65390014648438, 95.54971313476562, -123.83079528808594, -2.4505844116210938, -82.16358947753906, 8.806098937988281, 175.862060546875, 59.35673522949219, 1.8710670471191406, 285.9309997558594, 59.12705993652344, 177.07373046875, 7.1773681640625, 137.93606567382812, 199.42384338378906, -6.186248779296875, 131.55953979492188, 140.65847778320312, 132.601806640625, 99.2928695678711, 128.93260192871094, 53.774559020996094, 153.5194091796875, 52.10408020019531, 71.34180450439453, 164.18637084960938, 215.91690063476562, -47.97895431518555, 161.29632568359375, -64.94477844238281, 56.82427215576172, -70.16588592529297, 149.67752075195312, 115.14894104003906, 100.5582504272461, 204.50027465820312, -52.16802215576172, 110.50398254394531, -30.00250244140625, 134.3602752685547, -74.05132293701172, 16.33642578125, 21.75640869140625, 31.109149932861328, 162.59945678710938, -4.817102432250977, 115.06437683105469, -11.724849700927734, 151.6204376220703, 84.05026245117188, -26.239593505859375, 13.503904342651367, 0.7698001861572266, -81.23916625976562], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000376.npy"} +{"epoch": 0.5684051398337112, "step": 377, "batch_size": 64, "mean": 41.28596878051758, "std": 72.21913146972656, "min": -133.27577209472656, "p10": -45.0967315673828, "median": 34.7324161529541, "p90": 136.93267669677735, "max": 189.91152954101562, "pos_frac": 0.671875, "sample": [102.55882263183594, -30.478431701660156, 110.5652084350586, 110.77003479003906, 67.68138122558594, -1.7339706420898438, -99.8166275024414, -77.35671997070312, 54.12555694580078, 27.593727111816406, 152.80859375, 6.460624694824219, 111.95885467529297, -2.1363525390625, 127.66866302490234, 117.69922637939453, -86.8256607055664, 77.27616119384766, -62.16759490966797, -6.355621337890625, 153.2942352294922, -5.493133544921875, 73.58740234375, 31.55377197265625, 91.44303894042969, -125.90342712402344, 23.245445251464844, 189.91152954101562, 31.855220794677734, -13.405195236206055, 122.9696044921875, -10.214513778686523, 107.21139526367188, 1.3357810974121094, -5.936859130859375, -51.361717224121094, 52.091888427734375, 37.60961151123047, 145.7682647705078, 29.487930297851562, -3.4117507934570312, 82.91991424560547, 8.910768508911133, 76.36321258544922, 55.74873352050781, 159.577392578125, 50.70521926879883, -8.595142364501953, -14.897201538085938, 43.743865966796875, 133.07958984375, 25.3848876953125, -15.900934219360352, 152.47158813476562, 3.6143646240234375, -16.72930335998535, 138.58399963378906, 82.48259735107422, -133.27577209472656, 13.289039611816406, 79.95002746582031, -11.429328918457031, 80.29637145996094, 80.07377624511719], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000377.npy"} +{"epoch": 0.5699168556311414, "step": 378, "batch_size": 64, "mean": 39.404930114746094, "std": 70.80685424804688, "min": -136.4167022705078, "p10": -19.95389537811279, "median": 19.374088287353516, "p90": 137.91530914306642, "max": 195.7667236328125, "pos_frac": 0.71875, "sample": [106.98956298828125, 65.34778594970703, 4.325628280639648, 18.29755401611328, 83.88208770751953, 126.49610137939453, -52.40119934082031, 9.40036392211914, 56.44218444824219, 130.34866333007812, -136.4167022705078, 3.806356430053711, 195.7667236328125, -4.037708282470703, 141.1581573486328, 87.2426986694336, 52.39317321777344, 6.336116790771484, 150.693359375, -6.259243011474609, 70.05616760253906, 9.586196899414062, 8.03774642944336, 48.75109100341797, 145.41990661621094, 11.021720886230469, 51.410118103027344, 43.37713623046875, -75.18684387207031, 12.396015167236328, 87.220458984375, 31.371376037597656, -67.41787719726562, -6.072202682495117, 111.17050170898438, 20.45062255859375, -21.2664794921875, 10.270164489746094, 114.54882049560547, -6.29771614074707, 183.16957092285156, 79.05448913574219, -0.048187255859375, 128.1142578125, 28.5179443359375, 113.94024658203125, -4.009258270263672, 151.0348663330078, 64.64443969726562, 9.349287033081055, 7.286281585693359, -10.276779174804688, 8.19528579711914, -103.23881530761719, -14.170398712158203, 84.59101867675781, -16.891199111938477, 100.73452758789062, 1.194082260131836, 47.864646911621094, -12.23183822631836, -119.31025695800781, -8.156007766723633, 163.89865112304688], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000378.npy"} +{"epoch": 0.5714285714285714, "step": 379, "batch_size": 64, "mean": 54.581939697265625, "std": 75.9372787475586, "min": -102.73468780517578, "p10": -28.849578475952146, "median": 40.515451431274414, "p90": 153.2279769897461, "max": 235.74932861328125, "pos_frac": 0.8125, "sample": [75.71226501464844, -2.127166748046875, 136.2812042236328, -2.9761886596679688, 26.01873779296875, 72.21963500976562, 45.24433135986328, -102.73468780517578, 49.43326187133789, 11.610359191894531, 19.773056030273438, 41.028289794921875, -73.59190368652344, 101.37681579589844, 9.100013732910156, 235.74932861328125, 24.31787109375, -29.880962371826172, 124.7104721069336, 152.18380737304688, 232.16400146484375, 112.09844970703125, 153.6443634033203, 107.45777130126953, 69.95260620117188, -79.60040283203125, 92.6786117553711, -70.22076416015625, 44.816993713378906, -44.98272705078125, 214.196533203125, 45.41925811767578, 5.373600006103516, 40.00261306762695, -87.44345092773438, 152.25640869140625, 142.57907104492188, 18.941978454589844, 24.561996459960938, -14.148876190185547, -26.443016052246094, 12.742927551269531, 59.88066864013672, 161.11618041992188, 146.4459228515625, 14.33243179321289, 160.5745391845703, 192.76956176757812, 3.335681915283203, 12.504165649414062, 105.41413879394531, 14.459808349609375, 27.3411865234375, 59.72930908203125, 106.89530181884766, 1.7962722778320312, 33.30876159667969, 73.05529022216797, 35.187931060791016, 6.305696487426758, 89.26848602294922, 37.36863708496094, 95.2935791015625, -2.635711669921875], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000379.npy"} +{"epoch": 0.5729402872260015, "step": 380, "batch_size": 64, "mean": 63.36537170410156, "std": 78.2848129272461, "min": -147.40042114257812, "p10": -29.24803066253662, "median": 64.26558303833008, "p90": 154.15269775390624, "max": 204.59494018554688, "pos_frac": 0.796875, "sample": [34.59969711303711, 137.9331512451172, 62.053314208984375, 40.69990539550781, -43.13047790527344, -88.6811294555664, 148.3554229736328, 183.68267822265625, -7.957881927490234, 128.29061889648438, 106.53445434570312, 26.048503875732422, -3.1196250915527344, 69.31704711914062, -4.420711517333984, -41.250091552734375, 0.3200340270996094, 58.89434814453125, 129.78302001953125, 151.49693298339844, 89.19851684570312, 60.990501403808594, -12.091743469238281, -147.40042114257812, 142.67123413085938, 5.871421813964844, 115.02452850341797, 66.47785186767578, -27.84092903137207, 30.04512596130371, 114.75112915039062, 161.56887817382812, 70.43343353271484, 36.13765335083008, 204.59494018554688, 10.73013687133789, 153.51913452148438, 113.00780487060547, 29.848617553710938, 7.781715393066406, 137.54946899414062, -122.91244506835938, 147.67037963867188, 157.406982421875, 51.534873962402344, 111.83270263671875, -20.477088928222656, 93.86920166015625, -29.85107421875, 121.28489685058594, 19.905555725097656, 5.213781356811523, -63.91473388671875, 182.3865966796875, 144.9381866455078, 132.76193237304688, 8.872613906860352, 181.26959228515625, 114.6530532836914, 154.42422485351562, 72.08300018310547, 90.56924438476562, 23.01271629333496, 26.531524658203125], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000380.npy"} +{"epoch": 0.5744520030234316, "step": 381, "batch_size": 64, "mean": 25.174501419067383, "std": 79.18864440917969, "min": -189.71800231933594, "p10": -56.58800354003906, "median": 11.879356384277344, "p90": 145.3991256713867, "max": 254.90692138671875, "pos_frac": 0.640625, "sample": [20.92889404296875, 11.396804809570312, -0.4535064697265625, -83.08895874023438, -189.71800231933594, 9.616405487060547, 3.3701858520507812, 22.204185485839844, 166.31991577148438, 75.72798156738281, 4.747001647949219, -5.626209259033203, 9.152626037597656, 30.970584869384766, 1.855642318725586, 254.90692138671875, 91.46588134765625, -0.6903953552246094, 52.75559997558594, -4.560356140136719, 22.976545333862305, -56.090721130371094, 10.094549179077148, 175.9116973876953, -85.91271209716797, 82.1383285522461, -48.373565673828125, -56.801124572753906, 91.551513671875, -3.6968746185302734, 59.56096649169922, 124.39790344238281, 16.633682250976562, 20.962921142578125, -4.134059906005859, 154.18089294433594, 21.172504425048828, -24.258831024169922, -110.23902893066406, 12.361907958984375, 144.02346801757812, -29.622604370117188, 7.695533752441406, 14.032011032104492, 39.521392822265625, 163.96527099609375, 90.13230895996094, 68.8934097290039, -3.182706832885742, 13.593490600585938, 6.524566650390625, 104.72767639160156, 145.9886932373047, -23.010665893554688, 27.180583953857422, -8.35833740234375, 101.60395812988281, -170.76455688476562, -59.618019104003906, 36.92802429199219, -1.937774658203125, -43.09258270263672, -38.48480987548828, 150.71202087402344], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000381.npy"} +{"epoch": 0.5759637188208617, "step": 382, "batch_size": 64, "mean": 43.21149826049805, "std": 65.82597351074219, "min": -135.65391540527344, "p10": -27.14516792297363, "median": 35.28655242919922, "p90": 133.49981079101565, "max": 199.28677368164062, "pos_frac": 0.734375, "sample": [-24.60693359375, -6.922445297241211, 191.41049194335938, 47.004974365234375, 160.98155212402344, -21.658950805664062, 85.95982360839844, 23.796707153320312, 129.1441650390625, 71.88017272949219, 56.72361755371094, -19.478561401367188, -17.351806640625, 38.856048583984375, 127.80532836914062, 33.152801513671875, -34.36268615722656, 6.6707763671875, -135.65391540527344, 110.55210876464844, -1.9123058319091797, 38.30760192871094, 23.179916381835938, 4.419364929199219, -28.490280151367188, 6.133270263671875, 72.62299346923828, 43.14772033691406, -68.22956085205078, 162.82794189453125, 63.22553253173828, 25.937274932861328, -56.525630950927734, -47.000892639160156, 150.63504028320312, -3.8664016723632812, -28.232982635498047, 4.7194671630859375, 37.42030334472656, 135.36651611328125, 61.312103271484375, 199.28677368164062, 3.4341583251953125, 32.76847839355469, 25.30951690673828, 84.79082489013672, -16.363086700439453, -2.0821380615234375, 27.59906005859375, 61.11078643798828, 74.6495361328125, 98.58732604980469, -20.017261505126953, 45.29804611206055, 111.31875610351562, 1.8094139099121094, 67.0902099609375, 27.105297088623047, 128.38937377929688, 159.37741088867188, 91.35353088378906, 77.80357360839844, 54.09431838989258, 13.921806335449219], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000382.npy"} +{"epoch": 0.5774754346182918, "step": 383, "batch_size": 64, "mean": 45.22222137451172, "std": 83.16886901855469, "min": -150.53793334960938, "p10": -61.98408126831053, "median": 31.335659980773926, "p90": 156.4988739013672, "max": 212.95907592773438, "pos_frac": 0.703125, "sample": [-2.575704574584961, 130.12522888183594, 102.44033813476562, 18.824310302734375, 28.12792205810547, -42.07835388183594, 100.31260681152344, 49.47386932373047, 8.786506652832031, -70.70368194580078, 4.480762481689453, -70.78887939453125, 62.779537200927734, 67.25216674804688, 100.25028228759766, 48.56982421875, 135.86935424804688, -66.85918426513672, 170.94920349121094, 122.419189453125, 46.55656433105469, -16.2518310546875, 164.01380920410156, -49.69989013671875, 147.7154998779297, 17.637115478515625, 37.413604736328125, -20.150253295898438, 29.51902198791504, 212.95907592773438, 127.66907501220703, -46.1998291015625, -32.528831481933594, 187.75152587890625, -13.681888580322266, 84.56285095214844, 117.68985748291016, -150.53793334960938, 10.767913818359375, 46.351043701171875, -91.49642181396484, 22.742782592773438, 33.15229797363281, 20.223405838012695, 157.78558349609375, -69.97586059570312, 27.62396240234375, 51.06141662597656, -50.60884094238281, 207.969970703125, 22.241689682006836, 174.45367431640625, 93.92322540283203, 16.37530517578125, -8.653373718261719, 150.88641357421875, 119.28573608398438, 28.289031982421875, -16.11676788330078, -107.78715515136719, 143.67205810546875, -47.87396240234375, 153.49655151367188, 64.33946228027344], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000383.npy"} +{"epoch": 0.5789871504157218, "step": 384, "batch_size": 64, "mean": 47.909156799316406, "std": 67.44278717041016, "min": -170.97140502929688, "p10": -28.597258377075185, "median": 49.895423889160156, "p90": 147.8977920532227, "max": 176.37686157226562, "pos_frac": 0.828125, "sample": [-44.494659423828125, 139.75308227539062, 49.545562744140625, 95.44064331054688, 11.709125518798828, 70.3089828491211, 92.8711929321289, 51.82306671142578, 155.34619140625, -19.221660614013672, 41.716522216796875, 81.93232727050781, 50.24528503417969, 8.966865539550781, -11.040870666503906, 21.372604370117188, 10.559501647949219, 176.37686157226562, 8.67987060546875, 151.3883819580078, -2.8735580444335938, 66.32318115234375, 18.408729553222656, -32.61537170410156, -70.627197265625, 74.98863983154297, 175.94082641601562, 68.16805267333984, -96.97140502929688, 98.85615539550781, 158.64410400390625, 108.74639892578125, 4.449474334716797, 56.81993103027344, 68.10704040527344, 8.32611083984375, 164.65847778320312, 26.51131820678711, -170.97140502929688, 127.8639907836914, 46.436676025390625, 74.16256713867188, 96.24376678466797, -43.12427520751953, 165.01312255859375, 68.90411376953125, 55.7064094543457, 9.70121955871582, 15.553287506103516, 101.51546478271484, 73.04306030273438, 10.07757568359375, 48.51513671875, 47.3707275390625, 16.509849548339844, 1.6860694885253906, -72.9867172241211, 55.0489501953125, 3.276214599609375, -0.6379432678222656, 99.23580932617188, 101.98172760009766, 64.537353515625, 32.383583068847656], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000384.npy"} +{"epoch": 0.5804988662131519, "step": 385, "batch_size": 64, "mean": 60.028526306152344, "std": 70.40230560302734, "min": -62.691856384277344, "p10": -31.77743148803711, "median": 59.580257415771484, "p90": 158.5369384765625, "max": 195.06065368652344, "pos_frac": 0.75, "sample": [-56.16277313232422, -0.16888809204101562, 144.8145751953125, 100.767333984375, 52.57469177246094, 18.2891845703125, 59.27978515625, 93.55293273925781, 19.435287475585938, 42.0933837890625, -52.3520622253418, 80.84487915039062, 68.20156860351562, 140.53321838378906, 59.88072967529297, 122.13712310791016, 152.93905639648438, 113.827392578125, 3.8879928588867188, 57.715213775634766, -14.394561767578125, -29.191024780273438, -0.72412109375, 158.87908935546875, 157.73858642578125, 188.36500549316406, 36.013309478759766, 68.77662658691406, 28.64873504638672, 91.85446166992188, 86.67912292480469, -62.691856384277344, 73.13456726074219, -6.97015380859375, 65.67276000976562, 168.30392456054688, 125.78045654296875, 90.74203491210938, 77.92153930664062, 96.30780029296875, -24.949939727783203, -32.62065887451172, 110.05667114257812, 51.52699279785156, 10.949897766113281, 195.06065368652344, 180.0561065673828, -45.04481506347656, 2.661876678466797, -2.8080291748046875, -30.412139892578125, 41.325897216796875, -32.36255645751953, -15.912612915039062, 119.02218627929688, 89.67339324951172, 10.287322998046875, 145.22955322265625, -36.907798767089844, 179.67515563964844, 3.9034385681152344, 8.338798522949219, 161.9739227294922, 130.16567993164062], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000385.npy"} +{"epoch": 0.582010582010582, "step": 386, "batch_size": 64, "mean": 39.41490173339844, "std": 69.47517395019531, "min": -153.38063049316406, "p10": -40.23428611755371, "median": 41.595970153808594, "p90": 123.80642089843752, "max": 179.1214141845703, "pos_frac": 0.734375, "sample": [125.95401000976562, -70.3085708618164, -5.383892059326172, 63.526336669921875, 74.41069030761719, -3.72998046875, 0.73193359375, 71.86445617675781, 66.90495300292969, 76.34971618652344, 17.83313751220703, 45.04393005371094, -110.56498718261719, 14.049415588378906, 28.108291625976562, 128.66552734375, 112.03182983398438, 108.87687683105469, 112.68863677978516, 97.26226806640625, 13.682989120483398, 80.48865509033203, 62.81218719482422, -42.529605865478516, -57.662071228027344, 116.12779235839844, 107.82969665527344, -33.09776306152344, 75.13557434082031, 68.48094940185547, 29.067054748535156, 108.5543212890625, -9.790153503417969, 45.3399658203125, -25.159175872802734, -30.46661376953125, 41.785560607910156, 28.173370361328125, 59.26337814331055, 153.98098754882812, 24.338348388671875, -34.8785400390625, 70.2460708618164, 99.44802856445312, 130.9124755859375, -33.08952713012695, -60.3077392578125, 35.68238067626953, 1.1816158294677734, 179.1214141845703, 5.147666931152344, -23.883132934570312, -117.85795593261719, 128.2253875732422, 178.79647827148438, 41.40637969970703, 36.55427551269531, 60.456634521484375, 69.71733093261719, 118.79537963867188, 24.181198120117188, -22.52877426147461, 17.937156677246094, -153.38063049316406], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000386.npy"} +{"epoch": 0.5835222978080121, "step": 387, "batch_size": 64, "mean": 56.096248626708984, "std": 67.67647552490234, "min": -94.25682067871094, "p10": -24.9718204498291, "median": 41.59041976928711, "p90": 153.6830307006836, "max": 246.43666076660156, "pos_frac": 0.8125, "sample": [66.27885437011719, 9.368919372558594, 119.6075210571289, -28.172555923461914, 1.803741455078125, 177.1278839111328, 47.41334533691406, -24.127857208251953, 42.36888122558594, 246.43666076660156, 24.124757766723633, -4.115930557250977, 35.55909729003906, 40.81195831298828, 154.22315979003906, 6.110206604003906, 27.905136108398438, 127.00978088378906, 134.24656677246094, 37.64654541015625, 128.38748168945312, 158.3341064453125, 103.263916015625, -27.163814544677734, 4.956031799316406, 101.8421630859375, -4.121879577636719, 15.187952041625977, 136.43646240234375, 49.571319580078125, -2.094127655029297, -47.669952392578125, 40.109153747558594, 152.4227294921875, -37.713226318359375, 116.47266387939453, 63.87797927856445, 27.551790237426758, 19.859683990478516, 14.963821411132812, 0.5663356781005859, 52.355926513671875, 90.52205657958984, -94.25682067871094, -33.66426086425781, 45.64218521118164, 109.67475891113281, 176.64578247070312, 45.197914123535156, 140.3490447998047, -11.819332122802734, 40.39338684082031, 22.92120361328125, 58.57073974609375, 46.543701171875, 39.858516693115234, -25.333518981933594, 25.16602897644043, 70.1082763671875, 156.7639923095703, 205.92269897460938, 52.6995849609375, 30.246000289916992, 88.98473358154297], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000387.npy"} +{"epoch": 0.5850340136054422, "step": 388, "batch_size": 64, "mean": 37.09463119506836, "std": 80.85790252685547, "min": -129.52056884765625, "p10": -53.92568206787108, "median": 22.931095123291016, "p90": 139.8927764892578, "max": 258.28173828125, "pos_frac": 0.703125, "sample": [130.7224884033203, 75.789306640625, 90.72781372070312, 182.92845153808594, 38.77501678466797, 138.14576721191406, 33.96394348144531, 35.34382629394531, 21.54338836669922, -22.739112854003906, 31.94756317138672, 132.50283813476562, -16.209884643554688, 89.37555694580078, -6.936676025390625, 258.28173828125, 1.3724021911621094, 215.09120178222656, 18.823867797851562, 103.666015625, 115.79910278320312, 2.087554931640625, 140.9535675048828, 24.318801879882812, 141.61375427246094, -129.52056884765625, 68.32821655273438, 61.236663818359375, 13.024919509887695, 6.467058181762695, -5.624364852905273, -12.66187858581543, -7.18804931640625, 137.31655883789062, -21.16152000427246, 26.32562255859375, 27.928890228271484, -34.180084228515625, 47.372642517089844, -82.1802978515625, 49.614158630371094, 127.99807739257812, -121.76939392089844, 135.4382781982422, 136.29173278808594, 9.45074462890625, 12.585075378417969, 3.207477569580078, 18.467300415039062, 140.64149475097656, -5.308692932128906, 152.45091247558594, -43.69660949707031, 2.5301361083984375, -113.60298919677734, -58.3095703125, -42.39601135253906, 62.367767333984375, -17.024959564208984, 0.07776641845703125, 29.69073486328125, -87.95716094970703, -97.0565185546875, 6.994668960571289], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000388.npy"} +{"epoch": 0.5865457294028723, "step": 389, "batch_size": 64, "mean": 54.608154296875, "std": 75.38180541992188, "min": -142.78533935546875, "p10": -28.844689178466798, "median": 48.899295806884766, "p90": 154.12705078125, "max": 216.35043334960938, "pos_frac": 0.671875, "sample": [-43.05555725097656, -15.285764694213867, 82.59368896484375, 74.49942016601562, 98.28359985351562, 39.94099426269531, 101.25819396972656, 128.87936401367188, 193.4754638671875, 90.5972900390625, -27.94793701171875, -31.600143432617188, 85.533935546875, 102.22561645507812, 33.9559326171875, 86.64270782470703, 78.60467529296875, 142.9537353515625, 63.715576171875, 14.35549545288086, 136.6594696044922, 141.703369140625, -1.5200061798095703, 36.7745361328125, 109.40090942382812, -8.709236145019531, 134.60256958007812, -20.839698791503906, 36.04118347167969, 71.55401611328125, -32.08772277832031, 120.4252700805664, -13.905532836914062, 151.125732421875, 160.231689453125, 33.2701416015625, 173.70176696777344, 79.29044342041016, 27.252124786376953, -142.78533935546875, 182.392578125, -5.823627471923828, 7.56678581237793, -18.679927825927734, 57.85759735107422, -6.829010009765625, 137.40333557128906, -32.934871673583984, -81.27653503417969, 16.5655517578125, -14.659278869628906, 7.165035247802734, -22.57965087890625, -4.3350982666015625, -29.22901153564453, 172.6516876220703, 155.413330078125, 112.30926513671875, 62.98406982421875, 216.35043334960938, -10.506967544555664, 116.91575622558594, 4.738641738891602, -20.35007095336914], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000389.npy"} +{"epoch": 0.5880574452003023, "step": 390, "batch_size": 64, "mean": 45.414710998535156, "std": 67.74742126464844, "min": -131.75274658203125, "p10": -32.834086608886714, "median": 36.432701110839844, "p90": 135.91701354980472, "max": 187.14218139648438, "pos_frac": 0.765625, "sample": [-34.04139709472656, 66.61661529541016, 58.747718811035156, 23.7537841796875, 120.35926055908203, 33.467002868652344, 106.68440246582031, 105.31328582763672, -44.90336608886719, 39.89380645751953, 3.221700668334961, -30.01702880859375, 107.28114318847656, 23.302228927612305, -3.1269607543945312, 187.14218139648438, 126.67314910888672, -43.88965606689453, 84.01296997070312, -44.016990661621094, 92.26008605957031, 14.102760314941406, 12.4139404296875, 159.68096923828125, 145.3155517578125, 130.90774536132812, 20.520538330078125, -67.95671081542969, 4.222904205322266, 107.90026092529297, -28.725685119628906, 8.458708763122559, -19.32966423034668, 56.084373474121094, -12.94968032836914, -24.14385223388672, -131.75274658203125, 121.24234008789062, 144.26516723632812, 0.5355758666992188, 138.0638427734375, 12.311498641967773, -0.5826492309570312, 47.86271667480469, 1.2259483337402344, 75.64424133300781, 13.110679626464844, 25.98846435546875, 182.71383666992188, 39.398399353027344, 126.97164154052734, 88.01844787597656, 10.184371948242188, 46.68883514404297, 6.765537261962891, 94.74249267578125, 4.034189224243164, -66.93461608886719, 71.69621276855469, -18.500822067260742, 80.52790832519531, 65.66844940185547, 75.86286163330078, 165.5524139404297], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000390.npy"} +{"epoch": 0.5895691609977324, "step": 391, "batch_size": 64, "mean": 54.96485900878906, "std": 81.22235107421875, "min": -145.46377563476562, "p10": -40.09121475219726, "median": 57.46208572387695, "p90": 153.93846282958984, "max": 249.11277770996094, "pos_frac": 0.75, "sample": [27.041854858398438, -145.46377563476562, 155.17404174804688, 56.30021667480469, 54.405906677246094, 154.01702880859375, -3.7201271057128906, 149.37384033203125, 149.0746612548828, 240.483154296875, 54.555145263671875, -112.15647888183594, 110.28579711914062, -4.4078826904296875, 78.18574523925781, 180.59210205078125, -104.04534149169922, 36.89166259765625, -35.612335205078125, 27.60613250732422, -1.7836112976074219, 108.30235290527344, 90.9501953125, 58.62395477294922, 24.05945587158203, -37.06817626953125, -101.24951171875, -17.94469451904297, 69.54708862304688, -16.00249481201172, 249.11277770996094, 110.03736877441406, 75.59410095214844, -7.528228759765625, 61.795440673828125, 1.6501121520996094, 12.071290969848633, 73.0115966796875, 93.86717224121094, 124.54842376708984, 97.95777130126953, 82.53244018554688, -97.52061462402344, -44.50471496582031, 70.89667510986328, 38.05947494506836, 165.9168701171875, 31.882850646972656, 135.62612915039062, 128.12139892578125, 23.189849853515625, -12.032058715820312, 153.75514221191406, 120.22042846679688, 165.2991943359375, 106.94808959960938, 93.05631256103516, 50.74407196044922, -41.386802673339844, 11.718032836914062, 35.82365417480469, 61.90510940551758, 92.4661636352539, 6.8993988037109375], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000391.npy"} +{"epoch": 0.5910808767951625, "step": 392, "batch_size": 64, "mean": 57.89107894897461, "std": 85.45677947998047, "min": -155.45611572265625, "p10": -27.08631439208984, "median": 48.70254898071289, "p90": 171.37695465087893, "max": 298.9761962890625, "pos_frac": 0.796875, "sample": [-121.04228973388672, -1.3119430541992188, 32.86144256591797, 37.53559875488281, 31.033416748046875, -15.202888488769531, 149.43505859375, -29.399307250976562, 91.79122924804688, 138.97238159179688, 48.04008483886719, -155.45611572265625, 100.69346618652344, 150.52731323242188, 192.31790161132812, 50.44621276855469, 5.953155517578125, 127.80999755859375, 166.08131408691406, 22.1317138671875, 49.365013122558594, -2.2040252685546875, 58.69562530517578, -87.71954345703125, 101.1820068359375, 130.664794921875, 159.7650146484375, 57.280738830566406, 71.4085693359375, -84.02494812011719, 54.229736328125, 186.92213439941406, 101.911865234375, 11.950981140136719, -55.4984130859375, 60.981712341308594, 23.70738410949707, 82.01109313964844, 76.54731750488281, 130.52781677246094, 190.03582763671875, 181.23895263671875, -71.15357208251953, 161.56488037109375, 1.35198974609375, 2.5462722778320312, 6.278469085693359, 23.466796875, 173.64651489257812, 4.31402587890625, -4.5180511474609375, 298.9761962890625, 6.890201568603516, 43.80841064453125, -21.47564697265625, 7.111005783081055, 217.896240234375, -21.6893310546875, 23.653411865234375, 111.65093994140625, 7.56285285949707, 101.59221649169922, 23.152679443359375, 86.20516967773438], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000392.npy"} +{"epoch": 0.5925925925925926, "step": 393, "batch_size": 64, "mean": 61.085289001464844, "std": 71.46766662597656, "min": -92.52708435058594, "p10": -15.365423774719238, "median": 52.74745178222656, "p90": 156.0672393798828, "max": 224.23565673828125, "pos_frac": 0.78125, "sample": [64.92240905761719, -6.859628677368164, 105.81973266601562, 156.8163604736328, 153.12437438964844, 103.34996795654297, 27.581134796142578, 66.07686614990234, 70.61750030517578, 43.683048248291016, -14.984655380249023, 1.6454238891601562, 176.8505859375, 122.23013305664062, 49.49254608154297, -35.75553894042969, 0.12822723388671875, 162.42213439941406, 7.427787780761719, -0.028926849365234375, -15.528610229492188, 6.294527053833008, 96.97030639648438, 174.22567749023438, 90.45649719238281, 145.1251983642578, -23.379175186157227, 129.00132751464844, 109.28411865234375, 124.46388244628906, 54.65997314453125, -57.07851791381836, 166.2202606201172, 154.3192901611328, 1.0644168853759766, 52.88883972167969, -74.53697204589844, 170.22900390625, -1.6100234985351562, -8.07496452331543, 74.24817657470703, 23.540908813476562, 122.14229583740234, -11.862003326416016, 44.63237762451172, 110.89974975585938, 132.31130981445312, 12.99468994140625, 36.239742279052734, 153.00558471679688, 145.93678283691406, 224.23565673828125, 71.70683288574219, -8.610710144042969, 19.69153594970703, 111.97948455810547, 17.847122192382812, 52.60606384277344, -92.52708435058594, -25.677627563476562, 15.565071105957031, 116.97579956054688, 0.8750762939453125, 11.147323608398438], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000393.npy"} +{"epoch": 0.5941043083900227, "step": 394, "batch_size": 64, "mean": 49.6251220703125, "std": 63.1920051574707, "min": -123.76068115234375, "p10": -34.15351982116699, "median": 54.02333068847656, "p90": 129.18190841674812, "max": 198.76406860351562, "pos_frac": 0.796875, "sample": [25.711929321289062, 151.84385681152344, 112.77880859375, 16.956436157226562, 11.5926513671875, 39.34515380859375, -11.981155395507812, 43.40338134765625, 164.99444580078125, 53.59516143798828, 157.59054565429688, 89.31840515136719, 36.1827507019043, 35.25667190551758, -54.0279655456543, 48.676597595214844, -10.748401641845703, -20.44780158996582, -43.370025634765625, 24.519695281982422, 108.33943176269531, -29.82242202758789, 63.571285247802734, 66.41506958007812, 69.3681411743164, 170.03128051757812, 115.95819854736328, 91.31320190429688, 96.41193389892578, 2.9440994262695312, -86.86192321777344, 24.245223999023438, 138.99903869628906, 68.96318054199219, 41.68434143066406, 75.30548095703125, -1.098592758178711, 66.96986389160156, 61.7452392578125, 11.396343231201172, 87.70793151855469, -41.99592971801758, -36.00970458984375, 54.451499938964844, 72.80848693847656, 198.76406860351562, -123.76068115234375, 102.04991149902344, -1.1864089965820312, 56.5565185546875, -77.89454650878906, 94.54816436767578, 54.949058532714844, 78.48329162597656, 50.0472412109375, 63.99481964111328, 64.62388610839844, 104.27246856689453, 10.313987731933594, 39.234710693359375, 19.763870239257812, 134.84921264648438, 44.77899169921875, 97.58734893798828], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000394.npy"} +{"epoch": 0.5956160241874527, "step": 395, "batch_size": 64, "mean": 44.7777099609375, "std": 69.31011962890625, "min": -102.1764907836914, "p10": -23.615882492065428, "median": 26.238128662109375, "p90": 135.6009078979492, "max": 235.93032836914062, "pos_frac": 0.734375, "sample": [101.52155303955078, 132.43157958984375, 102.20310974121094, 5.638427734375, 115.48878479003906, 58.132415771484375, -2.8376216888427734, 78.52327728271484, 164.62338256835938, -17.249483108520508, 24.110855102539062, 64.45947265625, 151.27015686035156, 119.82079315185547, 20.49152374267578, 156.49278259277344, -4.2118377685546875, 78.67251586914062, 42.352996826171875, 9.24371337890625, -4.394828796386719, 19.80805206298828, 8.185104370117188, 54.41526412963867, 109.11630249023438, -102.1764907836914, 44.82398223876953, 132.77828979492188, 44.309383392333984, -6.120796203613281, 63.29991912841797, 235.93032836914062, 47.789093017578125, 39.549476623535156, -69.38371276855469, 25.155197143554688, -21.923595428466797, 14.552120208740234, 101.92777252197266, -24.341148376464844, -5.5104217529296875, 1.771615982055664, 136.4032440185547, 21.12087631225586, 14.995121002197266, 64.58061218261719, -1.5793075561523438, 172.46812438964844, -58.08363342285156, -9.703523635864258, 6.597942352294922, 217.6265106201172, -51.095611572265625, 5.455738067626953, 28.737472534179688, 133.72879028320312, -45.99174880981445, 27.321060180664062, 76.81629943847656, -63.30109405517578, 12.028350830078125, -15.539352416992188, 8.685907363891602, 73.76241302490234], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000395.npy"} +{"epoch": 0.5971277399848829, "step": 396, "batch_size": 64, "mean": 50.464759826660156, "std": 68.76835632324219, "min": -112.21709442138672, "p10": -29.578908538818357, "median": 37.54685592651367, "p90": 147.84925079345703, "max": 236.13478088378906, "pos_frac": 0.8125, "sample": [151.44583129882812, 236.13478088378906, 146.43576049804688, 144.59368896484375, 120.94474792480469, 95.9561538696289, 22.935192108154297, 139.99502563476562, 39.369300842285156, 30.548553466796875, 70.12398529052734, 10.448776245117188, 110.3494644165039, -31.07949447631836, 44.452232360839844, -1.6749725341796875, 53.0345458984375, 71.7406997680664, 1.0095176696777344, 59.71818542480469, 35.72441101074219, -32.61613464355469, 173.64035034179688, 45.38636016845703, 1.9860610961914062, 39.55213165283203, 85.09437561035156, -112.21709442138672, 120.27156066894531, 91.19853210449219, 10.723400115966797, -56.20957565307617, 1.3156089782714844, 136.74632263183594, 48.420562744140625, 35.184471130371094, 73.76646423339844, 25.898841857910156, 173.40103149414062, 184.35748291015625, -5.099742889404297, 23.2768611907959, 0.7688636779785156, 77.37051391601562, 7.136726379394531, 47.99897766113281, 11.929115295410156, 15.399848937988281, 71.39474487304688, -36.03813934326172, 12.195625305175781, -26.07754135131836, 17.96299934387207, 12.85934829711914, -3.1731605529785156, 142.63571166992188, 51.389488220214844, 151.1369171142578, 6.669284820556641, 23.484811782836914, -41.51676940917969, -68.7799072265625, -9.742118835449219, 148.4550323486328], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000396.npy"} +{"epoch": 0.5986394557823129, "step": 397, "batch_size": 64, "mean": 27.008699417114258, "std": 80.33943176269531, "min": -177.1779327392578, "p10": -62.778596496582026, "median": 27.4896879196167, "p90": 123.91083526611331, "max": 256.2907409667969, "pos_frac": 0.671875, "sample": [-1.0184650421142578, 20.078758239746094, -63.77131652832031, 45.73541259765625, -36.32373809814453, 50.52020263671875, 93.95512390136719, 34.39588165283203, 127.18428039550781, -9.751205444335938, 3.11346435546875, 56.47054672241211, 33.99126434326172, 82.50703430175781, 66.6955795288086, 78.34525299072266, -159.28018188476562, -84.579345703125, 45.150753021240234, -6.035469055175781, 90.64427185058594, -13.848648071289062, 56.184608459472656, 92.15985107421875, 9.776908874511719, -177.1779327392578, -60.462249755859375, 16.977676391601562, 155.1710205078125, 58.359130859375, 15.935462951660156, 20.98811149597168, 135.05929565429688, 48.439117431640625, 140.55897521972656, -20.601837158203125, 43.38137435913086, 115.19403076171875, 92.734619140625, 7.801530838012695, 12.408660888671875, 174.08438110351562, 115.73641967773438, 36.50868225097656, -163.148193359375, 53.46467590332031, 256.2907409667969, -59.4449462890625, -37.65538024902344, 2.0644073486328125, -0.21627426147460938, 48.6822509765625, -5.854011535644531, 11.988113403320312, 0.3688640594482422, -26.959983825683594, 35.872718811035156, 39.49632263183594, -24.721145629882812, 116.27279663085938, -140.63955688476562, -81.0238265991211, -2.6211299896240234, 162.94314575195312], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000397.npy"} +{"epoch": 0.600151171579743, "step": 398, "batch_size": 64, "mean": 62.283084869384766, "std": 75.5166244506836, "min": -58.055809020996094, "p10": -16.3873737335205, "median": 50.06866455078125, "p90": 161.38458862304688, "max": 338.0654296875, "pos_frac": 0.78125, "sample": [129.81312561035156, 61.26054000854492, 101.47959899902344, 57.85523986816406, 160.6511993408203, 16.383609771728516, 161.6988983154297, 188.076416015625, -18.721603393554688, 162.00735473632812, 102.92485046386719, 22.735733032226562, -10.71295166015625, -8.86224365234375, 106.56932067871094, 8.903945922851562, 110.99571990966797, -8.854957580566406, 66.57315063476562, -57.46049880981445, 99.74507141113281, 2.775350570678711, 163.51629638671875, 210.2097625732422, 1.0753021240234375, 146.9150390625, 125.52617645263672, 100.15699005126953, 37.43614959716797, 39.535377502441406, -21.348583221435547, 43.668914794921875, 19.767242431640625, 107.54017639160156, 4.564277648925781, -8.72233772277832, 33.66145324707031, 137.64488220214844, 19.75086212158203, 57.980865478515625, -32.27571105957031, -23.689659118652344, 129.66921997070312, 56.468414306640625, 94.99765014648438, 116.0677719116211, 20.08070945739746, 6.209327697753906, -10.635517120361328, 60.015010833740234, 3.9628982543945312, 338.0654296875, 27.836708068847656, -3.5522842407226562, 71.22276306152344, -23.234458923339844, 191.95718383789062, -58.055809020996094, 63.46576690673828, 8.682489395141602, -10.940837860107422, 119.94092559814453, 156.8570556640625, 8.28660774230957], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000398.npy"} +{"epoch": 0.6016628873771731, "step": 399, "batch_size": 64, "mean": 69.84799194335938, "std": 85.83064270019531, "min": -83.62965393066406, "p10": -23.596253204345704, "median": 56.286542892456055, "p90": 170.48277130126954, "max": 389.69610595703125, "pos_frac": 0.78125, "sample": [91.38523864746094, 43.338279724121094, 110.45275115966797, 198.37017822265625, -23.650894165039062, 131.858154296875, 139.2843017578125, 34.64930725097656, -5.073688507080078, -11.258201599121094, -67.33882141113281, 81.57864379882812, 73.68214416503906, -53.6962776184082, 45.42616271972656, 56.40016174316406, 60.33949279785156, 105.36276245117188, 68.13949584960938, 214.69873046875, -47.147125244140625, -20.839004516601562, -83.62965393066406, 110.6624755859375, 253.62814331054688, 16.711227416992188, 21.304698944091797, 389.69610595703125, 15.013069152832031, 15.801322937011719, 19.48383331298828, 1.206197738647461, 54.75599670410156, 32.1526985168457, 31.422332763671875, -20.592811584472656, 57.92186737060547, 164.8011016845703, 54.234642028808594, 180.30067443847656, 43.07951354980469, 1.3306140899658203, 166.91871643066406, -23.28973388671875, 164.52850341796875, 98.14832305908203, 61.734153747558594, 56.17292404174805, -40.57904052734375, -23.46875762939453, 154.08872985839844, 164.6580047607422, 152.4339599609375, 109.30794525146484, 120.54319763183594, 151.10433959960938, 101.64230346679688, 181.3337860107422, 33.112884521484375, -26.584888458251953, 172.01022338867188, -10.265689849853516, 73.21395111083984, 48.261680603027344], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000399.npy"} +{"epoch": 0.6031746031746031, "step": 400, "batch_size": 64, "mean": 39.76671600341797, "std": 71.26953125, "min": -130.561279296875, "p10": -36.39818649291992, "median": 26.892040252685547, "p90": 130.09062957763675, "max": 199.18370056152344, "pos_frac": 0.71875, "sample": [-9.34048843383789, 82.8164291381836, 27.511856079101562, -30.053512573242188, 104.88360595703125, 110.13984680175781, 26.39940643310547, 100.83979797363281, 70.86843872070312, 132.0418243408203, 38.26114273071289, -45.58684539794922, 37.008602142333984, 3.7253360748291016, 0.2765235900878906, -1.4066162109375, 27.384674072265625, 141.8042755126953, 109.13286590576172, 114.51512145996094, -6.9222412109375, 27.742481231689453, 85.97946166992188, 12.095041275024414, -102.94171142578125, 82.2842025756836, 14.254873275756836, 17.711090087890625, 17.24679946899414, -6.27275276184082, -81.49835205078125, -5.876066207885742, 101.34489440917969, 3.286285400390625, 161.3765411376953, -5.288471221923828, -60.29618835449219, 19.852367401123047, 125.537841796875, 94.35595703125, 169.34939575195312, 107.95893096923828, -130.561279296875, 94.85647583007812, 6.881843566894531, 31.62580108642578, 8.964141845703125, -29.750473022460938, -14.777137756347656, 199.18370056152344, 45.01339340209961, 119.1218490600586, -39.117332458496094, 43.94976043701172, -15.89771842956543, 167.03305053710938, 177.13583374023438, 50.97857666015625, 21.188743591308594, 22.09002685546875, -117.3452377319336, -11.443859100341797, 21.381980895996094, 82.05506896972656], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000400.npy"} +{"epoch": 0.6046863189720333, "step": 401, "batch_size": 64, "mean": 60.22024917602539, "std": 72.79557800292969, "min": -59.4875373840332, "p10": -25.308366584777822, "median": 45.85165023803711, "p90": 168.04096984863284, "max": 213.34976196289062, "pos_frac": 0.78125, "sample": [-6.605049133300781, 118.02088928222656, 131.4637451171875, 63.2401123046875, -28.726131439208984, 1.9896011352539062, 22.857337951660156, 46.12531280517578, -30.516483306884766, 2.4680557250976562, 169.64776611328125, -4.2096405029296875, -59.4875373840332, -6.7285614013671875, 25.97905731201172, -31.862831115722656, 113.31768798828125, 211.89096069335938, 132.27828979492188, 153.65829467773438, 55.36095428466797, 67.72348022460938, 31.324508666992188, 29.08371353149414, -49.011749267578125, -49.105064392089844, 63.80747985839844, 78.1432113647461, 63.40718078613281, 49.952064514160156, 108.17376708984375, 33.94658660888672, 16.707483291625977, 152.66775512695312, -5.128318786621094, 164.29177856445312, 5.727384567260742, 112.15380096435547, 15.29753303527832, 169.79238891601562, 11.414764404296875, 160.6907501220703, 105.673828125, -17.333581924438477, 172.12570190429688, 9.46579360961914, -1.861419677734375, 207.13058471679688, 152.62857055664062, 95.28197479248047, 73.21001434326172, 3.2883129119873047, 14.98355484008789, 14.385971069335938, -50.46280288696289, 67.9637680053711, 71.02232360839844, 24.35309410095215, 155.62210083007812, 170.0772247314453, 45.57798767089844, -9.668018341064453, 26.05881118774414, 213.34976196289062], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000401.npy"} +{"epoch": 0.6061980347694633, "step": 402, "batch_size": 64, "mean": 46.896968841552734, "std": 76.8852310180664, "min": -105.79878234863281, "p10": -49.53963775634765, "median": 34.69293975830078, "p90": 147.70838012695316, "max": 193.68751525878906, "pos_frac": 0.765625, "sample": [87.89152526855469, 160.968994140625, 107.26153564453125, 112.11821746826172, 109.07908630371094, 75.08463287353516, 193.68751525878906, 30.18756103515625, 32.75578308105469, 82.4292984008789, -17.791160583496094, 187.5196533203125, 39.578590393066406, -50.77935791015625, 52.50360107421875, 43.354679107666016, 5.740203857421875, 21.140283584594727, 17.425331115722656, 29.793548583984375, 113.9167251586914, 2.0593109130859375, 4.964179992675781, -94.51103210449219, 185.42172241210938, 6.923618316650391, 71.26983642578125, 139.45782470703125, 60.28029251098633, 21.42961883544922, 174.27207946777344, 134.05126953125, -11.660079956054688, 79.92536926269531, -8.490036010742188, 42.04431915283203, 140.67556762695312, 134.65383911132812, 18.141403198242188, 71.68834686279297, -53.47718811035156, -84.18397521972656, -105.40786743164062, 101.99553680419922, 33.84611511230469, 8.01679801940918, 35.539764404296875, -43.86680603027344, 12.869544982910156, 2.267627716064453, 120.58623504638672, 150.72244262695312, 116.73715209960938, 177.38414001464844, -44.11454772949219, -8.892675399780273, -18.37041473388672, -103.42674255371094, -105.79878234863281, 62.03047180175781, 29.093517303466797, 126.6414566040039, -46.64695739746094, 31.39739990234375], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000402.npy"} +{"epoch": 0.6077097505668935, "step": 403, "batch_size": 64, "mean": 61.4372673034668, "std": 81.09626007080078, "min": -135.40512084960938, "p10": -30.511787414550778, "median": 39.93813705444336, "p90": 159.43758392333984, "max": 305.57171630859375, "pos_frac": 0.796875, "sample": [-6.354286193847656, 11.29888916015625, 218.81002807617188, 31.479843139648438, 153.94497680664062, 33.71647644042969, 198.99725341796875, 108.37599182128906, 18.615432739257812, 0.8830108642578125, 55.816810607910156, -43.47059631347656, 123.99345397949219, -31.791385650634766, 140.86094665527344, 89.20843505859375, 47.48773956298828, 12.893182754516602, 35.66825866699219, 10.280889511108398, -5.67341423034668, -37.87459945678711, 305.57171630859375, 158.71783447265625, -9.811767578125, 106.2845458984375, 156.95864868164062, 6.803140640258789, 159.7460479736328, 21.91590118408203, -1.0035896301269531, 60.72047424316406, 37.72425842285156, 22.16217803955078, 58.28601837158203, -27.526058197021484, 12.340436935424805, 162.05410766601562, 36.576202392578125, 104.41421508789062, 35.979583740234375, 0.7725238800048828, 155.31301879882812, 31.08126449584961, 116.02870178222656, -25.206756591796875, 109.69331359863281, 125.63036346435547, 82.69981384277344, 43.55810546875, 138.49172973632812, 164.35665893554688, -135.40512084960938, -33.52096176147461, 193.68521118164062, -105.2340087890625, 131.52090454101562, 58.315879821777344, 34.150753021240234, 149.15505981445312, -50.8006591796875, 14.499427795410156, 42.152015686035156, 115.9665756225586], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000403.npy"} +{"epoch": 0.6092214663643235, "step": 404, "batch_size": 64, "mean": 61.26074981689453, "std": 83.51371002197266, "min": -103.88150024414062, "p10": -40.11311874389648, "median": 55.974266052246094, "p90": 170.1452590942383, "max": 247.8746337890625, "pos_frac": 0.703125, "sample": [-15.92840576171875, 47.26094055175781, 97.49015045166016, 4.3848114013671875, 55.43328094482422, -6.159980773925781, 93.92369842529297, 16.182464599609375, -35.80962371826172, -41.95747375488281, 167.46224975585938, -33.50567626953125, -103.88150024414062, -81.87115478515625, -0.6132354736328125, 199.1240234375, -25.78527069091797, -3.0440597534179688, 160.38653564453125, 172.81893920898438, 100.9078369140625, 112.4141616821289, 118.451904296875, 186.82907104492188, -35.37309265136719, 133.67733764648438, -53.82398986816406, 189.84130859375, 116.7064208984375, 127.94331359863281, 12.664470672607422, 106.73043823242188, -11.317289352416992, 129.77548217773438, -19.509117126464844, 6.138862609863281, 27.369606018066406, 123.83956146240234, 87.88880157470703, -1.0537071228027344, 9.562416076660156, -0.406768798828125, 116.1376953125, 49.84814453125, 145.34652709960938, 24.156269073486328, 109.47372436523438, 161.00494384765625, 171.2951202392578, 56.51525115966797, 1.2309761047363281, 247.8746337890625, 240.1617431640625, 60.45188903808594, 129.2510223388672, 115.46471405029297, 163.59848022460938, -46.614990234375, -60.07255554199219, -54.31599426269531, 59.068695068359375, 57.717044830322266, 11.487335205078125, 26.439598083496094], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000404.npy"} +{"epoch": 0.6107331821617535, "step": 405, "batch_size": 64, "mean": 48.31888198852539, "std": 72.29337310791016, "min": -111.48072052001953, "p10": -23.253609466552735, "median": 30.671204566955566, "p90": 156.17932739257813, "max": 199.912353515625, "pos_frac": 0.6875, "sample": [146.42434692382812, -15.582317352294922, -45.93911361694336, 170.9646453857422, 38.89476776123047, 12.988716125488281, 153.4357452392578, 3.2122344970703125, -4.518344879150391, -48.819480895996094, -11.474868774414062, 6.809236526489258, 7.334878921508789, -8.929901123046875, 59.324546813964844, 15.422889709472656, 199.912353515625, -2.1586055755615234, -5.466064453125, 78.49295043945312, 149.45684814453125, 141.40667724609375, 16.755722045898438, 89.91212463378906, -2.2998886108398438, 33.887081146240234, 116.62594604492188, 157.3551483154297, -29.757896423339844, 89.95597076416016, 23.242389678955078, -6.815143585205078, 123.33888244628906, 139.61734008789062, -23.18560791015625, 74.67337799072266, 20.300769805908203, -111.48072052001953, 51.66814422607422, 57.89556884765625, 31.798465728759766, -38.78385925292969, 42.42150115966797, 30.354555130004883, 3.2299270629882812, 15.293432235717773, 7.234931945800781, 45.466636657714844, 187.16888427734375, 128.82635498046875, -22.910076141357422, -16.745452880859375, 94.22296142578125, 30.98785400390625, 160.2303466796875, 167.23876953125, -8.293045043945312, 45.08530807495117, 111.56165313720703, -59.4451904296875, -13.807472229003906, 192.3017578125, 119.37144470214844, -23.282752990722656], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000405.npy"} +{"epoch": 0.6122448979591837, "step": 406, "batch_size": 64, "mean": 62.92144775390625, "std": 81.50392150878906, "min": -146.66786193847656, "p10": -33.08088397979736, "median": 61.8923454284668, "p90": 164.16001586914064, "max": 219.43247985839844, "pos_frac": 0.75, "sample": [152.0439453125, 35.009300231933594, -29.661252975463867, -19.93817138671875, 102.78411865234375, 95.87932586669922, 128.1616668701172, 156.77691650390625, -34.54644012451172, 202.88572692871094, 109.13776397705078, 118.4135513305664, 0.3539009094238281, -14.417770385742188, 165.23403930664062, 219.43247985839844, 174.20285034179688, 28.050500869750977, 51.32167053222656, 161.65396118164062, 85.29727172851562, 31.89867401123047, 93.68687438964844, 82.8175277709961, 28.307579040527344, 111.37945556640625, -26.508190155029297, 111.54945373535156, -5.42943000793457, 42.96628952026367, -1.4768257141113281, -0.6471900939941406, -111.68405151367188, -14.48288345336914, 47.741668701171875, 156.03677368164062, 51.37853240966797, 167.01161193847656, -63.742008209228516, 178.94607543945312, 85.40249633789062, 28.899566650390625, 49.507789611816406, 195.51246643066406, 16.21435546875, 148.69180297851562, -71.03033447265625, 11.761598587036133, 114.18511199951172, 143.48822021484375, 22.977537155151367, -55.60630798339844, 143.8060760498047, -71.80885314941406, 14.993392944335938, -146.66786193847656, 77.57510375976562, 119.12152099609375, -16.997032165527344, 24.340621948242188, 145.88047790527344, 96.32797241210938, 72.40615844726562, 110.16545104980469], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000406.npy"} +{"epoch": 0.6137566137566137, "step": 407, "batch_size": 64, "mean": 49.62183380126953, "std": 83.4005126953125, "min": -175.99249267578125, "p10": -38.204650497436525, "median": 50.04437255859375, "p90": 160.4184539794922, "max": 232.86228942871094, "pos_frac": 0.71875, "sample": [1.0925979614257812, 2.430238723754883, -5.59356689453125, 72.06456756591797, -37.629371643066406, 136.10546875, 163.4323272705078, -29.175460815429688, -96.89935302734375, 103.2950439453125, 65.02337646484375, 54.868099212646484, 2.8536376953125, 6.48431396484375, -82.1470947265625, 12.293190002441406, 81.29962921142578, 120.04888153076172, 179.0706024169922, 152.93565368652344, 53.9820556640625, 7.629205703735352, 76.626708984375, 46.106689453125, 85.76742553710938, 69.71609497070312, 1.3188247680664062, -11.275192260742188, 111.28424072265625, 190.54840087890625, 90.88671875, 3.8486404418945312, 161.53335571289062, 157.8170166015625, 147.38589477539062, 5.3729248046875, -83.83401489257812, 147.19183349609375, -35.21000671386719, 29.179115295410156, -21.890792846679688, 108.60537719726562, 138.59674072265625, 56.45679473876953, 171.60679626464844, 232.86228942871094, 99.01966094970703, 8.9046630859375, 202.64999389648438, -0.8563041687011719, 30.627517700195312, -175.99249267578125, -91.67544555664062, -36.321197509765625, -41.673553466796875, 22.059795379638672, -18.577669143676758, 141.75823974609375, -38.45119857788086, -8.850746154785156, -3.9675369262695312, 81.45341491699219, 63.631874084472656, 98.09223937988281], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000407.npy"} +{"epoch": 0.6152683295540439, "step": 408, "batch_size": 64, "mean": 70.90786743164062, "std": 74.64531707763672, "min": -98.93890380859375, "p10": -17.722768402099607, "median": 69.6647720336914, "p90": 171.5203536987305, "max": 206.86619567871094, "pos_frac": 0.8125, "sample": [48.15680694580078, 155.66990661621094, 127.82061767578125, 93.546142578125, 2.1859092712402344, -50.43373107910156, -98.93890380859375, 4.770198822021484, 121.51551055908203, 70.8457260131836, 37.08940124511719, 186.905517578125, -0.9705562591552734, 96.67881774902344, 133.57362365722656, 197.32736206054688, 33.426570892333984, -22.685020446777344, 62.30628204345703, 28.777740478515625, 87.39680480957031, 8.607933044433594, -5.126413345336914, 128.67466735839844, 199.03659057617188, -63.292724609375, 51.97943878173828, 180.86044311523438, 110.82536315917969, 137.4287872314453, 166.4435272216797, -24.86606216430664, 98.94284057617188, 10.872526168823242, 24.626113891601562, 155.42759704589844, 44.21345901489258, -18.238882064819336, 206.86619567871094, 69.62565612792969, 47.89482879638672, 149.3625946044922, 161.24276733398438, 173.69613647460938, 124.33741760253906, 21.369482040405273, 129.2322998046875, -16.518503189086914, 45.4639892578125, 1.8770599365234375, 139.83740234375, 82.73350524902344, 182.3289794921875, -90.95128631591797, 123.83133697509766, 102.85948181152344, 38.70454788208008, -2.8507041931152344, 13.455001831054688, 44.70266342163086, 114.49198150634766, 69.70388793945312, -1.3440704345703125, 84.77071380615234], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000408.npy"} +{"epoch": 0.6167800453514739, "step": 409, "batch_size": 64, "mean": 35.28793716430664, "std": 71.05015563964844, "min": -129.77392578125, "p10": -37.27924919128417, "median": 18.649288177490234, "p90": 139.31838073730472, "max": 183.98434448242188, "pos_frac": 0.640625, "sample": [19.506912231445312, 6.701066970825195, -18.412796020507812, -23.15350341796875, 1.5351905822753906, -12.16135025024414, 32.68158721923828, -22.547969818115234, 31.97000503540039, -28.692298889160156, -29.065715789794922, 162.06829833984375, -8.650651931762695, 171.2193603515625, 80.92266845703125, 7.6854248046875, 38.15478515625, -3.30078125, 1.0647163391113281, 174.34725952148438, 125.96417999267578, -41.75668716430664, 110.52976989746094, 142.05178833007812, 17.791664123535156, -54.202728271484375, -14.429031372070312, 79.66459655761719, 47.13848876953125, -12.3475341796875, -39.12968444824219, 55.83573913574219, 105.74547576904297, -32.96156692504883, 112.33405303955078, -6.391347885131836, 132.9404296875, 109.23929595947266, 44.46478271484375, 26.824872970581055, -39.42081832885742, -12.029777526855469, 71.50184631347656, -67.50820922851562, 14.45794677734375, -15.915115356445312, 15.694412231445312, 44.84584426879883, -127.2669677734375, 167.07289123535156, 12.676380157470703, 124.91236114501953, -0.7452392578125, 172.98846435546875, -129.77392578125, 11.034706115722656, 51.201080322265625, 57.47284698486328, 70.3281021118164, 64.6138916015625, 183.98434448242188, -29.525861740112305, 73.80648803710938, 52.84360122680664], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000409.npy"} +{"epoch": 0.618291761148904, "step": 410, "batch_size": 64, "mean": 57.0670051574707, "std": 66.2297134399414, "min": -103.50502014160156, "p10": -23.95414810180664, "median": 55.45488357543945, "p90": 140.82535400390628, "max": 231.84852600097656, "pos_frac": 0.828125, "sample": [62.53258514404297, 67.43818664550781, 27.472042083740234, -3.597789764404297, 157.87600708007812, 38.04437255859375, 87.752197265625, 29.079792022705078, -42.9034423828125, -103.50502014160156, 70.32427215576172, 143.59400939941406, 5.341705322265625, -60.40192413330078, 130.9951171875, 88.31807708740234, 125.86660766601562, -41.822784423828125, 85.21114349365234, 164.67079162597656, 231.84852600097656, 49.67150115966797, 38.66656494140625, 80.94544219970703, 17.53704833984375, 98.72322082519531, 11.871810913085938, 89.596435546875, 40.612815856933594, -22.96393585205078, 106.5655517578125, -24.378524780273438, 19.616741180419922, 114.83895111083984, 26.509918212890625, 188.53067016601562, 134.3651580810547, 29.851245880126953, 44.76068115234375, 60.356048583984375, -13.869941711425781, -41.79498291015625, 75.99559783935547, 58.72776794433594, 108.26639556884766, 69.91835021972656, 130.48231506347656, -3.086273193359375, 15.604808807373047, 94.1605224609375, 32.45524597167969, 61.27069091796875, 202.046142578125, 73.91950988769531, 45.24671936035156, 61.643592834472656, 5.199695587158203, 33.45420837402344, 4.60626220703125, 106.9835205078125, 156.331298828125, 52.18199920654297, -65.48748779296875, 18.220558166503906], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000410.npy"} +{"epoch": 0.6198034769463341, "step": 411, "batch_size": 64, "mean": 56.124996185302734, "std": 79.95755004882812, "min": -171.31591796875, "p10": -34.73931427001953, "median": 50.81592559814453, "p90": 157.18885498046876, "max": 292.2886657714844, "pos_frac": 0.71875, "sample": [-15.411842346191406, 143.04368591308594, 118.07408142089844, 140.09527587890625, 79.35103607177734, -12.716033935546875, 13.192916870117188, -171.31591796875, 88.25211334228516, 5.258277893066406, 78.60991668701172, 175.3682861328125, 93.39019012451172, 85.43365478515625, 123.97702026367188, 53.48723602294922, 92.30361938476562, -48.71251678466797, 74.28873443603516, 56.33665466308594, 7.531227111816406, 170.8767547607422, 167.08953857421875, 16.9030704498291, -35.1046142578125, 117.14714050292969, 3.9384841918945312, 26.315372467041016, -42.17337417602539, -51.86949157714844, 17.312225341796875, -19.712427139282227, -22.15941619873047, 50.95330810546875, 74.89675903320312, 39.350948333740234, -4.251947402954102, 146.40106201171875, 10.73309326171875, 292.2886657714844, 136.34033203125, 50.67854309082031, -23.899627685546875, 158.5098876953125, 152.41650390625, 162.70181274414062, -60.127288818359375, 41.15887451171875, -10.71817398071289, -45.83580017089844, 36.594757080078125, -33.88694763183594, 154.1064453125, 125.90521240234375, 53.930458068847656, 99.09809112548828, 90.89637756347656, 29.964807510375977, 212.49761962890625, 49.2740478515625, -22.234153747558594, -0.12176513671875, -5.2223968505859375, 101.19937133789062], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000411.npy"} +{"epoch": 0.6213151927437641, "step": 412, "batch_size": 64, "mean": 51.794273376464844, "std": 68.16270446777344, "min": -73.79922485351562, "p10": -31.887067031860347, "median": 36.28158950805664, "p90": 145.77497863769534, "max": 193.49327087402344, "pos_frac": 0.796875, "sample": [-66.61463165283203, 139.98178100585938, 51.64214324951172, 168.708740234375, 33.62842559814453, 110.05303955078125, 51.35673522949219, 137.75559997558594, -60.794681549072266, 0.4187736511230469, 66.20347595214844, 2.7994461059570312, 64.97607421875, 157.10301208496094, 2.5181503295898438, -36.278907775878906, 124.63641357421875, -73.79922485351562, 34.28424835205078, 1.6168212890625, 157.3146514892578, 102.64543151855469, 18.733993530273438, 46.6693115234375, 70.66653442382812, -57.10790252685547, 18.9908447265625, 33.37104415893555, 33.298099517822266, 35.930633544921875, -3.0117549896240234, 190.04600524902344, 6.034677505493164, 193.49327087402344, -27.91448211669922, 21.0794677734375, 59.436279296875, -7.718730926513672, 123.897216796875, 0.07567596435546875, -16.410364151000977, 3.6174774169921875, 104.71467590332031, -42.78207015991211, 36.632545471191406, 147.51324462890625, 108.35737609863281, 114.69170379638672, 169.98309326171875, -33.589603424072266, 65.43999481201172, 91.90797424316406, 69.03627014160156, 16.89350128173828, 34.67861557006836, 131.2064208984375, -4.937021255493164, 67.30892181396484, -27.551090240478516, 60.8917236328125, 141.71902465820312, 0.9265270233154297, 135.13470458984375, 13.323974609375], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000412.npy"} +{"epoch": 0.6228269085411943, "step": 413, "batch_size": 64, "mean": 48.3399543762207, "std": 88.80541229248047, "min": -172.27162170410156, "p10": -64.5197036743164, "median": 50.68427085876465, "p90": 156.6155670166016, "max": 321.16180419921875, "pos_frac": 0.703125, "sample": [10.207271575927734, -66.94126892089844, 92.1692123413086, 68.47794342041016, -8.997001647949219, -16.125244140625, -0.6985931396484375, 170.7613067626953, -47.52372741699219, 189.23370361328125, -148.38604736328125, 140.24053955078125, 96.05545806884766, -34.52665710449219, -6.4816436767578125, 22.120635986328125, -67.44279479980469, 143.93399047851562, -0.874786376953125, 21.5379581451416, 188.0057830810547, 77.1002197265625, 49.9556884765625, 44.6597785949707, 103.62454223632812, 40.00971221923828, 321.16180419921875, 78.93505859375, 16.554725646972656, 28.35822296142578, 78.33956909179688, 111.35631561279297, 89.99449157714844, 53.18134307861328, 170.05116271972656, -79.09005737304688, 95.94523620605469, 24.450820922851562, 59.29120635986328, 25.720169067382812, -126.59517669677734, 139.09890747070312, 135.33291625976562, -72.7986831665039, 64.3682861328125, -51.79597473144531, -172.27162170410156, 65.72089385986328, 66.59101104736328, 11.022212982177734, -25.91278076171875, -58.869384765625, 184.66531372070312, -0.6651115417480469, 45.6522216796875, 115.11711120605469, 51.4128532409668, 146.99618530273438, 35.87913131713867, 70.30298614501953, -53.50325012207031, 119.92124938964844, 160.7381591796875, 109.00363159179688], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000413.npy"} +{"epoch": 0.6243386243386243, "step": 414, "batch_size": 64, "mean": 56.28565216064453, "std": 74.25638580322266, "min": -125.30587768554688, "p10": -23.64987335205078, "median": 59.49437141418457, "p90": 161.7805145263672, "max": 187.02032470703125, "pos_frac": 0.765625, "sample": [126.83209991455078, -22.204360961914062, 100.431884765625, 104.95355224609375, 22.18634033203125, 58.93165588378906, -124.8192138671875, 102.29620361328125, 64.0340347290039, 22.772384643554688, 66.86077880859375, 132.85269165039062, 111.68608856201172, -45.6544189453125, 162.81814575195312, 70.36282348632812, -94.43359375, -49.970191955566406, 30.703887939453125, 85.46285247802734, 29.19620704650879, 60.74604797363281, 180.7691650390625, -20.322181701660156, 171.2925262451172, 49.081573486328125, 60.05708694458008, 16.031639099121094, 84.46987915039062, 106.91159057617188, 157.74497985839844, 29.1251220703125, 113.6324691772461, -14.805435180664062, 182.46043395996094, 71.46910858154297, 134.97711181640625, 39.544586181640625, 60.61541748046875, 129.89309692382812, 27.309951782226562, -18.590232849121094, 9.721267700195312, -2.447896957397461, 96.39666748046875, -24.269378662109375, 9.983695983886719, 81.88796997070312, -125.30587768554688, 47.97832489013672, 187.02032470703125, -7.170017242431641, -4.663845062255859, 23.93197250366211, 159.359375, 180.70465087890625, 32.39226531982422, 14.392791748046875, 101.3070068359375, 91.27632141113281, -45.92919921875, -0.6565074920654297, 13.039470672607422, 185.61856079101562], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000414.npy"} +{"epoch": 0.6258503401360545, "step": 415, "batch_size": 64, "mean": 49.79706954956055, "std": 78.52700805664062, "min": -127.5387954711914, "p10": -36.390927124023435, "median": 39.97852325439453, "p90": 155.48007202148438, "max": 255.722412109375, "pos_frac": 0.71875, "sample": [-7.276449203491211, 106.45609283447266, 27.225549697875977, 82.73495483398438, 16.067516326904297, 17.74932098388672, 129.39749145507812, 172.19866943359375, -34.924957275390625, 102.5674819946289, 57.263465881347656, -37.006866455078125, 136.9947509765625, 152.59552001953125, -0.16584014892578125, 159.86444091796875, 184.628662109375, 78.67498779296875, 90.66162109375, -2.086977005004883, -6.299224853515625, 73.67488098144531, 84.15660858154297, -0.7071609497070312, 41.937774658203125, 156.71630859375, -111.7981185913086, 14.047569274902344, 63.67658996582031, 133.52230834960938, -39.49543762207031, 114.47016906738281, 54.040870666503906, -3.09674072265625, -125.45731353759766, 255.722412109375, 89.96111297607422, 101.05351257324219, 143.4141082763672, -34.9537353515625, 91.33145904541016, -120.21925354003906, -49.79286575317383, -127.5387954711914, 32.501792907714844, 67.2872543334961, -3.8193740844726562, 38.01927185058594, -0.9279708862304688, 6.537416458129883, 7.195051193237305, 49.44324493408203, 32.46888732910156, 22.57436752319336, 16.008216857910156, 73.54266357421875, -2.6569080352783203, 110.38042449951172, 106.78750610351562, 0.40517425537109375, 19.29694366455078, 36.50281524658203, 169.67913818359375, 173.79998779296875], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000415.npy"} +{"epoch": 0.6273620559334845, "step": 416, "batch_size": 64, "mean": 41.74473190307617, "std": 83.42969512939453, "min": -137.58447265625, "p10": -46.53155059814453, "median": 35.19759750366211, "p90": 156.38221588134766, "max": 301.2815246582031, "pos_frac": 0.671875, "sample": [5.681663513183594, -132.70713806152344, -10.410419464111328, 77.62980651855469, 34.172630310058594, 158.2121124267578, -48.18989562988281, -33.902191162109375, 153.29571533203125, 173.10952758789062, 40.3780517578125, 170.32057189941406, 301.2815246582031, 22.74066925048828, -2.3974952697753906, 52.72576141357422, -1.253793716430664, 87.1589584350586, -137.58447265625, -24.934539794921875, 2.535520553588867, 105.17098999023438, 33.876220703125, 139.07211303710938, -1.1906814575195312, 97.57196044921875, 97.57293701171875, 168.8516845703125, 194.4461669921875, 70.33231353759766, 69.67417907714844, 98.19827270507812, -28.293746948242188, -51.382041931152344, 4.571718215942383, -5.333457946777344, -70.45870971679688, -110.44126892089844, 1.4823741912841797, 6.188831329345703, -28.297077178955078, 44.43860626220703, -17.9852294921875, 1.3099517822265625, 70.09492492675781, -27.632396697998047, 118.00171661376953, -110.57943725585938, -1.6848773956298828, 109.97767639160156, 36.222564697265625, 5.741724014282227, -42.662078857421875, 110.35282897949219, -17.54204559326172, 36.83440017700195, 12.205116271972656, 53.59034729003906, 73.28697967529297, 50.59552764892578, 149.60980224609375, 126.70809173583984, 157.7050018310547, 53.598289489746094], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000416.npy"} +{"epoch": 0.6288737717309146, "step": 417, "batch_size": 64, "mean": 55.25751876831055, "std": 88.01911926269531, "min": -266.0259094238281, "p10": -38.99912948608398, "median": 60.10200881958008, "p90": 154.11024627685546, "max": 291.15435791015625, "pos_frac": 0.78125, "sample": [35.23371124267578, 4.934906005859375, -20.04485321044922, -162.00341796875, 160.38330078125, 124.94197845458984, -266.0259094238281, 157.46514892578125, 64.94682312011719, 92.00819396972656, 291.15435791015625, 60.15214538574219, 33.464805603027344, 62.36260223388672, 60.05187225341797, -74.20832824707031, 152.7834014892578, 95.91686248779297, 1.78436279296875, 66.0708236694336, 87.651611328125, 71.49612426757812, 73.42826843261719, 38.16279602050781, 83.78640747070312, -35.492950439453125, 154.67889404296875, 50.14961242675781, 18.510128021240234, 140.13021850585938, -40.50177764892578, 141.89456176757812, 162.4517364501953, -83.93705749511719, 133.29296875, -33.06916809082031, 36.98701477050781, -12.326873779296875, 143.77133178710938, 97.09575653076172, 157.80368041992188, 9.980247497558594, 147.13685607910156, 67.81957244873047, -69.81558227539062, 40.35237121582031, 6.751688003540039, 49.86870574951172, -0.6406097412109375, 66.58683776855469, 30.8631591796875, 133.92355346679688, 4.7473602294921875, -30.926116943359375, 90.62960052490234, -42.91075134277344, 77.15875244140625, 32.9500617980957, 59.17408752441406, -1.7286014556884766, 126.25369262695312, 43.45479965209961, 140.44017028808594, 227.07546997070312], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000417.npy"} +{"epoch": 0.6303854875283447, "step": 418, "batch_size": 64, "mean": 43.91654586791992, "std": 84.68850708007812, "min": -177.08016967773438, "p10": -44.860681152343744, "median": 36.387454986572266, "p90": 145.21493530273438, "max": 330.34716796875, "pos_frac": 0.6875, "sample": [85.92704772949219, 112.17808532714844, 103.62751007080078, 53.1639404296875, 55.29103469848633, 146.02243041992188, 23.16595458984375, 99.42078399658203, 171.8396759033203, -41.04277801513672, 137.88565063476562, 165.68081665039062, -24.406021118164062, 123.58285522460938, 46.01990509033203, -86.63038635253906, 128.1541290283203, 8.220664978027344, 104.81465148925781, -15.770423889160156, 3.0647964477539062, 330.34716796875, 67.73767852783203, -7.604766845703125, 168.66445922851562, 32.971900939941406, -40.535675048828125, 7.474082946777344, 27.069698333740234, -33.866241455078125, -177.08016967773438, -114.36312866210938, 171.4146270751953, 48.41206359863281, 167.74327087402344, -20.493698120117188, 13.670417785644531, -14.817581176757812, 23.43077850341797, 4.8403472900390625, -56.55034637451172, -46.496925354003906, -90.17301940917969, -5.883813858032227, 89.34781646728516, -28.746803283691406, -11.978202819824219, 46.05809020996094, 24.29152488708496, -7.354026794433594, 30.952980041503906, 127.77532958984375, 139.94400024414062, 143.33078002929688, 18.04901885986328, 39.803009033203125, -86.14610290527344, 75.65345764160156, 85.40513610839844, 93.0100326538086, 84.27518463134766, -37.62788391113281, 74.186279296875, 54.30793762207031], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000418.npy"} +{"epoch": 0.6318972033257747, "step": 419, "batch_size": 64, "mean": 63.9669189453125, "std": 83.33177947998047, "min": -112.86616516113281, "p10": -27.177497482299803, "median": 40.33797836303711, "p90": 172.63537139892577, "max": 255.48985290527344, "pos_frac": 0.84375, "sample": [-16.16732406616211, 247.68092346191406, 11.324165344238281, 15.167152404785156, -63.39201736450195, 13.220672607421875, 172.41864013671875, 29.572975158691406, 6.245277404785156, 29.638248443603516, -112.86616516113281, 146.59368896484375, 170.55287170410156, 101.36723327636719, -32.155242919921875, 36.03959655761719, 72.84457397460938, 41.068115234375, 185.61801147460938, 16.385772705078125, 56.662109375, 96.70087432861328, -28.63946533203125, 75.03460693359375, 10.860939025878906, 16.223724365234375, 204.68792724609375, -31.874404907226562, 225.2090606689453, 87.75511169433594, 23.754016876220703, -74.51409149169922, -23.766239166259766, 161.71115112304688, 255.48985290527344, 87.28128051757812, 125.04191589355469, 17.47443389892578, 4.0363311767578125, 59.363433837890625, 2.651296615600586, 172.72825622558594, 20.50372314453125, 17.324859619140625, 156.43203735351562, 12.971084594726562, 79.1895523071289, 40.79221725463867, 8.267398834228516, 169.5537109375, 155.66006469726562, 0.6779594421386719, 39.88373947143555, 31.22254180908203, 123.93498229980469, -6.718328475952148, 108.14192962646484, 109.98596954345703, 207.1544952392578, 7.7239990234375, 75.42630004882812, 63.3651123046875, -86.68627166748047, 164.0462188720703], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000419.npy"} +{"epoch": 0.6334089191232048, "step": 420, "batch_size": 64, "mean": 33.346622467041016, "std": 87.87489318847656, "min": -194.24868774414062, "p10": -61.69006233215332, "median": 12.880082130432129, "p90": 156.46748657226564, "max": 227.56585693359375, "pos_frac": 0.671875, "sample": [-12.824310302734375, -40.82089614868164, 121.6311264038086, 16.03582000732422, 119.05303192138672, -123.49349975585938, 23.366836547851562, 10.205883026123047, 4.483100891113281, -159.62350463867188, -20.423751831054688, 63.644569396972656, 6.63018798828125, 126.6621322631836, 3.3146820068359375, 149.36007690429688, 206.12158203125, 84.29466247558594, 176.5081787109375, 138.62173461914062, 15.475759506225586, -56.89817428588867, 1.8196277618408203, 52.21125030517578, 80.71221923828125, 153.02285766601562, -81.05086517333984, -87.73091888427734, 57.70912170410156, 9.71875, -75.8702392578125, 32.56242370605469, -39.325706481933594, 34.63675308227539, 2.462352752685547, -63.74372863769531, -31.16455841064453, -24.400001525878906, 157.94375610351562, 25.873123168945312, -14.787895202636719, -194.24868774414062, -45.008522033691406, -10.639816284179688, 139.0419921875, 71.0320053100586, 28.242427825927734, 175.1201171875, -0.4347381591796875, 71.66485595703125, 176.23568725585938, 44.843711853027344, 107.11878967285156, 1.8942241668701172, 10.284404754638672, 109.61559295654297, 227.56585693359375, 6.686439514160156, 5.120418548583984, 35.15733337402344, -3.2179489135742188, 205.27069091796875, -40.699859619140625, -28.384700775146484], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000420.npy"} +{"epoch": 0.6349206349206349, "step": 421, "batch_size": 64, "mean": 48.352195739746094, "std": 97.86457061767578, "min": -164.07785034179688, "p10": -93.70029144287106, "median": 43.79092025756836, "p90": 169.15997924804688, "max": 289.9578552246094, "pos_frac": 0.75, "sample": [-123.38888549804688, 170.24273681640625, 8.795921325683594, 146.48696899414062, 138.99664306640625, 21.931671142578125, 79.45303344726562, 16.64794921875, 2.1464767456054688, 289.9578552246094, 227.1110382080078, -61.47943115234375, 166.633544921875, 54.844093322753906, -21.842853546142578, 60.45595169067383, 28.995033264160156, -32.945098876953125, 164.61334228515625, 93.36373901367188, 111.77275085449219, 100.04405212402344, 1.325204849243164, 5.546882629394531, 63.93440246582031, 5.213970184326172, 106.51708221435547, -164.07785034179688, -144.89334106445312, -54.500980377197266, 14.061967849731445, 155.39891052246094, 134.209716796875, 12.824117660522461, 67.49727630615234, 174.56948852539062, 186.9327850341797, 125.17675018310547, 39.98877716064453, 3.287334442138672, 160.4872283935547, -2.275890350341797, 53.837005615234375, -140.2342529296875, -107.56459045410156, 100.05038452148438, -2.0289459228515625, 51.103965759277344, -107.50923156738281, 9.942733764648438, 206.40130615234375, 175.16549682617188, 2.7618484497070312, 47.59306335449219, 35.2176513671875, -152.39337158203125, 33.11444854736328, 79.678466796875, 95.37425231933594, -59.167022705078125, 153.4562530517578, 107.17940521240234, -20.715476989746094, -0.7834053039550781], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000421.npy"} +{"epoch": 0.636432350718065, "step": 422, "batch_size": 64, "mean": 62.0421142578125, "std": 77.05105590820312, "min": -94.61051940917969, "p10": -34.961351776123045, "median": 58.1832160949707, "p90": 150.8330856323242, "max": 242.26974487304688, "pos_frac": 0.796875, "sample": [150.27731323242188, 242.26974487304688, -72.2749252319336, -4.528064727783203, 151.07127380371094, -11.037574768066406, 149.1204376220703, -94.61051940917969, 87.3992919921875, 202.02719116210938, 16.257095336914062, 39.687347412109375, 14.343055725097656, 68.63735961914062, 174.5649871826172, 21.123790740966797, 142.0477752685547, 167.47132873535156, -35.69422912597656, 123.83271026611328, 83.52220153808594, -80.11172485351562, -4.838527679443359, 8.608745574951172, 99.45042419433594, 139.72787475585938, 124.58737182617188, 117.0777359008789, 214.13204956054688, 77.42697143554688, 72.42935180664062, 83.63479614257812, 40.7465705871582, -10.115571975708008, 42.75359344482422, 55.21416091918945, 99.76284790039062, 20.36467933654785, 150.27630615234375, 18.912841796875, -19.62950897216797, -63.055301666259766, 139.9058837890625, 94.0537109375, 24.69439697265625, -33.251304626464844, 4.60418701171875, 105.58454132080078, 7.0525665283203125, 61.15227127075195, 50.91019058227539, 214.19009399414062, 35.158729553222656, -49.58307647705078, 14.315685272216797, 77.10270690917969, 22.439306259155273, -61.996849060058594, 25.04954719543457, 82.13140106201172, 142.76589965820312, 86.61861419677734, 21.569198608398438, 103.36434936523438], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000422.npy"} +{"epoch": 0.6379440665154951, "step": 423, "batch_size": 64, "mean": 64.58971405029297, "std": 80.24137878417969, "min": -100.26119232177734, "p10": -23.027609252929683, "median": 43.74664306640625, "p90": 182.4070297241211, "max": 234.2815399169922, "pos_frac": 0.78125, "sample": [40.698974609375, -7.368370056152344, 143.02346801757812, -57.960418701171875, 181.31858825683594, 2.6153011322021484, 47.93720626831055, -43.78638458251953, 162.99209594726562, 39.241554260253906, -24.996231079101562, 150.02658081054688, 0.423583984375, -29.50263214111328, 3.560699462890625, 14.090347290039062, 18.406387329101562, -3.1978607177734375, 165.0620574951172, -78.0351333618164, 85.45231628417969, 90.37989044189453, -35.64897155761719, -2.5235843658447266, 56.96024703979492, 210.89930725097656, 141.523681640625, 7.501239776611328, -100.26119232177734, 99.31269836425781, 219.88311767578125, 137.41720581054688, 102.12312316894531, 79.81782531738281, 93.08353424072266, 46.7943115234375, 39.4310302734375, 185.41358947753906, 190.3210906982422, 182.87350463867188, 20.54822540283203, 12.848316192626953, 19.695068359375, 103.30625915527344, 125.39136505126953, 137.26699829101562, 150.81280517578125, 49.63908004760742, -5.015522003173828, 70.44595336914062, 234.2815399169922, 97.77745056152344, -2.769369125366211, 35.662010192871094, 119.41808319091797, 186.72760009765625, 8.345855712890625, 3.1697540283203125, -18.434158325195312, 31.521621704101562, 176.390869140625, 2.737457275390625, 36.85515213012695, -18.184598922729492], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000423.npy"} +{"epoch": 0.6394557823129252, "step": 424, "batch_size": 64, "mean": 66.10272216796875, "std": 81.76143646240234, "min": -104.62763214111328, "p10": -38.87555847167968, "median": 52.20671844482422, "p90": 174.01031188964845, "max": 296.93585205078125, "pos_frac": 0.8125, "sample": [-13.722869873046875, 196.56649780273438, 52.34519958496094, 135.77536010742188, -41.26109313964844, 138.6317901611328, 296.93585205078125, 143.70858764648438, -94.14749908447266, -48.35975646972656, 21.182056427001953, 17.662294387817383, 47.535011291503906, -104.62763214111328, 132.33670043945312, 15.116493225097656, 143.93902587890625, -33.30931091308594, 58.99385070800781, 16.125694274902344, -21.19826316833496, 85.22074127197266, 113.81676483154297, 46.842369079589844, -47.38139724731445, 148.9276885986328, 205.5440673828125, 15.994186401367188, 187.7177734375, 34.660675048828125, 105.11344146728516, 97.17913055419922, 41.20421600341797, 48.87498474121094, 29.747711181640625, 63.65165710449219, 126.98895263671875, 195.80393981933594, 127.73053741455078, 114.52017974853516, 94.32376098632812, 29.056800842285156, 8.623157501220703, 174.14761352539062, 23.831398010253906, 178.0286407470703, 129.1760711669922, -0.7164020538330078, -66.59693145751953, 11.090993881225586, 158.9637451171875, 54.2869873046875, 153.88876342773438, 173.68994140625, 10.381965637207031, 29.88811492919922, 55.79734802246094, -72.984130859375, 56.101409912109375, 130.10260009765625, 8.432853698730469, 39.974266052246094, -3.3686981201171875, 52.0682373046875], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000424.npy"} +{"epoch": 0.6409674981103552, "step": 425, "batch_size": 64, "mean": 49.743309020996094, "std": 80.98249053955078, "min": -115.6705093383789, "p10": -52.700328445434565, "median": 36.59511947631836, "p90": 164.81334686279297, "max": 230.97869873046875, "pos_frac": 0.75, "sample": [129.59982299804688, 121.29708099365234, 30.47925567626953, -1.3479156494140625, 156.52828979492188, -30.219646453857422, 200.29098510742188, -6.649631500244141, 70.81551361083984, 79.11819458007812, 132.839599609375, -71.21138763427734, 52.39106369018555, -39.086822509765625, -61.48237228393555, 106.08320617675781, 54.791770935058594, 173.40733337402344, 19.02642822265625, 53.08694839477539, -107.83847045898438, 52.56294250488281, 0.4448814392089844, 59.944618225097656, 117.48399353027344, 7.877143859863281, 3.254659652709961, 189.6151580810547, 6.008796691894531, 174.07516479492188, 154.0276336669922, -39.23079299926758, 94.37979125976562, 2.5742721557617188, 78.9267578125, 38.54100799560547, 33.781005859375, 165.58255004882812, 28.66110610961914, 31.314434051513672, 169.21246337890625, -102.6226577758789, 60.700660705566406, 74.22525024414062, 34.64923095703125, -115.6705093383789, 43.04219055175781, 60.56570816040039, 19.77313232421875, -14.476272583007812, 163.01853942871094, -14.311504364013672, -62.176246643066406, 150.91537475585938, 7.343132019042969, 6.942745208740234, 127.31968688964844, 31.319015502929688, -9.490890502929688, 230.97869873046875, -45.88923263549805, 15.608230590820312, 146.4698944091797, -55.61936950683594], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000425.npy"} +{"epoch": 0.6424792139077853, "step": 426, "batch_size": 64, "mean": 30.36445426940918, "std": 92.44384765625, "min": -221.5467987060547, "p10": -80.12700195312499, "median": 16.41712188720703, "p90": 139.1182846069336, "max": 268.0863037109375, "pos_frac": 0.65625, "sample": [8.207782745361328, -3.9555702209472656, 109.19983673095703, 140.68505859375, 15.464500427246094, 127.97158813476562, 20.488876342773438, 169.39662170410156, 26.78050994873047, 46.921966552734375, -28.963966369628906, -25.77752685546875, 15.167793273925781, -131.357421875, 102.48680114746094, 13.17474365234375, 84.23731231689453, 2.1116943359375, 61.200096130371094, -32.48175811767578, -160.8480987548828, -22.28759765625, 15.2525634765625, 61.43128967285156, -15.349983215332031, 14.173263549804688, 47.646942138671875, -221.5467987060547, 96.86875915527344, 17.36974334716797, 173.47320556640625, 86.13595581054688, 122.08647918701172, -25.362775802612305, -207.87501525878906, 51.873653411865234, -6.8392181396484375, 5.655553817749023, -2.6214752197265625, 268.0863037109375, 156.66368103027344, 214.0738067626953, -108.91587829589844, -88.51643371582031, 1.652374267578125, 194.7104949951172, -18.106124877929688, 3.099994659423828, -3.311420440673828, -84.85989379882812, 57.64604949951172, 123.56879425048828, -3.6270294189453125, 107.24354553222656, 57.89140319824219, -54.56163787841797, 18.120136260986328, 106.9912338256836, 33.83088684082031, -69.08358764648438, 84.7406005859375, 75.69380187988281, 135.4624786376953, -15.363811492919922], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000426.npy"} +{"epoch": 0.6439909297052154, "step": 427, "batch_size": 64, "mean": 52.24851989746094, "std": 89.96790313720703, "min": -143.33523559570312, "p10": -68.6083366394043, "median": 41.431884765625, "p90": 169.82100067138674, "max": 318.77569580078125, "pos_frac": 0.734375, "sample": [92.75332641601562, 30.33467674255371, -20.999645233154297, -78.86394500732422, -74.3486328125, 111.50001525878906, 167.20814514160156, 36.22098159790039, -3.6306304931640625, -67.9318618774414, 163.1195068359375, -21.502552032470703, -68.89825439453125, -71.61325073242188, 51.822654724121094, 172.16036987304688, 91.32776641845703, 52.70130920410156, -13.049125671386719, -31.113510131835938, -0.3004169464111328, 62.27095413208008, 137.49526977539062, 73.27732849121094, 29.503875732421875, 137.10194396972656, 107.98444366455078, 132.01083374023438, 14.301025390625, 34.54009246826172, 175.165283203125, 16.910736083984375, 121.69320678710938, 43.639793395996094, 29.15746307373047, 162.15670776367188, 12.777259826660156, -143.33523559570312, 188.03097534179688, 170.9407958984375, 3.1816482543945312, 26.091537475585938, 67.29779052734375, 23.647789001464844, -115.82315063476562, -56.280662536621094, 114.41111755371094, 90.08570861816406, 39.223976135253906, -96.30886840820312, 164.98321533203125, 229.97726440429688, 0.3370819091796875, 68.13115692138672, 70.62554168701172, 32.33686828613281, 77.05259704589844, 62.946346282958984, 5.1359100341796875, -22.59375, 70.65477752685547, -52.08702087402344, 318.77569580078125, 199.58319091796875], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000427.npy"} +{"epoch": 0.6455026455026455, "step": 428, "batch_size": 64, "mean": 58.34028625488281, "std": 90.7276382446289, "min": -145.42514038085938, "p10": -34.582976913452136, "median": 56.33720779418945, "p90": 178.628776550293, "max": 339.3908386230469, "pos_frac": 0.734375, "sample": [-106.26765441894531, 78.44029998779297, 187.42672729492188, -1.6731910705566406, 2.6107330322265625, 24.538848876953125, 28.723087310791016, -105.47523498535156, -62.39612579345703, 66.52983856201172, 180.1832275390625, -15.622306823730469, 110.96845245361328, -23.13353729248047, 147.86895751953125, 66.11328125, 159.12625122070312, 27.301612854003906, -14.707298278808594, 47.559600830078125, 175.00172424316406, 0.4025535583496094, 0.8354568481445312, 3.3421859741210938, 182.50730895996094, 79.945068359375, 41.00165557861328, -136.1704864501953, 101.59468078613281, -145.42514038085938, 113.60702514648438, -10.697532653808594, 21.089542388916016, 33.711971282958984, 67.61481475830078, 188.23898315429688, 142.99658203125, 137.46742248535156, 65.11481475830078, -6.591833114624023, 182.44190979003906, 339.3908386230469, 74.6186294555664, 142.61239624023438, -56.56486511230469, -10.693603515625, 80.26953125, 67.03067779541016, 2.291036605834961, -21.39263916015625, 16.176925659179688, 12.819099426269531, -1.7122764587402344, 0.2791175842285156, 158.06092834472656, 171.62722778320312, 182.7200927734375, 71.67082214355469, 116.51638793945312, 137.57557678222656, 145.07122802734375, 113.86725616455078, -5.110420227050781, -39.4898796081543], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000428.npy"} +{"epoch": 0.6470143613000756, "step": 429, "batch_size": 64, "mean": 45.98888397216797, "std": 80.27310180664062, "min": -146.16018676757812, "p10": -64.83248558044433, "median": 48.35438919067383, "p90": 154.62808837890626, "max": 189.48728942871094, "pos_frac": 0.734375, "sample": [105.39204406738281, -84.790771484375, 2.1175384521484375, -13.796073913574219, 128.63970947265625, 99.3849105834961, 56.81162643432617, 40.276390075683594, -17.416194915771484, 48.07640075683594, 51.19618225097656, -108.74896240234375, 68.16541290283203, 24.761093139648438, 0.498565673828125, 113.03279113769531, -144.33041381835938, 35.58827209472656, 4.085906982421875, 103.75879669189453, 125.33941650390625, -18.448955535888672, 105.14015197753906, 148.0458221435547, 155.2711181640625, 160.2427978515625, 175.29144287109375, -6.458099365234375, 48.63237762451172, -44.35971450805664, -72.37728881835938, -50.8100471496582, 12.609870910644531, -13.536186218261719, 101.8118667602539, -0.6693267822265625, -70.84210205078125, 81.28479766845703, -7.163139343261719, 4.396537780761719, 154.8290557861328, 130.12326049804688, 35.63538360595703, 154.15916442871094, 122.29273986816406, -146.16018676757812, -91.24403381347656, 23.031444549560547, 7.206977844238281, 123.72814178466797, 17.85541534423828, 56.23198699951172, 25.834922790527344, -17.55263900756836, 55.8360481262207, 57.42375183105469, 189.48728942871094, 71.37346649169922, 188.4752655029297, 169.90884399414062, 10.50455093383789, 104.29869079589844, 64.51344299316406, 89.39119720458984], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000429.npy"} +{"epoch": 0.6485260770975056, "step": 430, "batch_size": 64, "mean": 69.51193237304688, "std": 83.24775695800781, "min": -216.71664428710938, "p10": -19.391732788085925, "median": 60.79034423828125, "p90": 173.14175109863282, "max": 206.30068969726562, "pos_frac": 0.828125, "sample": [33.96575927734375, 26.032026290893555, -23.96771240234375, 38.870887756347656, 2.5930557250976562, 163.1425323486328, 0.015239715576171875, 156.33694458007812, 31.234182357788086, 95.09416961669922, -91.4125747680664, 100.86714935302734, 182.47976684570312, 26.19138526916504, 166.55870056152344, 79.35547637939453, 105.5827407836914, 50.86912536621094, 191.94021606445312, -25.6716365814209, 65.31661987304688, 206.30068969726562, 126.3289566040039, 99.06919860839844, -0.6133880615234375, 169.14500427246094, 48.56486511230469, 186.84478759765625, 110.17677307128906, 153.36001586914062, 84.71434020996094, 19.5499267578125, 90.39263916015625, 160.03182983398438, -35.1879768371582, 169.2548370361328, 195.01364135742188, 119.07648468017578, -92.02166748046875, 140.79025268554688, 10.776901245117188, 95.5248794555664, 33.23690414428711, 46.25605010986328, 28.0592041015625, 120.20317077636719, 25.583839416503906, 0.9742488861083984, -216.71664428710938, 7.791023254394531, -2.678955078125, 156.65057373046875, -0.9748916625976562, 143.55233764648438, 45.21319580078125, 187.72421264648438, 174.8075714111328, 105.82138061523438, 130.8550567626953, -8.714447021484375, 56.264068603515625, -57.36017990112305, 13.542495727539062, 26.186203002929688], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000430.npy"} +{"epoch": 0.6500377928949358, "step": 431, "batch_size": 64, "mean": 51.76930236816406, "std": 79.55901336669922, "min": -154.94180297851562, "p10": -33.20119171142578, "median": 36.565494537353516, "p90": 161.84501953125002, "max": 221.69833374023438, "pos_frac": 0.75, "sample": [-154.94180297851562, 120.88179779052734, 60.877323150634766, 40.19873809814453, 20.680110931396484, 143.74609375, 145.7373046875, 134.23727416992188, 166.4723358154297, -6.787378311157227, 7.784873962402344, 171.44444274902344, 146.91693115234375, -15.503128051757812, 36.749916076660156, 21.34932518005371, 221.69833374023438, -2.868011474609375, 158.19674682617188, 36.381072998046875, 52.661277770996094, -140.21432495117188, 14.695381164550781, 81.40739440917969, -44.49351501464844, 166.38746643066406, 58.604034423828125, -59.10786437988281, 47.641998291015625, -10.081220626831055, 54.72447204589844, -2.1783485412597656, 145.95989990234375, 143.58453369140625, -77.61264038085938, 0.17200469970703125, 167.9080810546875, 89.56251525878906, -34.318634033203125, -30.593826293945312, -35.298675537109375, 7.237579345703125, -5.576179504394531, 130.514404296875, 2.3662185668945312, 15.311798095703125, 143.2729034423828, 75.65689086914062, 13.864852905273438, 205.17742919921875, 26.16436767578125, 60.765262603759766, 8.1033935546875, 27.439899444580078, 75.66919708251953, 12.346622467041016, 40.21269226074219, -1.3136825561523438, 16.66006851196289, 163.30307006835938, 158.44290161132812, 71.49739837646484, 36.12672424316406, -12.670806884765625], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000431.npy"} +{"epoch": 0.6515495086923658, "step": 432, "batch_size": 64, "mean": 54.7991943359375, "std": 81.6580581665039, "min": -170.0216827392578, "p10": -29.806499290466306, "median": 42.221548080444336, "p90": 168.70244903564455, "max": 201.1741943359375, "pos_frac": 0.734375, "sample": [-15.08648681640625, -30.301912307739258, -36.35655212402344, -170.0216827392578, 3.399953842163086, 5.533109664916992, 13.028915405273438, 79.66990661621094, -28.650535583496094, 162.07919311523438, 88.40251159667969, -87.59491729736328, 32.756591796875, 49.696258544921875, 169.22174072265625, -114.02682495117188, 68.24369049072266, 9.171646118164062, 195.8970184326172, 139.35513305664062, 8.182273864746094, 108.63294219970703, 135.07461547851562, -23.776275634765625, -3.931201934814453, 172.84243774414062, -5.485282897949219, 170.86207580566406, 130.58065795898438, -26.37587547302246, -48.70660400390625, 38.824893951416016, 9.825510025024414, -28.065780639648438, 31.513092041015625, 64.51174926757812, 167.4907684326172, 128.1795654296875, 59.80622863769531, 128.8280029296875, -12.77280044555664, 37.748775482177734, 115.64059448242188, 20.368209838867188, 144.98434448242188, 20.280776977539062, 45.618202209472656, 170.07427978515625, 26.637020111083984, 185.18959045410156, 98.8306655883789, 85.94876098632812, 111.00345611572266, -23.204696655273438, 93.69412231445312, 201.1741943359375, -26.797042846679688, 131.95802307128906, 79.02772521972656, 11.607704162597656, -52.921607971191406, 139.0237274169922, 10.190704345703125, 140.61326599121094], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000432.npy"} +{"epoch": 0.6530612244897959, "step": 433, "batch_size": 64, "mean": 65.49736785888672, "std": 81.69761657714844, "min": -171.19723510742188, "p10": -30.962632751464845, "median": 52.72382926940918, "p90": 168.97469177246094, "max": 202.5489044189453, "pos_frac": 0.78125, "sample": [44.733341217041016, 112.50474548339844, 17.75155258178711, 51.9043083190918, -5.3393402099609375, 50.92803955078125, -0.9613971710205078, 132.4544677734375, -14.431629180908203, 6.00567626953125, 14.697463989257812, 36.818260192871094, 102.83551025390625, 31.944496154785156, 173.70623779296875, -80.5688705444336, 86.20503234863281, 151.0037078857422, 114.82347869873047, -28.338886260986328, 55.934539794921875, 40.72770690917969, 1.6334152221679688, 160.91746520996094, -171.19723510742188, 61.980045318603516, 140.169189453125, 23.3316650390625, 139.33737182617188, 125.08352661132812, 31.48377227783203, 108.71013641357422, -40.787200927734375, 6.423805236816406, 37.539974212646484, -17.188018798828125, -42.40506362915039, 53.54335021972656, 122.6663818359375, 172.14247131347656, 202.5489044189453, 170.30917358398438, 189.25198364257812, 42.526275634765625, 161.97544860839844, -115.71610260009766, 35.50205993652344, 103.33139038085938, -30.768043518066406, 165.86090087890625, -12.864913940429688, 88.01197052001953, 148.73931884765625, -31.04602813720703, 38.347511291503906, 160.64114379882812, 139.36978149414062, 61.8336181640625, 172.80816650390625, 176.0986328125, 157.61279296875, 34.6732177734375, 164.80859375, -40.74725341796875], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000433.npy"} +{"epoch": 0.654572940287226, "step": 434, "batch_size": 64, "mean": 68.3910903930664, "std": 92.93335723876953, "min": -191.0888671875, "p10": -42.380364608764644, "median": 82.69662094116211, "p90": 174.9239273071289, "max": 235.14227294921875, "pos_frac": 0.8125, "sample": [-166.43463134765625, 83.91316223144531, 122.63063049316406, 30.35162353515625, 139.78659057617188, 173.4703369140625, -44.68503189086914, 175.48944091796875, -77.51341247558594, 62.785919189453125, 4.667360305786133, -48.664093017578125, -191.0888671875, 74.46583557128906, 138.7561798095703, -37.0028076171875, 113.14042663574219, 81.33883666992188, 235.14227294921875, 174.98121643066406, 88.9758529663086, 2.3774890899658203, 224.53208923339844, 8.025749206542969, -113.27870178222656, 46.05088806152344, 174.79025268554688, 102.54591369628906, 2.5130577087402344, 106.797119140625, 12.72524642944336, 111.63850402832031, 86.12031555175781, 171.13006591796875, 189.67630004882812, 166.78477478027344, -17.10924530029297, 126.06661224365234, 188.66632080078125, 7.5628509521484375, 168.62344360351562, 7.0320892333984375, 42.66139602661133, 117.43588256835938, 15.8515625, 7.341102600097656, 31.55767250061035, 114.1377182006836, 83.07550048828125, 143.43746948242188, 9.230976104736328, 183.72824096679688, -134.0056915283203, -18.692413330078125, -5.394844055175781, 90.4548110961914, 139.43067932128906, 162.12014770507812, 119.66171264648438, -5.5417633056640625, 65.36798095703125, 82.31774139404297, 163.09817504882812, 61.97767639160156], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000434.npy"} +{"epoch": 0.656084656084656, "step": 435, "batch_size": 64, "mean": 54.947364807128906, "std": 83.96150207519531, "min": -136.23541259765625, "p10": -44.78864517211914, "median": 51.87052917480469, "p90": 173.63020782470704, "max": 193.18411254882812, "pos_frac": 0.703125, "sample": [100.15093231201172, 72.44287109375, -16.23802947998047, 79.42984771728516, -85.24629974365234, 18.08625030517578, 3.5177459716796875, 0.4381904602050781, 112.05883026123047, -4.5666961669921875, 154.05633544921875, 158.79885864257812, -26.75732421875, 109.54174041748047, 160.55523681640625, 166.1464385986328, 24.70708465576172, -45.89256286621094, -17.82135009765625, 178.060546875, 55.252174377441406, -4.03546142578125, 150.61453247070312, 187.29833984375, 25.120941162109375, 40.846824645996094, -7.3748626708984375, 74.74226379394531, 173.10289001464844, 175.6773681640625, -13.231857299804688, 99.50155639648438, -136.23541259765625, 117.38372802734375, 63.50748062133789, 71.88856506347656, -12.688285827636719, -38.576324462890625, 117.1232681274414, 171.29782104492188, 178.44888305664062, 193.18411254882812, 173.856201171875, 48.48888397216797, 0.7195358276367188, 55.999977111816406, 37.17204666137695, -42.21283721923828, -29.920467376708984, 180.94512939453125, -65.97936248779297, 28.652908325195312, -51.95783996582031, 82.55326080322266, 79.12965393066406, 84.99325561523438, 140.41932678222656, -77.15603637695312, -99.3393325805664, 25.802841186523438, 1.7213592529296875, -39.774810791015625, 136.07736206054688, 22.123214721679688], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000435.npy"} +{"epoch": 0.6575963718820862, "step": 436, "batch_size": 64, "mean": 47.22056579589844, "std": 88.01837921142578, "min": -155.77572631835938, "p10": -64.59049911499024, "median": 30.219998359680176, "p90": 161.67628021240236, "max": 227.9365234375, "pos_frac": 0.703125, "sample": [101.66340637207031, -8.64156723022461, 151.55520629882812, 4.42576789855957, 109.93744659423828, 7.865907669067383, 85.89722442626953, 146.9956512451172, -80.96857452392578, 29.90251922607422, 27.074951171875, 156.8882293701172, 17.692283630371094, 101.70700073242188, -25.222591400146484, 176.02633666992188, 140.07077026367188, 108.76515197753906, -139.57554626464844, 52.207801818847656, 16.33974838256836, 65.96349334716797, -31.46057891845703, -3.6579208374023438, 30.537477493286133, -6.711967468261719, 110.63238525390625, -4.370809555053711, 163.72830200195312, 24.68830108642578, 74.8648681640625, -37.82965087890625, -155.77572631835938, 104.49839782714844, -27.63884925842285, 50.267616271972656, 152.9486083984375, -63.76929473876953, 5.597999572753906, -67.22848510742188, 146.05892944335938, 127.3834457397461, 31.45241928100586, 13.354202270507812, -97.22056579589844, 117.494140625, -56.484046936035156, 192.47283935546875, 94.0452880859375, 227.9365234375, 123.87604522705078, 1.9559783935546875, 189.32220458984375, 111.411376953125, -23.161094665527344, 17.071788787841797, 164.87782287597656, -51.27490234375, 22.017616271972656, 0.8157901763916016, -64.94244384765625, 185.5730438232422, -95.22310638427734, 77.41173553466797], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000436.npy"} +{"epoch": 0.6591080876795162, "step": 437, "batch_size": 64, "mean": 50.945472717285156, "std": 101.54486083984375, "min": -247.842529296875, "p10": -68.3572006225586, "median": 47.0362434387207, "p90": 185.80484008789068, "max": 275.52447509765625, "pos_frac": 0.65625, "sample": [275.52447509765625, 200.9486541748047, 158.9801025390625, 104.58110046386719, 40.687477111816406, -43.414493560791016, 147.84385681152344, 99.08755493164062, 210.5169677734375, 39.12477493286133, 166.9723358154297, -24.702545166015625, -247.842529296875, 80.48863220214844, -90.49273681640625, -64.49884796142578, 43.04856872558594, 74.19610595703125, 126.39833068847656, -124.88752746582031, 192.24685668945312, 199.98492431640625, 165.1461944580078, -17.308147430419922, -43.32561111450195, 75.43841552734375, 213.52386474609375, -26.036563873291016, -136.5320281982422, -70.01078033447266, -19.139244079589844, -51.999237060546875, 47.09331512451172, -16.298744201660156, -9.981101989746094, 170.77346801757812, 69.83476257324219, -29.71539306640625, 71.5384292602539, 79.84933471679688, 32.37890625, -7.560768127441406, -41.54315185546875, 157.18540954589844, 23.51654052734375, 161.41177368164062, 50.932212829589844, 113.21537780761719, 96.79466247558594, -112.75531768798828, 46.97917175292969, 53.35886764526367, 144.24581909179688, 139.8338623046875, 7.874153137207031, 16.35161590576172, 21.429161071777344, 111.78016662597656, -91.54824829101562, -7.774448394775391, -1.602914810180664, 75.49168395996094, 18.414779663085938, 214.45809936523438], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000437.npy"} +{"epoch": 0.6606198034769464, "step": 438, "batch_size": 64, "mean": 71.16368103027344, "std": 91.63633728027344, "min": -111.91344451904297, "p10": -24.320520401000973, "median": 52.26965141296387, "p90": 164.02464904785157, "max": 407.7125244140625, "pos_frac": 0.765625, "sample": [202.57933044433594, -6.383171081542969, 407.7125244140625, -67.12816619873047, -1.65887451171875, -50.982215881347656, -21.71457290649414, 141.36061096191406, 4.187578201293945, 227.0467071533203, -28.516902923583984, 197.64419555664062, -25.437355041503906, 12.624320983886719, 164.10531616210938, 0.40439605712890625, 111.34896087646484, -111.91344451904297, 140.9716796875, 84.72142791748047, 136.52911376953125, 142.4719696044922, -11.513313293457031, 53.82171630859375, 50.717586517333984, 156.1654510498047, 65.21641540527344, 35.3859977722168, 163.83642578125, 117.09330749511719, 92.08425903320312, -29.875152587890625, 130.63076782226562, 13.33961296081543, 9.661865234375, 153.39834594726562, 163.0708465576172, -11.63874626159668, 94.05984497070312, 38.32353210449219, 129.010009765625, 10.957992553710938, 61.16664123535156, 275.3446044921875, 133.89218139648438, 22.854522705078125, 119.9885025024414, 44.70536804199219, 13.0693359375, 1.8486213684082031, -21.41836166381836, -6.396203994750977, 22.741533279418945, 139.87599182128906, 147.86669921875, -70.17310333251953, 155.7974853515625, 46.298065185546875, -4.111396789550781, 178.8829345703125, 9.659427642822266, 32.52915954589844, 106.75656127929688, 59.576690673828125], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000438.npy"} +{"epoch": 0.6621315192743764, "step": 439, "batch_size": 64, "mean": 62.066558837890625, "std": 84.29643249511719, "min": -218.27273559570312, "p10": -18.321087837219235, "median": 48.00821304321289, "p90": 190.13121490478517, "max": 214.8879852294922, "pos_frac": 0.765625, "sample": [132.30865478515625, 6.491825103759766, 20.59272575378418, -30.46508026123047, 61.05869674682617, 152.16217041015625, 85.43948364257812, 22.494171142578125, -28.003395080566406, 203.61866760253906, 205.91014099121094, 3.3038692474365234, 172.54312133789062, 19.945114135742188, 49.52354431152344, 214.63882446289062, 165.88302612304688, 17.15027618408203, 168.382080078125, -26.877182006835938, 8.398143768310547, 100.78407287597656, 55.741294860839844, -4.686614990234375, 167.43284606933594, 47.44115447998047, 194.22079467773438, -65.72476196289062, 11.42021369934082, 184.15640258789062, -19.38313102722168, 192.6918487548828, -26.192115783691406, -2.753692626953125, 81.6769790649414, -7.7970733642578125, 0.07012176513671875, 16.355850219726562, -218.27273559570312, 24.351573944091797, 20.3751220703125, 48.57527160644531, 153.83877563476562, 52.74481201171875, 59.89142990112305, 162.98179626464844, 81.97756958007812, 211.5941162109375, 44.699005126953125, 31.566604614257812, 29.77084732055664, 70.44052124023438, -12.414070129394531, 116.58795928955078, 57.310943603515625, 214.8879852294922, 138.49969482421875, -15.842987060546875, -15.557579040527344, -0.0327606201171875, 24.182201385498047, 74.50920104980469, 74.39971160888672, -8.758552551269531], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000439.npy"} +{"epoch": 0.6636432350718064, "step": 440, "batch_size": 64, "mean": 62.042938232421875, "std": 88.475341796875, "min": -126.20730590820312, "p10": -55.333340072631835, "median": 51.97343826293945, "p90": 175.5578872680664, "max": 279.156982421875, "pos_frac": 0.78125, "sample": [-34.962730407714844, 53.754119873046875, 52.932098388671875, 218.58544921875, 175.70327758789062, 279.156982421875, 178.3871612548828, -12.120742797851562, 172.90451049804688, 54.9703369140625, 18.70134735107422, 164.72189331054688, 44.895103454589844, 137.11790466308594, 108.78486633300781, 37.737030029296875, 160.6138916015625, -50.869895935058594, -102.32947540283203, 62.86100769042969, 83.10321807861328, 1.466421127319336, 12.748764038085938, 143.07113647460938, 51.01477813720703, 130.6366729736328, 83.81265258789062, 118.55950927734375, 8.559186935424805, 27.72553253173828, 6.225202560424805, 77.01483917236328, 122.57464599609375, 0.4369010925292969, 3.1733016967773438, 38.46348571777344, 32.84837341308594, -108.21141815185547, 25.69809913635254, 180.5579376220703, 137.72727966308594, 175.21864318847656, -1.2269744873046875, 167.18765258789062, -56.62538528442383, 21.38245391845703, 180.21231079101562, 22.599571228027344, 150.38882446289062, -25.31877899169922, -55.5082893371582, -60.41532897949219, 75.62496948242188, -54.92512512207031, 81.21317291259766, 28.508609771728516, -20.292530059814453, -68.3288345336914, 156.20364379882812, -126.20730590820312, 41.24433898925781, 177.77700805664062, 171.31878662109375, 91.96611785888672], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000440.npy"} +{"epoch": 0.6651549508692366, "step": 441, "batch_size": 64, "mean": 68.77332305908203, "std": 73.74211120605469, "min": -72.94164276123047, "p10": -24.19587478637695, "median": 61.26816940307617, "p90": 169.63522338867188, "max": 192.03013610839844, "pos_frac": 0.78125, "sample": [135.55941772460938, 66.6263198852539, 174.24636840820312, 180.19830322265625, -1.6246395111083984, 138.49664306640625, 154.05508422851562, -6.717353820800781, 105.91964721679688, -17.602005004882812, -35.25663375854492, 143.40328979492188, -24.922142028808594, 169.83609008789062, 27.330081939697266, 25.511749267578125, 83.15935516357422, -1.7139892578125, -32.79415512084961, 170.46583557128906, 60.41758728027344, 73.32488250732422, 147.21197509765625, 161.2256622314453, 22.78150177001953, 168.904052734375, 1.3640861511230469, -0.6228713989257812, 192.03013610839844, 113.0765380859375, 52.472755432128906, 76.846923828125, -59.61963653564453, 94.27946472167969, 121.67829895019531, 6.7124176025390625, -59.26148986816406, 168.19374084472656, 52.530799865722656, 57.91851806640625, 45.323760986328125, 163.05337524414062, 30.570152282714844, 13.832653045654297, 109.83702087402344, 64.92074584960938, 93.187744140625, 4.5368804931640625, 109.54026794433594, -22.501251220703125, 169.16653442382812, 18.971986770629883, 180.3404541015625, 187.97006225585938, -47.24821472167969, 62.03465270996094, 60.108802795410156, 4.272773742675781, -3.2915420532226562, 99.28510284423828, -72.94164276123047, 60.501686096191406, 134.33042907714844, 30.047868728637695], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000441.npy"} +{"epoch": 0.6666666666666666, "step": 442, "batch_size": 64, "mean": 66.54078674316406, "std": 81.5394287109375, "min": -142.61785888671875, "p10": -30.686931610107415, "median": 67.78769302368164, "p90": 168.17587432861328, "max": 244.35369873046875, "pos_frac": 0.796875, "sample": [23.40459442138672, 234.2353515625, 71.13841247558594, -23.604873657226562, 63.57917785644531, 244.35369873046875, 176.2396240234375, 169.92579650878906, 68.67668151855469, 150.78665161132812, 57.40085220336914, 138.9222869873047, 139.58839416503906, 15.068084716796875, 128.75595092773438, 112.15887451171875, 1.5338211059570312, 8.407913208007812, 45.41351318359375, -33.72209930419922, -78.65199279785156, 128.2093505859375, 105.17636108398438, -10.112152099609375, 121.91590881347656, -2.4114303588867188, -71.86711883544922, 104.42324829101562, 12.670461654663086, 180.0040740966797, 0.2513580322265625, 66.8987045288086, 142.70462036132812, 156.96347045898438, 205.10641479492188, 85.58142852783203, 11.918693542480469, 0.22412490844726562, 167.72349548339844, 76.96365356445312, 70.43546295166016, 20.90380096435547, 22.54731559753418, 18.803508758544922, -1.913839340209961, -142.61785888671875, -34.03346252441406, 147.30941772460938, -34.16374206542969, -13.917739868164062, 168.3697509765625, 132.89801025390625, -72.04217529296875, 62.246620178222656, 123.61639404296875, -14.041372299194336, 73.18499755859375, 27.7530517578125, 76.45379638671875, 158.12393188476562, 80.29060363769531, 161.9412841796875, 7.009925842285156, 23.497663497924805], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000442.npy"} +{"epoch": 0.6681783824640968, "step": 443, "batch_size": 64, "mean": 82.42811584472656, "std": 94.2217025756836, "min": -159.83383178710938, "p10": -16.974423217773435, "median": 86.89866256713867, "p90": 171.36451568603516, "max": 393.2523498535156, "pos_frac": 0.796875, "sample": [9.784961700439453, 149.90773010253906, 88.57267761230469, 156.990478515625, 28.968597412109375, 75.96511840820312, 129.92250061035156, -66.01078796386719, 60.69670104980469, 106.48738098144531, -18.009010314941406, -14.419313430786133, 59.711246490478516, 163.28163146972656, 61.718441009521484, 194.7188720703125, 8.033212661743164, 130.15057373046875, 85.22464752197266, 159.88272094726562, 393.2523498535156, -159.83383178710938, -23.237831115722656, 149.7724609375, 0.7920742034912109, 229.28982543945312, 112.42548370361328, 84.15337371826172, 161.80572509765625, 158.13876342773438, 146.45166015625, 123.41409301757812, 123.67787170410156, 151.75384521484375, 102.65225219726562, 173.15582275390625, 159.51011657714844, 166.5108184814453, 119.86199951171875, 184.0917510986328, 8.68621826171875, 149.24147033691406, -10.466272354125977, 69.2894058227539, 167.18479919433594, 160.6342010498047, -14.560386657714844, 16.06097412109375, 17.733741760253906, 9.790266036987305, 5.134159088134766, -48.251808166503906, 139.05096435546875, -1.8229217529296875, 48.05331039428711, 14.342304229736328, -144.32327270507812, -21.443115234375, 208.63148498535156, 42.73982238769531, -0.4279289245605469, -6.443489074707031, 99.81291198730469, 237.53550720214844], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000443.npy"} +{"epoch": 0.6696900982615268, "step": 444, "batch_size": 64, "mean": 34.28218078613281, "std": 90.00736999511719, "min": -167.95452880859375, "p10": -77.61390838623045, "median": 17.044621467590332, "p90": 162.4079147338867, "max": 244.3642578125, "pos_frac": 0.65625, "sample": [119.59677124023438, -3.635814666748047, -48.97869110107422, 3.323854446411133, 20.245086669921875, 22.720172882080078, 95.82781982421875, -43.30854797363281, 7.786342620849609, 109.28483581542969, 5.921104431152344, 86.98834991455078, -85.51835632324219, -119.28778076171875, 68.90132141113281, 16.644866943359375, 77.69377136230469, 65.61544036865234, 50.59328842163086, -94.9259033203125, 201.15731811523438, 173.37533569335938, 0.4804496765136719, -28.391448974609375, -12.598114013671875, 41.28565216064453, 7.002006530761719, -12.208555221557617, -59.170196533203125, -57.3193359375, 154.00259399414062, 13.632579803466797, 145.65716552734375, 47.9178466796875, 23.608184814453125, 144.66281127929688, 33.165367126464844, 165.872314453125, -11.932235717773438, -167.95452880859375, 34.76776123046875, 244.3642578125, -116.297607421875, -53.537986755371094, -6.233793258666992, 162.50341796875, 140.68521118164062, 222.9700927734375, 169.67083740234375, 68.04176330566406, 17.44437599182129, 85.66752624511719, 2.545574188232422, 12.17010498046875, 151.03585815429688, -16.788049697875977, -42.350101470947266, 19.84563636779785, 4.152099609375, -97.11894226074219, -123.81124114990234, 162.18507385253906, -2.3583011627197266, -3.2273426055908203], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000444.npy"} +{"epoch": 0.671201814058957, "step": 445, "batch_size": 64, "mean": 68.70869445800781, "std": 83.65740966796875, "min": -118.05299377441406, "p10": -34.44050922393799, "median": 70.3913459777832, "p90": 172.03779754638674, "max": 216.19869995117188, "pos_frac": 0.8125, "sample": [25.104000091552734, 216.19869995117188, 15.206321716308594, -15.590103149414062, -42.366302490234375, 29.491622924804688, 162.68972778320312, 141.67112731933594, 63.890899658203125, 69.79060363769531, 0.585418701171875, -93.13391876220703, -35.63194274902344, 18.699386596679688, -99.49501037597656, 155.51962280273438, -24.40057373046875, 10.839126586914062, 29.40606689453125, 59.65534210205078, 1.183990478515625, 169.53677368164062, -118.05299377441406, 44.79066467285156, -77.5710678100586, 165.68890380859375, 8.120857238769531, 164.45887756347656, 53.886634826660156, 9.71478271484375, -52.32432174682617, -12.523351669311523, 79.72149658203125, 185.14349365234375, 177.65713500976562, 89.95188903808594, 147.0735626220703, 166.56430053710938, 72.21131896972656, -2.4318161010742188, 176.1199951171875, 82.71794891357422, 65.36569213867188, 199.8883819580078, 159.58673095703125, 166.3501739501953, 202.93011474609375, 15.308420181274414, 142.9534454345703, -31.660497665405273, 106.26103210449219, 1.5820083618164062, 11.179443359375, 88.87751007080078, 87.94678497314453, 75.11978149414062, 160.57431030273438, 158.30789184570312, 70.9920883178711, 74.45645904541016, 114.3781509399414, 113.07083892822266, 173.1096649169922, 21.00896453857422], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000445.npy"} +{"epoch": 0.672713529856387, "step": 446, "batch_size": 64, "mean": 74.02444458007812, "std": 79.93746948242188, "min": -88.68132019042969, "p10": -13.43291835784912, "median": 65.1898422241211, "p90": 177.48841705322266, "max": 268.1488952636719, "pos_frac": 0.796875, "sample": [6.791425704956055, 3.0368118286132812, -88.68132019042969, 124.81710815429688, 41.03168487548828, 114.30281066894531, 56.54451370239258, -17.719032287597656, 268.1488952636719, 43.87040710449219, 28.16379165649414, 121.14500427246094, 103.85443115234375, 145.51840209960938, 108.01041412353516, 174.15892028808594, 14.162391662597656, 86.81681823730469, 91.5595474243164, 62.051414489746094, 3.8099403381347656, 127.90725708007812, -7.021484375, 152.351318359375, 178.91534423828125, 83.5009765625, 13.992450714111328, 153.42459106445312, 185.58358764648438, -22.963706970214844, 147.51205444335938, 1.2419681549072266, -80.13751983642578, -2.5519638061523438, -12.92877197265625, 0.9734554290771484, 9.571456909179688, -22.30581283569336, 68.3282699584961, 127.45577239990234, 46.359710693359375, 195.99659729003906, 186.93780517578125, 153.85739135742188, 240.97845458984375, -0.14058494567871094, 208.63290405273438, 167.16229248046875, -13.648981094360352, 38.33295822143555, 70.63545989990234, 32.89009094238281, 84.23751831054688, 125.11335754394531, 163.23316955566406, 173.240966796875, 15.285572052001953, 31.998313903808594, -2.9720535278320312, 95.81185913085938, -3.4933395385742188, 51.12534713745117, -46.3497314453125, 128.0958251953125], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000446.npy"} +{"epoch": 0.674225245653817, "step": 447, "batch_size": 64, "mean": 81.6279525756836, "std": 91.6844711303711, "min": -169.06076049804688, "p10": -38.87104606628417, "median": 90.86869049072266, "p90": 187.87896575927735, "max": 217.27542114257812, "pos_frac": 0.8125, "sample": [217.27542114257812, 189.98448181152344, 150.01980590820312, 17.270126342773438, 40.49504852294922, -24.353713989257812, 196.88433837890625, 10.200439453125, -112.1464614868164, 30.383041381835938, 70.50789642333984, 128.65423583984375, 7.152137756347656, 75.501953125, 173.97592163085938, 173.78941345214844, 84.15924072265625, 84.92581176757812, 55.67501449584961, 70.0321044921875, 20.50762939453125, -24.58863067626953, 39.93656921386719, -42.93140411376953, 40.85780334472656, 206.09750366210938, 189.40394592285156, 168.99961853027344, 134.08233642578125, -54.575714111328125, 91.41671752929688, 90.32066345214844, 164.2187042236328, 161.16867065429688, 100.26931762695312, 156.31619262695312, 199.49734497070312, 139.76885986328125, 182.29067993164062, 6.484897613525391, 18.926651000976562, 92.508056640625, 176.3526611328125, -87.13240814208984, -29.39687728881836, -123.80718994140625, 34.05225372314453, 152.90707397460938, 167.36883544921875, 108.8160171508789, -11.130889892578125, 157.29283142089844, -62.33505630493164, 184.3206787109375, 87.02720642089844, 68.97866821289062, 108.12895202636719, -169.06076049804688, 112.99561309814453, 196.24856567382812, 175.98580932617188, -16.201141357421875, 124.54629516601562, 146.86920166015625], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000447.npy"} +{"epoch": 0.6757369614512472, "step": 448, "batch_size": 64, "mean": 65.02684020996094, "std": 85.6777572631836, "min": -167.41680908203125, "p10": -40.4695129394531, "median": 55.25187301635742, "p90": 169.16433258056642, "max": 278.0973815917969, "pos_frac": 0.828125, "sample": [149.18203735351562, -119.08043670654297, 170.1876220703125, 72.98759460449219, 80.6105728149414, 103.48499298095703, -1.2818069458007812, 133.860107421875, 55.82365417480469, 3.2582168579101562, 145.16184997558594, 95.20426177978516, 68.48831176757812, 12.842864990234375, 133.78143310546875, 188.76988220214844, -10.374507904052734, 188.98995971679688, 38.59368133544922, 5.757534027099609, 9.038803100585938, 158.76351928710938, 51.407264709472656, 86.36659240722656, 133.85922241210938, 1.4936943054199219, 166.7766571044922, 54.680091857910156, 20.671913146972656, -55.91169738769531, -60.84032440185547, 39.84431457519531, 44.191062927246094, 8.39385986328125, 13.542549133300781, 95.80940246582031, -52.415130615234375, 32.31846618652344, 215.13705444335938, -12.596406936645508, 7.448522567749023, -167.41680908203125, 82.63377380371094, 44.95857238769531, 116.7086181640625, 142.9940643310547, 101.01124572753906, 146.78961181640625, 61.68358612060547, 34.210899353027344, -52.961143493652344, 44.31629943847656, 70.33059692382812, 158.16966247558594, 1.2969589233398438, 278.0973815917969, -1.9915924072265625, -113.94791412353516, 165.61062622070312, 170.7767791748047, 158.50357055664062, 43.025421142578125, 17.37476348876953, 185.31561279296875], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000448.npy"} +{"epoch": 0.6772486772486772, "step": 449, "batch_size": 64, "mean": 32.7079963684082, "std": 79.23725128173828, "min": -126.50901794433594, "p10": -74.98603134155273, "median": 26.37685203552246, "p90": 151.13214111328125, "max": 197.97264099121094, "pos_frac": 0.65625, "sample": [4.765375137329102, 46.242431640625, -109.48648071289062, 68.16064453125, 27.963218688964844, -4.4001617431640625, -19.145431518554688, 74.30103302001953, 48.80493927001953, 182.10791015625, 123.55791473388672, 72.63301849365234, 4.222099304199219, -50.27278137207031, -11.10540771484375, -8.907012939453125, 197.97264099121094, 3.8458824157714844, 3.1301422119140625, 71.42393493652344, -46.65511703491211, 49.65662384033203, 170.04922485351562, 149.18154907226562, -126.50901794433594, -0.2741050720214844, 120.0468978881836, -110.49020385742188, 122.29492950439453, 40.065948486328125, 53.62068176269531, -28.171951293945312, 35.4677734375, -83.33683776855469, 160.50485229492188, 16.30176544189453, 176.28553771972656, -4.167751312255859, 38.2555046081543, 46.255767822265625, 13.865362167358398, 0.8106231689453125, -59.82284164428711, 34.02777099609375, -77.96965026855469, 69.45542907714844, -3.3772430419921875, 151.96810913085938, 9.671695709228516, 81.77823638916016, 157.62850952148438, -12.468795776367188, 34.963111877441406, 7.3520660400390625, -100.17132568359375, 144.49786376953125, 117.82147216796875, -68.02425384521484, 133.07879638671875, -47.841514587402344, 72.19367980957031, -81.40542602539062, 24.790485382080078, -13.706268310546875], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000449.npy"} +{"epoch": 0.6787603930461074, "step": 450, "batch_size": 64, "mean": 51.395240783691406, "std": 92.3817367553711, "min": -117.33939361572266, "p10": -47.728652191162105, "median": 25.146923065185547, "p90": 177.79769592285157, "max": 267.5722961425781, "pos_frac": 0.671875, "sample": [0.5470943450927734, -30.18255615234375, -40.424964904785156, -35.69249725341797, 267.5722961425781, 189.27969360351562, 64.19752502441406, 64.03854370117188, 151.89466857910156, 178.16543579101562, 89.6349868774414, 24.400846481323242, 58.551902770996094, 41.355560302734375, 2.7839889526367188, 175.59347534179688, -0.1885986328125, 58.73789978027344, 146.94277954101562, 240.99798583984375, -0.9912452697753906, 41.71345901489258, -15.235771179199219, -24.023277282714844, 71.90208435058594, -42.26961135864258, 6.207328796386719, 180.37966918945312, 53.71782684326172, 3.6368350982666016, -6.337287902832031, 161.18252563476562, 24.25365447998047, 105.18876647949219, -117.33939361572266, 176.93963623046875, 146.60916137695312, -2.574115753173828, 212.79116821289062, 27.985858917236328, 16.615901947021484, -3.0172500610351562, 107.71954345703125, -100.23482513427734, 27.730697631835938, 9.049203872680664, 129.0310516357422, -6.295074462890625, 142.40863037109375, -50.068241119384766, 25.89299964904785, -95.75714874267578, 16.631380081176758, 97.2562255859375, 255.01034545898438, 2.589508056640625, -75.36869812011719, 149.11196899414062, -95.67097473144531, 170.2391357421875, -57.91102600097656, 20.74018096923828, -30.2609806060791, -18.090675354003906], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000450.npy"} +{"epoch": 0.6802721088435374, "step": 451, "batch_size": 64, "mean": 48.64530944824219, "std": 82.47926330566406, "min": -148.83627319335938, "p10": -34.110993194580075, "median": 40.908103942871094, "p90": 155.7907913208008, "max": 238.30075073242188, "pos_frac": 0.703125, "sample": [97.32135009765625, 7.49578857421875, 59.568359375, 40.64347839355469, 153.28382873535156, 41.1727294921875, -148.83627319335938, 48.573028564453125, 2.182443618774414, 185.11856079101562, 72.35240173339844, 84.92426300048828, 143.2962646484375, 39.383026123046875, 144.62289428710938, 54.806060791015625, 57.147377014160156, 7.979072570800781, 26.984464645385742, 89.53349304199219, -2.0723323822021484, -116.45824432373047, -90.68757629394531, 238.30075073242188, 156.86520385742188, -39.15081787109375, 109.4571533203125, -98.33099365234375, -35.897857666015625, -0.7685890197753906, 45.548377990722656, 225.41079711914062, -13.530651092529297, -0.9667911529541016, 137.168701171875, 76.7282485961914, 170.4316864013672, 123.63407897949219, -22.761962890625, 12.026603698730469, 17.188209533691406, 107.16960144042969, 2.7765769958496094, 0.5360107421875, 98.62153625488281, 35.696563720703125, 2.5588111877441406, 128.4340057373047, 187.40452575683594, 83.71028137207031, -16.374786376953125, 132.9697265625, 41.21299743652344, -29.94164276123047, -0.454498291015625, 7.0601806640625, 148.480712890625, -0.4217796325683594, -5.81297492980957, 44.13663101196289, 174.35482788085938, -9.691410064697266, -101.72943115234375, -17.08332061767578], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000451.npy"} +{"epoch": 0.6817838246409675, "step": 452, "batch_size": 64, "mean": 55.15898132324219, "std": 92.110595703125, "min": -148.13092041015625, "p10": -69.76631927490233, "median": 46.6424674987793, "p90": 169.01803283691407, "max": 239.5393829345703, "pos_frac": 0.75, "sample": [30.58861541748047, -19.54322052001953, 22.51270866394043, 74.38058471679688, 4.407585144042969, 92.85112762451172, 17.590408325195312, 161.4000701904297, 145.02508544921875, 181.0650634765625, 17.084026336669922, 227.4856719970703, -139.413330078125, 118.74188232421875, 162.70120239257812, 89.36568450927734, 239.5393829345703, 107.61770629882812, 114.53060913085938, 133.42831420898438, 28.232933044433594, -16.3912353515625, 211.07015991210938, 124.39962768554688, 17.679302215576172, -9.874353408813477, 150.69126892089844, 51.91357421875, -2.1537551879882812, 28.153175354003906, 5.075115203857422, 210.64483642578125, -100.5806884765625, 164.70590209960938, -59.27705383300781, 93.04585266113281, 41.371360778808594, 105.24681091308594, -116.53816986083984, 15.344928741455078, 90.9587173461914, -85.98577880859375, 101.29668426513672, 55.6676025390625, 69.44540405273438, -122.20634460449219, 183.39990234375, 126.90047454833984, 27.119918823242188, 4.792816162109375, 116.51943969726562, -10.81243896484375, 10.844766616821289, 127.66806030273438, 4.059154510498047, 8.044967651367188, -38.166099548339844, 170.8660888671875, 143.92453002929688, -74.26171875, -15.954025268554688, 69.74774932861328, -148.13092041015625, -9.682601928710938], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000452.npy"} +{"epoch": 0.6832955404383976, "step": 453, "batch_size": 64, "mean": 58.01622772216797, "std": 90.83164978027344, "min": -130.21923828125, "p10": -45.527077865600575, "median": 54.68796157836914, "p90": 183.1062438964844, "max": 259.4002685546875, "pos_frac": 0.6875, "sample": [100.83126068115234, 59.86851501464844, 4.519500732421875, -9.809562683105469, 183.58242797851562, 28.661788940429688, -15.730697631835938, 152.5490264892578, 133.9082489013672, -24.302146911621094, -109.71223449707031, -4.026390075683594, 56.93121337890625, -1.9769744873046875, 141.67852783203125, 157.21115112304688, 259.4002685546875, 50.253326416015625, 181.99514770507812, 61.07822799682617, 1.6308040618896484, -21.291961669921875, 58.62593078613281, 21.538894653320312, 7.7000579833984375, -130.21923828125, -127.7876968383789, 178.9542694091797, -7.399909973144531, 164.59124755859375, 193.79971313476562, 48.063507080078125, 97.59867858886719, -48.9588623046875, -10.16994857788086, 53.59504699707031, 151.0373077392578, 139.7412567138672, -80.15982055664062, 157.7271728515625, 55.78087615966797, 222.6430206298828, -52.24802780151367, 0.9172935485839844, -29.178482055664062, 33.08192443847656, -81.99046325683594, 23.756366729736328, 141.23849487304688, 71.78237915039062, -3.6179161071777344, -17.978946685791016, 57.25328063964844, 90.13575744628906, 104.46170043945312, -37.51958084106445, -3.3395729064941406, 84.27798461914062, 184.2307891845703, 60.38812255859375, 208.5948486328125, 143.69638061523438, 195.64358520507812, 5.50177001953125], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000453.npy"} +{"epoch": 0.6848072562358276, "step": 454, "batch_size": 64, "mean": 62.78339385986328, "std": 92.09689331054688, "min": -218.58740234375, "p10": -30.688591003417965, "median": 58.96108055114746, "p90": 172.35779571533203, "max": 320.255615234375, "pos_frac": 0.8125, "sample": [158.2506103515625, -43.24267578125, -28.135635375976562, 179.29855346679688, -218.58740234375, -14.57573127746582, 145.67576599121094, 26.10260772705078, 9.042652130126953, 37.573097229003906, 72.60227966308594, 168.8466339111328, 20.970245361328125, -176.30062866210938, 178.81304931640625, 99.52285766601562, 167.75230407714844, 69.09468078613281, 173.86257934570312, 43.95606994628906, -9.91912841796875, -109.27371215820312, 4.537698745727539, 165.23590087890625, 191.15225219726562, 320.255615234375, -7.100835800170898, 27.6785888671875, -36.79187774658203, 24.518531799316406, -31.78271484375, 98.90116119384766, 151.1200714111328, 25.398048400878906, 105.2074966430664, 82.5087661743164, 197.2724609375, -54.877384185791016, 179.34576416015625, 64.19094848632812, 76.61639404296875, 115.20233154296875, 5.380851745605469, 0.8468770980834961, 5.90667724609375, 32.583274841308594, 162.88180541992188, 119.74642944335938, 3.9468860626220703, 30.103302001953125, 130.2652130126953, 134.51739501953125, 6.186275482177734, 154.52679443359375, 109.2568130493164, 29.88079833984375, 113.48458099365234, 86.40086364746094, 2.5705718994140625, 119.76461791992188, 88.97386932373047, 53.7312126159668, 2.515695571899414, -25.25220489501953], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000454.npy"} +{"epoch": 0.6863189720332578, "step": 455, "batch_size": 64, "mean": 60.55400085449219, "std": 85.73413848876953, "min": -118.02794647216797, "p10": -40.14814720153808, "median": 36.47736740112305, "p90": 183.37806396484376, "max": 260.7884216308594, "pos_frac": 0.78125, "sample": [91.61602783203125, 36.672821044921875, 51.24359893798828, 211.33895874023438, 63.526206970214844, 2.042123794555664, 234.84239196777344, 143.69790649414062, -42.639808654785156, 30.480125427246094, 88.23506164550781, -118.02794647216797, 78.27210998535156, 94.31095886230469, 56.59552001953125, 260.7884216308594, -21.713218688964844, 13.690277099609375, 24.050048828125, -54.004676818847656, 191.15057373046875, 4.450433731079102, 148.2531280517578, -4.730159759521484, -11.942680358886719, 180.38720703125, 30.256179809570312, 124.14463806152344, 174.12196350097656, 36.28191375732422, 19.000286102294922, 21.419992446899414, 181.0595703125, 21.63916778564453, 32.67720031738281, -3.1684646606445312, -81.37074279785156, 96.92095947265625, 147.63674926757812, 162.58026123046875, -45.027957916259766, 25.817596435546875, 86.09457397460938, -30.84808349609375, 147.8299102783203, 208.02931213378906, 53.751426696777344, 58.219383239746094, 5.3128814697265625, 13.62042236328125, 184.3717041015625, 38.06249237060547, -1.6025505065917969, 145.09181213378906, 9.597000122070312, 10.49822998046875, 42.18589401245117, -62.10059356689453, -46.036346435546875, 26.488929748535156, 48.91607666015625, 25.264835357666016, -34.33427047729492, 250.46835327148438], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000455.npy"} +{"epoch": 0.6878306878306878, "step": 456, "batch_size": 64, "mean": 55.74595642089844, "std": 86.45791625976562, "min": -138.8593292236328, "p10": -23.901129531860345, "median": 34.1093692779541, "p90": 169.0295562744141, "max": 313.9625549316406, "pos_frac": 0.796875, "sample": [110.10246276855469, 0.09676361083984375, 2.1790027618408203, 94.04901885986328, 313.9625549316406, 1.5845222473144531, -26.291057586669922, 86.05961608886719, -8.69790267944336, 121.63728332519531, 55.75584411621094, 57.698909759521484, 220.8125, 147.48062133789062, 21.706436157226562, 8.758834838867188, 92.46479797363281, 74.91048431396484, 4.714849472045898, 173.6929931640625, -72.11851501464844, 16.324691772460938, 55.85260772705078, -18.324630737304688, 143.55245971679688, -2.6855030059814453, -138.8593292236328, -102.98158264160156, 129.59902954101562, -33.809356689453125, 8.519542694091797, 60.06105041503906, 16.432275772094727, 107.08100891113281, 19.47490692138672, 87.32252502441406, 35.90045166015625, 1.1379547119140625, 91.6407470703125, 5.895565032958984, -14.246191024780273, 32.31828689575195, 62.99707794189453, 85.79600524902344, -94.50434875488281, -107.78435516357422, 110.82987976074219, 1.72540283203125, -14.999168395996094, -7.258258819580078, 132.03187561035156, 173.0950927734375, 15.0538330078125, 226.67481994628906, 30.54638671875, 130.7988739013672, 186.82081604003906, 16.66112518310547, 127.7922134399414, 159.54330444335938, 21.916505813598633, 23.644134521484375, 66.24125671386719, 239.35206604003906], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000456.npy"} +{"epoch": 0.6893424036281179, "step": 457, "batch_size": 64, "mean": 57.726070404052734, "std": 75.64600372314453, "min": -117.53300476074219, "p10": -14.26754703521728, "median": 39.77702522277832, "p90": 168.96298980712893, "max": 205.75343322753906, "pos_frac": 0.828125, "sample": [29.70478057861328, 3.0761566162109375, 10.038875579833984, 118.315185546875, 72.38172912597656, -88.26881408691406, 32.8962287902832, 57.06697082519531, 32.631507873535156, 9.2845458984375, 24.74263572692871, 203.9447021484375, 139.29794311523438, 93.64302825927734, -8.623477935791016, -73.34759521484375, 164.69410705566406, 30.683700561523438, 1.2844600677490234, 141.16647338867188, 146.60678100585938, 59.20257568359375, 205.75343322753906, 31.288803100585938, 3.921855926513672, 68.85035705566406, -16.686433792114258, 159.30419921875, -7.680854797363281, 7.204082489013672, -69.391845703125, -104.01358795166016, 11.853652954101562, 118.83770751953125, 25.788333892822266, -37.75390625, -117.53300476074219, 57.47874450683594, 90.44329071044922, 18.6650390625, 84.69678497314453, 10.911170959472656, 170.79251098632812, 138.2581787109375, -1.8570365905761719, 16.33179473876953, 131.39207458496094, 27.720170974731445, 10.141075134277344, 171.1038818359375, 106.64862823486328, 92.17229461669922, 177.87332153320312, 107.44727325439453, 91.33819580078125, 175.48854064941406, 173.385009765625, 43.638145446777344, 24.655744552612305, 35.9159049987793, 132.98960876464844, -4.72186279296875, 69.572021484375, 61.822784423828125], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000457.npy"} +{"epoch": 0.690854119425548, "step": 458, "batch_size": 64, "mean": 61.138328552246094, "std": 89.64224243164062, "min": -186.57058715820312, "p10": -29.198367881774903, "median": 50.42523384094238, "p90": 181.36076660156252, "max": 267.93707275390625, "pos_frac": 0.8125, "sample": [119.11004638671875, 133.48275756835938, 6.537836074829102, 130.57330322265625, 64.91028594970703, 25.742984771728516, 92.05783081054688, -186.57058715820312, 0.03040313720703125, 10.451370239257812, -5.6038055419921875, -73.69883728027344, -25.235824584960938, 182.79579162597656, 166.11477661132812, 35.59723663330078, 50.19622039794922, 156.14141845703125, 44.34679412841797, 87.97004699707031, 17.96876335144043, 41.04292297363281, 40.856910705566406, -11.195198059082031, 132.38157653808594, 27.572647094726562, 200.7699432373047, 72.21334075927734, 23.55982208251953, 135.25006103515625, 202.16574096679688, 61.260467529296875, 56.03203201293945, -94.81978607177734, 57.13926696777344, 0.04480171203613281, 25.877647399902344, 27.195213317871094, 74.40919494628906, 145.00347900390625, 128.42774963378906, 50.65424728393555, -160.76776123046875, -4.7685699462890625, 212.09417724609375, 6.627147674560547, 128.8920135498047, -28.39644432067871, 171.48379516601562, 197.86643981933594, -29.542049407958984, 267.93707275390625, 93.18861389160156, 28.587411880493164, -94.47917175292969, 178.0123748779297, 54.01586151123047, 154.43704223632812, -51.547576904296875, 28.71490478515625, 10.840251922607422, 36.17298889160156, 196.1859130859375, 88.53790283203125], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000458.npy"} +{"epoch": 0.6923658352229781, "step": 459, "batch_size": 64, "mean": 77.55421447753906, "std": 91.0995101928711, "min": -191.20367431640625, "p10": -16.83669319152832, "median": 76.19469451904297, "p90": 189.17154541015626, "max": 249.8273468017578, "pos_frac": 0.796875, "sample": [55.70232391357422, 116.3760986328125, -17.430313110351562, 122.92413330078125, 14.966629028320312, -191.20367431640625, 0.0003833770751953125, 172.90420532226562, 97.77157592773438, 148.99185180664062, 190.07843017578125, -27.280445098876953, 82.50440979003906, -61.24275207519531, 176.1931915283203, 218.02049255371094, 81.24705505371094, 91.31088256835938, 17.994125366210938, 148.3214874267578, 141.07907104492188, 170.97657775878906, 71.142333984375, 22.919822692871094, 12.254549026489258, 165.4793701171875, 53.59386444091797, 142.67156982421875, 49.67019271850586, 130.84130859375, 238.18988037109375, 32.34227752685547, -11.221635818481445, 16.967557907104492, -0.9755935668945312, 137.71307373046875, 64.10245513916016, -106.97648620605469, 158.22543334960938, -15.451580047607422, -0.9695529937744141, 120.27731323242188, 163.08042907714844, 4.054901123046875, 249.8273468017578, -92.27899169921875, 100.2749252319336, 30.128257751464844, -72.0477294921875, 110.82463836669922, -0.5146865844726562, 6.90313720703125, -13.946134567260742, 203.2576904296875, 119.8116455078125, 47.25004577636719, 163.96559143066406, 69.5537109375, 187.05548095703125, 185.30526733398438, 194.24014282226562, 17.2989501953125, 193.23953247070312, 65.18399810791016], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000459.npy"} +{"epoch": 0.6938775510204082, "step": 460, "batch_size": 64, "mean": 74.39859008789062, "std": 88.5855941772461, "min": -93.9857177734375, "p10": -28.365875244140625, "median": 48.87944412231445, "p90": 183.78662414550783, "max": 286.468017578125, "pos_frac": 0.78125, "sample": [214.3435516357422, 105.79873657226562, 228.85595703125, -43.05885314941406, 19.51097869873047, 174.71290588378906, 202.83909606933594, 43.44158935546875, 286.468017578125, 5.554901123046875, -42.85710144042969, -27.814834594726562, 15.954460144042969, 22.67278289794922, 3.473541259765625, 14.217323303222656, 25.03388786315918, 162.02450561523438, -34.28825378417969, 166.20257568359375, 88.83636474609375, 176.3345184326172, 40.257728576660156, 195.76129150390625, 160.77728271484375, 92.74254608154297, 11.46627426147461, 38.75994873046875, 171.1970672607422, 68.70765686035156, 112.5772705078125, 161.04031372070312, 149.40061950683594, 116.21429443359375, 11.574342727661133, 82.28953552246094, 5.982025146484375, 22.241653442382812, 41.8507080078125, -3.202829360961914, 96.58271789550781, 166.5837860107422, -22.326683044433594, 9.160547256469727, 107.87559509277344, 176.77748107910156, -41.324615478515625, -11.9410400390625, 138.95904541015625, -93.9857177734375, -0.9622707366943359, 42.6949462890625, 169.7606201171875, 56.63740539550781, 15.224441528320312, 186.79054260253906, 54.317298889160156, 257.64703369140625, -71.52194213867188, -28.602035522460938, 110.94979858398438, -4.40374755859375, -14.010658264160156, 172.73294067382812], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000460.npy"} +{"epoch": 0.6953892668178382, "step": 461, "batch_size": 64, "mean": 75.10448455810547, "std": 86.03243255615234, "min": -86.22006225585938, "p10": -28.613871765136718, "median": 66.4798355102539, "p90": 186.66881408691407, "max": 255.41653442382812, "pos_frac": 0.765625, "sample": [191.16693115234375, 73.60272979736328, 35.25856018066406, 57.30274963378906, 157.1815948486328, 198.28053283691406, 50.332496643066406, 149.41958618164062, 136.59048461914062, -73.23971557617188, -15.408645629882812, 66.90412902832031, 66.0555419921875, 5.446298599243164, 121.26306915283203, -21.023422241210938, -61.39033508300781, 177.43350219726562, 3.7089920043945312, 4.042577743530273, 121.68159484863281, 147.9309844970703, 145.01470947265625, 4.251495361328125, 30.655052185058594, 114.87985229492188, -33.397361755371094, -9.442432403564453, -28.82469940185547, 100.7148208618164, 165.58401489257812, -28.12194061279297, -18.1540470123291, 73.5904312133789, 145.67637634277344, 186.60662841796875, 255.41653442382812, 176.71551513671875, 52.60272216796875, 226.50411987304688, 176.2054901123047, 168.3052520751953, 100.93183898925781, 59.02471160888672, 3.903074264526367, -26.553482055664062, 78.64894104003906, -0.8513393402099609, 156.99061584472656, 26.813270568847656, 190.27137756347656, 78.02286529541016, 46.995574951171875, 27.140335083007812, 186.69546508789062, -27.169708251953125, 194.9110870361328, -86.22006225585938, 40.040977478027344, -29.89513397216797, 159.14016723632812, 2.8449783325195312, 172.55502319335938, -44.87599182128906], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000461.npy"} +{"epoch": 0.6969009826152683, "step": 462, "batch_size": 64, "mean": 76.93798828125, "std": 85.79206848144531, "min": -153.25723266601562, "p10": -14.579668045043945, "median": 67.26665878295898, "p90": 173.54538116455078, "max": 252.18618774414062, "pos_frac": 0.796875, "sample": [168.46046447753906, 191.41326904296875, 183.81137084960938, 164.099609375, 7.804603576660156, 26.7550048828125, 137.4833984375, -0.12099838256835938, 0.32646942138671875, 5.083824157714844, -40.179893493652344, 169.69561767578125, 157.19537353515625, 49.490440368652344, 169.80752563476562, 185.16876220703125, -6.9423828125, 162.8196563720703, 22.25682830810547, 112.3069076538086, 147.54002380371094, 61.80033874511719, 52.128662109375, 137.78021240234375, 57.160858154296875, 10.680152893066406, 148.63800048828125, 185.53103637695312, -14.925045013427734, 126.85757446289062, -27.665069580078125, -13.773788452148438, -9.668830871582031, 163.96609497070312, 171.60629272460938, -56.542388916015625, -29.264799118041992, 107.875732421875, 55.80054473876953, 108.27362060546875, 164.319091796875, 174.3764190673828, 76.30217742919922, 37.820709228515625, 45.56205749511719, 178.118408203125, -0.9085540771484375, 28.10439682006836, 146.07611083984375, 151.86727905273438, 69.27847290039062, -140.15794372558594, 147.17529296875, 169.90472412109375, 119.85661315917969, 8.359642028808594, 24.037691116333008, 252.18618774414062, 84.2919692993164, 65.25484466552734, -153.25723266601562, 7.753532409667969, -5.540903091430664, 22.714984893798828], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000462.npy"} +{"epoch": 0.6984126984126984, "step": 463, "batch_size": 64, "mean": 46.52490997314453, "std": 80.51114654541016, "min": -175.52883911132812, "p10": -52.002571105957024, "median": 38.20619010925293, "p90": 153.67540740966797, "max": 202.4825897216797, "pos_frac": 0.71875, "sample": [-0.9311943054199219, 148.39779663085938, 84.16726684570312, -175.52883911132812, 91.08143615722656, 134.3511199951172, -20.278696060180664, 172.68614196777344, 138.24185180664062, 94.42595672607422, -56.49293899536133, -53.94136047363281, 1.4595108032226562, 68.41798400878906, 140.5314483642578, -112.04208374023438, 33.03595733642578, 37.13868713378906, 4.651542663574219, -71.46561431884766, 56.40428161621094, 29.403709411621094, -16.406158447265625, 174.87088012695312, 66.8618392944336, -31.840972900390625, 27.998031616210938, 18.03455352783203, -8.225532531738281, 6.571987152099609, 33.51731872558594, 12.033988952636719, 168.15411376953125, 159.8208465576172, 47.888919830322266, 122.74678802490234, 116.05744171142578, 35.20825958251953, 8.134986877441406, 202.4825897216797, 39.2736930847168, 18.14971160888672, 69.12741088867188, -83.45497131347656, -25.00289535522461, -47.478729248046875, 195.57867431640625, 103.52745056152344, 154.8472137451172, 104.90310668945312, 42.77338790893555, -122.86954498291016, -4.476966857910156, -14.080869674682617, 59.90663146972656, 150.94119262695312, 58.30427932739258, -2.190521240234375, 95.92565155029297, 104.38082122802734, -9.440963745117188, 59.46479797363281, 10.920377731323242, 130.9415740966797], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000463.npy"} +{"epoch": 0.6999244142101285, "step": 464, "batch_size": 64, "mean": 70.37861633300781, "std": 96.32426452636719, "min": -158.14309692382812, "p10": -41.63649444580078, "median": 75.95195388793945, "p90": 200.2273361206055, "max": 230.80665588378906, "pos_frac": 0.734375, "sample": [-32.12297058105469, 31.102081298828125, 168.20721435546875, -42.5203857421875, 166.78543090820312, -2.9966278076171875, 7.209510803222656, 161.52227783203125, 76.73678588867188, 120.837890625, 167.072265625, -32.00597381591797, 128.92474365234375, 99.9681625366211, 83.45217895507812, -103.32369995117188, 203.6268310546875, 117.6728515625, 37.39442443847656, 149.84609985351562, 12.334220886230469, 230.80665588378906, -21.278718948364258, 101.3795394897461, 25.559310913085938, 162.69866943359375, 53.43769073486328, 208.38644409179688, 117.48458862304688, 131.76329040527344, 90.02079772949219, 14.260719299316406, 167.80307006835938, 225.8151092529297, -132.40621948242188, -39.57408142089844, 177.50604248046875, 75.16712188720703, -109.4560546875, -64.44450378417969, 150.01004028320312, 16.724525451660156, 39.74343490600586, 211.23391723632812, -50.45703887939453, -1.8416824340820312, 19.09064483642578, 54.96961975097656, -4.9755859375, 215.8197784423828, 122.79566955566406, 198.84165954589844, -158.14309692382812, -19.15073013305664, 35.94275665283203, -21.343303680419922, 15.330299377441406, 173.11114501953125, 117.74705505371094, 200.82119750976562, -22.849281311035156, 126.38996887207031, 137.98443603515625, 11.783187866210938], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000464.npy"} +{"epoch": 0.7014361300075586, "step": 465, "batch_size": 64, "mean": 57.592037200927734, "std": 92.12824249267578, "min": -121.5587158203125, "p10": -58.322994995117185, "median": 63.169944763183594, "p90": 178.13519592285158, "max": 223.83743286132812, "pos_frac": 0.671875, "sample": [-56.72740173339844, 223.83743286132812, 152.529541015625, -118.34335327148438, 144.63497924804688, 153.57229614257812, -36.56614685058594, 179.71383666992188, 36.36256408691406, 68.89253997802734, 69.12019348144531, 167.1142578125, 131.5348663330078, 207.92868041992188, -52.959800720214844, 138.63677978515625, 0.43091583251953125, 172.67547607421875, 142.419189453125, -0.48218536376953125, -42.921905517578125, -102.69679260253906, 175.6468505859375, 204.4912567138672, 78.23420715332031, 181.49143981933594, -60.25605010986328, -97.09660339355469, -26.994300842285156, 63.002296447753906, 1.1236495971679688, -31.70386505126953, 79.58892822265625, 78.89994049072266, 121.19895935058594, -5.9542236328125, -59.00682067871094, -7.387138366699219, 3.513723373413086, 156.97796630859375, -71.32400512695312, -5.710655212402344, 56.5080680847168, 40.056068420410156, -9.842933654785156, -121.5587158203125, -43.25319290161133, 64.94400024414062, 41.32611083984375, 181.0438995361328, 6.264518737792969, 179.20162963867188, 22.840065002441406, 82.73493957519531, 18.693992614746094, -24.876577377319336, 63.33759307861328, -11.989721298217773, 108.67198181152344, 91.09891510009766, 173.34249877929688, 116.44398498535156, 137.1405792236328, 156.32131958007812], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000465.npy"} +{"epoch": 0.7029478458049887, "step": 466, "batch_size": 64, "mean": 37.1757698059082, "std": 86.34699249267578, "min": -253.74468994140625, "p10": -49.89047088623047, "median": 24.060248374938965, "p90": 157.60387268066407, "max": 235.40170288085938, "pos_frac": 0.6875, "sample": [-0.9100265502929688, 147.71939086914062, -50.63720703125, -105.06890869140625, 25.959375381469727, 4.629858016967773, 22.743301391601562, -12.91009521484375, 28.61577606201172, -253.74468994140625, 71.31044006347656, 59.398193359375, 169.03652954101562, -83.55677795410156, 82.25814056396484, -1.1861572265625, 88.530029296875, 235.40170288085938, 38.33369445800781, 198.07717895507812, 74.94412231445312, 14.090522766113281, 158.60748291015625, -0.3059272766113281, -1.113983154296875, 7.311744689941406, 112.54554748535156, -59.80833053588867, 218.3614501953125, 42.2364501953125, -4.242887496948242, 100.61140441894531, -18.518882751464844, 44.69538879394531, 141.7337188720703, 39.51365280151367, 120.45138549804688, 39.34027862548828, -28.693897247314453, 34.16973114013672, -27.011207580566406, -136.36196899414062, -44.64868927001953, -62.03477478027344, 108.75628662109375, 22.287445068359375, 11.991653442382812, 89.08377838134766, 210.66006469726562, -1.0085258483886719, -48.14808654785156, 73.19308471679688, -26.29192352294922, 46.90052795410156, 10.871421813964844, 2.1371707916259766, 12.922086715698242, 16.533430099487305, 25.377195358276367, 155.26211547851562, 180.57562255859375, 13.251567840576172, 13.001380920410156, 32.02074432373047], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000466.npy"} +{"epoch": 0.7044595616024187, "step": 467, "batch_size": 64, "mean": 54.6355094909668, "std": 86.58133697509766, "min": -144.2418670654297, "p10": -31.74634666442871, "median": 29.549095153808594, "p90": 160.14881744384772, "max": 394.6236267089844, "pos_frac": 0.78125, "sample": [2.5370941162109375, 112.00511169433594, 39.344085693359375, 55.33589172363281, 27.105804443359375, 66.91476440429688, -0.01151275634765625, -25.837932586669922, -32.16935348510742, 64.14459991455078, 119.92245483398438, -54.9418830871582, 174.71621704101562, -24.774938583374023, 91.83903503417969, 114.03401947021484, 84.7486343383789, 36.703125, -103.95335388183594, 11.394241333007812, 129.64022827148438, -79.23614501953125, -30.75933074951172, 124.01721954345703, 195.96206665039062, 27.737144470214844, 21.169960021972656, 91.53239440917969, -144.2418670654297, 144.4000244140625, -6.5656890869140625, 56.36842346191406, 10.155431747436523, 26.452789306640625, -0.8539886474609375, 17.120101928710938, 102.74348449707031, 204.53805541992188, 58.13563537597656, 108.4974365234375, 1.187957763671875, -0.3580951690673828, 1.1865158081054688, 19.61747932434082, 6.605878829956055, -40.76515197753906, 142.23434448242188, 3.4568557739257812, 137.2825469970703, 122.30654907226562, 394.6236267089844, 11.948204040527344, 0.8738632202148438, 7.701032638549805, 68.38321685791016, 82.01346588134766, 31.361045837402344, 180.821044921875, 21.85369110107422, 208.04100036621094, -50.842376708984375, 166.89830017089844, 142.95419311523438, 21.41802978515625], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000467.npy"} +{"epoch": 0.7059712773998488, "step": 468, "batch_size": 64, "mean": 77.71587371826172, "std": 91.20565032958984, "min": -135.1853485107422, "p10": -26.590035438537598, "median": 67.36042785644531, "p90": 198.35744476318362, "max": 230.28839111328125, "pos_frac": 0.828125, "sample": [4.961015701293945, 36.929351806640625, 104.640869140625, 226.56080627441406, 31.02703094482422, -27.34076499938965, 5.199819564819336, 139.741455078125, 152.1722412109375, 49.285545349121094, 107.83518981933594, 204.98880004882812, 193.61399841308594, -135.1853485107422, 23.812728881835938, 57.396331787109375, 59.44701385498047, -22.772491455078125, -121.5177001953125, 116.97544860839844, 173.16883850097656, 114.98312377929688, 156.42626953125, 216.78631591796875, 50.27622985839844, 135.39761352539062, 173.8883056640625, 5.399682998657227, -1.868072509765625, -117.47711944580078, 200.39035034179688, -108.95367431640625, 94.24346923828125, -4.542362213134766, 17.263282775878906, -52.311546325683594, 121.27104949951172, 130.49215698242188, -43.083953857421875, 160.52175903320312, 57.633766174316406, 59.97625732421875, 169.2708740234375, 204.88137817382812, 156.92425537109375, 3.34539794921875, 28.286169052124023, 52.35888671875, 18.106727600097656, 6.941884994506836, 172.64065551757812, 50.57257843017578, 105.12142944335938, 53.075927734375, 230.28839111328125, 102.49942016601562, -24.838333129882812, 212.49169921875, 160.83444213867188, 170.29539489746094, 168.4144287109375, 95.00554656982422, 74.74459838867188, 14.900901794433594], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000468.npy"} +{"epoch": 0.7074829931972789, "step": 469, "batch_size": 64, "mean": 67.26615142822266, "std": 77.22006225585938, "min": -102.58847045898438, "p10": -9.595890426635739, "median": 57.748125076293945, "p90": 164.16361083984376, "max": 269.07733154296875, "pos_frac": 0.796875, "sample": [21.0775146484375, 164.688720703125, 93.49693298339844, 116.31456756591797, 16.75055694580078, 6.723529815673828, 46.21440124511719, 113.10738372802734, 62.27437210083008, -102.58847045898438, 161.38136291503906, 70.71253967285156, 133.5289764404297, 2.7860794067382812, -10.954216003417969, 149.6295166015625, 117.0937271118164, 49.82312774658203, 91.67865753173828, 168.89224243164062, 178.84432983398438, 10.750228881835938, 113.16593170166016, 5.90618896484375, 115.09976196289062, -80.29093170166016, 51.17571258544922, 13.56549072265625, -0.6746082305908203, 53.22187805175781, -3.8463897705078125, 0.6647930145263672, 117.3736572265625, 189.85916137695312, 161.34091186523438, -1.715667724609375, 0.11865234375, -20.25853729248047, 162.9383544921875, 134.91387939453125, 170.73001098632812, 80.19535064697266, 29.414249420166016, 118.68282318115234, -4.670280456542969, 0.248443603515625, 108.11618041992188, -0.9136734008789062, 162.69442749023438, 28.742172241210938, -46.023895263671875, -6.426464080810547, 218.42312622070312, 3.048980712890625, 269.07733154296875, 14.208457946777344, 89.24520874023438, 68.67427825927734, 118.45149230957031, -35.237525939941406, 108.08674621582031, 10.995878219604492, -28.230438232421875, 152.71676635742188], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000469.npy"} +{"epoch": 0.708994708994709, "step": 470, "batch_size": 64, "mean": 64.09949493408203, "std": 87.95196533203125, "min": -190.42564392089844, "p10": -38.109088516235346, "median": 67.29606246948242, "p90": 179.08680267333986, "max": 220.54074096679688, "pos_frac": 0.765625, "sample": [153.7796630859375, 74.60247039794922, 220.54074096679688, -190.42564392089844, 59.989654541015625, 168.46084594726562, 45.00025939941406, 36.151817321777344, 161.87612915039062, 115.52078247070312, 166.2422332763672, -68.26771545410156, 183.95822143554688, 24.242477416992188, 152.7050018310547, 20.119285583496094, 93.12884521484375, -58.40718078613281, -16.62261962890625, 141.03729248046875, -39.639469146728516, 199.13510131835938, 12.294778823852539, -82.18783569335938, 181.11474609375, 31.287248611450195, 150.29403686523438, 147.3641815185547, 7.257499694824219, -20.977075576782227, 81.24668884277344, 2.3069801330566406, 120.02774047851562, 22.04193115234375, -57.28382873535156, 13.827171325683594, 77.39909362792969, 2.4650630950927734, 85.98995971679688, -21.282325744628906, 212.1492156982422, 174.3549346923828, 170.7515869140625, 11.371009826660156, -34.53820037841797, -25.136856079101562, 21.828035354614258, 149.62103271484375, 90.89915466308594, 126.54296112060547, 102.41004943847656, 184.10134887695312, -34.27629852294922, 112.07212829589844, 24.06853485107422, 121.1467056274414, 82.20637512207031, 95.73419189453125, -7.3548126220703125, -56.796974182128906, 185.81378173828125, 1.3800716400146484, -7.189487457275391, 4.894695281982422], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000470.npy"} +{"epoch": 0.7105064247921391, "step": 471, "batch_size": 64, "mean": 73.78404998779297, "std": 89.30802154541016, "min": -174.9926300048828, "p10": -29.013428497314447, "median": 64.36171340942383, "p90": 180.05993957519533, "max": 265.5000305175781, "pos_frac": 0.8125, "sample": [12.175697326660156, 214.50424194335938, 150.4364776611328, 149.5571746826172, 63.16094970703125, -38.26806640625, 161.8546142578125, 64.32438659667969, 169.08180236816406, 205.7900390625, 83.25350189208984, 51.01713562011719, 182.19378662109375, 19.713829040527344, -122.07955932617188, -0.9990139007568359, 64.39904022216797, 185.09649658203125, 155.8892822265625, -79.68478393554688, 33.289913177490234, 54.05403518676758, 139.90011596679688, 62.781402587890625, 149.03274536132812, -174.9926300048828, 83.3663558959961, 100.310546875, 173.18055725097656, 15.160057067871094, 141.88966369628906, 94.10835266113281, 30.080760955810547, 34.97224426269531, 77.06068420410156, 91.53736114501953, 174.41842651367188, -33.86231994628906, 22.717628479003906, 168.027099609375, 21.952232360839844, 3.2493896484375, 174.72601318359375, 184.17840576171875, -8.295347213745117, 13.795303344726562, 44.27754211425781, 106.20494079589844, -32.07971954345703, 116.04417419433594, -21.858749389648438, 175.08096313476562, 64.19856262207031, 17.798965454101562, 145.6162109375, -3.8886756896972656, 18.418853759765625, 108.03163146972656, -115.88481140136719, 265.5000305175781, 24.79620361328125, 74.31170654296875, -3.2358779907226562, 220.79124450683594], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000471.npy"} +{"epoch": 0.7120181405895691, "step": 472, "batch_size": 64, "mean": 59.67264175415039, "std": 102.39328002929688, "min": -191.13511657714844, "p10": -67.2498237609863, "median": 49.58000946044922, "p90": 178.844189453125, "max": 362.41644287109375, "pos_frac": 0.75, "sample": [2.5450973510742188, 44.65137481689453, 64.72289276123047, -40.68309020996094, 176.98963928222656, 160.02162170410156, -30.563812255859375, 129.0222930908203, 199.45355224609375, 148.7581787109375, 55.33389663696289, 232.11679077148438, 19.168203353881836, -47.73371887207031, -6.725408554077148, 176.17352294921875, -1.6790409088134766, 75.73102569580078, 177.83787536621094, 37.375640869140625, -80.58399963378906, 42.82432556152344, -23.078022003173828, 169.8427734375, 11.075408935546875, 158.50213623046875, 36.37776184082031, 186.46282958984375, 177.2139129638672, -19.92983627319336, 19.266632080078125, 61.88728332519531, 74.7855453491211, -97.77580261230469, -38.635948181152344, 54.823944091796875, 204.24453735351562, 362.41644287109375, -7.255195617675781, 4.309989929199219, 162.5764617919922, 179.2754669189453, -191.13511657714844, 182.28878784179688, -125.40690612792969, -75.6138687133789, 163.39646911621094, 14.393304824829102, -130.38909912109375, 96.5876235961914, 8.214805603027344, 59.73310852050781, 8.258621215820312, 14.220558166503906, 26.133621215820312, 54.508644104003906, 84.7786865234375, 22.91942596435547, 173.3105010986328, 33.92439270019531, 87.392578125, 59.298728942871094, -113.41830444335938, 154.50958251953125], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000472.npy"} +{"epoch": 0.7135298563869993, "step": 473, "batch_size": 64, "mean": 68.46421813964844, "std": 109.30412292480469, "min": -154.26873779296875, "p10": -57.872529602050776, "median": 45.790836334228516, "p90": 224.03772583007813, "max": 316.48736572265625, "pos_frac": 0.734375, "sample": [229.03662109375, 194.87826538085938, 32.302276611328125, -123.5284423828125, -85.52809143066406, 141.13804626464844, 46.03587341308594, 24.077102661132812, 45.545799255371094, 190.89056396484375, 162.7734375, 32.52033996582031, -3.834268569946289, 94.46199035644531, 7.158470153808594, -43.784584045410156, 255.42665100097656, 222.20065307617188, 20.36779022216797, 189.94332885742188, -107.14009094238281, 29.29473114013672, 160.68670654296875, -55.29844665527344, -58.9757080078125, 151.8426055908203, 122.71270751953125, 208.89596557617188, 10.811861038208008, -3.3728103637695312, -14.50946044921875, 5.6702728271484375, -147.85256958007812, -21.502540588378906, -22.11155891418457, 93.96559143066406, 316.48736572265625, 230.884765625, 25.348636627197266, 19.53556251525879, 244.30392456054688, 156.14605712890625, 278.25811767578125, 100.30654907226562, 83.69142150878906, 69.98104858398438, 46.34709930419922, 10.40655517578125, 38.802513122558594, 160.82508850097656, 109.28536987304688, -2.4620895385742188, 96.9769058227539, 90.24646759033203, -20.73955535888672, 96.57178497314453, 224.82504272460938, -115.16166687011719, 12.3363037109375, -39.95587158203125, 22.003456115722656, 124.64468383789062, 170.88433837890625, -154.26873779296875], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000473.npy"} +{"epoch": 0.7150415721844293, "step": 474, "batch_size": 64, "mean": 54.56712341308594, "std": 98.79825592041016, "min": -167.77464294433594, "p10": -49.555993652343744, "median": 29.498900413513184, "p90": 190.3882049560547, "max": 265.49017333984375, "pos_frac": 0.703125, "sample": [192.13705444335938, 159.61151123046875, 99.13059997558594, -66.30947875976562, -12.21500015258789, 8.375118255615234, 152.36691284179688, 197.39837646484375, 75.09597778320312, 25.69378662109375, 86.04542541503906, 81.38142395019531, -167.77464294433594, 106.70330810546875, 69.27871704101562, 170.49122619628906, -88.47917938232422, 0.03899383544921875, -41.956748962402344, 28.348129272460938, -52.81281280517578, -17.31732940673828, 154.18162536621094, 36.614280700683594, 116.22305297851562, 23.678144454956055, -0.7830982208251953, -36.37889099121094, -10.077743530273438, -4.296287536621094, 146.02883911132812, 39.021549224853516, -148.30775451660156, 6.391761779785156, -23.50070571899414, 161.56863403320312, 25.13001251220703, 196.87570190429688, 186.30755615234375, 0.44475555419921875, 30.64967155456543, 41.732452392578125, 220.59890747070312, 122.11521911621094, -38.18021011352539, 265.49017333984375, 207.78573608398438, 61.85401916503906, 129.992431640625, -4.526124954223633, 168.44288635253906, 249.81640625, -33.42506408691406, 22.92205047607422, 27.76142120361328, -27.62210464477539, 173.78964233398438, -114.7384033203125, 8.74740982055664, 67.78706359863281, 147.76406860351562, -128.65260314941406, 1.15631103515625, 16.681743621826172], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000474.npy"} +{"epoch": 0.7165532879818595, "step": 475, "batch_size": 64, "mean": 84.86761474609375, "std": 92.22247314453125, "min": -80.70181274414062, "p10": -14.439963912963867, "median": 65.31962203979492, "p90": 196.9603698730469, "max": 275.3047180175781, "pos_frac": 0.8125, "sample": [-13.747446060180664, 6.682529449462891, 10.855476379394531, -3.8956146240234375, 158.7533416748047, 123.7739028930664, 172.03173828125, 193.87222290039062, -9.286432266235352, -39.272804260253906, 154.2091064453125, -80.70181274414062, 188.55032348632812, 275.3047180175781, 15.356195449829102, 11.576980590820312, 142.9739990234375, 156.1609344482422, 8.74300765991211, 133.91348266601562, 54.813987731933594, 23.838699340820312, -14.736757278442383, 33.248191833496094, 140.05630493164062, 8.820011138916016, 30.22417449951172, 208.3171844482422, 130.80889892578125, -13.064628601074219, 195.95672607421875, 179.5509033203125, 175.54415893554688, 197.3905029296875, 50.11134338378906, 2.9009742736816406, 127.26947784423828, 5.456306457519531, 123.87466430664062, 37.1224479675293, 225.058349609375, 145.0135498046875, 17.24008560180664, 32.52740478515625, 148.05796813964844, -57.36514663696289, 26.137676239013672, 85.75169372558594, 268.585205078125, 36.148414611816406, 171.03529357910156, 233.22442626953125, 224.5933837890625, 112.49832916259766, 158.28439331054688, -44.519981384277344, -65.63460540771484, 180.15231323242188, 75.82525634765625, 166.09298706054688, 5.953022003173828, -0.19820404052734375, -57.61009216308594, 41.318416595458984], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000475.npy"} +{"epoch": 0.7180650037792895, "step": 476, "batch_size": 64, "mean": 55.24436950683594, "std": 95.08464813232422, "min": -120.26766967773438, "p10": -53.81904830932616, "median": 47.6953010559082, "p90": 170.87709808349612, "max": 294.89471435546875, "pos_frac": 0.6875, "sample": [200.7034912109375, 54.45559310913086, -20.61867332458496, 74.05021667480469, -44.50984191894531, 46.739166259765625, -34.350921630859375, 173.9147491455078, 294.89471435546875, 44.39973449707031, 245.14227294921875, -2.7975311279296875, 163.78924560546875, 143.44581604003906, 128.4281005859375, 101.32759857177734, 148.5267333984375, 2.9622268676757812, 65.8798599243164, 11.35223388671875, -95.68618774414062, 4.284854888916016, 119.33680725097656, 155.44996643066406, 44.81373596191406, -117.39393615722656, 26.176864624023438, -25.122024536132812, -35.516815185546875, 12.362133026123047, 192.8552703857422, -37.32945251464844, 120.10881042480469, 22.334217071533203, 64.8611068725586, -65.70640563964844, -97.13162231445312, -120.26766967773438, 71.86604309082031, 15.885116577148438, -28.707046508789062, 113.56169128417969, 11.509140014648438, -13.883056640625, 102.20480346679688, 56.714691162109375, 126.26956176757812, -1.7262344360351562, -35.194061279296875, 141.56411743164062, 106.41377258300781, -118.10592651367188, 188.11495971679688, -42.7005615234375, 96.22984313964844, 226.37954711914062, 3.7044544219970703, 48.65143585205078, 161.60232543945312, 123.27703857421875, -30.141740798950195, 152.18690490722656, 151.60696411132812, -57.80870819091797], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000476.npy"} +{"epoch": 0.7195767195767195, "step": 477, "batch_size": 64, "mean": 58.888214111328125, "std": 110.43643188476562, "min": -189.42984008789062, "p10": -105.79905014038084, "median": 44.11717224121094, "p90": 189.28507232666016, "max": 275.57220458984375, "pos_frac": 0.765625, "sample": [-135.18663024902344, -89.98275756835938, 137.22573852539062, 39.482261657714844, 3.667816162109375, 171.50991821289062, 1.3650436401367188, 21.9472599029541, 59.70074462890625, 3.473377227783203, 184.2459716796875, 30.1531982421875, -123.6341552734375, -5.169227600097656, 37.68086242675781, 7.396827697753906, -19.635086059570312, 245.19107055664062, 118.29029846191406, -66.94419860839844, 183.28697204589844, 136.1179962158203, 7.9774169921875, 70.1880111694336, 98.91140747070312, -45.816429138183594, -112.57746124267578, 5.731803894042969, 176.84930419921875, 13.630111694335938, -136.88783264160156, 43.17455291748047, 41.372703552246094, 34.90035629272461, -183.3704376220703, -37.69082260131836, -35.8316650390625, 45.059791564941406, 118.54888916015625, 47.42670440673828, 195.46543884277344, -1.4132080078125, 190.21517944335938, 187.1148223876953, 89.98587036132812, 195.22598266601562, -154.8525390625, 180.95437622070312, 128.95611572265625, 29.196380615234375, 275.57220458984375, 123.60379028320312, 17.093263626098633, 169.3866729736328, 205.8860321044922, 72.88768005371094, -189.42984008789062, 227.905029296875, 171.75172424316406, 183.50955200195312, 48.563255310058594, 166.5770263671875, 17.539291381835938, 145.37205505371094], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000477.npy"} +{"epoch": 0.7210884353741497, "step": 478, "batch_size": 64, "mean": 48.554412841796875, "std": 94.84188842773438, "min": -152.11273193359375, "p10": -84.85633316040038, "median": 45.8645133972168, "p90": 169.4322723388672, "max": 210.996337890625, "pos_frac": 0.6875, "sample": [-11.850332260131836, 166.24232482910156, 97.2825927734375, 143.79757690429688, 110.53350830078125, -3.8790512084960938, 185.3733367919922, 127.72683715820312, -21.416147232055664, 102.00593566894531, 3.146209716796875, 16.119049072265625, 114.03411865234375, 210.996337890625, -31.72541046142578, 18.459930419921875, -100.75431823730469, 51.7197265625, -16.91497039794922, 66.14146423339844, -39.62249755859375, -29.376779556274414, 155.47071838378906, 121.62623596191406, 157.09146118164062, -101.4800033569336, 137.43902587890625, 126.17422485351562, 84.02154541015625, -152.11273193359375, 56.91905212402344, 6.461658477783203, -143.508544921875, -143.97610473632812, 21.588153839111328, 114.99740600585938, 170.7993927001953, 24.3121337890625, 160.156005859375, 49.218482971191406, 182.07763671875, -0.9788913726806641, -89.52332305908203, 42.51054382324219, 178.68112182617188, 61.48002624511719, -4.787078857421875, 206.0192413330078, 34.919639587402344, -6.045291900634766, 150.9456024169922, 93.53231048583984, -54.126983642578125, 121.33609771728516, 2.6498565673828125, 198.23489379882812, 130.9509735107422, -48.76154327392578, 3.4768600463867188, 28.267623901367188, -73.96669006347656, -138.19918823242188, 67.96471405029297, 17.586824417114258], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000478.npy"} +{"epoch": 0.7226001511715797, "step": 479, "batch_size": 64, "mean": 42.73262023925781, "std": 90.40058135986328, "min": -220.50064086914062, "p10": -54.93957061767578, "median": 38.060020446777344, "p90": 154.3117126464844, "max": 315.57513427734375, "pos_frac": 0.6875, "sample": [11.94887924194336, 38.51045608520508, 95.16943359375, -116.1004638671875, -56.44456481933594, 69.55699920654297, 206.29310607910156, 96.66026306152344, 91.96609497070312, -55.666664123535156, 37.84180450439453, -33.716182708740234, 12.219024658203125, -23.50203514099121, -4.824485778808594, 41.94380187988281, 212.99778747558594, 158.47247314453125, -32.416664123535156, 1.8072471618652344, -47.526615142822266, 25.288753509521484, 315.57513427734375, 184.92466735839844, 38.278236389160156, -93.13650512695312, 23.026214599609375, 38.874053955078125, -82.97417449951172, -53.243019104003906, 0.0034027099609375, 93.11017608642578, -4.654121398925781, 142.48326110839844, 4.187469482421875, 55.46828079223633, -135.44451904296875, -13.142181396484375, 20.74089813232422, 143.49330139160156, 117.7689208984375, -220.50064086914062, -18.408653259277344, 68.98408508300781, 164.33546447753906, 164.43484497070312, 82.15306854248047, -2.471710205078125, 0.9256744384765625, 70.69051361083984, 63.210540771484375, 108.05477142333984, -41.15373229980469, 144.603271484375, -9.15641975402832, 104.35423278808594, 104.9422607421875, 23.552427291870117, 60.45207977294922, 122.95219421386719, 0.8211116790771484, -0.6079864501953125, 86.60238647460938, 130.2997283935547], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000479.npy"} +{"epoch": 0.7241118669690099, "step": 480, "batch_size": 64, "mean": 66.35453796386719, "std": 94.8783950805664, "min": -192.6812744140625, "p10": -34.25903472900391, "median": 72.52432250976562, "p90": 166.75999298095704, "max": 320.0506286621094, "pos_frac": 0.765625, "sample": [98.21495819091797, 3.08563232421875, 164.1909942626953, -131.09475708007812, 123.63172912597656, 23.364110946655273, 141.7499237060547, -192.6812744140625, 12.433197021484375, 320.0506286621094, -5.638603210449219, 78.17318725585938, 162.0216064453125, -15.871284484863281, 75.84451293945312, -25.781936645507812, -42.60247802734375, 140.0928497314453, -32.64337158203125, 3.161327362060547, -99.44541931152344, 144.63229370117188, 35.77887725830078, -91.04100799560547, 180.158203125, 138.78744506835938, 282.4461975097656, 85.48820495605469, 146.9943084716797, 55.375030517578125, 93.59370422363281, 2.30316162109375, 35.42707061767578, 124.2650146484375, 51.746978759765625, 98.62760925292969, 184.7544403076172, 114.08798217773438, -119.24359893798828, 104.23623657226562, 156.40257263183594, 110.35936737060547, 64.48058319091797, 138.9688720703125, 49.30677795410156, 141.57760620117188, 7.7622833251953125, -12.10400390625, 46.3519401550293, 69.20413208007812, -5.91963005065918, -28.376434326171875, 167.86099243164062, 94.08168029785156, 132.52940368652344, 100.5958251953125, 180.14361572265625, 155.49696350097656, 19.796977996826172, -34.95146179199219, 18.471054077148438, 196.218017578125, -11.2421875, 21.001358032226562], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000480.npy"} +{"epoch": 0.7256235827664399, "step": 481, "batch_size": 64, "mean": 62.557899475097656, "std": 92.93016815185547, "min": -166.5558624267578, "p10": -38.88188934326171, "median": 51.52293395996094, "p90": 169.7623031616211, "max": 324.60736083984375, "pos_frac": 0.75, "sample": [81.07763671875, 9.887962341308594, 170.99752807617188, 51.529930114746094, -56.553001403808594, 110.95945739746094, 151.5538330078125, 60.489810943603516, -58.29231262207031, -72.2978515625, 116.50234985351562, 65.37959289550781, 152.2276153564453, 86.73863983154297, -2.0555953979492188, 122.83920288085938, 155.24102783203125, 38.66021728515625, 128.35513305664062, 138.15676879882812, -163.2300262451172, -3.969940185546875, 188.82559204101562, 46.76847839355469, -2.1159400939941406, -27.363195419311523, 14.043167114257812, 160.10293579101562, 16.916339874267578, 92.8067626953125, 1.1281604766845703, 166.88011169433594, 14.301361083984375, 10.667236328125, 44.30131530761719, -10.021957397460938, 121.75537872314453, 13.634746551513672, 4.906375885009766, 9.807868957519531, 55.393035888671875, 51.51593780517578, 163.07391357421875, 185.4639892578125, -6.6900177001953125, 196.4130859375, -30.61505126953125, -14.840583801269531, 175.9711151123047, 165.31002807617188, 152.30001831054688, 35.87084197998047, 56.54551696777344, 17.342796325683594, -42.42481994628906, 324.60736083984375, -166.5558624267578, 98.0361557006836, 95.12623596191406, 287.76904296875, 92.24617767333984, 40.399375915527344, -64.5452880859375, -15.550067901611328], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000481.npy"} +{"epoch": 0.72713529856387, "step": 482, "batch_size": 64, "mean": 59.961273193359375, "std": 113.85560607910156, "min": -243.2610626220703, "p10": -72.69690017700195, "median": 40.13429260253906, "p90": 189.40564422607423, "max": 357.9279479980469, "pos_frac": 0.703125, "sample": [-14.329696655273438, -243.2610626220703, -24.18071746826172, 113.12654876708984, 50.704750061035156, 116.5186538696289, 40.82853698730469, -16.560142517089844, 5.998676300048828, 187.88380432128906, 89.404541015625, 171.698974609375, 150.261474609375, 46.680686950683594, 142.01002502441406, 122.49341583251953, 258.24725341796875, 4.044029235839844, -169.48854064941406, 83.35193634033203, 194.05410766601562, -7.517425537109375, 345.4284973144531, -68.04524230957031, -1.4096298217773438, 114.1593017578125, 145.1181640625, 80.65440368652344, -14.516860961914062, 8.325946807861328, 11.923576354980469, 146.85084533691406, -91.52604675292969, 92.94558715820312, 190.057861328125, 161.68922424316406, 80.5964126586914, 30.039188385009766, -4.331912994384766, -58.99981689453125, 357.9279479980469, 104.78091430664062, 31.236366271972656, 18.924835205078125, 8.430442810058594, 168.0624542236328, 25.51673126220703, 8.060327529907227, 300.46136474609375, -97.47370910644531, 99.2171401977539, 39.44004821777344, 84.41729736328125, 30.104339599609375, 140.91949462890625, -0.10369682312011719, -60.57079315185547, 252.00535583496094, -74.69046783447266, -93.55282592773438, 121.70811462402344, -20.32227325439453, -113.266357421875, 35.359230041503906], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000482.npy"} +{"epoch": 0.7286470143613001, "step": 483, "batch_size": 64, "mean": 71.90357971191406, "std": 89.99600219726562, "min": -177.4743194580078, "p10": -20.137082672119142, "median": 62.544864654541016, "p90": 185.0389144897461, "max": 244.73916625976562, "pos_frac": 0.78125, "sample": [20.265357971191406, 185.44215393066406, -0.6155967712402344, 88.88710021972656, 149.5706024169922, 162.22422790527344, 147.65235900878906, -43.48002624511719, -19.864227294921875, -17.529407501220703, 68.90164947509766, 154.45419311523438, 152.97393798828125, 155.78990173339844, -44.25873947143555, 147.61819458007812, 77.25001525878906, -60.073875427246094, 5.1688995361328125, 158.68856811523438, 64.63520812988281, 177.07858276367188, 175.48861694335938, 59.97129821777344, 184.0980224609375, 60.45452117919922, 209.37196350097656, -20.25402069091797, -6.55712890625, 73.00668334960938, 95.41522979736328, -139.63424682617188, 178.32980346679688, 4.876432418823242, 4.97735595703125, 244.73916625976562, 15.137603759765625, -177.4743194580078, 41.51783752441406, -21.811378479003906, 53.02741241455078, 31.596031188964844, 189.75820922851562, 69.9578628540039, 2.0793075561523438, 65.54559326171875, 233.50523376464844, 191.1273193359375, 58.80492401123047, 139.3247833251953, 35.920379638671875, 65.35475158691406, 29.694175720214844, 197.07211303710938, -13.146707534790039, 13.94349479675293, 54.02028274536133, 6.616830825805664, 183.47970581054688, 128.7637939453125, 18.670211791992188, -18.97167205810547, -4.111377716064453, 157.36392211914062], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000483.npy"} +{"epoch": 0.7301587301587301, "step": 484, "batch_size": 64, "mean": 49.79658508300781, "std": 70.90343475341797, "min": -100.17700958251953, "p10": -35.99320487976074, "median": 42.28712272644043, "p90": 135.8675964355469, "max": 207.78909301757812, "pos_frac": 0.765625, "sample": [32.06707000732422, 51.452178955078125, -0.2710418701171875, 7.742958068847656, 190.54771423339844, 7.47917366027832, 64.26351928710938, -12.95916748046875, 132.70220947265625, -11.933418273925781, 31.954551696777344, -100.17700958251953, 46.53628921508789, 42.96657943725586, 91.91120910644531, 95.79261779785156, -46.13637924194336, -17.415813446044922, 83.66989135742188, 85.8310775756836, 0.8612194061279297, 136.24229431152344, 121.55415344238281, 20.975299835205078, 103.14192962646484, 99.39835357666016, 181.60423278808594, -4.9882354736328125, 94.6300048828125, 5.40330696105957, 31.03317642211914, 32.47740936279297, -5.5516815185546875, -43.365318298339844, 207.78909301757812, -9.53598403930664, 25.067991256713867, 35.423858642578125, 79.09034729003906, 7.5793304443359375, 134.99330139160156, -36.865623474121094, 206.0925750732422, -72.35971069335938, 123.6095962524414, 74.4205551147461, 168.15481567382812, -33.95756149291992, 81.50936889648438, 20.537017822265625, 193.3533477783203, 29.28502655029297, 60.94384765625, 24.392440795898438, -75.61951446533203, -92.72257232666016, 68.48600769042969, 65.40322875976562, 90.74006652832031, 98.8751449584961, 41.607666015625, 69.19314575195312, 46.07316970825195, 5.9808807373046875], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000484.npy"} +{"epoch": 0.7316704459561603, "step": 485, "batch_size": 64, "mean": 55.39051818847656, "std": 82.30409240722656, "min": -164.33822631835938, "p10": -20.470810127258297, "median": 31.012924194335938, "p90": 177.8616958618164, "max": 272.2115478515625, "pos_frac": 0.734375, "sample": [24.36974334716797, 98.00699615478516, 85.39109802246094, 107.10749816894531, 87.01383972167969, -2.9469375610351562, 5.491823196411133, 10.248250961303711, 64.32896423339844, -54.03363800048828, -110.31593322753906, 27.941253662109375, 178.46243286132812, 168.68746948242188, -6.1510009765625, 195.8256378173828, 10.261959075927734, 166.3396453857422, 223.203369140625, 16.98493003845215, 18.80927085876465, 118.358154296875, -3.0998992919921875, 215.05609130859375, -4.169059753417969, 1.2912101745605469, -164.33822631835938, 87.53297424316406, 63.719581604003906, 73.36605834960938, -23.217674255371094, 0.3379249572753906, 74.9870376586914, 0.7195606231689453, 105.06871032714844, -62.75447082519531, 272.2115478515625, 185.32943725585938, -8.424545288085938, 133.45545959472656, 32.79343032836914, -24.993356704711914, 44.2677001953125, 14.556175231933594, 65.3477554321289, -0.7557086944580078, -5.638853073120117, 172.28211975097656, 99.44720458984375, -9.421188354492188, 29.232418060302734, 40.00035858154297, 100.2859115600586, 176.45997619628906, 61.833335876464844, 99.79904174804688, 70.94612884521484, 178.756591796875, -23.02458953857422, -14.511991500854492, 27.450469970703125, -0.11598587036132812, 25.476882934570312, 4.06256103515625], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000485.npy"} +{"epoch": 0.7331821617535903, "step": 486, "batch_size": 64, "mean": 50.371673583984375, "std": 103.32962036132812, "min": -168.7650909423828, "p10": -71.03640747070312, "median": 46.44390869140625, "p90": 182.985758972168, "max": 370.6150817871094, "pos_frac": 0.640625, "sample": [14.584159851074219, -12.358139038085938, 251.91986083984375, 10.344491958618164, -14.144134521484375, -3.477001190185547, 40.75120544433594, 370.6150817871094, 23.52318572998047, -3.9100189208984375, -5.421670913696289, 136.86468505859375, 101.74935150146484, 63.27031707763672, 69.47321319580078, 27.399337768554688, -15.95361328125, 186.40484619140625, -1.3582992553710938, 174.28079223632812, 101.62259674072266, 55.08296203613281, -67.96002197265625, -72.3548583984375, 204.4073486328125, -131.08102416992188, 48.36041259765625, -67.0360107421875, 61.83728790283203, -153.2825927734375, 202.16445922851562, 67.64373779296875, 57.55731201171875, -116.62084197998047, 7.469297409057617, 110.90837860107422, 54.30915069580078, 137.10511779785156, -95.34748077392578, 33.15266036987305, -0.046886444091796875, 168.42767333984375, 73.905029296875, 185.09197998046875, 178.0712432861328, -58.278404235839844, 107.28315734863281, 127.01045227050781, 62.2606201171875, 172.13125610351562, 106.69210815429688, -45.51588439941406, 24.867996215820312, 166.32894897460938, -4.635566711425781, -85.47032165527344, -3.1492652893066406, 87.79664611816406, 240.56602478027344, -22.178712844848633, 44.52740478515625, -168.7650909423828, 56.53133010864258, -42.16022491455078], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000486.npy"} +{"epoch": 0.7346938775510204, "step": 487, "batch_size": 64, "mean": 60.003597259521484, "std": 94.11260223388672, "min": -146.46505737304688, "p10": -41.45836982727051, "median": 43.235687255859375, "p90": 176.0797576904297, "max": 388.9510192871094, "pos_frac": 0.734375, "sample": [89.47950744628906, -45.22987365722656, 122.18514251708984, 109.1543960571289, 39.53533935546875, 25.846799850463867, -40.80973815917969, 43.42774200439453, 88.6036148071289, 136.10595703125, -18.096160888671875, -19.887435913085938, 37.06310272216797, -49.03077697753906, -16.42253875732422, 177.2773895263672, 101.0213623046875, 34.619876861572266, 338.2591552734375, 53.28092956542969, -4.246345520019531, 177.17752075195312, 35.99287414550781, 179.15553283691406, 100.09329223632812, -41.73635482788086, 38.049346923828125, -133.16986083984375, 5.558830261230469, 55.084686279296875, 150.8889617919922, 61.069480895996094, 78.56560516357422, -3.3709239959716797, 169.89041137695312, -6.858543395996094, 120.49049377441406, -48.734893798828125, 49.547088623046875, 102.61677551269531, 185.84365844726562, 12.031620025634766, 52.87391662597656, 158.26873779296875, -123.51219177246094, 103.11227416992188, 5.033592224121094, -26.372817993164062, 74.43360137939453, -146.46505737304688, -11.828950881958008, 173.518310546875, 33.942115783691406, 30.139938354492188, 10.242019653320312, 112.64567565917969, 42.45717239379883, 42.93489074707031, -5.412811279296875, 181.2135772705078, 102.2021255493164, 43.04363250732422, 388.9510192871094, 108.48628997802734], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000487.npy"} +{"epoch": 0.7362055933484505, "step": 488, "batch_size": 64, "mean": 67.5914306640625, "std": 87.44241333007812, "min": -143.7299041748047, "p10": -17.755435371398924, "median": 43.627506256103516, "p90": 187.23217926025393, "max": 287.14068603515625, "pos_frac": 0.765625, "sample": [28.908416748046875, 3.0409774780273438, -7.473031997680664, -8.304288864135742, 19.63225555419922, -49.73480224609375, -20.860679626464844, 171.0341796875, 199.8082733154297, 37.48160934448242, 20.869863510131836, 7.4659271240234375, 181.76290893554688, 17.822654724121094, 9.263847351074219, 224.68753051757812, -13.688308715820312, 164.7364501953125, 2.0774307250976562, 62.69480514526367, 112.88443756103516, 47.386329650878906, 7.215309143066406, -15.416366577148438, -15.331947326660156, 60.480979919433594, -67.09916687011719, 183.77505493164062, 11.929229736328125, 182.9531707763672, 39.868682861328125, -50.607421875, -17.485708236694336, 166.5298309326172, 168.3879852294922, 89.85389709472656, 170.11488342285156, -22.883995056152344, 211.9686279296875, 204.85780334472656, 203.36949157714844, 126.92977142333984, 128.24595642089844, 24.998748779296875, 103.22093963623047, 99.91846466064453, -11.484970092773438, 97.26875305175781, -17.87103271484375, 70.95930480957031, 35.92454528808594, 76.38084411621094, -143.7299041748047, 99.27561950683594, 14.34503173828125, 91.02371978759766, 287.14068603515625, 57.236385345458984, 185.10243225097656, 49.08250045776367, 14.114501953125, 30.19390869140625, -4.546684265136719, 188.14492797851562], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000488.npy"} +{"epoch": 0.7377173091458806, "step": 489, "batch_size": 64, "mean": 40.00508117675781, "std": 92.93455505371094, "min": -155.2611846923828, "p10": -79.92853469848632, "median": 29.375198364257812, "p90": 161.4538299560547, "max": 241.72943115234375, "pos_frac": 0.640625, "sample": [-145.16905212402344, 133.64031982421875, 30.146774291992188, 140.82562255859375, 130.53053283691406, 165.82095336914062, -49.365692138671875, 137.81085205078125, 52.81130599975586, 228.10003662109375, 95.36141204833984, 18.177146911621094, 80.24288940429688, -86.81307983398438, -5.704902648925781, -70.86009216308594, -26.69280242919922, -16.356220245361328, 126.1368408203125, 48.08885955810547, 185.42691040039062, 93.68533325195312, 116.59264373779297, 18.966197967529297, 104.07501220703125, 136.22705078125, -11.069648742675781, -40.86437225341797, -31.942474365234375, 34.122066497802734, -155.2611846923828, -66.06393432617188, 158.1129150390625, 20.743125915527344, 3.5116424560546875, -16.03350830078125, -29.79631805419922, -2.126222610473633, 162.88565063476562, 115.09210968017578, 36.90472412109375, 99.4866943359375, 9.232490539550781, 241.72943115234375, 57.876869201660156, -96.13984680175781, 178.0626220703125, 15.256973266601562, 93.99498748779297, 108.78126525878906, -144.35345458984375, 14.877677917480469, -17.938045501708984, 9.781278610229492, -10.341598510742188, -133.73880004882812, 143.77548217773438, 42.570457458496094, -83.81501007080078, 70.83322143554688, -51.194549560546875, 171.09255981445312, -8.028352737426758, 28.603622436523438], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000489.npy"} +{"epoch": 0.7392290249433107, "step": 490, "batch_size": 64, "mean": 49.74869918823242, "std": 108.31641387939453, "min": -221.72946166992188, "p10": -82.40984802246092, "median": 45.89541435241699, "p90": 188.03148651123047, "max": 257.08648681640625, "pos_frac": 0.65625, "sample": [-28.217910766601562, -17.721176147460938, -221.72946166992188, 9.880897521972656, -12.271913528442383, 82.52072143554688, 38.36277770996094, 156.08741760253906, 202.01589965820312, 251.36129760742188, -154.25411987304688, 188.13551330566406, -178.59890747070312, 10.013776779174805, 38.58332824707031, 103.39672088623047, 136.02493286132812, 98.6042251586914, 215.49667358398438, 21.20862579345703, 14.184165954589844, 183.51043701171875, 141.0059814453125, 187.78875732421875, -87.79161071777344, -37.52239990234375, 174.23841857910156, -2.733631134033203, 48.93024826049805, 31.687049865722656, -135.0029296875, 90.34947204589844, 52.03619384765625, 102.0457763671875, -0.011793136596679688, -15.243423461914062, -25.518287658691406, 191.3179473876953, -102.46568298339844, -16.2535400390625, 105.39923095703125, -67.09133911132812, 76.19994354248047, 118.80231475830078, -0.32056617736816406, 120.6566162109375, 34.662506103515625, 0.8822879791259766, -56.60639190673828, -21.14263916015625, 257.08648681640625, 142.493896484375, -14.73739242553711, 88.7646484375, 223.69813537597656, 102.783935546875, 185.0278778076172, 65.87812042236328, 51.1666259765625, 174.61053466796875, -176.6079559326172, -69.85240173339844, 42.86058044433594, 65.85113525390625], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000490.npy"} +{"epoch": 0.7407407407407407, "step": 491, "batch_size": 64, "mean": 53.53771209716797, "std": 85.41658782958984, "min": -176.5256805419922, "p10": -38.986560058593746, "median": 31.83547019958496, "p90": 169.289535522461, "max": 307.83038330078125, "pos_frac": 0.734375, "sample": [118.98402404785156, -28.91534423828125, 105.17718505859375, 27.719940185546875, 152.79714965820312, 82.9896011352539, -2.385416030883789, 107.23876953125, 151.790771484375, 32.83577346801758, 11.976638793945312, -103.69373321533203, 180.40771484375, 30.835166931152344, 155.8636474609375, -60.674949645996094, 10.609783172607422, 118.86087036132812, 12.462200164794922, 89.71832275390625, -41.002532958984375, 137.90457153320312, 176.40142822265625, -6.887302398681641, 48.53888702392578, 150.02993774414062, 11.937583923339844, -16.623428344726562, 1.9516067504882812, 8.889163970947266, 177.5684356689453, 91.17634582519531, -34.282623291015625, 20.53961944580078, 122.4264144897461, 35.04037857055664, 28.92145538330078, 307.83038330078125, 49.98687744140625, -47.0654296875, 175.04348754882812, 17.127731323242188, 15.1983642578125, -14.494226455688477, -3.2254676818847656, 64.2945556640625, -16.021453857421875, -52.396270751953125, 92.55213165283203, 182.0306854248047, 10.219314575195312, 124.85595703125, 212.20787048339844, 155.59996032714844, 16.47617530822754, -12.827484130859375, 37.22967529296875, 45.931495666503906, 72.47332763671875, -176.5256805419922, -59.615509033203125, 6.49083137512207, -19.099506378173828, 135.00778198242188], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000491.npy"} +{"epoch": 0.7422524565381708, "step": 492, "batch_size": 64, "mean": 44.18886184692383, "std": 99.9230728149414, "min": -186.6486053466797, "p10": -62.54796371459961, "median": 22.232511520385742, "p90": 186.58772125244144, "max": 260.58441162109375, "pos_frac": 0.671875, "sample": [260.58441162109375, 208.1824951171875, -91.46070861816406, 4.68170166015625, 193.31423950195312, 2.285512924194336, 117.82353210449219, 53.974796295166016, 77.97135925292969, -6.212038040161133, 133.78211975097656, 178.3395538330078, 62.705169677734375, -34.91790008544922, 21.659988403320312, 149.10772705078125, -175.62722778320312, 58.861541748046875, 7.479667663574219, 149.93943786621094, 136.9537353515625, -61.89411163330078, -2.2365875244140625, -15.665428161621094, 4.136375427246094, 80.88189697265625, 91.62689971923828, 215.18014526367188, -62.82818603515625, -27.029258728027344, 171.41891479492188, 16.06169319152832, -34.045501708984375, 76.35517883300781, -6.743921279907227, 16.386367797851562, -186.6486053466797, 210.55218505859375, -110.58135986328125, -7.713706970214844, 141.4893798828125, 5.206230163574219, 82.22322845458984, 6.541088104248047, -42.80186462402344, 125.8169937133789, 30.057567596435547, 52.28596496582031, -52.42664337158203, 126.32329559326172, -172.97744750976562, -36.663307189941406, -10.776702880859375, 135.51963806152344, 190.12265014648438, 22.805034637451172, 124.1636962890625, 78.98941040039062, 88.28514099121094, 9.176132202148438, 3.673276901245117, -100.82455444335938, -47.70716094970703, 192.944091796875], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000492.npy"} +{"epoch": 0.7437641723356009, "step": 493, "batch_size": 64, "mean": 68.38059997558594, "std": 92.77110290527344, "min": -166.8321533203125, "p10": -41.706488037109374, "median": 55.74586296081543, "p90": 187.7437896728516, "max": 316.4317321777344, "pos_frac": 0.765625, "sample": [7.19927978515625, 14.335277557373047, -19.4920654296875, 147.6092529296875, -23.881935119628906, 52.10504150390625, -140.0821533203125, 26.15005111694336, 8.048662185668945, -14.680412292480469, 56.0682373046875, 190.54837036132812, 146.5859375, 193.08062744140625, 55.42348861694336, -57.6990852355957, 159.05181884765625, -1.5719032287597656, 119.78509521484375, 146.18099975585938, 17.840051651000977, 36.341331481933594, -3.0919742584228516, 51.1492919921875, 56.92351531982422, -37.452484130859375, 134.2649383544922, 9.261154174804688, 195.79100036621094, 125.3639907836914, 93.34095764160156, 175.50254821777344, -65.61181640625, 0.7363090515136719, -61.227867126464844, 116.66149139404297, 177.4718475341797, -43.529632568359375, 160.85430908203125, 5.168832778930664, 225.02630615234375, 117.02003479003906, 115.75547790527344, 316.4317321777344, 72.03519439697266, 199.05348205566406, -48.07704162597656, 175.67303466796875, 133.51260375976562, -8.985359191894531, -10.79412841796875, 152.59466552734375, 61.848411560058594, 14.227035522460938, 200.04470825195312, 119.53996276855469, 52.57048034667969, 47.58551025390625, 99.41204833984375, 181.19976806640625, 15.367378234863281, 58.94850158691406, 42.678306579589844, -166.8321533203125], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000493.npy"} +{"epoch": 0.745275888133031, "step": 494, "batch_size": 64, "mean": 55.94435119628906, "std": 106.31587219238281, "min": -234.64804077148438, "p10": -67.36024627685546, "median": 50.3101921081543, "p90": 174.6277603149414, "max": 354.1458740234375, "pos_frac": 0.6875, "sample": [125.08760070800781, 37.111175537109375, 62.367759704589844, 46.38294982910156, 170.19839477539062, 9.311264038085938, -36.505653381347656, 141.3534393310547, 119.8974380493164, -69.34733581542969, 19.61280059814453, -69.09337615966797, -7.0012969970703125, 122.45195770263672, 90.56575012207031, 71.90084838867188, 165.3283233642578, 2.5909500122070312, 52.80766677856445, -100.46331787109375, 16.54648208618164, 354.1458740234375, 106.89350891113281, -11.543930053710938, 48.836036682128906, 174.94012451171875, 170.52578735351562, -6.883476257324219, 124.37106323242188, 173.89891052246094, 137.1361083984375, -175.79432678222656, -189.84658813476562, 152.89260864257812, -10.644357681274414, -88.40701293945312, -63.31627655029297, 144.13369750976562, 27.10138702392578, 119.0347900390625, 66.78359985351562, -1.3819904327392578, -234.64804077148438, -5.307369232177734, 34.59835433959961, 58.59912872314453, 218.42921447753906, 4.468622207641602, -44.09735107421875, 42.89288330078125, 190.81094360351562, 51.78434753417969, 42.76222229003906, 248.64016723632812, 75.3318099975586, 93.53961944580078, -17.577880859375, -17.645816802978516, 126.00363159179688, 172.10638427734375, 204.61050415039062, -38.6507568359375, -29.754009246826172, 179.56292724609375], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000494.npy"} +{"epoch": 0.7467876039304611, "step": 495, "batch_size": 64, "mean": 47.70680618286133, "std": 99.3141098022461, "min": -158.81182861328125, "p10": -60.604605484008786, "median": 24.995448112487793, "p90": 180.06126556396487, "max": 382.7333984375, "pos_frac": 0.65625, "sample": [-85.13935089111328, -68.35063934326172, -158.81182861328125, -132.4112091064453, 156.91845703125, -10.480117797851562, -103.13478088378906, 27.322402954101562, 73.234375, -27.723159790039062, -2.760101318359375, -106.16486358642578, -15.403152465820312, 73.19546508789062, 58.039512634277344, 181.83163452148438, -24.16657257080078, 37.6673583984375, 98.83670806884766, -4.892873764038086, 57.29622268676758, 109.31703186035156, 126.01264953613281, 2.745920181274414, 154.40072631835938, 177.371826171875, -14.480899810791016, 90.21422576904297, 2.876262664794922, 34.62117385864258, 382.7333984375, 10.330408096313477, 17.114356994628906, -62.619510650634766, 24.528310775756836, 25.46258544921875, 0.7598190307617188, 130.26112365722656, 206.91317749023438, 137.87966918945312, -53.91270446777344, -0.3968505859375, 63.36015701293945, 94.53558349609375, 206.38906860351562, 13.978080749511719, 76.02710723876953, -5.743247985839844, -0.5952529907226562, 181.21388244628906, -1.848031997680664, 147.10902404785156, 51.17523956298828, -20.017662048339844, -55.903160095214844, 294.68115234375, 45.449462890625, -5.1989593505859375, 5.714759826660156, 68.29879760742188, 99.98892974853516, 15.932174682617188, 242.93711853027344, 8.715091705322266], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000495.npy"} +{"epoch": 0.7482993197278912, "step": 496, "batch_size": 64, "mean": 62.52857208251953, "std": 113.00833129882812, "min": -134.26559448242188, "p10": -57.4459041595459, "median": 48.58833312988281, "p90": 196.8451568603516, "max": 566.2178955078125, "pos_frac": 0.703125, "sample": [111.16896057128906, 137.57815551757812, 201.67367553710938, 141.42906188964844, -67.85114288330078, 53.65116882324219, 65.51954650878906, 269.9322814941406, 38.27723693847656, 113.17449951171875, -80.87474060058594, 30.789344787597656, 56.23400115966797, 48.940704345703125, 4.81831169128418, -3.2324295043945312, -2.5005226135253906, 30.28655433654785, 129.75167846679688, 56.94866180419922, -47.01837921142578, 566.2178955078125, -3.088542938232422, 184.44143676757812, 64.51817321777344, -134.26559448242188, 295.9919738769531, 162.51858520507812, -2.772510528564453, 223.79574584960938, -57.99950408935547, 14.641651153564453, 181.3908233642578, 185.57861328125, 1.9056854248046875, 3.4135303497314453, -92.85277557373047, -12.048494338989258, 70.08331298828125, 101.00862884521484, 48.2359619140625, 64.0133056640625, 202.22000122070312, 85.0166015625, 119.3727035522461, 44.09403991699219, -35.05755615234375, 78.3630142211914, -17.368865966796875, 6.683696746826172, 208.2762908935547, -129.73983764648438, -40.69377136230469, 4.090932846069336, 127.36203002929688, 136.08518981933594, -6.226829528808594, 127.3603286743164, -56.154170989990234, 9.15570068359375, -75.62911987304688, 65.25878143310547, 4.4132537841796875, -8.478324890136719], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000496.npy"} +{"epoch": 0.7498110355253212, "step": 497, "batch_size": 64, "mean": 64.73158264160156, "std": 90.83746337890625, "min": -175.8621826171875, "p10": -25.742033386230467, "median": 72.4465103149414, "p90": 169.60068664550784, "max": 245.30169677734375, "pos_frac": 0.71875, "sample": [175.78897094726562, 41.167625427246094, 245.30169677734375, 150.10177612304688, 140.40753173828125, 18.135520935058594, -25.635818481445312, -7.2559356689453125, 19.914445877075195, 73.10411071777344, 130.6479949951172, 103.568115234375, 117.64005279541016, 2.5620956420898438, 122.67276000976562, 7.806053161621094, 151.8363037109375, -162.27914428710938, 163.69346618652344, 181.36492919921875, -3.7465057373046875, -1.4274559020996094, -6.245155334472656, -7.554542541503906, 29.607192993164062, -40.81022644042969, -25.677337646484375, 165.3553466796875, 150.3854217529297, 170.80572509765625, -8.803300857543945, 90.01795959472656, 110.07025146484375, 167.3175048828125, -158.59423828125, 147.388427734375, 163.86993408203125, 78.97710418701172, 84.06121826171875, -25.769760131835938, 162.1895294189453, 81.8811264038086, -17.49502944946289, 71.78890991210938, 89.99681091308594, -33.28504943847656, 213.47769165039062, 124.6232681274414, -0.7191314697265625, 38.111427307128906, 55.73441696166992, 63.96551513671875, 50.74809265136719, 107.41571044921875, 39.96208953857422, 218.5430145263672, -175.8621826171875, 5.6923675537109375, -12.19437026977539, 170.57919311523438, 74.06558227539062, 63.40033721923828, -88.23365783691406, 108.66555786132812], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000497.npy"} +{"epoch": 0.7513227513227513, "step": 498, "batch_size": 64, "mean": 67.53453063964844, "std": 83.78617858886719, "min": -227.13198852539062, "p10": -25.260644531249998, "median": 54.66725158691406, "p90": 178.54451293945314, "max": 251.9091339111328, "pos_frac": 0.828125, "sample": [-26.276168823242188, 91.84839630126953, 163.09043884277344, 71.23670959472656, 54.60052490234375, -13.529434204101562, 150.39968872070312, 166.48486328125, -11.71072769165039, -50.79534912109375, 156.85531616210938, 54.867252349853516, 70.05096435546875, -23.992332458496094, 143.43670654296875, 77.61949157714844, 12.754226684570312, -29.4271297454834, 53.05414581298828, 129.00169372558594, 251.9091339111328, 49.76068878173828, 172.8566131591797, 36.40461349487305, 46.47724151611328, 89.93132019042969, -32.46007537841797, 163.71664428710938, 149.40103149414062, 41.211631774902344, 186.37571716308594, 159.61524963378906, 1.8496437072753906, 33.62556457519531, 53.78321075439453, -37.9833984375, -8.515892028808594, 68.78211975097656, 2.316312789916992, 4.352350234985352, 99.15260314941406, 180.8877410888672, -227.13198852539062, 110.5042953491211, 79.3482894897461, 48.118568420410156, 0.9340476989746094, 62.773048400878906, 23.102649688720703, 64.90118408203125, 201.66696166992188, 186.12681579589844, 100.9691390991211, 17.78386688232422, 173.0769805908203, 6.991472244262695, 201.0052947998047, 28.557830810546875, 6.409029006958008, 10.936859130859375, 54.733978271484375, -25.80420684814453, 22.39104461669922, 221.79530334472656], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000498.npy"} +{"epoch": 0.7528344671201814, "step": 499, "batch_size": 64, "mean": 68.37374877929688, "std": 109.94048309326172, "min": -174.3934783935547, "p10": -81.90595626831053, "median": 78.26710891723633, "p90": 194.13955841064455, "max": 349.34259033203125, "pos_frac": 0.75, "sample": [105.20829010009766, 181.88710021972656, -163.5159912109375, 249.47003173828125, 24.140579223632812, 58.666255950927734, 51.58500671386719, -129.24777221679688, 24.87680435180664, 75.15538024902344, 87.07062530517578, 111.20455932617188, 146.7654266357422, -115.38679504394531, 195.23760986328125, 6.274986267089844, 349.34259033203125, -91.56817626953125, 191.46429443359375, 174.9375762939453, 85.07606506347656, -59.432373046875, -45.1611328125, -87.21561431884766, -58.89855194091797, 108.71881103515625, 83.00027465820312, 191.5774383544922, -59.075714111328125, 94.50745391845703, -22.99264144897461, 24.065441131591797, 125.80149841308594, 141.6816864013672, 77.12142944335938, -29.908050537109375, 21.008575439453125, 137.40008544921875, -0.8043460845947266, 78.43145751953125, 208.42562866210938, 16.207191467285156, 188.72076416015625, 60.40560531616211, -174.3934783935547, 114.83631134033203, 78.1027603149414, 110.29214477539062, 203.71328735351562, 242.00726318359375, 186.03756713867188, 29.54840850830078, 36.91487121582031, -69.51675415039062, -124.23042297363281, 185.57321166992188, 119.99986267089844, 116.26001739501953, -39.49041748046875, 227.06336975097656, 20.368934631347656, 164.87387084960938, 112.5907211303711, 23.139053344726562], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000499.npy"} +{"epoch": 0.7543461829176115, "step": 500, "batch_size": 64, "mean": 57.531761169433594, "std": 96.40264129638672, "min": -222.3326416015625, "p10": -86.03459968566892, "median": 61.793128967285156, "p90": 176.6765106201172, "max": 207.7772979736328, "pos_frac": 0.78125, "sample": [-33.721038818359375, 92.78417205810547, 21.859024047851562, 8.209699630737305, 122.70269775390625, 54.07350158691406, 83.90132141113281, 133.76123046875, 79.85296630859375, 185.7258758544922, 54.029541015625, 177.01412963867188, 175.88873291015625, -34.23255157470703, 174.56275939941406, 25.159164428710938, 175.70201110839844, 69.60108947753906, 30.474159240722656, -19.141815185546875, 196.48541259765625, 149.5972442626953, 42.30933380126953, 134.04026794433594, -11.136367797851562, 181.19322204589844, 75.93312072753906, 15.113033294677734, -28.989280700683594, -119.70012664794922, -99.08313751220703, 67.44334411621094, 21.636302947998047, 48.62617492675781, -107.60572814941406, 0.20451927185058594, 64.43710327148438, 182.61842346191406, 180.85498046875, 6.423057556152344, 114.14076232910156, 16.483694076538086, 163.3101806640625, 51.9340705871582, -59.35085678100586, 107.83740997314453, 59.14915466308594, -222.3326416015625, 164.88607788085938, -169.245361328125, 207.7772979736328, -97.47048950195312, 3.6254653930664062, 118.9418716430664, 115.33753967285156, 31.269939422607422, 10.444938659667969, 73.18272399902344, 104.28905487060547, -25.79240608215332, -110.43988800048828, 125.77135467529297, 173.3339080810547, 146.3411865234375], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000500.npy"} +{"epoch": 0.7558578987150416, "step": 501, "batch_size": 64, "mean": 53.3382568359375, "std": 68.4932632446289, "min": -144.34959411621094, "p10": -10.779005241394042, "median": 37.62897872924805, "p90": 157.68576202392578, "max": 198.12339782714844, "pos_frac": 0.75, "sample": [25.39356231689453, 158.27157592773438, 15.042098999023438, 46.580448150634766, 99.05815124511719, 116.41231536865234, 7.5235137939453125, 38.14836883544922, 14.290233612060547, 122.53668975830078, 149.40867614746094, 22.55549430847168, 83.22758483886719, 15.669174194335938, -0.9721508026123047, -4.848676681518555, 53.42822265625, 164.10653686523438, -9.699897766113281, -9.376466751098633, 61.891212463378906, -5.78985595703125, -0.27065277099609375, 198.12339782714844, 170.2265625, 141.7750244140625, 126.39028930664062, 184.06851196289062, 29.47665023803711, -8.116828918457031, 38.69995880126953, -52.47589111328125, -4.3780975341796875, 6.169727325439453, 69.8414306640625, 72.18939208984375, 106.14987182617188, -1.5207901000976562, 3.8412437438964844, 68.97653198242188, 37.109588623046875, 146.56341552734375, 19.252925872802734, 84.85655975341797, -11.987586975097656, -144.34959411621094, 35.80803680419922, 156.31886291503906, -55.04557418823242, 68.6421127319336, 54.31005859375, 68.16608428955078, 17.43000030517578, -16.143630981445312, 67.38554382324219, -11.241479873657227, 21.66607666015625, 16.544862747192383, 181.657470703125, 168.4104766845703, 78.60801696777344, 19.68936538696289, 118.07827758789062, -20.104644775390625], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000501.npy"} +{"epoch": 0.7573696145124716, "step": 502, "batch_size": 64, "mean": 57.323463439941406, "std": 79.35635375976562, "min": -100.48112487792969, "p10": -37.58397598266601, "median": 52.24411392211914, "p90": 170.45753936767582, "max": 240.1614227294922, "pos_frac": 0.765625, "sample": [-31.019248962402344, 35.07625961303711, 11.090164184570312, -40.397430419921875, 144.04757690429688, 101.42051696777344, 24.34099578857422, 32.457916259765625, -91.78728485107422, 65.59393310546875, 26.943973541259766, 177.33914184570312, -9.184310913085938, -52.35169219970703, 147.69097900390625, 240.1614227294922, 42.30621337890625, -100.48112487792969, -19.603492736816406, 58.09153747558594, 32.04353332519531, -19.63742446899414, 54.122413635253906, 131.47605895996094, 153.44076538085938, 74.42047119140625, 133.20819091796875, -13.228824615478516, 0.2720508575439453, 50.365814208984375, 22.663490295410156, 9.88630485534668, 79.05135345458984, 8.453145980834961, 93.3712158203125, 72.148681640625, 180.69290161132812, 210.21983337402344, -56.269805908203125, 1.9071388244628906, -20.81554412841797, 30.613975524902344, 81.42430877685547, 5.574920654296875, 91.29742431640625, -3.689300537109375, 38.30682373046875, 163.86813354492188, 100.07787322998047, -81.97724914550781, 83.11245727539062, 100.9810791015625, 148.79299926757812, 81.610107421875, 173.96621704101562, -81.62771606445312, 63.20208740234375, 151.71121215820312, -18.022796630859375, 173.2815704345703, 7.760013580322266, 112.94820404052734, 199.88916015625, 86.07250213623047], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000502.npy"} +{"epoch": 0.7588813303099018, "step": 503, "batch_size": 64, "mean": 57.900814056396484, "std": 91.70829772949219, "min": -186.23211669921875, "p10": -44.06630477905273, "median": 44.11880111694336, "p90": 177.58167266845703, "max": 206.59854125976562, "pos_frac": 0.78125, "sample": [144.68902587890625, 4.262432098388672, -29.738433837890625, 42.65967559814453, 107.28714752197266, 36.16956329345703, 206.59854125976562, -186.23211669921875, 3.0137939453125, 117.80807495117188, 110.89938354492188, -9.070480346679688, 32.26844024658203, 180.84959411621094, -37.74711608886719, 90.178466796875, -46.77452850341797, 30.58660888671875, 201.7382049560547, -50.93938446044922, 22.649620056152344, 109.47607421875, 165.82749938964844, 61.47795104980469, 32.136817932128906, 45.57792663574219, 129.1103515625, 191.90347290039062, 5.124958038330078, 146.14981079101562, -17.463375091552734, 61.982666015625, 185.5748748779297, 177.40313720703125, 178.8329620361328, -20.140228271484375, 101.6971206665039, -14.827095031738281, -112.51570129394531, 25.044044494628906, 2.406749725341797, 30.691497802734375, 4.797021865844727, 86.86338806152344, -0.8614921569824219, 15.570480346679688, 58.21900939941406, 177.65818786621094, 115.27283477783203, 11.842132568359375, 172.3194122314453, 162.8688201904297, -142.1398162841797, 8.200271606445312, 163.19168090820312, 126.257080078125, 5.624643325805664, -95.71768951416016, 107.38444519042969, 165.51475524902344, 17.207271575927734, 123.74486541748047, 113.74523162841797, -148.53871154785156], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000503.npy"} +{"epoch": 0.7603930461073318, "step": 504, "batch_size": 64, "mean": 76.12149047851562, "std": 81.49816131591797, "min": -114.9020767211914, "p10": -7.228911972045898, "median": 69.15570831298828, "p90": 189.226171875, "max": 269.35430908203125, "pos_frac": 0.828125, "sample": [0.177825927734375, 170.55101013183594, -7.2591094970703125, 115.75118255615234, 210.06932067871094, -14.064697265625, 107.37646484375, 35.25048065185547, 190.76600646972656, 11.373971939086914, 55.709259033203125, 73.91357421875, 7.2930145263671875, 194.01596069335938, 44.79640579223633, 152.4258575439453, 153.56544494628906, -99.63202667236328, 103.4510498046875, 137.15155029296875, -7.158451080322266, 81.97920227050781, 2.6087799072265625, 166.1332244873047, 185.6332244873047, -30.525009155273438, 53.718788146972656, 175.4067840576172, 73.60750579833984, 269.35430908203125, 198.0399169921875, 203.57553100585938, -6.161060333251953, 70.61769104003906, 65.4102783203125, -4.9028167724609375, 6.383049011230469, -113.4452133178711, 164.79727172851562, 67.6937255859375, 153.87911987304688, -7.5508575439453125, -3.937976837158203, 41.69927978515625, 47.034149169921875, 158.0777130126953, 95.19721984863281, 62.33501434326172, 16.899627685546875, 91.38995361328125, 108.56689453125, 65.14488220214844, -114.9020767211914, 129.94851684570312, 108.40309143066406, 32.283470153808594, 17.31709098815918, 84.50288391113281, 113.23843383789062, 38.815589904785156, 9.427865982055664, 203.07583618164062, 98.20938110351562, 57.27123260498047], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000504.npy"} +{"epoch": 0.7619047619047619, "step": 505, "batch_size": 64, "mean": 50.9160270690918, "std": 101.78529357910156, "min": -180.65667724609375, "p10": -58.78641586303711, "median": 30.949562072753906, "p90": 178.29224395751953, "max": 303.61810302734375, "pos_frac": 0.6875, "sample": [116.5496826171875, 2.036113739013672, 71.27162170410156, 27.132564544677734, 0.5601463317871094, 303.61810302734375, -117.645263671875, 254.72364807128906, 148.1339874267578, 176.19180297851562, 178.6647491455078, -15.544235229492188, 48.74658966064453, 11.428184509277344, 24.359466552734375, -34.56427001953125, -16.373443603515625, -11.59054183959961, 117.08049011230469, 13.58322525024414, -86.13168334960938, 160.12721252441406, 135.60525512695312, 36.32631301879883, 98.38526153564453, 234.52865600585938, 38.22032928466797, -57.44340515136719, 31.995346069335938, -0.4278526306152344, -45.9801025390625, -5.736305236816406, 177.42306518554688, -128.7740478515625, 198.810546875, 148.59902954101562, 107.31147003173828, 152.00376892089844, -3.112485885620117, -49.94964599609375, 41.81610107421875, 22.815040588378906, -4.775993347167969, -132.747314453125, 44.44549560546875, 48.13832092285156, 87.6087875366211, -28.13858985900879, 204.7452850341797, -124.12014770507812, -22.985084533691406, 155.33676147460938, 175.05650329589844, 38.51300048828125, 164.5567626953125, 29.903778076171875, 123.33865356445312, 13.752197265625, 12.514320373535156, 189.6603546142578, 17.016515731811523, 2.0503158569335938, -59.36199188232422, -180.65667724609375], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000505.npy"} +{"epoch": 0.763416477702192, "step": 506, "batch_size": 64, "mean": 54.82719421386719, "std": 98.3857421875, "min": -222.69985961914062, "p10": -45.03932647705078, "median": 56.47887420654297, "p90": 168.73795471191406, "max": 253.1142578125, "pos_frac": 0.734375, "sample": [40.36933135986328, 147.07347106933594, 5.462726593017578, -29.70068359375, 124.35728454589844, 154.6901092529297, 86.38897705078125, -40.64204025268555, 143.30136108398438, -44.790252685546875, 3.030721664428711, 95.62446594238281, 46.096092224121094, 25.96741485595703, 77.714599609375, 106.8721923828125, -170.72195434570312, 223.2087860107422, 249.097900390625, 14.170936584472656, 167.1914520263672, -107.57996368408203, -16.421279907226562, -222.69985961914062, -95.88236236572266, -166.72378540039062, 33.08323669433594, 186.56932067871094, 220.7540283203125, 161.13922119140625, 177.58642578125, -45.14607238769531, 253.1142578125, -16.69091796875, 169.40074157714844, 24.190025329589844, 163.8516387939453, 57.11878204345703, 98.07939910888672, -21.6246337890625, -85.72549438476562, 10.222572326660156, 11.528411865234375, 23.236717224121094, 96.5758056640625, 73.45887756347656, -6.133052825927734, 56.39142608642578, 106.8902587890625, 74.97943878173828, 75.56901550292969, 124.692138671875, -2.4642791748046875, 117.06639099121094, 102.67155456542969, 0.05626678466796875, 13.363883972167969, 126.9536361694336, -16.580650329589844, -9.22011947631836, 56.566322326660156, 142.09689331054688, 109.93205261230469, 29.931304931640625], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000506.npy"} +{"epoch": 0.764928193499622, "step": 507, "batch_size": 64, "mean": 60.51799774169922, "std": 104.69632720947266, "min": -161.37460327148438, "p10": -59.034708404541014, "median": 48.7020263671875, "p90": 208.41294860839852, "max": 336.12066650390625, "pos_frac": 0.671875, "sample": [154.64877319335938, -1.1905975341796875, -20.078819274902344, 89.24774169921875, 336.12066650390625, -8.254875183105469, 264.6745300292969, -161.37460327148438, -66.80619812011719, 99.67539978027344, 69.76792907714844, 48.03411865234375, -60.91737365722656, 118.00314331054688, -54.051734924316406, -27.986328125, 65.79168701171875, -30.466262817382812, 174.23800659179688, 25.952190399169922, 51.050689697265625, 49.36993408203125, 159.53646850585938, -33.47770690917969, 190.6676025390625, -6.327104568481445, 51.896278381347656, 222.92581176757812, 82.00579833984375, 7.44000244140625, 57.651824951171875, 9.250518798828125, 272.5665588378906, -20.58509063720703, 174.79629516601562, 106.22847747802734, -46.7535400390625, 169.90028381347656, -71.25006866455078, -11.80615234375, -33.686187744140625, 39.0006103515625, -2.2249832153320312, 134.61376953125, 118.80648803710938, 13.061080932617188, 52.029014587402344, 18.756072998046875, 314.509765625, 221.51214599609375, -66.80201721191406, 87.50015258789062, -54.641822814941406, 4.144294738769531, 102.92230224609375, 1.7234573364257812, 144.79736328125, -71.10728454589844, 40.009193420410156, -106.93775939941406, 24.070159912109375, 216.01809692382812, 79.20010375976562, 165.7635040283203], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000507.npy"} +{"epoch": 0.7664399092970522, "step": 508, "batch_size": 64, "mean": 71.11956787109375, "std": 98.16250610351562, "min": -159.69180297851562, "p10": -39.48687057495117, "median": 59.79829406738281, "p90": 193.4394714355469, "max": 271.54095458984375, "pos_frac": 0.765625, "sample": [137.43655395507812, 22.259780883789062, 134.84657287597656, 12.506866455078125, 36.2725830078125, -41.49322509765625, 230.27511596679688, -7.797084808349609, 127.9244155883789, 191.45965576171875, 247.37010192871094, 158.95413208007812, 22.132217407226562, 0.9499359130859375, 67.00909423828125, 120.88990020751953, -151.22900390625, 50.243865966796875, 52.587493896484375, -46.932437896728516, 24.472640991210938, 34.911865234375, 136.17042541503906, -36.456825256347656, -49.68663787841797, -159.69180297851562, 81.07499694824219, 0.9644184112548828, 271.54095458984375, 89.94746398925781, -40.78546142578125, 244.68492126464844, 84.16288757324219, 73.7882308959961, 126.5904312133789, 120.50497436523438, 87.46278381347656, 111.45230102539062, 179.34237670898438, 15.562034606933594, 4.226615905761719, -28.242469787597656, 161.84988403320312, 175.544921875, -12.124923706054688, -35.79768371582031, 128.7386932373047, 226.47125244140625, 184.93341064453125, 11.931650161743164, 179.32852172851562, -1.3345870971679688, 42.958797454833984, -9.684240341186523, 18.616958618164062, -123.48238372802734, -20.708816528320312, 184.565185546875, 172.37469482421875, 204.044921875, 70.04084014892578, 45.5445556640625, 15.889373779296875, 194.2879638671875], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000508.npy"} +{"epoch": 0.7679516250944822, "step": 509, "batch_size": 64, "mean": 53.13042449951172, "std": 92.01817321777344, "min": -155.19024658203125, "p10": -76.79194259643553, "median": 61.03363609313965, "p90": 170.53393859863283, "max": 208.05770874023438, "pos_frac": 0.703125, "sample": [66.39796447753906, -48.6010627746582, 68.88685607910156, 161.44827270507812, 58.20918273925781, -1.522054672241211, 17.48125457763672, -14.131875991821289, -96.3603744506836, 85.31761169433594, 24.04070281982422, 79.50845336914062, -131.15585327148438, 63.858089447021484, 148.92892456054688, -128.36460876464844, 174.79556274414062, 129.17169189453125, -12.06121826171875, 13.77191162109375, 133.6414337158203, -80.0942611694336, 70.46197509765625, -36.911231994628906, 208.05770874023438, 43.85029602050781, -27.74451446533203, 19.670238494873047, 42.799774169921875, -6.3795166015625, 179.00701904296875, 34.43071365356445, 153.62684631347656, 123.90167236328125, 21.940963745117188, -1.9156360626220703, 158.3158721923828, 101.82235717773438, 122.94024658203125, 168.86334228515625, 30.752891540527344, -2.7145538330078125, 180.804443359375, -69.08653259277344, 130.51107788085938, 175.0818634033203, 51.73274230957031, 69.94732666015625, 198.12728881835938, 157.14491271972656, 171.24990844726562, -27.16065216064453, -42.21485137939453, -155.19024658203125, 10.3516845703125, 146.05458068847656, 96.35576629638672, -125.19952392578125, -112.18872833251953, 73.05118560791016, 20.603118896484375, 67.69647979736328, 160.89393615722656, 103.83837890625], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000509.npy"} +{"epoch": 0.7694633408919124, "step": 510, "batch_size": 64, "mean": 66.6436767578125, "std": 108.83637237548828, "min": -161.00521850585938, "p10": -66.91841354370115, "median": 51.28818130493164, "p90": 215.52996215820312, "max": 319.3110046386719, "pos_frac": 0.75, "sample": [44.50486755371094, 167.47183227539062, 148.64898681640625, 99.12338256835938, -12.35931396484375, -3.08673095703125, 21.277050018310547, 215.32052612304688, 3.3252182006835938, 13.24139404296875, -34.057472229003906, 30.96269989013672, 33.65769577026367, 50.81413269042969, -136.72679138183594, -13.541923522949219, 7.723114013671875, 49.68888854980469, -41.730499267578125, 27.33537483215332, 67.18856811523438, 166.7661590576172, 191.1282501220703, -94.78872680664062, 8.363166809082031, 169.80567932128906, 48.980430603027344, -24.721954345703125, -1.1625785827636719, 138.64520263671875, 68.56890869140625, 102.36105346679688, 267.0406494140625, 85.12415313720703, 19.854671478271484, 134.59356689453125, 79.10686492919922, 243.25350952148438, 52.55821228027344, -28.042236328125, 12.302717208862305, -127.96895599365234, 165.341796875, 64.20343017578125, 241.90884399414062, 23.002098083496094, 111.92803192138672, 231.93746948242188, 319.3110046386719, -77.7132339477539, 51.762229919433594, 62.94175338745117, 169.89883422851562, 135.23941040039062, -108.00320434570312, 8.27933120727539, 215.61972045898438, 214.2772216796875, -14.64129638671875, 110.73889923095703, 307.6284484863281, 69.21330261230469, -127.22331237792969, -161.00521850585938], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000510.npy"} +{"epoch": 0.7709750566893424, "step": 511, "batch_size": 64, "mean": 75.91867065429688, "std": 93.7223892211914, "min": -129.55783081054688, "p10": -37.36074447631836, "median": 63.69856071472168, "p90": 190.53603820800782, "max": 230.72006225585938, "pos_frac": 0.796875, "sample": [203.769287109375, 185.76205444335938, 79.23615264892578, 182.7672576904297, 20.17160415649414, -6.553924560546875, 29.633380889892578, 1.1066970825195312, 145.90748596191406, 182.9272003173828, 79.893798828125, -87.87171173095703, 26.461532592773438, 50.498619079589844, 173.11996459960938, 218.82740783691406, 140.8671875, -34.682899475097656, 149.79632568359375, 110.21969604492188, 174.5695343017578, -5.59197998046875, 45.656532287597656, -107.35298919677734, -129.55783081054688, -38.508392333984375, 204.14942932128906, 125.31919860839844, 92.11925506591797, 37.672698974609375, 29.874025344848633, 125.99468994140625, 55.331634521484375, 65.72146606445312, 161.80624389648438, 116.14064025878906, 156.01788330078125, 32.74788284301758, -25.22241973876953, 16.501096725463867, 56.19956970214844, 61.675655364990234, 161.8103485107422, 217.56399536132812, 230.72006225585938, 135.04379272460938, -111.71640014648438, 46.212493896484375, 3.5120677947998047, 177.35443115234375, 37.12287139892578, 1.3084945678710938, 131.75146484375, 134.89279174804688, 13.672264099121094, 60.382164001464844, -80.92239379882812, 223.982421875, 185.1333465576172, 115.26693725585938, 192.58203125, -5.229785919189453, -87.53619384765625, -27.232967376708984], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000511.npy"} +{"epoch": 0.7724867724867724, "step": 512, "batch_size": 64, "mean": 51.556705474853516, "std": 93.05501556396484, "min": -208.38690185546875, "p10": -63.03770065307617, "median": 36.29647445678711, "p90": 171.52483062744145, "max": 198.58180236816406, "pos_frac": 0.703125, "sample": [145.27886962890625, 71.03347778320312, 34.799339294433594, -117.77099609375, -63.71317672729492, 177.59788513183594, 31.222225189208984, 20.82447624206543, 42.371543884277344, 116.289306640625, 142.2420196533203, 197.77256774902344, -208.38690185546875, -61.46158981323242, 38.88004684448242, -23.229248046875, -1.9674301147460938, -9.65207290649414, 157.24375915527344, 2.9395618438720703, 189.677734375, 161.505126953125, 4.926277160644531, 135.2069091796875, -18.295852661132812, 141.00421142578125, -95.42245483398438, 145.87771606445312, -33.683631896972656, 154.65943908691406, 22.346317291259766, 150.76806640625, 143.00209045410156, 5.838216781616211, 126.40211486816406, 29.698135375976562, 5.789276123046875, 110.06661987304688, -1.935262680053711, 174.8892822265625, -13.689834594726562, -114.2734603881836, -8.972677230834961, -25.307113647460938, 65.14633178710938, 198.58180236816406, 31.720603942871094, 32.03901290893555, 37.793609619140625, 11.68832778930664, 164.09214782714844, -4.251411437988281, 24.223800659179688, -125.19952392578125, 52.2161865234375, 125.64640808105469, 177.823486328125, 91.96781158447266, 174.71026611328125, 151.33978271484375, 50.71190643310547, -37.02837371826172, 90.68721771240234, -96.6709976196289], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000512.npy"} +{"epoch": 0.7739984882842026, "step": 513, "batch_size": 64, "mean": 62.23939895629883, "std": 84.5774154663086, "min": -148.52069091796875, "p10": -23.063982772827146, "median": 43.34175109863281, "p90": 189.6516067504883, "max": 304.8028869628906, "pos_frac": 0.8125, "sample": [263.26666259765625, 131.2329864501953, 174.6065216064453, 102.1358642578125, 110.92974090576172, 57.313297271728516, 110.7762680053711, 3.3547096252441406, 1.3999443054199219, -18.09192657470703, 61.41930389404297, -88.41233825683594, 159.1782684326172, 76.81658935546875, 84.77497863769531, 101.1902084350586, -20.685260772705078, 13.775871276855469, 188.6722412109375, 19.765708923339844, 34.73643493652344, 202.381591796875, 107.61014556884766, 63.513309478759766, 197.12173461914062, 14.391365051269531, -25.265975952148438, 93.61773681640625, 24.35319709777832, 78.59127044677734, 26.126014709472656, 61.28976058959961, 107.88481903076172, -148.52069091796875, 59.80883026123047, 23.5729923248291, -40.84490203857422, 113.78054809570312, 304.8028869628906, 23.325000762939453, -0.051303863525390625, -13.395536422729492, 220.92294311523438, 11.070953369140625, 142.82379150390625, 190.0713348388672, 205.15115356445312, 3.8573989868164062, 108.2022705078125, 86.03141784667969, 46.98766326904297, -0.670440673828125, 39.695838928222656, 29.645339965820312, -24.08343505859375, -58.43595886230469, 34.478782653808594, 16.394412994384766, 13.02840805053711, 20.48894691467285, 93.642578125, -57.94017791748047, 8.679855346679688, 11.029865264892578], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000513.npy"} +{"epoch": 0.7755102040816326, "step": 514, "batch_size": 64, "mean": 70.05230712890625, "std": 94.52629852294922, "min": -174.36642456054688, "p10": -44.038043975830064, "median": 76.79988098144531, "p90": 176.53552551269533, "max": 359.14044189453125, "pos_frac": 0.765625, "sample": [6.357282638549805, 79.79766845703125, 104.58659362792969, 105.45149230957031, 93.67900085449219, 75.92916107177734, 145.44747924804688, -19.126693725585938, 53.74322509765625, -13.179767608642578, 46.942020416259766, 184.96090698242188, 103.61428833007812, 68.94857788085938, -0.6382846832275391, 77.4778060913086, -117.5408935546875, 126.3105239868164, 10.140739440917969, 74.43358612060547, -174.36642456054688, 0.17536163330078125, 164.99691772460938, 136.635498046875, 196.39495849609375, -3.9503631591796875, 48.2095947265625, 151.38812255859375, 123.87132263183594, 203.90597534179688, -49.4337158203125, -56.72587585449219, 149.9501495361328, 147.22341918945312, 3.7182693481445312, 78.90320587158203, 113.15341186523438, 154.1563720703125, -6.15826416015625, 93.46342468261719, 52.881568908691406, -52.612548828125, -31.448143005371094, 15.741241455078125, 123.78599548339844, 76.12195587158203, 124.50741577148438, -16.723114013671875, 28.822998046875, 98.59891510009766, -26.57270050048828, 35.63273239135742, 2.1186294555664062, 160.02218627929688, -125.62124633789062, 132.609619140625, 194.0236358642578, 146.90164184570312, 234.48342895507812, 0.7435512542724609, 359.14044189453125, 178.757080078125, -82.76551818847656, 171.35189819335938], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000514.npy"} +{"epoch": 0.7770219198790628, "step": 515, "batch_size": 64, "mean": 58.35056686401367, "std": 90.46141815185547, "min": -168.44500732421875, "p10": -54.4922565460205, "median": 50.60700988769531, "p90": 181.1834197998047, "max": 220.88267517089844, "pos_frac": 0.75, "sample": [1.0696372985839844, 104.07550811767578, 40.350486755371094, 41.81720733642578, 220.88267517089844, 153.05532836914062, 14.502254486083984, 169.9599151611328, 11.895118713378906, 178.83343505859375, 48.970359802246094, 53.78827667236328, 89.65048217773438, -26.95127296447754, 102.52740478515625, 39.170501708984375, -75.98031616210938, 195.21937561035156, -95.0361557006836, -45.63970947265625, 85.14569854736328, 0.1041412353515625, -2.948211669921875, 24.325531005859375, -168.44500732421875, 142.68045043945312, 182.0896453857422, 81.00730895996094, -13.666679382324219, -36.642112731933594, 85.56328582763672, 136.83580017089844, 7.222408294677734, 6.560220718383789, 52.24365997314453, 161.31561279296875, -96.2672119140625, 148.84788513183594, -16.815176010131836, 133.4149627685547, -58.28620529174805, 75.86302185058594, 211.7949981689453, -115.46080780029297, 47.335601806640625, 193.17298889160156, 16.56224250793457, -21.49208641052246, 78.42566680908203, 173.10084533691406, 32.49559783935547, 108.90840911865234, 95.9521484375, 190.0534210205078, 205.79640197753906, -40.90414810180664, 121.30704498291016, 4.920139312744141, 179.0688934326172, -60.21160125732422, 54.736961364746094, 105.83749389648438, -2.634275436401367, 3.3605880737304688], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000515.npy"} +{"epoch": 0.7785336356764928, "step": 516, "batch_size": 64, "mean": 52.3648681640625, "std": 93.58353424072266, "min": -209.38552856445312, "p10": -61.160953521728516, "median": 60.79200744628906, "p90": 161.3625671386719, "max": 211.51478576660156, "pos_frac": 0.734375, "sample": [150.82894897460938, 194.37684631347656, 116.81422424316406, -69.11009216308594, -58.738067626953125, 22.237857818603516, -42.92591094970703, 102.39674377441406, 162.37933349609375, 107.32643127441406, 66.1007308959961, 46.208335876464844, 164.0289306640625, 211.51478576660156, 13.424274444580078, 3.8651981353759766, 77.5830078125, 152.3201141357422, 200.14366149902344, 118.69569396972656, -62.19933319091797, -185.73854064941406, 64.13847351074219, 107.87947845458984, 156.19256591796875, 71.6373062133789, 141.21926879882812, 14.413459777832031, 145.95712280273438, 125.08150482177734, -209.38552856445312, -0.1740875244140625, 1.0250225067138672, 17.83983612060547, -13.007423400878906, 158.9901123046875, 137.00357055664062, -8.330717086791992, 4.289745330810547, -0.9741859436035156, 116.03477478027344, -149.23532104492188, 107.04527282714844, 176.19064331054688, 39.307098388671875, 40.91156005859375, 144.82330322265625, 17.524059295654297, 57.44554138183594, 88.05781555175781, 5.4045562744140625, 111.96399688720703, 17.691925048828125, -37.30326843261719, -146.54449462890625, 104.70195007324219, -34.791988372802734, 88.47154235839844, -8.540489196777344, 24.385456085205078, 91.68417358398438, -0.6714973449707031, -75.03023529052734, 166.4963836669922], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000516.npy"} +{"epoch": 0.780045351473923, "step": 517, "batch_size": 64, "mean": 43.72069549560547, "std": 87.08187103271484, "min": -118.10006713867188, "p10": -60.69702835083008, "median": 25.615455627441406, "p90": 174.11417083740236, "max": 254.14920043945312, "pos_frac": 0.65625, "sample": [25.681331634521484, -25.95660400390625, -5.544178009033203, 81.78404235839844, -39.039588928222656, 25.549579620361328, -59.46263122558594, 73.25633239746094, 203.72509765625, 39.250675201416016, 10.536514282226562, -16.061546325683594, -63.001922607421875, 18.56529998779297, 21.959228515625, -33.058433532714844, -3.820222854614258, -1.4955978393554688, 60.670372009277344, 7.4070281982421875, 97.41816711425781, -108.14457702636719, 254.14920043945312, 139.9931640625, -118.10006713867188, 50.88860321044922, -13.440887451171875, 81.13553619384766, 43.979644775390625, 141.6785125732422, 51.57697296142578, 159.00440979003906, 12.056215286254883, 58.559486389160156, -41.52154541015625, -66.3813705444336, 16.890701293945312, 153.2081298828125, -19.377702713012695, -60.831077575683594, 74.22303009033203, 178.77822875976562, 245.76327514648438, 29.857807159423828, 96.07160949707031, 152.75186157226562, 21.14620590209961, 75.21653747558594, -100.45134735107422, -20.45446014404297, -60.384246826171875, 93.69912719726562, 17.45294952392578, 175.32632446289062, 213.38052368164062, 176.52780151367188, 52.04722595214844, -14.658008575439453, 34.160400390625, 20.82773208618164, 171.2858123779297, -80.57893371582031, 103.58851623535156, -11.1397705078125], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000517.npy"} +{"epoch": 0.781557067271353, "step": 518, "batch_size": 64, "mean": 55.49640655517578, "std": 89.66114044189453, "min": -139.51097106933594, "p10": -53.8123550415039, "median": 36.051185607910156, "p90": 178.4978591918946, "max": 264.9444580078125, "pos_frac": 0.734375, "sample": [97.65383911132812, 2.068756103515625, -2.0206680297851562, 186.83895874023438, -21.32720947265625, 6.569877624511719, 15.272392272949219, 80.33738708496094, -76.13902282714844, 36.398170471191406, 58.18648910522461, -45.138671875, 65.9061050415039, 98.50718688964844, 103.09651947021484, -79.56831359863281, 63.72099304199219, 129.71791076660156, -80.96658325195312, 150.6804962158203, 247.54931640625, -139.51097106933594, 0.30921173095703125, 91.5882568359375, 133.2337188720703, 124.04449462890625, -72.60624694824219, 131.56063842773438, -57.52964782714844, 137.38186645507812, 7.421733856201172, -29.962255477905273, 3.4017162322998047, 108.55641174316406, 42.95893859863281, -1.0568084716796875, 8.673652648925781, -8.56878662109375, 71.21461486816406, 264.9444580078125, 25.259567260742188, 35.704200744628906, 0.9646778106689453, 196.04583740234375, 126.08357238769531, 229.235107421875, -41.574798583984375, 159.03529357910156, 206.04104614257812, -57.80921173095703, -14.46769905090332, -7.747827529907227, 137.06033325195312, 0.810150146484375, 19.834327697753906, 151.40078735351562, 129.27793884277344, 42.44384765625, 4.573843002319336, -5.1605682373046875, 13.965377807617188, 6.106512069702148, 234.74227905273438, 106.54652404785156], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000518.npy"} +{"epoch": 0.783068783068783, "step": 519, "batch_size": 64, "mean": 33.876487731933594, "std": 111.0798568725586, "min": -291.819580078125, "p10": -105.81386642456054, "median": 27.730365753173828, "p90": 170.53179779052735, "max": 224.90115356445312, "pos_frac": 0.625, "sample": [-121.52643585205078, 163.58180236816406, 80.377685546875, -184.39576721191406, -64.77049255371094, 164.47103881835938, -7.747531890869141, 224.90115356445312, 12.341018676757812, 133.44482421875, 17.588409423828125, 15.045999526977539, 157.16851806640625, -29.75957489013672, 68.1550064086914, 79.59686279296875, 170.86160278320312, 20.015207290649414, -160.67282104492188, -46.959259033203125, 162.14932250976562, 137.8892364501953, -142.24888610839844, 166.11155700683594, 137.50436401367188, 183.24119567871094, -74.41984558105469, 12.248458862304688, 72.69276428222656, 109.74346923828125, -47.807220458984375, 161.757080078125, 28.102737426757812, -39.654022216796875, 78.61042022705078, -61.022735595703125, -46.07525634765625, 6.856578826904297, 209.6772918701172, -89.42837524414062, 65.22183227539062, 6.62762451171875, 143.58346557617188, 55.79706573486328, 43.360939025878906, -291.819580078125, 51.41558837890625, -27.948226928710938, 43.24151611328125, -98.22403717041016, 169.7622528076172, -54.92572784423828, -109.066650390625, 208.95578002929688, 49.93666076660156, 27.357994079589844, 188.56822204589844, 102.40316009521484, -4.393756866455078, -117.55268096923828, -47.51599884033203, -5.619012832641602, 186.17767333984375, -74.89425659179688], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000519.npy"} +{"epoch": 0.7845804988662132, "step": 520, "batch_size": 64, "mean": 49.947235107421875, "std": 85.69355010986328, "min": -127.58589172363281, "p10": -49.14239654541015, "median": 41.075313568115234, "p90": 166.5539108276367, "max": 303.9922180175781, "pos_frac": 0.703125, "sample": [133.7476348876953, -12.025827407836914, -3.6141204833984375, -9.56412124633789, 164.7370147705078, 24.80352783203125, 73.95285034179688, 9.434104919433594, -0.3937873840332031, 303.9922180175781, 136.25343322753906, 17.91485023498535, -5.541839599609375, -50.843231201171875, 82.39230346679688, 60.82215118408203, 17.41595458984375, -45.17378234863281, 10.210453033447266, 167.33258056640625, 190.366943359375, 79.37054443359375, 42.84624481201172, 188.3409423828125, 92.37576293945312, 60.72199249267578, 72.74620056152344, -95.20823669433594, -111.77484893798828, 132.19979858398438, 64.05406188964844, 1.4553298950195312, -7.576316833496094, 24.072669982910156, -1.3035430908203125, -0.7174072265625, 180.63917541503906, 86.22176361083984, 7.0898284912109375, -79.82654571533203, -127.58589172363281, 35.38288879394531, 49.34605407714844, -96.54457092285156, 65.28323364257812, 54.74993896484375, 28.146774291992188, 91.13473510742188, 94.66552734375, 39.37933349609375, 60.50172424316406, 187.74891662597656, 132.90492248535156, 34.83818817138672, 238.0248260498047, 42.77129364013672, 71.57589721679688, 4.6155242919921875, -3.1998634338378906, -1.0770759582519531, -3.4137649536132812, 152.6900177001953, 151.54400634765625, -108.80638122558594], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000520.npy"} +{"epoch": 0.7860922146636432, "step": 521, "batch_size": 64, "mean": 73.10690307617188, "std": 87.90787506103516, "min": -163.90066528320312, "p10": -14.786286163330074, "median": 70.09628677368164, "p90": 168.170751953125, "max": 346.0802307128906, "pos_frac": 0.75, "sample": [142.05654907226562, 59.529632568359375, 161.34173583984375, 54.184295654296875, 164.25009155273438, 92.73810577392578, 165.7684326171875, -3.8551712036132812, -4.7822418212890625, 63.915985107421875, 75.25985717773438, -18.579509735107422, 147.32980346679688, 58.343528747558594, 134.61312866210938, 93.37964630126953, 26.81144905090332, 30.418724060058594, -9.467666625976562, 171.91250610351562, -5.591651916503906, 162.855712890625, 46.99726867675781, 15.83941650390625, -8.909624099731445, 112.93502044677734, -91.19966125488281, 156.37103271484375, -7.7750396728515625, 125.49415588378906, 222.33067321777344, 346.0802307128906, -90.49199676513672, 26.139972686767578, -10.599525451660156, -7.105796813964844, 17.81623077392578, 81.20188903808594, 3.5785980224609375, 216.96661376953125, 212.8373260498047, 14.606548309326172, -46.274803161621094, 90.19840240478516, -10.558149337768555, 43.771392822265625, 141.78782653808594, 83.75056457519531, 39.28487777709961, 99.34593200683594, 119.46310424804688, 85.93839263916016, -163.90066528320312, 234.35220336914062, 147.1422119140625, 72.84205627441406, 67.35051727294922, -27.751800537109375, 90.4830322265625, -16.580612182617188, 109.53408813476562, 63.733665466308594, 140.18295288085938, 169.2003173828125], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000521.npy"} +{"epoch": 0.7876039304610734, "step": 522, "batch_size": 64, "mean": 46.652549743652344, "std": 109.78096771240234, "min": -231.37832641601562, "p10": -89.35727310180661, "median": 41.130836486816406, "p90": 196.0007110595703, "max": 268.4202880859375, "pos_frac": 0.671875, "sample": [-57.24072265625, 79.38826751708984, 5.806367874145508, 74.01608276367188, 93.17314910888672, 170.44667053222656, 42.97834014892578, 211.83306884765625, 164.10415649414062, 39.28821563720703, -154.47056579589844, -122.81929016113281, 65.53689575195312, 200.20669555664062, 38.13665771484375, 152.50454711914062, -64.30977630615234, 70.86358642578125, 132.72352600097656, 24.183744430541992, 194.41404724121094, 4.650554656982422, 44.86609649658203, -231.37832641601562, 254.70877075195312, 4.0355072021484375, 0.6726417541503906, -64.89495086669922, -175.69039916992188, 18.39299201965332, -17.078109741210938, 182.20199584960938, -32.41839599609375, 202.6258544921875, 132.08645629882812, 55.28422546386719, -9.004547119140625, 62.03001403808594, -18.669971466064453, 42.97345733642578, 69.33924865722656, -3.6959304809570312, 8.324958801269531, -29.00788116455078, 103.54765319824219, -0.742218017578125, 136.23672485351562, -174.35501098632812, 196.6807098388672, -47.7779541015625, -9.373222351074219, -128.55934143066406, 140.21145629882812, 268.4202880859375, -7.644195556640625, 17.211936950683594, -99.84112548828125, 235.13392639160156, 131.14015197753906, 117.51049041748047, 9.513528823852539, -31.120098114013672, 96.25279998779297, 172.19876098632812], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000522.npy"} +{"epoch": 0.7891156462585034, "step": 523, "batch_size": 64, "mean": 54.024444580078125, "std": 94.30965423583984, "min": -230.0576171875, "p10": -76.20312042236327, "median": 63.158199310302734, "p90": 157.19099578857424, "max": 211.44076538085938, "pos_frac": 0.78125, "sample": [30.194400787353516, 198.36636352539062, 6.206394195556641, -5.6961517333984375, 105.27481842041016, 89.9117202758789, 69.52796936035156, 42.36559295654297, 128.30654907226562, 43.25819396972656, 0.6211414337158203, 100.49617004394531, 181.13619995117188, -133.0716552734375, 76.32868957519531, 49.12117004394531, 99.08631896972656, -9.502752304077148, 48.73277282714844, -136.77517700195312, 15.583892822265625, 161.78634643554688, -44.97477722167969, 64.94915008544922, -95.22357177734375, 147.08999633789062, -41.599708557128906, 14.511333465576172, 14.782020568847656, 132.85902404785156, 38.919189453125, 111.41835021972656, 146.7127685546875, 108.98604583740234, 148.5281524658203, 138.27542114257812, 159.36593627929688, 44.02378845214844, 24.834678649902344, -230.0576171875, 61.36724853515625, -105.17511749267578, 211.44076538085938, 107.70701599121094, 149.2286376953125, -21.483558654785156, 9.416507720947266, 92.7177734375, 115.17085266113281, -70.3517074584961, 207.03346252441406, 55.89167404174805, 123.22906494140625, -78.71086883544922, 152.1161346435547, 126.1782455444336, 78.84283447265625, 189.392578125, 0.9801712036132812, -159.12547302246094, -51.17536163330078, 71.5419921875, 18.286376953125, 128.38629150390625], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000523.npy"} +{"epoch": 0.7906273620559335, "step": 524, "batch_size": 64, "mean": 54.84926986694336, "std": 80.42777252197266, "min": -174.33697509765625, "p10": -40.88294067382812, "median": 52.367488861083984, "p90": 163.75638732910159, "max": 235.72769165039062, "pos_frac": 0.765625, "sample": [133.15452575683594, 39.87873840332031, 220.7679443359375, 57.77500534057617, -13.9417724609375, -17.47612762451172, -45.33837127685547, -32.105682373046875, 89.53579711914062, 58.66794204711914, 168.46633911132812, -0.5205764770507812, -62.99562072753906, 55.901092529296875, 45.35899353027344, 192.41287231445312, -138.79583740234375, -44.644622802734375, 25.540897369384766, 129.6918182373047, 142.4734344482422, -174.33697509765625, 146.1124725341797, -0.5214576721191406, 14.967742919921875, 25.47087860107422, 166.98214721679688, 79.70270538330078, 99.53499603271484, 10.9781494140625, -13.739845275878906, 102.46138763427734, 36.06278991699219, 73.69534301757812, 110.44619750976562, 59.04771041870117, 37.653785705566406, 98.53781127929688, 30.222549438476562, -52.218963623046875, 46.491668701171875, -26.896392822265625, 6.929664611816406, 235.72769165039062, 26.94090461730957, 110.5753402709961, 160.50296020507812, 3.016956329345703, 60.7132568359375, 52.577606201171875, 86.76219940185547, 32.80406188964844, 52.157371520996094, 183.13369750976562, 58.6269416809082, 113.43273162841797, 165.0623779296875, 86.28600311279297, -77.60417175292969, 19.327903747558594, 160.70907592773438, -9.690177917480469, 99.16181945800781, 8.737739562988281], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000524.npy"} +{"epoch": 0.7921390778533636, "step": 525, "batch_size": 64, "mean": 45.26337432861328, "std": 89.45649719238281, "min": -165.513671875, "p10": -48.935272979736325, "median": 34.427337646484375, "p90": 167.9815841674805, "max": 298.09075927734375, "pos_frac": 0.65625, "sample": [31.73150634765625, -147.06463623046875, -45.491546630859375, -34.80923080444336, -85.05626678466797, 31.632843017578125, 37.16242218017578, 45.8970947265625, 216.068359375, -20.61431121826172, 91.22509765625, -0.810699462890625, 108.1402816772461, 26.06219482421875, 59.1387939453125, 158.0257568359375, 81.16983795166016, -30.203697204589844, 154.4891815185547, -50.658935546875, 44.41248321533203, -11.846027374267578, 195.22543334960938, 159.5351104736328, -10.864753723144531, 102.5595703125, -26.484512329101562, 104.50639343261719, 51.227882385253906, 92.01203918457031, 17.730026245117188, 159.02008056640625, 30.84984588623047, 98.17803955078125, 86.5194091796875, -27.104507446289062, 41.69034957885742, 5.13922119140625, 298.09075927734375, -10.822389602661133, -37.11570739746094, 59.97315979003906, 7.632335662841797, -165.513671875, -15.088188171386719, 171.9640655517578, 0.2578086853027344, 10.768348693847656, 37.1231689453125, 141.432373046875, -50.411155700683594, 176.47274780273438, 13.207923889160156, -16.072494506835938, 113.14287567138672, 196.62222290039062, -89.07351684570312, 60.500274658203125, 99.01235961914062, 103.99581909179688, -14.775657653808594, 171.60150146484375, -4.145994186401367, -100.26301574707031], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000525.npy"} +{"epoch": 0.7936507936507936, "step": 526, "batch_size": 64, "mean": 42.10501480102539, "std": 83.9603500366211, "min": -166.53512573242188, "p10": -52.89489860534667, "median": 43.473833084106445, "p90": 149.9031890869141, "max": 259.94964599609375, "pos_frac": 0.734375, "sample": [203.7025604248047, 10.294078826904297, -27.415903091430664, 8.717817306518555, -67.67635345458984, 10.542716979980469, 5.232746124267578, 193.43299865722656, -154.43028259277344, -99.07624816894531, 30.22418212890625, 69.7620849609375, -110.7418441772461, 22.193145751953125, 117.26126098632812, -21.20368194580078, 77.5596923828125, 132.4221649169922, 24.27306365966797, 111.22999572753906, 57.785675048828125, 171.0377960205078, 36.32661437988281, 114.8863525390625, 151.99188232421875, 9.34360122680664, 62.348915100097656, 88.38109588623047, -34.39479064941406, 145.02957153320312, -5.10304069519043, 66.46855926513672, 65.4063949584961, -28.654890060424805, 154.50286865234375, -4.532381057739258, 81.01946258544922, 33.68402862548828, 42.76451110839844, 27.442222595214844, 81.62419891357422, 54.19314193725586, -2.3549957275390625, 91.73038482666016, 70.82540893554688, -156.7098388671875, -1.7794456481933594, 90.65013885498047, 110.33056640625, -33.620208740234375, 81.95713806152344, 0.028644561767578125, 259.94964599609375, 44.18315505981445, 177.42575073242188, 13.991546630859375, -59.07295608520508, 73.70628356933594, 56.29008483886719, 38.55299377441406, 58.86741638183594, -38.47943115234375, 76.927734375, -166.53512573242188], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000526.npy"} +{"epoch": 0.7951625094482238, "step": 527, "batch_size": 64, "mean": 36.07099151611328, "std": 90.61422729492188, "min": -160.79623413085938, "p10": -73.38787536621093, "median": 17.74228286743164, "p90": 171.3644012451172, "max": 223.98361206054688, "pos_frac": 0.640625, "sample": [-5.705652236938477, 16.722976684570312, 35.609535217285156, 96.33859252929688, 20.40167236328125, 2.7563095092773438, 204.10287475585938, 55.3902702331543, 151.45265197753906, 214.86968994140625, 158.74758911132812, -27.76605224609375, 167.36268615722656, 14.060386657714844, 54.9862060546875, -69.92430877685547, 196.45773315429688, 1.0971927642822266, 85.103271484375, -49.865478515625, -98.20310974121094, -74.87226104736328, -33.46998596191406, -84.00996398925781, 91.28318786621094, 14.3636474609375, 223.98361206054688, 56.82420349121094, 21.897686004638672, 13.810333251953125, 94.53872680664062, 17.915924072265625, -40.86067199707031, 67.15798950195312, 20.047367095947266, 185.13919067382812, 47.93224334716797, -14.797607421875, -24.910947799682617, 131.5482635498047, 78.44329071044922, 4.335758209228516, 125.16580200195312, -31.046985626220703, -40.064971923828125, -16.992767333984375, -94.40570068359375, 173.0794219970703, -16.854232788085938, -7.569948196411133, -10.482879638671875, 2.929502487182617, 127.6561279296875, 110.06873321533203, -160.79623413085938, -25.15656280517578, 77.34100341796875, -4.742149353027344, 95.09672546386719, 187.12289428710938, -154.74305725097656, -135.64344787597656, 70.71849060058594, 17.568641662597656], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000527.npy"} +{"epoch": 0.7966742252456538, "step": 528, "batch_size": 64, "mean": 40.385128021240234, "std": 99.90628051757812, "min": -214.91409301757812, "p10": -48.12619857788085, "median": 36.10497760772705, "p90": 171.98799896240237, "max": 232.45858764648438, "pos_frac": 0.71875, "sample": [121.92015075683594, -214.91409301757812, 184.616455078125, -6.821199417114258, 53.140663146972656, 119.09066009521484, 63.819339752197266, 7.9836883544921875, 13.693962097167969, -1.4157867431640625, -3.676025390625, -37.428314208984375, 155.4936981201172, -174.71969604492188, -4.483144760131836, -4.350639343261719, 157.01527404785156, 14.134664535522461, 18.258451461791992, -20.808181762695312, -36.88213348388672, 232.45858764648438, 0.10260009765625, -189.98684692382812, 1.4735183715820312, 53.13325500488281, -52.71100616455078, -32.002784729003906, 12.93739128112793, 142.62142944335938, 78.75556945800781, 13.889251708984375, 42.0216178894043, 207.64004516601562, 94.49021911621094, 5.294515609741211, 209.81993103027344, 45.50200653076172, 82.26200866699219, 69.30268859863281, 163.2236328125, 175.74415588378906, 30.188337326049805, 57.41980743408203, -159.87811279296875, 53.13832092285156, 13.006214141845703, 6.657806396484375, 131.52932739257812, 3.6194686889648438, 47.78697204589844, -153.87913513183594, -160.49778747558594, 224.3380126953125, 209.37350463867188, 45.71864700317383, 5.718921661376953, -9.215232849121094, 149.18112182617188, -1.1983165740966797, 108.018798828125, 42.50077819824219, 105.28189849853516, 76.19923400878906], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000528.npy"} +{"epoch": 0.7981859410430839, "step": 529, "batch_size": 64, "mean": 84.01304626464844, "std": 88.18578338623047, "min": -151.92562866210938, "p10": -14.383003234863278, "median": 89.1004409790039, "p90": 190.5155258178711, "max": 248.3829345703125, "pos_frac": 0.828125, "sample": [129.42758178710938, -45.922725677490234, 82.04557800292969, 5.85968017578125, 59.58621597290039, 2.2056427001953125, 248.3829345703125, 190.31060791015625, -40.77814865112305, 15.64666748046875, 4.87611198425293, -1.008523941040039, 8.427947998046875, 108.76486206054688, 137.70924377441406, 110.7613296508789, -87.72820281982422, 146.00868225097656, -11.83111572265625, 146.007568359375, 186.90574645996094, -15.476669311523438, -31.058990478515625, 156.52871704101562, 93.56685638427734, 174.34327697753906, -1.6050033569335938, 7.545188903808594, 154.7111358642578, 27.74560546875, 209.54043579101562, 148.83860778808594, 109.00216674804688, 179.19479370117188, 110.57259368896484, 106.83690643310547, 164.8460693359375, 183.3833465576172, 22.16946029663086, 201.266357421875, 150.48904418945312, 166.37374877929688, 224.01844787597656, 31.714767456054688, 96.66292572021484, 170.35166931152344, 62.380950927734375, -2.822193145751953, 80.21041107177734, 35.660888671875, 30.753631591796875, 84.63402557373047, 37.145538330078125, 190.6033477783203, -95.9429931640625, 195.158203125, 71.51566314697266, 184.20542907714844, 107.92234802246094, 81.19825744628906, -151.92562866210938, 16.38800811767578, 8.960609436035156, 203.56991577148438], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000529.npy"} +{"epoch": 0.799697656840514, "step": 530, "batch_size": 64, "mean": 51.71576690673828, "std": 84.10457611083984, "min": -135.3158416748047, "p10": -25.109954452514646, "median": 33.61944103240967, "p90": 162.3186248779297, "max": 279.11407470703125, "pos_frac": 0.703125, "sample": [279.11407470703125, 56.60377883911133, 43.294166564941406, -2.664989471435547, 14.260398864746094, -17.931900024414062, 202.38226318359375, -17.385353088378906, 128.95411682128906, 135.07440185546875, 18.598346710205078, 177.43710327148438, -20.275033950805664, 26.289718627929688, 94.72445678710938, 65.48204803466797, 41.92900085449219, 74.40069580078125, 153.41053771972656, 9.170295715332031, 0.7625999450683594, -15.725822448730469, -113.03765869140625, 147.30198669433594, 129.69232177734375, -1.0454158782958984, 97.86491394042969, 60.275699615478516, 27.080963134765625, 174.50885009765625, 29.729469299316406, 21.60497283935547, 205.33856201171875, 239.38082885742188, 41.34492492675781, 31.00057029724121, 46.06999588012695, 106.66414642333984, -84.45097351074219, 12.682323455810547, -9.770462036132812, 99.65739440917969, -20.65032196044922, 63.70060729980469, -71.87390899658203, -23.77257537841797, 160.83958435058594, -18.561019897460938, -135.3158416748047, -16.091033935546875, -7.071168899536133, -57.76282501220703, 162.95249938964844, -25.683116912841797, 158.4485626220703, 50.02165222167969, 123.10133361816406, -27.41656494140625, 36.238311767578125, 12.302169799804688, 149.94558715820312, 53.779296875, 2.6412315368652344, 30.2381591796875], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000530.npy"} +{"epoch": 0.8012093726379441, "step": 531, "batch_size": 64, "mean": 55.08310317993164, "std": 88.43067169189453, "min": -178.7455291748047, "p10": -38.23912658691406, "median": 43.79004669189453, "p90": 174.0630874633789, "max": 236.3192138671875, "pos_frac": 0.6875, "sample": [-58.595489501953125, 123.69308471679688, 199.25833129882812, 109.67585754394531, 90.4478759765625, 73.99667358398438, 1.8199996948242188, 236.3192138671875, 54.99794006347656, -6.132274627685547, 43.07490539550781, 0.10949516296386719, 214.22702026367188, -6.3549957275390625, 141.05645751953125, 159.94979858398438, -122.05994415283203, -37.66200256347656, 21.715171813964844, 165.0902099609375, 74.22291564941406, 206.8015899658203, -80.61251068115234, -19.75273895263672, -35.04432678222656, 44.50518798828125, 69.4264144897461, 53.708984375, 36.03773498535156, 3.7322540283203125, 55.45677947998047, -14.170068740844727, -3.178060531616211, 12.5357666015625, -178.7455291748047, -6.481487274169922, 72.61372375488281, 140.74017333984375, 25.437728881835938, -38.48646545410156, 40.44319152832031, 69.55635833740234, 174.86456298828125, 168.0252685546875, -85.40846252441406, -50.53734588623047, 172.19297790527344, 165.32888793945312, 79.38885498046875, 29.825927734375, -11.441543579101562, 27.509685516357422, 65.48661804199219, 157.2533416748047, 70.98831176757812, -12.951541900634766, 103.81442260742188, -18.536571502685547, 155.01902770996094, 195.28976440429688, -1.6800308227539062, -0.03399848937988281, 190.46270751953125, 17.082847595214844], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000531.npy"} +{"epoch": 0.8027210884353742, "step": 532, "batch_size": 64, "mean": 60.55923080444336, "std": 90.5064468383789, "min": -132.42138671875, "p10": -64.29073791503905, "median": 63.67122840881348, "p90": 187.99888610839844, "max": 233.56578063964844, "pos_frac": 0.734375, "sample": [103.80287170410156, 73.193115234375, 188.828857421875, 188.83572387695312, -52.227508544921875, -15.024711608886719, 114.55286407470703, 186.06228637695312, -2.016284942626953, 136.9163360595703, -75.07463836669922, 119.10420227050781, 147.62986755371094, 32.33917236328125, 64.08840942382812, 39.84968566894531, 63.25404739379883, 106.79350280761719, 18.45033073425293, -109.55885314941406, -42.67906188964844, 12.294069290161133, 160.27015686035156, 52.46851348876953, 16.28143310546875, 79.58953857421875, 101.611083984375, 233.56578063964844, 103.47312927246094, 211.92599487304688, 166.8942413330078, 23.99245834350586, -7.405303955078125, 195.53945922851562, 21.480880737304688, 72.51631164550781, 96.45787048339844, -69.460693359375, 19.100448608398438, 16.530168533325195, -75.69408416748047, -32.59474182128906, 22.943767547607422, -28.97812271118164, 190.05526733398438, 53.61846160888672, 176.95208740234375, -51.73839569091797, 53.387359619140625, 133.0032196044922, 114.43232727050781, 101.5550308227539, -15.850440979003906, 192.1630096435547, -132.42138671875, 101.01051330566406, -116.34937286376953, 115.41510009765625, 157.9520721435547, -102.09835052490234, 3.198770523071289, -17.113428115844727, 108.84580993652344, 129.85061645507812], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000532.npy"} +{"epoch": 0.8042328042328042, "step": 533, "batch_size": 64, "mean": 60.84646987915039, "std": 88.75458526611328, "min": -174.4671173095703, "p10": -33.995217514038075, "median": 46.62698745727539, "p90": 170.71415863037114, "max": 265.113037109375, "pos_frac": 0.765625, "sample": [71.08069610595703, 152.54637145996094, 27.292274475097656, 52.79322814941406, 97.14797973632812, 80.21031951904297, 10.753089904785156, -15.802677154541016, 158.49147033691406, 114.60816955566406, -45.753570556640625, 3.022136688232422, 0.4594268798828125, -1.7444438934326172, 104.16783142089844, 265.113037109375, 17.06241798400879, 139.00204467773438, -55.82757568359375, -7.822929382324219, 14.405189514160156, 2.471902847290039, 101.47312927246094, 16.866348266601562, -64.57918548583984, 121.9556655883789, 117.71696472167969, 46.781585693359375, 20.335952758789062, -153.94895935058594, -22.518524169921875, -6.840595245361328, 175.95245361328125, 146.50344848632812, -5.687784194946289, 214.57264709472656, 26.965576171875, 253.82485961914062, 45.62165832519531, -37.36281204223633, 38.646240234375, 129.81439208984375, 118.35211181640625, 127.07946014404297, 149.7432098388672, 182.3734130859375, 58.94935607910156, -84.36186218261719, 11.370574951171875, -7.36151123046875, 7.42976188659668, 128.6210174560547, 128.90541076660156, -26.137496948242188, 2.8949527740478516, 46.472389221191406, 150.72886657714844, 93.427490234375, 34.527198791503906, 177.31295776367188, 144.98617553710938, 196.1809539794922, -174.4671173095703, 77.37734985351562], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000533.npy"} +{"epoch": 0.8057445200302343, "step": 534, "batch_size": 64, "mean": 56.857086181640625, "std": 98.99298858642578, "min": -182.3823699951172, "p10": -60.18272933959961, "median": 50.15578269958496, "p90": 179.0455062866211, "max": 294.24542236328125, "pos_frac": 0.65625, "sample": [35.25263214111328, -13.548768997192383, 149.57989501953125, 43.07742691040039, -22.318693161010742, 55.795814514160156, -5.5263214111328125, -182.3823699951172, 97.1697998046875, -82.94096374511719, -7.266809463500977, 30.440521240234375, 163.64898681640625, 154.64779663085938, -60.373939514160156, 294.24542236328125, 104.04022979736328, 48.79379653930664, 66.34770202636719, -26.021270751953125, 153.45223999023438, 226.00889587402344, 101.11468505859375, 73.27166748046875, -11.168586730957031, -127.20938110351562, -154.51943969726562, -9.069448471069336, 204.09786987304688, 25.239173889160156, 85.24055480957031, -62.68330001831055, 202.9208221435547, 178.1875, 179.41322326660156, 104.94232177734375, -66.62974548339844, 51.51776885986328, 252.0957794189453, 173.37596130371094, 104.23094177246094, 171.93832397460938, -40.951133728027344, 17.3316650390625, 148.66221618652344, 88.77508544921875, -8.210128784179688, 109.67686462402344, 17.259376525878906, -28.341079711914062, 11.448593139648438, 190.2874298095703, 83.13347625732422, -20.808666229248047, -26.001907348632812, 15.053611755371094, 115.74018096923828, -59.736572265625, 95.43965148925781, -22.215652465820312, 75.07990264892578, 48.66504669189453, 167.49468994140625, -37.35822677612305], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000534.npy"} +{"epoch": 0.8072562358276644, "step": 535, "batch_size": 64, "mean": 48.91130065917969, "std": 92.8858642578125, "min": -191.1544189453125, "p10": -44.19939918518066, "median": 36.85749626159668, "p90": 160.75220031738286, "max": 255.2859649658203, "pos_frac": 0.640625, "sample": [35.19694519042969, -39.81454849243164, 115.85636901855469, 53.561458587646484, 15.637382507324219, 35.37856674194336, -164.13571166992188, -41.771976470947266, -102.86324310302734, 40.887725830078125, 152.68038940429688, -75.01799011230469, 38.507774353027344, 120.8679428100586, -8.800758361816406, -6.848594665527344, -36.8409423828125, 41.96154022216797, -0.5847797393798828, -29.466567993164062, 35.37489318847656, 94.18412780761719, 144.1533966064453, -49.41973876953125, 146.47341918945312, 14.480384826660156, 199.71136474609375, -105.28253173828125, -45.239723205566406, 13.390657424926758, 111.96546936035156, 175.84567260742188, 95.84893798828125, -9.599891662597656, 93.33660888671875, 146.2490997314453, 36.146728515625, 255.2859649658203, -25.3212890625, 121.09380340576172, 53.657325744628906, -20.76866912841797, 240.15231323242188, 116.01626586914062, -11.918502807617188, -191.1544189453125, -2.757568359375, 130.36798095703125, -7.664646148681641, 80.14127349853516, 99.4337387084961, -29.016525268554688, 37.56826400756836, 201.40780639648438, 13.020622253417969, 120.52978515625, 11.955093383789062, 135.9161376953125, 133.7050018310547, -18.91082763671875, 69.30743408203125, -13.669151306152344, 225.72491455078125, 164.2115478515625], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000535.npy"} +{"epoch": 0.8087679516250945, "step": 536, "batch_size": 64, "mean": 75.20512390136719, "std": 79.35576629638672, "min": -69.44502258300781, "p10": -6.947177696228025, "median": 67.15356063842773, "p90": 190.6714294433594, "max": 256.43212890625, "pos_frac": 0.828125, "sample": [72.20932006835938, 17.204811096191406, -35.93213653564453, 174.43951416015625, 155.5394287109375, 29.884063720703125, -8.850433349609375, -19.515701293945312, 72.63629150390625, 13.918840408325195, -69.44502258300781, 85.05571746826172, 91.03754425048828, 197.33709716796875, 155.94032287597656, 132.12387084960938, 89.60443115234375, 180.46511840820312, 256.43212890625, 73.08130645751953, 21.240102767944336, 8.294282913208008, 174.5284423828125, 142.93606567382812, 32.46440124511719, 193.40609741210938, 113.62467956542969, 4.79881477355957, 113.1567611694336, 87.10162353515625, 197.8033447265625, -5.024921417236328, 2.3847618103027344, 70.70248413085938, -20.878387451171875, 5.939544677734375, 178.093994140625, 12.213729858398438, 90.74967956542969, 4.196317672729492, 188.52255249023438, 181.23631286621094, 68.41571807861328, -4.540491104125977, 20.550800323486328, 34.48155212402344, 14.362022399902344, 60.63738250732422, 65.89140319824219, 214.99227905273438, -3.237516403198242, 161.8914031982422, 51.540008544921875, 191.59237670898438, 106.76612854003906, 43.53173828125, 20.834999084472656, 226.4059600830078, -7.771001815795898, -54.53404235839844, 28.55269432067871, 111.71638488769531, -2.08953857421875, 2.4802398681640625], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000536.npy"} +{"epoch": 0.8102796674225246, "step": 537, "batch_size": 64, "mean": 60.637962341308594, "std": 95.52462768554688, "min": -113.46844482421875, "p10": -71.9122589111328, "median": 65.16035079956055, "p90": 181.37796020507812, "max": 276.40350341796875, "pos_frac": 0.671875, "sample": [115.30648803710938, 78.83849334716797, -6.2103271484375, 133.58554077148438, 238.11749267578125, 161.33935546875, 96.83364868164062, -1.055654525756836, 138.21185302734375, 77.82695007324219, 76.61896514892578, 1.2152576446533203, 180.7606964111328, 183.99050903320312, 123.84681701660156, 172.20986938476562, 169.81698608398438, 8.467428207397461, -10.269119262695312, -15.130258560180664, -2.532032012939453, 64.2305908203125, 40.52119445800781, 7.083488464355469, -8.755815505981445, 204.7957763671875, 92.98977661132812, 15.584205627441406, -79.32715606689453, -10.898359298706055, 66.0901107788086, 27.743534088134766, 104.74401092529297, -36.739356994628906, -81.72270965576172, 16.501354217529297, 253.37521362304688, 106.6793212890625, 2.824249267578125, -16.215770721435547, 20.79590606689453, 177.74757385253906, -95.74607849121094, 72.96214294433594, -32.256317138671875, -34.00719451904297, 128.02459716796875, -32.21417236328125, 71.03762817382812, 80.10609436035156, -3.232940673828125, 123.14244079589844, -54.61083221435547, 159.76727294921875, 181.6425018310547, 276.40350341796875, -98.74899291992188, 133.0848846435547, -82.0035629272461, 47.34733581542969, 169.634521484375, 190.98822021484375, -113.46844482421875, -96.85904693603516], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000537.npy"} +{"epoch": 0.8117913832199547, "step": 538, "batch_size": 64, "mean": 66.09611511230469, "std": 86.48246002197266, "min": -165.93386840820312, "p10": -31.06011657714843, "median": 57.271568298339844, "p90": 169.69999389648441, "max": 314.76617431640625, "pos_frac": 0.8125, "sample": [-47.754615783691406, 141.1611328125, 39.08380889892578, 18.73159408569336, 71.78398132324219, -165.93386840820312, 58.48612594604492, -25.614715576171875, 85.19850158691406, 133.9042510986328, 65.65178680419922, 172.6434326171875, 8.45538330078125, 149.27005004882812, 45.90386962890625, 45.270263671875, 144.67042541503906, 162.83197021484375, 20.843284606933594, 56.057010650634766, 54.08978271484375, 2.1194076538085938, 184.770751953125, 127.07846069335938, 29.131515502929688, -36.84695053100586, 136.8670196533203, -12.715309143066406, 214.5799560546875, 21.670372009277344, -20.13653564453125, 135.96658325195312, -24.30414581298828, 10.78997802734375, 4.695655822753906, 46.689537048339844, 46.509674072265625, 80.56640625, 1.7577362060546875, 55.726806640625, 248.8184814453125, -33.39385986328125, 196.74325561523438, 78.91278076171875, -71.3759994506836, 97.47317504882812, -43.96788787841797, 152.34295654296875, 130.64393615722656, 314.76617431640625, 158.3127899169922, 61.122406005859375, 116.97868347167969, -110.71539306640625, 109.13714599609375, 71.17347717285156, 205.951904296875, 0.75531005859375, 110.48587036132812, 12.45941162109375, 30.829811096191406, 74.97344970703125, 94.82384490966797, -16.750499725341797], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000538.npy"} +{"epoch": 0.8133030990173847, "step": 539, "batch_size": 64, "mean": 49.074729919433594, "std": 82.52106475830078, "min": -118.71429443359375, "p10": -24.03227996826172, "median": 28.213669776916504, "p90": 173.57068481445316, "max": 265.18292236328125, "pos_frac": 0.75, "sample": [70.45764923095703, 99.97979736328125, 5.616493225097656, 194.26849365234375, 31.428274154663086, -21.802635192871094, 176.49832153320312, 142.19927978515625, 100.77011108398438, 11.059738159179688, 61.68623352050781, 18.343231201171875, 46.25738525390625, 7.4081573486328125, -22.591659545898438, -9.574142456054688, -14.490463256835938, -2.4610366821289062, 194.19534301757812, 83.94219207763672, 11.892427444458008, -44.82741928100586, 49.46641540527344, -99.01370239257812, 7.551109313964844, -118.71429443359375, -6.208028793334961, 113.18417358398438, 239.99725341796875, 49.95538330078125, 23.53533172607422, -4.080841064453125, -25.119110107421875, 16.5750732421875, 221.9241943359375, 51.428733825683594, 11.066749572753906, 29.099212646484375, 166.73953247070312, 17.251718521118164, -20.094802856445312, 48.12591552734375, 66.23599243164062, 16.93437957763672, 107.29623413085938, 50.10249328613281, -100.01287078857422, 127.6805648803711, 13.395927429199219, -24.649688720703125, 157.90647888183594, 42.21916961669922, 18.21927261352539, -17.859947204589844, 141.7816162109375, 71.46844482421875, 4.7476043701171875, 30.407291412353516, -103.08233642578125, 118.9885482788086, 27.328126907348633, 200.51547241210938, 265.18292236328125, 13.051498413085938], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000539.npy"} +{"epoch": 0.8148148148148148, "step": 540, "batch_size": 64, "mean": 72.91771697998047, "std": 86.478271484375, "min": -131.7114715576172, "p10": -23.716108131408685, "median": 63.4570255279541, "p90": 181.22172546386722, "max": 283.1352233886719, "pos_frac": 0.8125, "sample": [-16.87933349609375, 0.0274505615234375, 283.1352233886719, 174.890869140625, 5.993513107299805, -131.7114715576172, 106.69642639160156, 104.22709655761719, 70.27849578857422, 5.334598541259766, 56.635555267333984, 145.36605834960938, 174.0540313720703, 37.14159393310547, -76.44994354248047, 38.53993225097656, 161.55596923828125, 109.97493743896484, 12.873546600341797, 99.92913818359375, 37.76861572265625, -73.41175842285156, 83.52230834960938, 43.82713317871094, 222.81024169921875, 146.69732666015625, -26.646154403686523, 99.11337280273438, -61.509033203125, 27.178726196289062, 79.71652221679688, 183.032958984375, 170.0599365234375, 87.38372802734375, 176.99551391601562, -3.683307647705078, -12.665000915527344, 162.3819580078125, -39.44866943359375, 2.442209243774414, -1.0009498596191406, 166.2766876220703, 159.79962158203125, 194.94390869140625, 190.32447814941406, 28.142776489257812, 171.8388671875, 48.80851364135742, 79.64738464355469, -68.89481353759766, 50.163780212402344, 124.17929077148438, 47.74737548828125, 4.353813171386719, 2.6016616821289062, 56.224090576171875, -13.348152160644531, 216.0159454345703, 28.352951049804688, 89.76676940917969, 155.30322265625, 10.93171501159668, 73.28495788574219, 184.0896453857422], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000540.npy"} +{"epoch": 0.8163265306122449, "step": 541, "batch_size": 64, "mean": 65.40504455566406, "std": 81.36196899414062, "min": -136.0809326171875, "p10": -25.43951396942138, "median": 57.731651306152344, "p90": 168.80260009765627, "max": 202.23300170898438, "pos_frac": 0.734375, "sample": [155.54342651367188, 50.701812744140625, 103.85636901855469, 176.665283203125, -10.812545776367188, 143.68191528320312, -7.266845703125, 143.85931396484375, 165.7830810546875, 7.461578369140625, -8.990921020507812, -62.145782470703125, 14.2191162109375, 112.54581451416016, -5.8404693603515625, -136.0809326171875, 147.01071166992188, 170.0966796875, 46.49977111816406, 174.50379943847656, -56.200050354003906, 46.70957946777344, 184.43959045410156, 161.31060791015625, 161.238037109375, 96.26234436035156, 160.85812377929688, -15.959732055664062, -63.24092483520508, -4.381893157958984, 109.26667022705078, 27.181154251098633, 180.97637939453125, 202.23300170898438, 11.480857849121094, 124.49403381347656, 111.04806518554688, -27.524322509765625, 111.74028015136719, -1.893686294555664, 2.3120059967041016, -64.38972473144531, 111.73797607421875, 150.86083984375, 42.10747528076172, 96.13005065917969, 135.813232421875, 134.84063720703125, -76.71195983886719, 7.687469482421875, 2.1169185638427734, 146.8883056640625, 70.05931854248047, 55.53224182128906, -16.792922973632812, 3.4752197265625, 59.931060791015625, 66.10252380371094, -20.574960708618164, 31.815574645996094, 115.85533142089844, -9.89592170715332, 184.23255920410156, 55.46027374267578], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000541.npy"} +{"epoch": 0.817838246409675, "step": 542, "batch_size": 64, "mean": 73.235107421875, "std": 96.0574951171875, "min": -181.18199157714844, "p10": -65.97272109985352, "median": 63.180240631103516, "p90": 184.84061279296876, "max": 257.0937194824219, "pos_frac": 0.796875, "sample": [141.50074768066406, 121.51751708984375, 12.668800354003906, 225.28839111328125, 58.60334777832031, 17.10943603515625, 65.62432861328125, 66.44371032714844, 115.04904174804688, 71.1288833618164, 49.40359115600586, -10.251518249511719, -67.45165252685547, 174.73001098632812, 45.528289794921875, 150.71725463867188, 59.41362762451172, 257.0937194824219, -115.16636657714844, 176.50543212890625, 175.83175659179688, 210.74160766601562, 47.1302490234375, 1.0007553100585938, -116.89726257324219, -181.18199157714844, 119.63308715820312, 54.612030029296875, 121.8965072631836, -62.521881103515625, 171.7796630859375, 184.5638427734375, 1.7075252532958984, 182.1256103515625, -77.35761260986328, -9.238239288330078, -1.579742431640625, 99.41780090332031, -1.1910438537597656, 126.95964813232422, 17.7572021484375, 32.49707794189453, 184.959228515625, -69.08363342285156, 83.31803894042969, 4.516578674316406, 175.45413208007812, 31.225791931152344, 53.401161193847656, 210.42791748046875, 143.25930786132812, 201.457763671875, -83.09930419921875, 39.746742248535156, -6.290605545043945, 6.554645538330078, 20.736953735351562, 179.683837890625, 151.38134765625, 60.73615264892578, 88.1256103515625, 212.99530029296875, 102.35588836669922, 182.041015625], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000542.npy"} +{"epoch": 0.8193499622071051, "step": 543, "batch_size": 64, "mean": 67.49037170410156, "std": 87.02543640136719, "min": -196.59771728515625, "p10": -17.096081924438476, "median": 63.13206481933594, "p90": 178.5245101928711, "max": 219.83261108398438, "pos_frac": 0.796875, "sample": [29.581863403320312, 27.951473236083984, 83.77229309082031, 0.05921745300292969, 96.14213562011719, 26.453075408935547, 124.70220947265625, 163.57455444335938, -156.48313903808594, 195.13800048828125, 67.866455078125, 150.40069580078125, 142.83071899414062, 164.57554626464844, 214.8912353515625, 92.75730895996094, 172.91189575195312, -84.52857971191406, 64.23253631591797, 184.41470336914062, 19.654333114624023, -1.4250259399414062, 5.000041961669922, 48.326812744140625, 9.676280975341797, 168.08978271484375, -196.59771728515625, 1.357147216796875, -4.049571990966797, -57.88911437988281, 34.39427185058594, 166.64035034179688, 185.98532104492188, 29.835453033447266, 159.2401123046875, 90.97142028808594, 180.92991638183594, -1.737588882446289, -34.64366912841797, -15.127761840820312, 88.81666564941406, 95.76213836669922, 149.43069458007812, 36.9808349609375, 167.61798095703125, 37.56867218017578, 104.31151580810547, 219.83261108398438, 8.514324188232422, 68.13256072998047, -17.939647674560547, 62.031593322753906, 61.14996337890625, -1.6339797973632812, 100.25785827636719, 39.977294921875, 94.79682159423828, 19.47163200378418, 12.576507568359375, -38.03646469116211, 141.7409210205078, 215.861328125, -3.939990997314453, 106.22662353515625], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000543.npy"} +{"epoch": 0.8208616780045351, "step": 544, "batch_size": 64, "mean": 77.56633758544922, "std": 98.59868621826172, "min": -134.3792266845703, "p10": -48.17697677612304, "median": 71.09458923339844, "p90": 195.68131713867191, "max": 276.55072021484375, "pos_frac": 0.796875, "sample": [18.816986083984375, -97.20207214355469, 71.630615234375, 25.121065139770508, 131.75430297851562, 57.860992431640625, -94.09847259521484, 40.760963439941406, 0.60601806640625, 31.25316619873047, 27.9200439453125, 70.55856323242188, -8.24078369140625, 183.58840942382812, 102.87516021728516, 27.657140731811523, -126.16630554199219, 101.35454559326172, 114.1418228149414, 96.7420654296875, 95.28971862792969, 127.89287567138672, 153.31524658203125, 168.7008819580078, 188.48068237304688, 56.14710235595703, 31.4681396484375, -9.968818664550781, 0.17296409606933594, -134.3792266845703, 276.55072021484375, -122.46893310546875, 162.507080078125, -4.923210144042969, 184.6961669921875, 140.00987243652344, 256.529296875, -45.88404846191406, 47.32814025878906, 61.901451110839844, 144.7804412841797, 46.019554138183594, 234.9521484375, 44.37427520751953, 31.56574249267578, 85.18475341796875, 133.72637939453125, 114.40058135986328, 221.4617919921875, -49.56365966796875, 7.173746109008789, 168.108154296875, 245.4593505859375, 257.39874267578125, -49.15966033935547, -19.562515258789062, 198.76730346679688, 22.76605224609375, 184.77999877929688, 155.93804931640625, -1.637176513671875, 81.927734375, 117.07252502441406, 178.010986328125], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000544.npy"} +{"epoch": 0.8223733938019653, "step": 545, "batch_size": 64, "mean": 46.31963348388672, "std": 89.90167999267578, "min": -190.4232940673828, "p10": -53.90981521606445, "median": 30.338486671447754, "p90": 173.75733795166016, "max": 240.37318420410156, "pos_frac": 0.65625, "sample": [100.2841567993164, 101.80516815185547, -56.34478759765625, 195.41629028320312, 13.51968002319336, -2.4786148071289062, -33.21929168701172, -45.801246643066406, -23.76200294494629, 39.81295394897461, 104.74591064453125, -2.3897705078125, 174.51844787597656, 28.324068069458008, 42.50647735595703, 34.857383728027344, 46.61381530761719, 171.98141479492188, -55.88824462890625, 91.06561279296875, -13.165107727050781, 128.72152709960938, -15.285942077636719, 131.57553100585938, 112.21334838867188, -6.321647644042969, 42.633323669433594, 26.37290382385254, -15.047378540039062, 6.846067428588867, -4.710659027099609, -49.293479919433594, -102.56622314453125, 112.174560546875, -65.7593994140625, -20.741315841674805, 182.51080322265625, 186.48681640625, 140.53211975097656, -9.545097351074219, -8.38314437866211, 216.51138305664062, 144.2616729736328, 20.823593139648438, 19.06682586669922, 98.73184967041016, -28.23345184326172, 114.92357635498047, 66.73915100097656, -190.4232940673828, 24.33087158203125, 81.1014404296875, 32.3529052734375, 240.37318420410156, 94.884765625, -106.74650573730469, 2.396503448486328, 121.5002212524414, -143.57247924804688, 1.0494403839111328, 88.81189727783203, 167.43052673339844, 199.97491455078125, 13.352668762207031], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000545.npy"} +{"epoch": 0.8238851095993953, "step": 546, "batch_size": 64, "mean": 53.73503494262695, "std": 91.04003143310547, "min": -175.326416015625, "p10": -82.17007904052733, "median": 57.48374366760254, "p90": 173.25964965820313, "max": 205.3402099609375, "pos_frac": 0.796875, "sample": [175.04534912109375, -39.94317626953125, 168.34393310546875, 62.739219665527344, 88.52313232421875, 153.3267059326172, -6.768463134765625, -47.66944885253906, 34.858245849609375, -63.967803955078125, -175.326416015625, 114.83839416503906, 27.05331039428711, 28.95245361328125, -135.6975860595703, 182.31063842773438, 18.764890670776367, 2.9623031616210938, -59.62178039550781, 37.802940368652344, -121.18087768554688, 68.8123779296875, 72.89456176757812, 114.14418029785156, 36.25299072265625, 87.35153198242188, 139.09080505371094, 20.3414306640625, 124.43882751464844, 196.47955322265625, 115.75099182128906, 8.782478332519531, 153.80496215820312, 51.58851623535156, 52.228267669677734, -90.17196655273438, 36.83686065673828, 205.3402099609375, 87.72404479980469, 91.64022827148438, 13.23366928100586, 25.604833602905273, -89.97105407714844, 88.63101959228516, 33.261924743652344, 114.47437286376953, -36.82024383544922, 18.382747650146484, 89.12358856201172, 115.72560119628906, 136.7723846435547, 41.09757995605469, 202.164794921875, -120.78518676757812, 5.349205017089844, 68.72599792480469, 140.88644409179688, 94.70515441894531, 180.8969268798828, 64.05951690673828, 184.73175048828125, -124.21623229980469, 169.093017578125, 5.237714767456055], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000546.npy"} +{"epoch": 0.8253968253968254, "step": 547, "batch_size": 64, "mean": 71.930419921875, "std": 92.11223602294922, "min": -195.16070556640625, "p10": -15.433628082275384, "median": 69.72477340698242, "p90": 183.71318664550782, "max": 288.97247314453125, "pos_frac": 0.828125, "sample": [4.4181060791015625, 11.17718505859375, 19.81781578063965, 13.692672729492188, 199.16339111328125, 70.4417724609375, -76.41246795654297, 234.21780395507812, 89.94671630859375, 144.95742797851562, 137.2547607421875, 121.42900848388672, 44.35987091064453, 81.11532592773438, 62.79573440551758, -5.1706390380859375, 107.34004211425781, 172.6367645263672, 21.29952621459961, 41.79985046386719, 164.5186767578125, 174.5447235107422, 178.23886108398438, 1.817626953125, 195.64822387695312, 123.90552520751953, -7.7090606689453125, 88.2616195678711, 74.83340454101562, 25.73566436767578, 97.12269592285156, -1.4677677154541016, -195.16070556640625, 130.1030731201172, -36.57963562011719, 71.25875854492188, 174.27059936523438, 36.62497329711914, 183.60293579101562, 63.957130432128906, 104.9632797241211, 183.76043701171875, 113.62629699707031, 138.62782287597656, -102.84799194335938, 69.00777435302734, 12.045494079589844, -171.99932861328125, 22.768997192382812, 32.70832824707031, 197.50106811523438, 171.4954071044922, 288.97247314453125, -8.037971496582031, 76.98467254638672, -40.046112060546875, 32.1794319152832, 163.37216186523438, 1.4834041595458984, 44.721092224121094, 46.50250244140625, 13.668975830078125, 190.88375854492188, -18.603195190429688], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000547.npy"} +{"epoch": 0.8269085411942555, "step": 548, "batch_size": 64, "mean": 44.76388931274414, "std": 90.05619812011719, "min": -130.04046630859375, "p10": -73.97176208496093, "median": 35.464040756225586, "p90": 179.2696502685547, "max": 224.13467407226562, "pos_frac": 0.640625, "sample": [107.73951721191406, 147.01181030273438, -31.273529052734375, -51.68379211425781, -118.371826171875, 78.74107360839844, -21.336265563964844, 222.6937255859375, 142.26780700683594, 59.304344177246094, -32.91777038574219, 184.65432739257812, 0.7679710388183594, 14.758155822753906, 38.389373779296875, -0.7279567718505859, -101.74235534667969, 40.658058166503906, -6.325691223144531, 106.8193359375, 180.97872924804688, 69.45985412597656, -99.33442687988281, 18.562362670898438, 128.41668701171875, 32.5387077331543, 210.16627502441406, 175.28179931640625, 20.286285400390625, 105.05155944824219, -38.35762405395508, 94.10562133789062, -15.723907470703125, 117.14857482910156, 29.383438110351562, -25.288711547851562, 201.8558807373047, 48.956443786621094, -40.215476989746094, 73.76822662353516, 75.54952239990234, -4.731561660766602, 58.94603729248047, -130.04046630859375, 224.13467407226562, 1.77764892578125, -19.939170837402344, 70.37196350097656, -89.547119140625, 90.92218780517578, 26.252655029296875, -111.40164184570312, 48.12641906738281, 124.16827392578125, 93.61898040771484, -8.091270446777344, 146.14329528808594, -23.838134765625, 29.84710693359375, -61.80793762207031, 190.05841064453125, 147.3430938720703, -79.18482971191406, -0.25576019287109375], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000548.npy"} +{"epoch": 0.8284202569916855, "step": 549, "batch_size": 64, "mean": 53.36622619628906, "std": 97.95784759521484, "min": -186.38465881347656, "p10": -61.47577056884766, "median": 52.58894729614258, "p90": 183.2603500366211, "max": 278.75177001953125, "pos_frac": 0.6875, "sample": [5.557220458984375, 33.16736602783203, -57.915321350097656, 54.18273162841797, -6.006065368652344, -68.73518371582031, 93.84354400634766, 4.40330696105957, 80.81575775146484, 198.98025512695312, 185.51707458496094, 7.768135070800781, 81.79937744140625, 138.7249755859375, -4.3387451171875, -28.97595977783203, -110.24104309082031, 77.059326171875, 126.08647155761719, 126.53221130371094, 144.43267822265625, 131.8916778564453, 203.65853881835938, -87.05950927734375, 59.544189453125, 12.46136474609375, 24.247386932373047, 186.04244995117188, 132.19500732421875, -58.219139099121094, 177.99465942382812, 140.45651245117188, 278.75177001953125, -21.616044998168945, 131.03001403808594, 227.78768920898438, -8.829465866088867, -116.64511108398438, -38.432342529296875, 141.7054443359375, -175.98611450195312, 31.651748657226562, -16.375473022460938, 44.08462905883789, 70.79798889160156, 123.96977233886719, -60.386688232421875, 118.86099243164062, 190.81524658203125, 50.99516296386719, -5.7204437255859375, 118.25062561035156, 128.82681274414062, 99.25575256347656, 77.7698974609375, 9.101226806640625, 11.481115341186523, -0.9730720520019531, -23.72592544555664, 90.67894744873047, 177.7329864501953, -186.38465881347656, -61.94252014160156, 3.0372772216796875], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000549.npy"} +{"epoch": 0.8299319727891157, "step": 550, "batch_size": 64, "mean": 37.31532287597656, "std": 87.05760192871094, "min": -163.85243225097656, "p10": -72.62949066162109, "median": 29.206144332885742, "p90": 159.1249343872071, "max": 227.96054077148438, "pos_frac": 0.71875, "sample": [67.08869934082031, 198.48736572265625, 182.10421752929688, 46.24119567871094, -111.60940551757812, 9.991798400878906, 0.2695331573486328, -21.876632690429688, -4.087532043457031, 57.277099609375, 144.096435546875, 43.95348358154297, 50.26251220703125, 0.9974136352539062, 16.277742385864258, 185.56048583984375, 196.60597229003906, 95.2149887084961, 26.36248779296875, 32.049800872802734, 131.53054809570312, -13.83712387084961, 119.53494262695312, 101.26942443847656, 140.03286743164062, -67.99235534667969, 227.96054077148438, -7.465648651123047, 23.300643920898438, -100.94224548339844, -99.19706726074219, 25.753311157226562, -73.27365112304688, 79.12098693847656, 5.4102783203125, 67.7579345703125, 53.70397186279297, 1.770477294921875, -41.399314880371094, 10.980209350585938, -71.12644958496094, 65.53804016113281, 21.394107818603516, 45.043399810791016, -5.6911163330078125, 95.63180541992188, 18.889495849609375, 19.688417434692383, 40.814697265625, 113.69313049316406, -107.92849731445312, 92.87701416015625, 190.66189575195312, 49.172828674316406, 137.2272186279297, 38.095558166503906, -163.85243225097656, 11.303838729858398, 165.5657196044922, -154.34762573242188, 100.17901611328125, -41.81671905517578, -20.163463592529297, -51.95549392700195], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000550.npy"} +{"epoch": 0.8314436885865457, "step": 551, "batch_size": 64, "mean": 50.47639465332031, "std": 85.26113891601562, "min": -166.97140502929688, "p10": -20.30245609283447, "median": 21.53953456878662, "p90": 159.21590270996094, "max": 421.81878662109375, "pos_frac": 0.765625, "sample": [5.304649353027344, 67.1317138671875, 89.09449768066406, 21.1322021484375, 93.54098510742188, 57.93016815185547, 421.81878662109375, 3.470867156982422, 21.946866989135742, 37.847557067871094, -29.644702911376953, 22.257232666015625, 131.2640380859375, 4.752054214477539, 70.35186767578125, 30.098857879638672, 142.80307006835938, 47.518760681152344, -166.97140502929688, -24.103668212890625, -11.107271194458008, 12.675880432128906, 96.9269790649414, 12.865631103515625, 74.99954223632812, 181.89620971679688, -7.4794464111328125, 79.91507720947266, 48.77000427246094, 155.4246063232422, 30.03293800354004, -36.617103576660156, 0.30391693115234375, -2.437835693359375, 46.20472717285156, 229.1983642578125, 4.01763916015625, 136.92864990234375, -15.747701644897461, 11.390884399414062, 4.589302062988281, 56.90605926513672, -22.254493713378906, 9.891284942626953, 147.15074157714844, 201.55010986328125, 160.8407440185547, 10.942951202392578, 19.619522094726562, 1.2880821228027344, 62.458946228027344, 96.73519134521484, 2.584381103515625, -48.23747634887695, 11.528648376464844, -1.4991912841796875, -11.032825469970703, 186.37156677246094, -2.841705322265625, 10.448719024658203, -51.620025634765625, -3.7616233825683594, 172.9831085205078, 120.14108276367188], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000551.npy"} +{"epoch": 0.8329554043839759, "step": 552, "batch_size": 64, "mean": 57.80108642578125, "std": 80.08467102050781, "min": -183.861572265625, "p10": -17.853820037841796, "median": 62.4782657623291, "p90": 151.00320739746095, "max": 234.81822204589844, "pos_frac": 0.84375, "sample": [3.4013233184814453, 28.4815673828125, 43.68811798095703, -18.14385223388672, 117.77447509765625, 62.49763107299805, 2.5360851287841797, 22.819473266601562, 35.85966491699219, 132.3598175048828, 180.29928588867188, 234.81822204589844, 111.94622802734375, 54.71858215332031, -10.469062805175781, -67.59774017333984, 9.176246643066406, 119.93182373046875, 61.758201599121094, -17.177078247070312, 51.071128845214844, 112.96551513671875, 100.58885192871094, 119.22718048095703, 112.28652954101562, 0.9039764404296875, 84.90746307373047, 134.5771942138672, 153.4002227783203, -183.861572265625, 10.849416732788086, 25.534202575683594, 80.80252075195312, -139.77398681640625, 78.8793716430664, -0.5624618530273438, 177.47891235351562, 53.90382385253906, 1.1601486206054688, 0.29279327392578125, 168.57843017578125, 28.288055419921875, -52.80976104736328, 112.19017028808594, 96.87533569335938, 14.97882080078125, 86.06288146972656, 53.90167236328125, -173.30227661132812, 165.00547790527344, 184.73170471191406, 91.64698028564453, 15.342267990112305, -60.149436950683594, 105.75193786621094, 67.8429946899414, 62.458900451660156, 59.142127990722656, 140.2447967529297, 78.16658020019531, 79.17720794677734, 74.98828887939453, 145.41017150878906, 71.43576049804688], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000552.npy"} +{"epoch": 0.8344671201814059, "step": 553, "batch_size": 64, "mean": 53.45932388305664, "std": 101.73280334472656, "min": -189.21560668945312, "p10": -52.26652183532715, "median": 44.556766510009766, "p90": 202.51326751708987, "max": 301.9083251953125, "pos_frac": 0.640625, "sample": [235.60980224609375, -33.27466583251953, -6.2210235595703125, 91.58758544921875, 6.265510559082031, -2.550577163696289, 155.18569946289062, 195.61981201171875, -19.67987823486328, -15.961357116699219, 45.238807678222656, 113.07061767578125, 205.4676055908203, 234.13059997558594, -50.546546936035156, 107.81005859375, -1.8004894256591797, 58.975074768066406, 62.581024169921875, -189.21560668945312, -8.041501998901367, 126.03276062011719, -19.45404815673828, 120.88018798828125, 150.13404846191406, 37.571083068847656, 14.941566467285156, 47.150421142578125, -3.93475341796875, -56.73486328125, 248.07763671875, 165.12940979003906, 80.02404022216797, 301.9083251953125, 43.874725341796875, 91.82820892333984, 178.3253936767578, 122.35606384277344, 95.53353881835938, 76.69852447509766, 11.708885192871094, 52.91132736206055, 21.697751998901367, -16.076030731201172, -60.06834411621094, 40.784400939941406, -6.095149993896484, 215.01666259765625, -169.99151611328125, -109.52143859863281, 68.20419311523438, 140.36602783203125, 121.70938110351562, -52.257301330566406, -48.78215789794922, 31.391830444335938, -28.244274139404297, -124.61430358886719, 104.75370788574219, 74.10718536376953, -36.573143005371094, -52.27047348022461, 224.62689208984375, 14.019607543945312], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000553.npy"} +{"epoch": 0.8359788359788359, "step": 554, "batch_size": 64, "mean": 65.028076171875, "std": 90.00746154785156, "min": -181.77752685546875, "p10": -25.8632640838623, "median": 53.620208740234375, "p90": 181.38377685546877, "max": 244.85707092285156, "pos_frac": 0.765625, "sample": [59.085113525390625, 208.47166442871094, 186.62074279785156, 203.35595703125, -1.960968017578125, 77.34759521484375, 23.189775466918945, 24.876598358154297, 59.35447692871094, 140.9326171875, -3.291595458984375, -9.674507141113281, -8.348617553710938, 118.52474212646484, -181.77752685546875, 28.072174072265625, 106.39384460449219, -20.996490478515625, 109.49315643310547, 17.761022567749023, -7.056526184082031, 146.02139282226562, 48.155303955078125, -64.87425231933594, 160.2665557861328, 137.897705078125, 183.39532470703125, 25.660167694091797, -11.996654510498047, 38.542381286621094, 182.39857482910156, 0.5015869140625, 145.05958557128906, 37.80862808227539, 4.861053466796875, -60.64769744873047, 153.68185424804688, 15.28575325012207, 121.53357696533203, 13.225433349609375, -177.1716766357422, 149.2118682861328, 66.01791381835938, 87.53077697753906, -29.617019653320312, 104.33244323730469, 16.38582420349121, 101.986328125, 42.86810302734375, 6.94635009765625, 150.42886352539062, -0.6561050415039062, -27.949024200439453, 157.5692138671875, 196.4160919189453, 25.511619567871094, 130.84710693359375, 139.85186767578125, 102.46512603759766, 179.0159149169922, 244.85707092285156, -103.31763458251953, 169.72085571289062, 21.395431518554688], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000554.npy"} +{"epoch": 0.8374905517762661, "step": 555, "batch_size": 64, "mean": 54.15822219848633, "std": 99.3387451171875, "min": -201.78121948242188, "p10": -74.97238464355468, "median": 59.711524963378906, "p90": 177.49309539794925, "max": 213.0677947998047, "pos_frac": 0.765625, "sample": [2.849546432495117, -200.04537963867188, 49.59040832519531, 49.95953369140625, 164.7777099609375, 9.055961608886719, -179.7958526611328, -9.439834594726562, -85.17402648925781, 103.61216735839844, 192.91766357421875, -56.94670104980469, 94.3104248046875, 21.960773468017578, 134.360107421875, 203.91513061523438, 40.64762878417969, 8.83367919921875, 16.245315551757812, 182.12799072265625, 96.54166412353516, -0.8538665771484375, 197.46633911132812, 58.6285400390625, 169.10940551757812, 60.79450988769531, 83.46839904785156, 164.74803161621094, 83.39411926269531, 181.51834106445312, 145.85159301757812, 136.43133544921875, 93.6842269897461, 141.99822998046875, -98.67913055419922, 181.0861053466797, -201.78121948242188, 116.95531463623047, -56.57019805908203, 47.14522171020508, 76.61761474609375, 79.84341430664062, -23.291221618652344, 29.17029571533203, -61.17195129394531, 15.18503189086914, 63.66545104980469, 86.42426300048828, 155.45457458496094, -24.36400604248047, 110.04714965820312, 27.26323699951172, -178.0905303955078, -2.0098342895507812, 152.9514617919922, 39.77320861816406, 86.8323974609375, 42.6175537109375, 98.47562408447266, -80.88685607910156, 213.0677947998047, 45.678749084472656, 161.96624755859375, 6.207235336303711], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000555.npy"} +{"epoch": 0.8390022675736961, "step": 556, "batch_size": 64, "mean": 49.503414154052734, "std": 98.27352142333984, "min": -166.09555053710938, "p10": -74.32548522949219, "median": 33.1645450592041, "p90": 178.51851806640624, "max": 300.2833251953125, "pos_frac": 0.703125, "sample": [135.91973876953125, 32.37109375, 42.70451354980469, -12.490909576416016, 1.0477752685546875, 156.17916870117188, 195.937255859375, 77.46295166015625, -17.155275344848633, -66.49542236328125, 15.836809158325195, 7.9191436767578125, 92.84090423583984, 167.48065185546875, 23.089641571044922, -35.92909240722656, 45.423919677734375, -5.577445983886719, 100.02120971679688, 158.79541015625, -23.067062377929688, 139.6702423095703, 162.65084838867188, 34.12158966064453, -59.19799041748047, 27.56751251220703, -164.3530731201172, 42.43743896484375, 125.64405059814453, -91.9473876953125, -1.925954818725586, -166.09555053710938, 94.03630065917969, 28.419883728027344, 31.730117797851562, 5.039220809936523, 122.99247741699219, 153.35946655273438, 9.378463745117188, 6.343839645385742, 179.18112182617188, 300.2833251953125, 33.9579963684082, 40.23466491699219, 215.58567810058594, 183.00726318359375, -50.6519775390625, 30.643157958984375, -116.65650177001953, -7.0553131103515625, 196.72262573242188, -77.07559204101562, -34.39546203613281, 164.8375244140625, 21.55270767211914, -81.10348510742188, 55.13763427734375, -83.8442153930664, 67.65370178222656, 171.19802856445312, 185.6966552734375, 176.97244262695312, 72.05843353271484, -67.9085693359375], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000556.npy"} +{"epoch": 0.8405139833711263, "step": 557, "batch_size": 64, "mean": 69.40608978271484, "std": 81.32310485839844, "min": -61.11590576171875, "p10": -25.631427383422846, "median": 61.068748474121094, "p90": 186.46854400634766, "max": 210.65048217773438, "pos_frac": 0.71875, "sample": [193.0998077392578, 113.80485534667969, 87.10069274902344, 30.152923583984375, 7.875522613525391, -37.77655029296875, 186.77293395996094, 32.93182373046875, 173.11703491210938, 100.40634155273438, 2.1799468994140625, -12.527725219726562, -4.1946563720703125, 92.20055389404297, -7.307964324951172, 67.43551635742188, 70.23631286621094, 6.818550109863281, 146.0931396484375, 87.6594467163086, 7.553722381591797, -5.722137451171875, 167.34799194335938, -4.2940673828125, -51.01029968261719, -61.11590576171875, 172.65274047851562, 206.85641479492188, 28.693477630615234, -52.97657012939453, 210.65048217773438, 93.49432373046875, 143.37850952148438, -19.77212905883789, -11.354354858398438, 185.75830078125, 89.84073638916016, 130.59194946289062, 54.78016662597656, 204.1939697265625, -5.5553131103515625, 30.408815383911133, -28.142555236816406, -12.782135009765625, -0.5504093170166016, -35.150665283203125, 195.6757049560547, 179.5572509765625, 158.27755737304688, 17.95378875732422, 10.48028564453125, 73.85515594482422, 33.83576965332031, 135.3500213623047, 140.3539581298828, 81.29595947265625, 180.4962921142578, 67.35733032226562, 42.204708099365234, 53.49143981933594, -42.422332763671875, -15.194747924804688, 204.6149444580078, 150.9530792236328], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000557.npy"} +{"epoch": 0.8420256991685563, "step": 558, "batch_size": 64, "mean": 78.43830108642578, "std": 90.20142364501953, "min": -119.37128448486328, "p10": -24.615619659423825, "median": 74.90170288085938, "p90": 192.97844390869142, "max": 299.3053894042969, "pos_frac": 0.796875, "sample": [144.88156127929688, 198.6608428955078, 195.5675048828125, -0.9697341918945312, 174.94154357910156, 10.06787109375, 178.34600830078125, -37.00859451293945, 4.0466461181640625, 137.89830017089844, -20.821327209472656, 144.74874877929688, -26.241744995117188, 29.541465759277344, 2.237701416015625, 138.52777099609375, 167.37925720214844, 7.82275390625, 84.095947265625, 78.67050170898438, 299.3053894042969, 136.79615783691406, 24.166141510009766, 177.2530517578125, 128.59938049316406, -54.27171325683594, 192.76504516601562, 27.910667419433594, 152.3284912109375, 75.39928436279297, 164.99264526367188, 33.18278503417969, 82.3497314453125, 214.1902618408203, 7.7978668212890625, 4.642080307006836, 98.03860473632812, 12.975875854492188, 45.97023010253906, 241.0589599609375, 133.47450256347656, -37.09088134765625, 253.06875610351562, -1.4111785888671875, 181.17782592773438, 180.38430786132812, -14.57122802734375, -30.70685577392578, 193.0699005126953, 18.479812622070312, 99.30474853515625, -119.37128448486328, 74.6050796508789, -42.930572509765625, 48.85064697265625, -6.138130187988281, 118.30757141113281, 14.587722778320312, -20.301788330078125, 3.99945068359375, 166.0840606689453, 49.99779510498047, 75.19832611083984, 4.138916015625], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000558.npy"} +{"epoch": 0.8435374149659864, "step": 559, "batch_size": 64, "mean": 66.95707702636719, "std": 103.83827209472656, "min": -148.71705627441406, "p10": -35.81832580566406, "median": 37.6202278137207, "p90": 193.14001922607423, "max": 416.86944580078125, "pos_frac": 0.71875, "sample": [4.7645416259765625, -35.956932067871094, 3.913921356201172, -15.715896606445312, 109.2823715209961, 416.86944580078125, 218.76846313476562, 259.98626708984375, 34.58039093017578, -5.271968841552734, -137.04364013671875, 169.35092163085938, 61.956565856933594, 122.41868591308594, 10.598478317260742, 181.33804321289062, 120.01371002197266, 49.57941436767578, 145.96250915527344, 112.89891052246094, 184.4163818359375, 34.32438659667969, -23.194229125976562, 127.64523315429688, 0.7141036987304688, 14.830329895019531, -87.50950622558594, 171.11087036132812, 55.61552429199219, 185.30038452148438, 40.660064697265625, 72.11662292480469, -9.9326171875, 211.84683227539062, 193.5740203857422, -37.546424865722656, 101.50907897949219, 7.603742599487305, -20.512611389160156, -19.789512634277344, -8.568321228027344, -17.67182159423828, -21.563594818115234, 30.989349365234375, 117.59626770019531, 192.12734985351562, 119.73717498779297, -35.494911193847656, 147.6353759765625, -11.566146850585938, 25.75361442565918, 202.40003967285156, -116.86103820800781, 12.564468383789062, 147.3325653076172, 212.30088806152344, 17.304088592529297, 130.20184326171875, 5.593208312988281, 13.06132698059082, 114.005615234375, 166.75827026367188, -40.742271423339844, -148.71705627441406], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000559.npy"} +{"epoch": 0.8450491307634165, "step": 560, "batch_size": 64, "mean": 60.21735382080078, "std": 84.18445587158203, "min": -87.56587219238281, "p10": -57.596253204345686, "median": 44.381317138671875, "p90": 179.11573791503906, "max": 217.53390502929688, "pos_frac": 0.734375, "sample": [77.5218734741211, 56.517242431640625, 177.50132751464844, 40.69861602783203, -66.41470336914062, -65.67765045166016, 186.98666381835938, 35.16984558105469, 217.53390502929688, 1.9676685333251953, 88.94371032714844, 4.944648742675781, 64.38175964355469, 48.10572814941406, 9.118743896484375, -25.84136962890625, -0.7256927490234375, -1.7166423797607422, 23.741886138916016, 111.09428405761719, -71.35572814941406, 141.58767700195312, 54.488670349121094, 5.0445098876953125, 177.35816955566406, 123.72293090820312, -15.470924377441406, 169.77120971679688, 182.4981231689453, 16.751874923706055, 30.99481201171875, -15.756538391113281, -36.70165252685547, 200.49017333984375, 134.54835510253906, -74.71505737304688, 36.117652893066406, -64.63275146484375, 179.3291473388672, -41.177757263183594, 187.05328369140625, 131.63877868652344, 48.06401824951172, 103.14279174804688, 4.384864807128906, 104.36856842041016, 2.5741348266601562, 178.61778259277344, 33.305171966552734, -16.014083862304688, -4.316802978515625, 180.09417724609375, -73.46501922607422, -1.1217498779296875, 153.10052490234375, 145.11907958984375, -87.56587219238281, 34.32138442993164, 157.62353515625, 53.12527847290039, 178.29623413085938, 104.80488586425781, 33.95424270629883, 86.0609130859375], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000560.npy"} +{"epoch": 0.8465608465608465, "step": 561, "batch_size": 64, "mean": 62.07233428955078, "std": 90.30623626708984, "min": -88.96372985839844, "p10": -42.036244964599604, "median": 39.04734802246094, "p90": 188.44662475585943, "max": 265.60626220703125, "pos_frac": 0.734375, "sample": [5.1785888671875, 15.171981811523438, -2.5316162109375, -3.8797245025634766, 52.86866760253906, 140.2818603515625, 77.75320434570312, -19.71966552734375, 170.44363403320312, 37.12834167480469, 53.070587158203125, 122.63407897949219, 3.803516387939453, 106.09477233886719, 13.5113525390625, -88.19563293457031, 29.288345336914062, 155.54867553710938, 195.12850952148438, -6.3863677978515625, -38.62962341308594, 153.70913696289062, 120.68049621582031, -43.0175666809082, 99.24220275878906, -36.061683654785156, 132.64071655273438, -39.74649429321289, -88.96372985839844, 244.24600219726562, -20.91989517211914, 40.17530822753906, 177.69781494140625, 201.59950256347656, 37.91938781738281, 33.565643310546875, 51.716529846191406, 46.71589660644531, 12.705221176147461, 253.98193359375, 265.60626220703125, 213.4507598876953, 155.0071563720703, 192.9607696533203, 129.87030029296875, -82.49678802490234, -65.05219268798828, 37.24775695800781, 93.48591613769531, 10.79969596862793, -29.412826538085938, 64.7883529663086, 5.154945373535156, 0.28808021545410156, 104.96371459960938, 177.9136199951172, 8.10316276550293, 113.36973571777344, 103.11740112304688, -72.88931274414062, -2.831541061401367, 29.430627822875977, 167.12144470214844, -43.817596435546875], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000561.npy"} +{"epoch": 0.8480725623582767, "step": 562, "batch_size": 64, "mean": 73.26075744628906, "std": 92.98955535888672, "min": -96.48112487792969, "p10": -40.60835800170898, "median": 68.90968322753906, "p90": 182.49549865722656, "max": 311.862548828125, "pos_frac": 0.75, "sample": [15.484931945800781, 172.79457092285156, -71.44908142089844, 185.62020874023438, 180.41249084472656, 167.49591064453125, 30.04576873779297, 306.524169921875, 162.406005859375, -32.432411193847656, 92.052001953125, 64.05081176757812, -69.07331848144531, 5.173839569091797, 98.88555908203125, -2.3449363708496094, 39.02577209472656, 68.9808349609375, 111.82330322265625, -57.52198791503906, 122.17394256591797, 175.10763549804688, -47.239959716796875, -18.160682678222656, -5.5246124267578125, 178.0199432373047, -3.379110336303711, 4.321403503417969, 62.123199462890625, 16.983585357666016, 156.94989013671875, -44.112335205078125, 162.136474609375, 189.52392578125, 70.72181701660156, 311.862548828125, -17.901371002197266, -13.732925415039062, 1.2237510681152344, 211.16455078125, 10.52435302734375, 10.163383483886719, 73.51494598388672, 111.27558898925781, 131.30328369140625, 182.72891235351562, 181.95086669921875, 93.4921875, 131.83160400390625, -14.5125732421875, 170.68927001953125, 68.83853149414062, -17.665193557739258, 54.26036834716797, 118.95181274414062, 78.46485900878906, 162.14881896972656, 202.47352600097656, 78.65522003173828, -96.48112487792969, 2.957183837890625, -70.71650695800781, 3.6235885620117188, 39.99989318847656], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000562.npy"} +{"epoch": 0.8495842781557067, "step": 563, "batch_size": 64, "mean": 62.966552734375, "std": 94.71707153320312, "min": -184.56765747070312, "p10": -54.67888031005858, "median": 63.889190673828125, "p90": 184.91433105468752, "max": 224.0692901611328, "pos_frac": 0.765625, "sample": [83.88408660888672, 135.5221710205078, 48.746517181396484, 0.53314208984375, 178.9399871826172, 138.88568115234375, -184.56765747070312, 189.62017822265625, 116.88697814941406, -6.808631896972656, 18.61190414428711, 127.163818359375, 14.9947509765625, -43.729705810546875, 169.2190399169922, 45.75274658203125, -124.42413330078125, 85.07015228271484, -26.848350524902344, 224.0692901611328, 41.358001708984375, 213.49310302734375, -42.66943359375, 180.45663452148438, 149.08685302734375, 85.15392303466797, 106.84036254882812, 10.912467956542969, 74.96783447265625, -103.94649505615234, 2.4842071533203125, -30.412654876708984, 4.5391998291015625, 29.314300537109375, -15.458881378173828, 131.51438903808594, 57.24832534790039, -90.5826416015625, 100.09146118164062, 37.09663772583008, 186.20416259765625, 191.17013549804688, 168.8748016357422, -25.933547973632812, -109.777587890625, 68.72578430175781, 53.44795227050781, -34.05724334716797, 181.90472412109375, 102.41976165771484, -103.00875854492188, 88.79067993164062, 46.77834701538086, 135.46075439453125, 113.99723815917969, 59.05259704589844, 201.67462158203125, 220.45895385742188, 42.31126403808594, 150.8091583251953, 89.18912506103516, -59.37138366699219, 122.97988891601562, 4.748260498046875], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000563.npy"} +{"epoch": 0.8510959939531368, "step": 564, "batch_size": 64, "mean": 80.27366638183594, "std": 97.75011444091797, "min": -176.3113555908203, "p10": -53.25345230102539, "median": 78.03952407836914, "p90": 205.91575927734377, "max": 232.98683166503906, "pos_frac": 0.8125, "sample": [179.81689453125, 8.941780090332031, 204.16409301757812, 173.97772216796875, 94.47205352783203, 230.10394287109375, 124.02717590332031, -153.9894256591797, -20.31121826171875, 7.268707275390625, 196.839599609375, 157.8795166015625, 58.07380294799805, -51.14421844482422, 11.184967041015625, 21.061248779296875, -18.45160675048828, 120.23011779785156, 135.47662353515625, 72.91718292236328, 71.03739929199219, 0.5629596710205078, 104.67668151855469, 112.29269409179688, 166.9676055908203, 152.91104125976562, 223.877685546875, -72.33265686035156, -0.4419536590576172, 102.70237731933594, 220.68426513671875, 232.98683166503906, 206.66647338867188, 97.91111755371094, 54.483154296875, -112.7216567993164, 152.96551513671875, 53.5074577331543, 61.28947448730469, 12.132286071777344, 170.5474090576172, 70.15031433105469, 72.60392761230469, -6.836137771606445, -68.74858093261719, 60.33258056640625, 59.147438049316406, 199.6099853515625, 67.6528091430664, -70.24391174316406, 83.161865234375, 105.34420013427734, 209.98635864257812, 0.7543659210205078, 168.57244873046875, 33.92610168457031, 172.0556182861328, 207.14724731445312, -176.3113555908203, 186.16143798828125, -54.15740966796875, 19.702655792236328, 86.35736083984375, 145.8999481201172], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000564.npy"} +{"epoch": 0.8526077097505669, "step": 565, "batch_size": 64, "mean": 57.372161865234375, "std": 85.69770050048828, "min": -135.7086181640625, "p10": -52.86337242126465, "median": 51.063072204589844, "p90": 166.18914489746095, "max": 280.68829345703125, "pos_frac": 0.765625, "sample": [20.54736328125, 2.0911598205566406, -11.076667785644531, 33.387359619140625, 46.625953674316406, 43.283355712890625, 114.86862182617188, 55.41313934326172, 10.958831787109375, 27.56061553955078, 46.71300506591797, 104.66429138183594, 227.68734741210938, -135.7086181640625, -20.354095458984375, 135.2602996826172, 76.28504943847656, 93.43521118164062, 280.68829345703125, 203.82211303710938, 146.63528442382812, -78.39646911621094, 5.912117004394531, 16.20783233642578, 66.86466979980469, 126.4630126953125, 67.38429260253906, 43.29999542236328, 77.77710723876953, 98.63871002197266, 171.12216186523438, 11.942453384399414, -52.816009521484375, -68.76925659179688, 107.80087280273438, -52.883670806884766, 17.387895584106445, 135.70501708984375, -127.49296569824219, 78.0968017578125, 113.93051147460938, -16.384647369384766, -48.68843078613281, 104.94793701171875, -58.454681396484375, 110.11741638183594, 22.4422607421875, 160.21022033691406, 215.62596130371094, 26.45063018798828, 131.72689819335938, -14.563018798828125, -99.8111572265625, -0.3138160705566406, 33.663272857666016, 27.280948638916016, -19.173858642578125, 133.36227416992188, 58.36498260498047, 84.39190673828125, 184.3886260986328, 116.98197937011719, 89.53838348388672, 168.7515411376953], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000565.npy"} +{"epoch": 0.854119425547997, "step": 566, "batch_size": 64, "mean": 55.465171813964844, "std": 107.20050811767578, "min": -249.45286560058594, "p10": -64.65326538085937, "median": 60.77851867675781, "p90": 182.52509002685548, "max": 278.3076171875, "pos_frac": 0.703125, "sample": [75.27398681640625, 39.57343292236328, -56.80113220214844, 103.66758728027344, 1.202056884765625, 47.986331939697266, 184.2384033203125, 175.60214233398438, 3.5152454376220703, 122.6220932006836, 65.58528137207031, 97.90238952636719, 62.8466796875, 61.96281051635742, 19.87773895263672, 278.3076171875, -249.45286560058594, 105.95938873291016, 178.52735900878906, 133.2261962890625, 199.0205535888672, -16.529754638671875, -38.711246490478516, 103.70801544189453, 3.1866092681884766, -66.57167053222656, 99.56480407714844, 161.52816772460938, 176.9589385986328, 0.2192535400390625, 166.9158477783203, 139.1503143310547, 150.43942260742188, 35.657562255859375, -6.48919677734375, -177.19906616210938, -57.043479919433594, 30.074153900146484, 254.26527404785156, -54.62517547607422, 37.0775146484375, -60.17698669433594, 269.4388427734375, -44.025360107421875, 173.52920532226562, 10.582084655761719, -80.65066528320312, -122.42729949951172, 74.59180450439453, -8.835441589355469, -44.65095901489258, 4.215171813964844, -34.31956481933594, 172.6148681640625, -20.420215606689453, 59.5942268371582, -67.24663543701172, 189.88125610351562, 63.268516540527344, -112.02044677734375, 138.83303833007812, 99.91655731201172, 102.2259521484375, 193.6334228515625], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000566.npy"} +{"epoch": 0.8556311413454271, "step": 567, "batch_size": 64, "mean": 65.55530548095703, "std": 85.54998779296875, "min": -103.7050552368164, "p10": -59.652650451660136, "median": 64.82452011108398, "p90": 173.63448181152344, "max": 245.84243774414062, "pos_frac": 0.796875, "sample": [118.73670959472656, 0.8373603820800781, -2.7930221557617188, 172.47491455078125, -43.32594299316406, 118.97384643554688, 192.83926391601562, 148.90460205078125, 174.13143920898438, 29.26445770263672, 162.3140869140625, 58.20082092285156, 84.52437591552734, -42.37162780761719, 90.9150161743164, -14.066291809082031, -8.586143493652344, 41.615692138671875, 19.38105010986328, 58.01518630981445, 137.02676391601562, 9.867912292480469, 2.5549755096435547, 161.42758178710938, -74.12601470947266, 0.22711753845214844, -103.7050552368164, -81.10228729248047, 112.36859893798828, -89.02388763427734, 156.3463592529297, 62.23851013183594, 179.265625, 245.84243774414062, 193.61367797851562, 0.6851310729980469, 89.86495208740234, 32.42132568359375, 109.27815246582031, 193.642822265625, -78.31999206542969, 104.12346649169922, 57.956695556640625, 70.29753112792969, 151.45574951171875, 123.69978332519531, -0.186798095703125, 3.4991302490234375, 157.53598022460938, 120.94673156738281, 81.03547668457031, 25.275585174560547, 166.77499389648438, 4.182891845703125, 11.706527709960938, -94.44425201416016, -66.64981079101562, 89.40377807617188, 201.97073364257812, 10.18572998046875, 121.37882995605469, 67.41053009033203, 57.81395721435547, 109.78575897216797], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000567.npy"} +{"epoch": 0.8571428571428571, "step": 568, "batch_size": 64, "mean": 78.94135284423828, "std": 92.60421752929688, "min": -78.63829040527344, "p10": -38.039559936523425, "median": 62.813608169555664, "p90": 194.56463317871095, "max": 360.39227294921875, "pos_frac": 0.796875, "sample": [120.7938003540039, 51.171417236328125, 60.992740631103516, 31.0692138671875, 94.69021606445312, 126.64389038085938, 126.45028686523438, -78.63829040527344, 25.121417999267578, -25.192291259765625, -66.45677185058594, 164.85968017578125, 42.19233703613281, 218.55780029296875, -13.764625549316406, -60.58229064941406, 51.265113830566406, -5.322914123535156, 66.1465072631836, 108.334716796875, -73.36283874511719, 1.72198486328125, 40.38065719604492, 168.3603515625, 196.31935119628906, 172.218017578125, 141.09243774414062, 244.66055297851562, -67.33625793457031, 35.366546630859375, 127.77680969238281, 64.63447570800781, 80.46276092529297, -19.392845153808594, 135.1734161376953, 20.262346267700195, -4.5875244140625, 113.50067901611328, -1.7189807891845703, 149.44363403320312, 23.27031707763672, 166.51837158203125, 97.59341430664062, 91.87295532226562, 151.947998046875, 42.769142150878906, 42.17353820800781, 2.45843505859375, 15.075912475585938, 48.43019104003906, 82.14376831054688, 142.81979370117188, -44.6168212890625, 119.5949935913086, 177.84329223632812, 44.54206848144531, 1.6954574584960938, 304.5372619628906, 199.65423583984375, 216.7015838623047, -43.5455322265625, 54.595924377441406, 190.4702911376953, 360.39227294921875], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000568.npy"} +{"epoch": 0.8586545729402872, "step": 569, "batch_size": 64, "mean": 45.525840759277344, "std": 90.35174560546875, "min": -171.46102905273438, "p10": -51.374136352539054, "median": 38.39813232421875, "p90": 174.76989746093753, "max": 247.16937255859375, "pos_frac": 0.71875, "sample": [161.236328125, -55.85166931152344, 10.258123397827148, 161.10545349121094, 45.20808410644531, 178.0460205078125, 14.160049438476562, 247.16937255859375, 69.308349609375, 180.31088256835938, 78.4073486328125, -32.33623504638672, 15.26718521118164, 48.86415100097656, -171.46102905273438, 40.02821350097656, 15.936199188232422, 241.1403045654297, -7.530988693237305, 73.86674499511719, 158.06097412109375, 141.83663940429688, 42.904232025146484, 203.2689208984375, -28.65899658203125, 161.89328002929688, 92.64591979980469, 21.95175552368164, 36.919647216796875, -115.17877960205078, -111.81620025634766, 47.84214401245117, 0.8424072265625, 16.666759490966797, -20.34008026123047, -25.001708984375, 191.20516967773438, 7.23210334777832, 43.389991760253906, 20.497262954711914, 55.75990295410156, -40.92655944824219, -99.45368957519531, -16.471397399902344, 89.39042663574219, -112.17610931396484, 37.34562683105469, -27.388992309570312, 34.5921745300293, 86.27348327636719, 58.79560470581055, 81.72096252441406, 162.2361602783203, -34.077903747558594, -35.93244171142578, 32.794212341308594, 97.17593383789062, 39.45063781738281, 180.36917114257812, -27.11370849609375, -87.5198745727539, 30.28697967529297, 167.1256103515625, 42.103233337402344], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000569.npy"} +{"epoch": 0.8601662887377173, "step": 570, "batch_size": 64, "mean": 81.95825958251953, "std": 93.59471893310547, "min": -129.00865173339844, "p10": -26.019437599182126, "median": 71.0296745300293, "p90": 196.2804962158203, "max": 389.5987854003906, "pos_frac": 0.78125, "sample": [177.91412353515625, -87.95014190673828, 130.663818359375, 63.31338119506836, 112.80390167236328, 46.157920837402344, -36.09918212890625, -4.069671630859375, 48.65464782714844, -23.578170776367188, 67.43885040283203, 61.6514892578125, 18.31537437438965, 131.05465698242188, -7.990715026855469, 142.30677795410156, -1.9540119171142578, 2.3489646911621094, 65.74537658691406, 97.47837829589844, 104.37664794921875, -104.58465576171875, 26.395347595214844, 164.25372314453125, 196.38760375976562, 3.885465621948242, 58.52347946166992, 119.25703430175781, 205.93276977539062, -22.809837341308594, 25.437477111816406, 121.16080474853516, 160.81700134277344, -79.70011901855469, 26.292728424072266, 106.86710357666016, 166.48861694335938, 74.62049865722656, 181.7410125732422, 65.7886734008789, 215.23736572265625, 146.52276611328125, 228.50701904296875, -27.06569480895996, 35.53472137451172, 116.85711669921875, 165.86895751953125, 205.8676300048828, 117.74075317382812, -129.00865173339844, 162.505859375, -28.056053161621094, 54.98301696777344, 156.76124572753906, 197.3191375732422, 37.21257019042969, 89.6199951171875, -5.08460807800293, 124.75656127929688, 158.91171264648438, 389.5987854003906, 40.16072463989258, 196.03057861328125, -10.790176391601562], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000570.npy"} +{"epoch": 0.8616780045351474, "step": 571, "batch_size": 64, "mean": 44.822479248046875, "std": 88.22185516357422, "min": -163.2166290283203, "p10": -79.41457214355468, "median": 58.02311897277832, "p90": 144.30182342529298, "max": 250.333251953125, "pos_frac": 0.71875, "sample": [102.68368530273438, 77.65213775634766, 53.11183166503906, 23.66401481628418, -0.4382171630859375, 103.12745666503906, 83.03939819335938, 84.81963348388672, 123.5997543334961, 250.333251953125, 76.6393814086914, 59.307701110839844, -90.5406723022461, 6.558872222900391, -4.049552917480469, 103.34422302246094, 30.843490600585938, 144.32608032226562, 14.996871948242188, 104.18163299560547, 147.3665771484375, 14.844734191894531, 91.22019958496094, 62.13395690917969, 166.126953125, 94.001708984375, 86.79658508300781, 106.39971160888672, -154.94342041015625, 26.85076141357422, 6.215478897094727, -84.66380310058594, -5.206398010253906, -102.10065460205078, 94.31175231933594, -1.1247386932373047, -54.003662109375, 0.4569816589355469, -67.16636657714844, -30.980926513671875, 65.93285369873047, 73.53195190429688, 144.24522399902344, 121.3329086303711, 56.7385368347168, 176.58737182617188, 167.68814086914062, -163.2166290283203, 38.399192810058594, -25.04615020751953, -58.64289855957031, -133.16029357910156, 95.28784942626953, 48.74352264404297, 112.21635437011719, -37.13878631591797, 114.15925598144531, 132.7831573486328, 56.628379821777344, 135.52308654785156, -41.2927360534668, 8.612930297851562, -149.8901824951172, 184.87918090820312], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000571.npy"} +{"epoch": 0.8631897203325775, "step": 572, "batch_size": 64, "mean": 55.10819625854492, "std": 81.37066650390625, "min": -114.9002685546875, "p10": -51.52134552001952, "median": 48.92620086669922, "p90": 165.68453063964844, "max": 202.38958740234375, "pos_frac": 0.734375, "sample": [8.591102600097656, -70.29795837402344, 5.759925842285156, 88.98072052001953, 149.25538635253906, 47.20207214355469, 163.28594970703125, 54.36119079589844, -11.279956817626953, 190.75521850585938, -16.039077758789062, 106.60930633544922, 161.56082153320312, 172.70849609375, -25.46187973022461, 166.71249389648438, -55.690093994140625, 17.343820571899414, 26.415143966674805, 118.45314025878906, 82.71836853027344, 16.576629638671875, 77.49473571777344, 161.29891967773438, 158.55862426757812, 60.940185546875, -23.374984741210938, 86.59319305419922, -9.641380310058594, 19.059127807617188, 202.38958740234375, 167.33909606933594, 170.11883544921875, -114.9002685546875, 114.98116302490234, 54.046390533447266, 50.65032958984375, -58.21441650390625, 8.421161651611328, 91.70503997802734, 106.90050506591797, -0.31288719177246094, 122.5787124633789, 134.51632690429688, 35.32476806640625, 125.05989837646484, 27.600830078125, -92.34452819824219, 196.39767456054688, 15.215408325195312, 80.30387878417969, 135.96197509765625, -24.245590209960938, 29.435630798339844, -93.79434204101562, -41.79426574707031, 33.091712951660156, 76.98747253417969, -18.611679077148438, -101.33670043945312, 132.6220703125, -0.7972812652587891, 14.610509872436523, 17.568246841430664], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000572.npy"} +{"epoch": 0.8647014361300076, "step": 573, "batch_size": 64, "mean": 59.32253646850586, "std": 108.12000274658203, "min": -199.74087524414062, "p10": -54.765569305419916, "median": 55.876712799072266, "p90": 215.2652008056641, "max": 326.71478271484375, "pos_frac": 0.71875, "sample": [45.94602966308594, 98.6260757446289, -162.9140167236328, 165.7021026611328, -49.450035095214844, 52.3592529296875, -6.612482070922852, 29.85968780517578, 72.61538696289062, -57.04365539550781, -169.2751007080078, -135.0889892578125, -16.158864974975586, -4.2398681640625, -26.052703857421875, 148.85443115234375, -25.587875366210938, 17.164459228515625, 186.65744018554688, -199.74087524414062, 59.39417266845703, 59.56029510498047, 205.28253173828125, 69.93134307861328, -16.942901611328125, 17.271503448486328, 326.71478271484375, 7.571300506591797, 144.6983642578125, 69.11260223388672, 25.924392700195312, 32.067626953125, 85.20372009277344, 42.49952697753906, 160.5478515625, 25.48110580444336, 110.33291625976562, 63.28603744506836, 36.294227600097656, 254.96826171875, 156.14886474609375, 144.6143035888672, 140.9949188232422, -4.199235916137695, -42.93254089355469, 79.9343490600586, 233.49021911621094, 31.337692260742188, 28.623313903808594, 74.48827362060547, 221.59375, 244.804931640625, 60.095367431640625, 115.52539825439453, -5.122337341308594, -100.92799377441406, 292.36676025390625, -44.33849334716797, 62.14211654663086, 87.28418731689453, 111.00125122070312, 35.347389221191406, -89.99360656738281, 219.54348754882812], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000573.npy"} +{"epoch": 0.8662131519274376, "step": 574, "batch_size": 64, "mean": 73.88447570800781, "std": 79.74378204345703, "min": -108.61060333251953, "p10": -11.155338287353514, "median": 68.01949310302734, "p90": 182.58799133300784, "max": 347.0589904785156, "pos_frac": 0.8125, "sample": [56.35466766357422, -31.10118865966797, -14.183204650878906, -108.61060333251953, 98.79153442382812, 110.41837310791016, 32.92462158203125, 22.614044189453125, 9.252557754516602, -20.64354705810547, -9.447555541992188, 102.10307312011719, 10.959518432617188, 25.150346755981445, -8.686515808105469, 3.5128936767578125, -2.435710906982422, 71.77827453613281, 52.967323303222656, 101.90774536132812, 155.99606323242188, 42.452598571777344, 64.26071166992188, 129.88555908203125, -7.522621154785156, 201.15492248535156, 59.205665588378906, 155.0089874267578, 0.2588214874267578, 185.11199951171875, 116.94879150390625, -0.2818450927734375, 72.49588012695312, 40.01164245605469, 136.14407348632812, 119.4793701171875, -73.23355865478516, 120.12315368652344, 186.25537109375, 5.218446731567383, 94.44520568847656, 30.722900390625, 176.69863891601562, 149.95278930664062, 127.50457763671875, 187.110595703125, 104.38853454589844, 111.985595703125, 79.56669616699219, 22.60411834716797, -14.648834228515625, 189.13514709472656, 11.79888916015625, 103.18360137939453, 96.84136199951172, 15.893577575683594, 54.47390365600586, 170.80474853515625, 151.43521118164062, 194.96311950683594, -11.887245178222656, 117.98902893066406, 347.0589904785156, 3.9847869873046875], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000574.npy"} +{"epoch": 0.8677248677248677, "step": 575, "batch_size": 64, "mean": 50.93318557739258, "std": 102.96333312988281, "min": -167.50735473632812, "p10": -81.42034912109375, "median": 34.214393615722656, "p90": 187.0608627319336, "max": 297.74029541015625, "pos_frac": 0.703125, "sample": [66.69805145263672, -121.76756286621094, -152.5753173828125, -9.22252082824707, 297.74029541015625, 90.796875, -18.94019317626953, 100.56305694580078, 14.528121948242188, -23.79343032836914, 108.16703796386719, -69.13530731201172, 204.93788146972656, -37.01237106323242, -112.08491516113281, 105.47630310058594, -94.77974700927734, 109.751953125, 3.5571517944335938, 13.934303283691406, 44.64954376220703, 183.0802001953125, 126.58898162841797, 19.357452392578125, -1.4555892944335938, 20.273147583007812, -120.49240112304688, 116.3652572631836, 181.90872192382812, 6.133445739746094, 15.79438591003418, 53.526222229003906, 188.76686096191406, 258.71893310546875, 156.7594451904297, -82.9161376953125, 214.56890869140625, 0.4359283447265625, 225.837158203125, 145.5880126953125, -7.6589813232421875, 34.317291259765625, 61.212806701660156, 36.88153076171875, 12.863784790039062, -11.754463195800781, 34.11149597167969, -167.50735473632812, 69.59979248046875, 275.0831604003906, 177.5114288330078, 85.34913635253906, 33.20841979980469, 43.15444564819336, -77.93017578125, 28.795494079589844, 70.49397277832031, -14.316661834716797, 25.0457706451416, 118.77542114257812, -29.42058563232422, 144.23196411132812, 113.11508178710938, -25.767017364501953], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000575.npy"} +{"epoch": 0.8692365835222978, "step": 576, "batch_size": 64, "mean": 75.7958984375, "std": 94.43069458007812, "min": -187.0516815185547, "p10": -30.875739479064936, "median": 54.21706771850586, "p90": 193.55815734863282, "max": 286.74749755859375, "pos_frac": 0.75, "sample": [41.334747314453125, 160.2567901611328, -10.934829711914062, 52.827911376953125, 170.16680908203125, 53.69795227050781, 186.32533264160156, 31.2084903717041, 81.48919677734375, 115.55235290527344, -25.94991111755371, -67.01657104492188, 173.57252502441406, -43.811737060546875, 91.21392059326172, -100.79072570800781, -39.625267028808594, 157.1886749267578, 286.74749755859375, 136.85223388671875, 173.07322692871094, 210.4500732421875, 103.05079650878906, 4.458127975463867, 122.44602966308594, 85.2952880859375, 33.12433624267578, -46.333534240722656, 245.20343017578125, -32.98680877685547, 38.61750793457031, 22.06623077392578, 51.0743408203125, 176.33612060546875, 67.06716918945312, 42.317901611328125, 236.04808044433594, -14.633285522460938, -5.1962890625, 18.436439514160156, 171.5641326904297, -13.012706756591797, 165.4590301513672, 16.834394454956055, 191.01303100585938, -8.800582885742188, 197.1878204345703, 150.91676330566406, -4.701261520385742, 194.64892578125, 179.7576141357422, -187.0516815185547, 203.5562286376953, 133.98670959472656, 54.736183166503906, 143.65501403808594, -18.53629493713379, -4.583831787109375, 44.99683380126953, 88.90483093261719, 1.6134777069091797, 34.990196228027344, 24.39763641357422, 109.18424987792969], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000576.npy"} +{"epoch": 0.8707482993197279, "step": 577, "batch_size": 64, "mean": 52.36536407470703, "std": 92.2142105102539, "min": -184.07467651367188, "p10": -41.241367721557616, "median": 44.80608558654785, "p90": 176.9465515136719, "max": 249.907958984375, "pos_frac": 0.75, "sample": [47.01167297363281, 10.2457275390625, 16.436927795410156, 50.64338684082031, 1.6721343994140625, 84.82460021972656, 15.876636505126953, -23.95457649230957, 209.31671142578125, -10.019248962402344, -31.803382873535156, 168.00799560546875, 134.05514526367188, -37.3448486328125, -77.52044677734375, 190.99691772460938, 179.6883544921875, 170.54901123046875, -151.23208618164062, 102.22087097167969, 188.5010223388672, 88.43091583251953, 15.70211410522461, 153.0684814453125, 18.004806518554688, -80.67881774902344, -119.45729064941406, 125.89053344726562, 127.7752914428711, 89.39584350585938, -1.4202880859375, 152.03750610351562, -27.952117919921875, 50.16877746582031, 40.868988037109375, -7.947898864746094, 69.78964233398438, 30.395050048828125, 47.042259216308594, 2.756397247314453, 37.11577606201172, 41.3525390625, 170.0208740234375, 6.120145797729492, 185.26718139648438, 249.907958984375, -172.9246826171875, 71.67512512207031, 57.05744934082031, 76.47186279296875, -4.1479644775390625, 102.85067749023438, 180.7421875, 166.18719482421875, 33.74592590332031, 42.60049819946289, -184.07467651367188, -10.493776321411133, -42.91130447387695, 119.76811981201172, 17.353309631347656, 86.63514709472656, 83.33126831054688, 25.689712524414062], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000577.npy"} +{"epoch": 0.872260015117158, "step": 578, "batch_size": 64, "mean": 48.02423095703125, "std": 95.07792663574219, "min": -170.6879119873047, "p10": -58.12692756652831, "median": 31.183334350585938, "p90": 171.16403350830078, "max": 315.28448486328125, "pos_frac": 0.640625, "sample": [83.48878479003906, -42.398162841796875, 74.99797058105469, 48.480499267578125, 74.27190399169922, -36.0191650390625, 81.73860168457031, 18.964004516601562, 127.45893859863281, 1.9197101593017578, -0.1507568359375, 315.28448486328125, -12.364242553710938, 99.97750854492188, 160.64964294433594, -170.6879119873047, 149.30821228027344, 167.7663116455078, 117.7454605102539, 113.84133911132812, 156.77923583984375, 83.96942138671875, 11.557046890258789, 6.567371368408203, 2.302328109741211, 74.92874908447266, 171.7069091796875, -4.472755432128906, 78.74098205566406, -7.276237487792969, 203.10354614257812, 143.35223388671875, 179.94342041015625, -91.15914916992188, -33.97840118408203, 29.570297241210938, 1.8224620819091797, 100.27369689941406, 53.563499450683594, 69.50875091552734, 150.29859924316406, -120.35751342773438, 32.79637145996094, -47.098854064941406, -13.057998657226562, -0.583709716796875, -28.90929412841797, 169.89732360839844, -62.85324478149414, 194.706787109375, 85.8904800415039, -80.40308380126953, 233.29527282714844, -6.05180549621582, -42.415191650390625, -82.98307800292969, 20.340499877929688, 48.045310974121094, -23.626487731933594, 2.7871837615966797, -31.955318450927734, -5.418037414550781, -113.19219207763672, 189.32223510742188], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000578.npy"} +{"epoch": 0.873771730914588, "step": 579, "batch_size": 64, "mean": 74.7949447631836, "std": 81.45682525634766, "min": -143.1686248779297, "p10": -19.149705505371088, "median": 68.56473541259766, "p90": 182.01701965332032, "max": 240.75050354003906, "pos_frac": 0.796875, "sample": [97.82750701904297, 73.27081298828125, 61.66138458251953, 44.43390655517578, 39.054527282714844, -111.62014770507812, 183.54002380371094, 51.90840148925781, 117.27774047851562, 240.75050354003906, 119.91201782226562, 172.77877807617188, 115.19696044921875, 191.88485717773438, 109.777587890625, 24.90058135986328, 170.63656616210938, -33.05686950683594, -11.638648986816406, 129.79759216308594, 218.44580078125, -55.74998092651367, 175.0727081298828, -4.61982536315918, 68.24436950683594, 113.47109985351562, 191.42465209960938, 22.31451416015625, 179.80931091308594, 147.35768127441406, -41.677772521972656, 50.340614318847656, 128.9044189453125, 9.250070571899414, 112.93280792236328, 116.83001708984375, 56.22119140625, -2.212186813354492, -3.4300689697265625, 175.99803161621094, -11.88232421875, 55.615455627441406, -10.669876098632812, 1.1902694702148438, 68.88510131835938, 6.273042678833008, -22.264297485351562, -143.1686248779297, 188.55059814453125, 139.06039428710938, 83.22772216796875, 114.99256896972656, 51.73785400390625, 182.9631805419922, 100.34515380859375, 11.215017318725586, 128.78135681152344, 141.10617065429688, 39.312110900878906, 67.84825134277344, -51.70005798339844, 23.95113754272461, 121.5469741821289, 52.73768997192383], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000579.npy"} +{"epoch": 0.8752834467120182, "step": 580, "batch_size": 64, "mean": 59.434383392333984, "std": 104.31442260742188, "min": -168.576904296875, "p10": -56.67549667358398, "median": 54.91040802001953, "p90": 210.58298950195316, "max": 278.81817626953125, "pos_frac": 0.671875, "sample": [-92.79853820800781, -64.48309326171875, -13.482086181640625, 16.531415939331055, -36.40582275390625, 56.18389892578125, 170.42259216308594, 86.08111572265625, 69.45242309570312, 23.98535919189453, 194.9797821044922, 82.1347885131836, 24.08245849609375, -2.340618133544922, -54.00824737548828, 59.7723388671875, 141.47264099121094, 103.82575225830078, 1.4906139373779297, 36.16984558105469, -4.278728485107422, 104.01823425292969, 231.7744140625, 59.41095733642578, 89.7790756225586, -29.620635986328125, 244.34576416015625, -8.202392578125, -3.5065059661865234, 217.361083984375, 202.353759765625, 186.8109893798828, -0.6776504516601562, 118.26378631591797, -29.758438110351562, 183.87835693359375, -40.60319137573242, -168.576904296875, 17.38198471069336, 278.81817626953125, -158.58094787597656, 33.53509521484375, -57.818603515625, 125.1544189453125, 246.98509216308594, -33.47528076171875, 42.31633758544922, 53.63691711425781, 214.10980224609375, 111.24799346923828, 105.58905029296875, 140.19869995117188, -40.896812438964844, -128.99034118652344, 22.70969009399414, -31.996301651000977, 85.37617492675781, 120.3430404663086, 94.86163330078125, 269.3338317871094, 43.929901123046875, -116.04393005371094, 88.57508850097656, 121.66130065917969], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000580.npy"} +{"epoch": 0.8767951625094482, "step": 581, "batch_size": 64, "mean": 56.961395263671875, "std": 95.27515411376953, "min": -124.76156616210938, "p10": -66.37806396484375, "median": 48.950246810913086, "p90": 177.14951934814457, "max": 316.6584167480469, "pos_frac": 0.703125, "sample": [139.26693725585938, 169.8446044921875, 26.084129333496094, 6.818164825439453, 80.59159851074219, 15.3214111328125, -9.100433349609375, -64.92837524414062, 90.67218017578125, 90.9645767211914, -95.5440673828125, 18.094158172607422, 24.214895248413086, 44.381797790527344, 128.70980834960938, -67.4905014038086, 137.93191528320312, 53.02082061767578, 119.2425537109375, 18.851133346557617, 146.6810760498047, 23.115020751953125, 184.75857543945312, -20.446044921875, 221.4171600341797, 193.08444213867188, 144.34976196289062, -27.26690673828125, 45.27936553955078, 81.9932861328125, -35.6514892578125, 122.40003204345703, 35.57639694213867, 140.86474609375, 77.90933990478516, 117.90447998046875, 58.05839538574219, -120.18283081054688, 246.91859436035156, 186.015625, -27.678863525390625, -124.76156616210938, 96.02323913574219, 14.500869750976562, 91.591064453125, -88.50811767578125, 316.6584167480469, -12.565399169921875, -12.160877227783203, -118.62611389160156, 145.79656982421875, -30.47003936767578, 99.19471740722656, 131.57672119140625, 21.051166534423828, 137.59971618652344, -2.3610687255859375, -66.99935913085938, -63.629638671875, 52.62112808227539, 28.55230712890625, 165.05624389648438, 180.2801971435547, -36.938323974609375], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000581.npy"} +{"epoch": 0.8783068783068783, "step": 582, "batch_size": 64, "mean": 57.9677734375, "std": 89.7421875, "min": -137.7101593017578, "p10": -35.69066467285156, "median": 41.66208076477051, "p90": 175.07067871093753, "max": 300.4955749511719, "pos_frac": 0.734375, "sample": [114.2527847290039, 179.70928955078125, 23.16071319580078, 117.72378540039062, 11.275527954101562, 27.273967742919922, 196.3385772705078, 56.38821792602539, 136.3436737060547, 148.6827392578125, 71.75762939453125, 56.050193786621094, 159.8744354248047, 300.4955749511719, -42.717987060546875, 177.5403594970703, -35.552215576171875, -3.9433135986328125, 71.82221984863281, 137.56900024414062, -3.1334762573242188, 121.0391616821289, 12.648242950439453, 203.93978881835938, 151.76611328125, 191.5835418701172, 8.998422622680664, 7.268487930297852, -97.07925415039062, -137.7101593017578, -5.958913803100586, 20.3623046875, 111.6482162475586, -29.293807983398438, -28.178564071655273, 118.13922119140625, 133.3840789794922, 71.51689147949219, 188.7635498046875, 7.786388397216797, 104.77105712890625, 83.17240905761719, 73.77703094482422, 12.00920295715332, -3.138124465942383, -10.896102905273438, -60.74317169189453, 117.0507583618164, 9.518241882324219, -137.144775390625, 3.0849170684814453, 19.98126983642578, 0.6819114685058594, 0.9609527587890625, -68.0859603881836, 67.32081604003906, 153.10223388671875, -30.40802764892578, 167.7394256591797, -30.034378051757812, -35.75, 11.238441467285156, 140.88577270507812, 169.30809020996094], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000582.npy"} +{"epoch": 0.8798185941043084, "step": 583, "batch_size": 64, "mean": 67.69149780273438, "std": 102.54582977294922, "min": -188.1800994873047, "p10": -45.87504272460937, "median": 67.52604675292969, "p90": 195.49888000488284, "max": 246.28421020507812, "pos_frac": 0.6875, "sample": [68.46258544921875, -18.855995178222656, -21.45349884033203, -13.062664031982422, 175.9453887939453, 82.10255432128906, -48.54906463623047, -50.17753601074219, -115.2999496459961, -8.853103637695312, 183.2462615966797, -28.894100189208984, -30.280635833740234, 137.92185974121094, 57.70815658569336, -39.635658264160156, 67.36058044433594, -3.490537643432617, 196.54678344726562, 159.1982879638672, 56.18208312988281, -127.96295928955078, 134.2206268310547, 8.471702575683594, 120.90534973144531, 114.38203430175781, 246.28421020507812, -164.9547576904297, 30.42813491821289, 166.78070068359375, 67.69151306152344, 43.61204528808594, -10.946884155273438, 38.82121276855469, 188.50534057617188, 213.5225067138672, -29.885971069335938, -29.707374572753906, 171.8638916015625, 175.78260803222656, 57.608760833740234, 214.64755249023438, -188.1800994873047, 240.54278564453125, 2.086282730102539, 130.92822265625, 133.48257446289062, 84.44292449951172, 113.2177963256836, -14.320426940917969, 214.32757568359375, 101.3508071899414, 176.99143981933594, 12.20408821105957, 97.89356994628906, 164.03900146484375, -67.4123306274414, 103.50992584228516, -2.40777587890625, 165.1239776611328, 202.04212951660156, 193.05377197265625, 29.905929565429688, 3.2416534423828125], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000583.npy"} +{"epoch": 0.8813303099017384, "step": 584, "batch_size": 64, "mean": 58.68948745727539, "std": 104.4764633178711, "min": -163.03944396972656, "p10": -70.8064971923828, "median": 44.013824462890625, "p90": 195.89686279296876, "max": 264.44061279296875, "pos_frac": 0.671875, "sample": [198.32723999023438, 190.22598266601562, 69.1429443359375, -10.315238952636719, 53.04212951660156, -9.557489395141602, 228.5467529296875, 189.28128051757812, 126.03057098388672, 132.94664001464844, 99.47085571289062, -12.78758430480957, -10.453325271606445, -58.80120086669922, -107.3924560546875, 90.30493927001953, 93.6561050415039, 187.7429656982422, 164.2783203125, -14.98055648803711, 148.02252197265625, 219.86427307128906, -6.129203796386719, 146.3571014404297, 223.78738403320312, 163.84872436523438, 73.06769561767578, 22.304054260253906, 32.210487365722656, 18.83001708984375, 179.76873779296875, -59.28208923339844, 115.51831817626953, 33.533172607421875, -98.8551025390625, 180.17868041992188, -36.94804382324219, -32.9571533203125, -11.120643615722656, -30.362638473510742, 12.024242401123047, 91.56754302978516, -75.74552917480469, 53.478721618652344, 81.2549819946289, 234.47967529296875, 2.070650100708008, 55.50233459472656, 94.35652923583984, -85.62688446044922, -162.1383056640625, 32.32034683227539, -41.37110137939453, 171.894287109375, -0.3062744140625, 264.44061279296875, 236.40890502929688, 8.396211624145508, 8.429258346557617, 34.98551940917969, 21.074607849121094, 116.4656982421875, -115.14045715332031, -163.03944396972656], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000584.npy"} +{"epoch": 0.8828420256991686, "step": 585, "batch_size": 64, "mean": 45.5220832824707, "std": 89.0029067993164, "min": -224.0035400390625, "p10": -24.43485488891601, "median": 32.2180290222168, "p90": 171.85222473144535, "max": 290.7920837402344, "pos_frac": 0.765625, "sample": [31.946308135986328, 122.26298522949219, 37.6114501953125, -3.5464630126953125, 65.3324966430664, 65.01435852050781, 56.60221862792969, 163.25494384765625, -9.347335815429688, 7.141624450683594, -168.36761474609375, 20.708248138427734, 135.350830078125, 20.549530029296875, 0.6683540344238281, 290.7920837402344, -117.03363037109375, -6.376792907714844, 59.40779113769531, 102.32528686523438, 105.61105346679688, 16.113088607788086, -7.55006217956543, -99.41322326660156, 8.246744155883789, 35.868675231933594, -18.159461975097656, 10.073753356933594, 141.4281463623047, 112.54068756103516, 4.857242584228516, 6.761627197265625, 43.15205764770508, -6.175395965576172, -132.2924041748047, 11.970222473144531, 12.59295654296875, 132.22003173828125, 179.39471435546875, 105.96139526367188, 33.08479690551758, 133.63711547851562, 73.44943237304688, -53.70146942138672, -224.0035400390625, 192.29556274414062, 196.17153930664062, 180.96273803710938, -26.95452117919922, -17.85155487060547, 32.03749084472656, 30.45685577392578, -18.555633544921875, 14.14512825012207, 32.39856719970703, 79.2975082397461, 89.19534301757812, 175.53677368164062, 181.78529357910156, 91.15768432617188, 70.08863067626953, 25.471099853515625, 70.8445053100586, 14.965293884277344], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000585.npy"} +{"epoch": 0.8843537414965986, "step": 586, "batch_size": 64, "mean": 60.64173889160156, "std": 72.92900085449219, "min": -80.532470703125, "p10": -16.27133445739746, "median": 39.170833587646484, "p90": 175.26744689941407, "max": 222.08702087402344, "pos_frac": 0.765625, "sample": [100.05020141601562, 19.45587921142578, 131.55523681640625, 52.39727020263672, 36.173797607421875, 142.9855499267578, 36.83638000488281, 11.216575622558594, -1.1809005737304688, -16.13526725769043, 100.2231674194336, -18.482620239257812, 9.089706420898438, 215.79293823242188, 183.27903747558594, -16.329648971557617, 100.7628173828125, 107.14372253417969, 55.956153869628906, 115.69132232666016, 18.581249237060547, 85.02706146240234, 25.750919342041016, 174.589599609375, 23.122886657714844, -2.8612117767333984, -5.311790466308594, 17.830291748046875, 137.33541870117188, 59.753841400146484, 142.86825561523438, 112.64108276367188, 52.503990173339844, 55.55668258666992, 184.66590881347656, 6.7771148681640625, -80.532470703125, 215.23904418945312, -2.7733726501464844, 8.271276473999023, 7.304948806762695, 21.310577392578125, -21.274444580078125, 118.58065795898438, 79.72148132324219, -10.666988372802734, -0.7939834594726562, 62.73828125, -4.667877197265625, 102.20269775390625, 222.08702087402344, -37.46965026855469, 15.214187622070312, 38.28074645996094, 175.83193969726562, 40.06092071533203, -76.8640365600586, 175.55795288085938, 15.013076782226562, -18.176376342773438, 166.310302734375, 28.866130828857422, 112.70027923583984, 73.68626403808594], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000586.npy"} +{"epoch": 0.8858654572940288, "step": 587, "batch_size": 64, "mean": 60.2142219543457, "std": 115.20861053466797, "min": -426.6921081542969, "p10": -58.092468643188475, "median": 71.50548553466797, "p90": 184.1443801879883, "max": 281.0702819824219, "pos_frac": 0.734375, "sample": [39.79544448852539, -133.07545471191406, -3.2683486938476562, 113.77531433105469, 151.64468383789062, -84.45625305175781, 62.2809944152832, -42.727783203125, 159.86788940429688, 103.71937561035156, 16.788227081298828, 92.08368682861328, -58.551025390625, -2.8558807373046875, -1.3138427734375, 65.45210266113281, 133.84727478027344, -5.356605529785156, -17.676742553710938, 208.63499450683594, 166.26976013183594, 117.30076599121094, -0.5020980834960938, 187.7748260498047, 97.16485595703125, 54.08112335205078, 201.44757080078125, 15.386703491210938, -426.6921081542969, 1.7226066589355469, 83.02690887451172, 87.73780822753906, 104.44746398925781, 117.34727478027344, 27.164867401123047, 87.6724853515625, 100.29447937011719, -249.4022674560547, -68.03521728515625, 268.9059753417969, 161.19644165039062, -17.57320785522461, 154.44281005859375, 105.35768127441406, 4.256315231323242, 144.91806030273438, 12.819725036621094, 172.06649780273438, 152.70452880859375, 94.32228088378906, 207.2003631591797, -95.9324722290039, 128.84649658203125, 11.635139465332031, 63.141845703125, 220.9785614013672, 23.055015563964844, -12.211372375488281, -57.02250289916992, 68.58319854736328, 74.42777252197266, 281.0702819824219, 175.67333984375, 8.031425476074219], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000587.npy"} +{"epoch": 0.8873771730914588, "step": 588, "batch_size": 64, "mean": 64.5030517578125, "std": 100.4663314819336, "min": -141.32427978515625, "p10": -58.49918327331542, "median": 65.21704864501953, "p90": 186.06985015869142, "max": 303.35186767578125, "pos_frac": 0.78125, "sample": [76.37406921386719, -66.77299499511719, -38.53748321533203, 136.76547241210938, 1.2954864501953125, 141.05984497070312, 166.19503784179688, 44.18266296386719, 161.38485717773438, 131.7276611328125, 274.36669921875, 41.98704528808594, 34.398345947265625, 96.60790252685547, 42.632362365722656, 111.18560791015625, 203.15335083007812, 296.3914489746094, 27.318693161010742, 303.35186767578125, 73.98172760009766, 131.26510620117188, -47.55466842651367, 181.21432495117188, 4.742303848266602, 84.26730346679688, 49.34501647949219, -28.24066925048828, 4.0578155517578125, -113.35769653320312, 5.836694717407227, 90.8129653930664, -124.25725555419922, 103.94941711425781, 110.91747283935547, 201.9605712890625, 6.486391067504883, 98.84201049804688, 72.57882690429688, -30.492530822753906, -40.34258270263672, -41.004058837890625, 68.7143325805664, 187.22850036621094, 126.87055206298828, 63.73976135253906, 157.48757934570312, -3.3829307556152344, 26.473770141601562, 132.1253204345703, 26.905059814453125, -130.27432250976562, 30.623748779296875, 46.35022735595703, 75.45643615722656, 66.6943359375, -63.18968963623047, 23.124717712402344, 48.107269287109375, -133.849365234375, 151.36915588378906, 205.50244140625, 183.3663330078125, -141.32427978515625], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000588.npy"} +{"epoch": 0.8888888888888888, "step": 589, "batch_size": 64, "mean": 67.54927825927734, "std": 79.1126937866211, "min": -113.11709594726562, "p10": -26.826406478881832, "median": 69.63813781738281, "p90": 167.88420410156252, "max": 284.55145263671875, "pos_frac": 0.78125, "sample": [34.323486328125, 48.723594665527344, -110.11119079589844, 184.2237548828125, 76.78083038330078, 2.0011138916015625, -39.631072998046875, -10.168670654296875, 15.985206604003906, -1.392791748046875, -36.24055480957031, 36.79844665527344, 284.55145263671875, 5.440723419189453, 143.3730926513672, 69.23277282714844, 90.44831085205078, 129.82505798339844, 133.6206817626953, 118.25934600830078, 70.04350280761719, 103.98611450195312, 158.45680236816406, -72.61058044433594, 187.2169952392578, 105.17071533203125, -31.282997131347656, 118.0873031616211, 130.072509765625, 117.01553344726562, 65.38893127441406, -8.25997543334961, 165.9566192626953, 48.50856018066406, -23.754013061523438, 78.19303894042969, 52.33220672607422, 28.97838592529297, 70.72063446044922, 182.5858917236328, 40.303131103515625, 103.89485168457031, 171.66311645507812, 93.36104583740234, 74.65850830078125, -3.860992431640625, 113.55420684814453, -28.143146514892578, -18.66231918334961, 27.091934204101562, -113.11709594726562, 122.4347915649414, 163.49432373046875, -8.048301696777344, 57.332618713378906, 168.71031188964844, 120.88327026367188, 113.40408325195312, 18.50902557373047, 28.63080596923828, 72.349609375, 40.1777229309082, 236.366455078125, 5.315958023071289], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000589.npy"} +{"epoch": 0.890400604686319, "step": 590, "batch_size": 64, "mean": 65.18154907226562, "std": 87.85477447509766, "min": -165.67462158203125, "p10": -34.40607528686523, "median": 59.382362365722656, "p90": 180.65586395263674, "max": 233.45663452148438, "pos_frac": 0.78125, "sample": [95.1212387084961, 38.68561553955078, 99.82801055908203, 6.512260437011719, 147.59063720703125, 164.1497802734375, 93.77264404296875, -137.87188720703125, 35.1345329284668, -12.164482116699219, 39.896697998046875, 2.4379920959472656, 9.0389404296875, 41.33625030517578, -165.67462158203125, 139.64340209960938, 150.99815368652344, 84.71768188476562, -22.211284637451172, 0.7546234130859375, -39.33599853515625, 136.21774291992188, 4.946510314941406, 183.14920043945312, 190.1086883544922, -15.930030822753906, -28.682846069335938, 60.14991760253906, 225.2613525390625, 62.9588623046875, -29.009300231933594, 170.69674682617188, 18.776304244995117, 12.9534912109375, 137.6346893310547, 84.31352233886719, 78.96500396728516, 12.911056518554688, 58.61480712890625, 14.953536987304688, 197.46585083007812, 103.2491683959961, 233.45663452148438, 157.20040893554688, 173.41259765625, 94.87373352050781, 91.1920166015625, 160.22262573242188, -36.71897888183594, 56.76057434082031, -39.63116455078125, 186.60394287109375, 119.29141235351562, -25.946365356445312, 2.3349456787109375, 172.3592529296875, 39.157989501953125, 66.0348129272461, 181.61529541015625, -5.144664764404297, 47.13357925415039, -39.36204528808594, 178.4171905517578, -93.70852661132812], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000590.npy"} +{"epoch": 0.891912320483749, "step": 591, "batch_size": 64, "mean": 79.55722045898438, "std": 110.15702819824219, "min": -151.52456665039062, "p10": -77.2550811767578, "median": 78.5546646118164, "p90": 201.29747314453127, "max": 368.02069091796875, "pos_frac": 0.796875, "sample": [1.7173595428466797, 190.61163330078125, 129.4009246826172, 152.2986602783203, 145.70523071289062, 64.198974609375, 183.27117919921875, 85.76152038574219, 81.02687072753906, 104.01948547363281, 50.52601623535156, -103.13616943359375, 164.59661865234375, -93.73145294189453, 110.73539733886719, -20.528594970703125, 50.715850830078125, 60.37872314453125, 107.76828002929688, 18.686939239501953, 150.36788940429688, 76.08245849609375, 278.2812194824219, -106.25743103027344, 175.7799072265625, -150.86473083496094, 146.82754516601562, 108.14860534667969, 3.83294677734375, 29.66064453125, -151.52456665039062, -130.2066192626953, 245.03173828125, 218.81114196777344, 5.6897430419921875, 193.9374542236328, -13.999271392822266, 50.905120849609375, 178.75692749023438, 14.439517974853516, 4.679145812988281, -14.681411743164062, 60.53302001953125, 161.3001251220703, 0.7029819488525391, 234.64138793945312, -18.107088088989258, -81.088623046875, -14.723762512207031, 368.02069091796875, -68.31015014648438, 13.181190490722656, 231.35525512695312, 41.29674530029297, 34.40653610229492, 191.16006469726562, 183.12930297851562, 116.33961486816406, 158.5496063232422, 100.14585876464844, 204.45176696777344, 185.58607482910156, 11.084707260131836, 180.2852783203125], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000591.npy"} +{"epoch": 0.8934240362811792, "step": 592, "batch_size": 64, "mean": 61.694923400878906, "std": 91.75536346435547, "min": -89.83296203613281, "p10": -44.313880538940424, "median": 31.85818099975586, "p90": 184.3554214477539, "max": 332.5138854980469, "pos_frac": 0.796875, "sample": [81.28099060058594, 210.24850463867188, 176.96554565429688, 34.195350646972656, 168.29071044921875, 181.21620178222656, 211.48699951171875, 43.446834564208984, 6.80792236328125, 26.145484924316406, -48.196388244628906, 102.63605499267578, 52.43070983886719, 17.044296264648438, -57.63104248046875, 83.71288299560547, 184.11512756347656, 113.61004638671875, 3.4468002319335938, 22.893108367919922, -66.63960266113281, 151.624755859375, 79.72743225097656, 239.1866455078125, 16.202152252197266, 100.87452697753906, 100.14824676513672, 184.45840454101562, 155.6942138671875, 13.911514282226562, -83.27315521240234, 118.89117431640625, -13.648414611816406, 130.86141967773438, 30.154335021972656, 59.32284164428711, -89.83296203613281, 107.77716064453125, -79.07308197021484, -35.23612976074219, -5.835788726806641, 8.65922737121582, 26.278541564941406, 0.3892364501953125, -67.30192565917969, 13.84442138671875, 33.56202697753906, 269.2490234375, 221.2254638671875, 12.287139892578125, 332.5138854980469, -1.0526199340820312, 15.373050689697266, 0.8466339111328125, 29.0799560546875, 5.945013046264648, -21.05352783203125, 5.154762268066406, -35.254695892333984, 38.15645980834961, 72.45790100097656, 22.66893768310547, 103.2386474609375, 132.765625], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000592.npy"} +{"epoch": 0.8949357520786092, "step": 593, "batch_size": 64, "mean": 63.08100891113281, "std": 96.3347396850586, "min": -191.31942749023438, "p10": -57.63460617065425, "median": 65.56657791137695, "p90": 189.01837463378908, "max": 225.96041870117188, "pos_frac": 0.765625, "sample": [130.28831481933594, 27.17245101928711, 174.1657257080078, 1.10186767578125, 153.40652465820312, -11.1737060546875, 80.40015411376953, -191.31942749023438, 203.66810607910156, 48.28114318847656, 186.54498291015625, 25.138202667236328, 222.83360290527344, 160.9732666015625, 45.75250244140625, 4.396091461181641, 102.71056365966797, 101.31283569335938, 167.48089599609375, 115.74108123779297, 17.227712631225586, 84.21238708496094, 217.97979736328125, 190.07839965820312, -13.071441650390625, -1.1203460693359375, -5.154561996459961, 157.87220764160156, 110.5822525024414, -111.7020263671875, 84.77427673339844, -75.46123504638672, 2.972076416015625, 85.1313247680664, 104.61395263671875, 158.677001953125, 8.11956787109375, -12.4002685546875, 127.34843444824219, -89.32246398925781, -127.1646728515625, -16.039138793945312, 205.19798278808594, -135.05889892578125, 165.52859497070312, 136.3370361328125, 160.07151794433594, 30.782377243041992, -14.956539154052734, 225.96041870117188, 66.84982299804688, -8.767385482788086, 115.2612075805664, 82.62950134277344, 64.28333282470703, -112.9104995727539, 29.987459182739258, 193.12583923339844, 1.1076240539550781, 3.2275466918945312, 25.47662353515625, 40.83551025390625, 13.9639892578125, 101.22283172607422], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000593.npy"} +{"epoch": 0.8964474678760394, "step": 594, "batch_size": 64, "mean": 56.433143615722656, "std": 82.87394714355469, "min": -192.44593811035156, "p10": -47.089403533935545, "median": 58.161712646484375, "p90": 161.3094741821289, "max": 217.72994995117188, "pos_frac": 0.75, "sample": [45.77418899536133, 130.8422088623047, -59.606449127197266, 5.925605773925781, 84.90312194824219, 119.49178314208984, 29.272605895996094, 53.56915283203125, 81.30570983886719, 2.0350112915039062, -46.79754638671875, 7.936412811279297, -19.969070434570312, 114.29722595214844, 20.100244522094727, 1.8191719055175781, -55.054473876953125, -1.3457145690917969, 78.44171142578125, 13.358291625976562, 159.7427520751953, 71.07550048828125, 2.2059078216552734, 142.76205444335938, 191.25994873046875, 114.72286987304688, 161.37644958496094, -47.21448516845703, 157.259765625, -2.1433658599853516, 145.95376586914062, 143.72500610351562, 217.3736572265625, 144.15867614746094, 47.509033203125, -34.89845275878906, -60.37384796142578, 87.65533447265625, 128.07635498046875, -63.59532165527344, 161.1531982421875, 7.524309158325195, 76.26158142089844, 170.50534057617188, 4.243019104003906, 26.91426658630371, 62.1578369140625, 179.40907287597656, -2.926816940307617, 167.420166015625, 70.82110595703125, -192.44593811035156, 97.5087890625, 217.72994995117188, 54.16558837890625, 106.49362182617188, 7.075965881347656, 65.27001953125, 80.29446411132812, -37.70722198486328, 91.17488098144531, -55.00657653808594, -24.47942352294922, -34.7667236328125], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000594.npy"} +{"epoch": 0.8979591836734694, "step": 595, "batch_size": 64, "mean": 74.60322570800781, "std": 104.30529022216797, "min": -184.7678985595703, "p10": -41.0871124267578, "median": 67.74566268920898, "p90": 191.9880630493164, "max": 332.3894348144531, "pos_frac": 0.84375, "sample": [-6.299507141113281, 78.48632049560547, 332.3894348144531, 92.0068359375, 0.5850143432617188, 14.274431228637695, 80.62284088134766, 30.963123321533203, 19.661483764648438, 180.7786865234375, 209.29507446289062, 33.17713165283203, 67.89723205566406, -113.18902587890625, 186.41238403320312, 21.674407958984375, 2.595663070678711, 5.516845703125, 186.6677703857422, 31.25272560119629, 38.624961853027344, 86.91322326660156, 219.9769744873047, 26.803916931152344, 255.8966064453125, 45.05127716064453, 96.78710174560547, 90.19317626953125, 166.3977813720703, 134.6415557861328, -4.089744567871094, -88.90428161621094, 67.5940933227539, -48.372650146484375, 168.0777587890625, 173.9966278076172, 225.7961883544922, -128.446044921875, -184.7678985595703, 210.40850830078125, 192.00559997558594, 184.2423553466797, 112.29974365234375, 67.12680053710938, -92.36428833007812, 189.12815856933594, 80.7711181640625, 113.69474792480469, -24.0875244140625, 25.780841827392578, 2.2390689849853516, 191.9471435546875, 105.5738525390625, 26.903907775878906, 2.9493560791015625, 43.21900939941406, 184.65721130371094, 144.2724609375, 44.340423583984375, 6.520111083984375, 2.4644832611083984, -169.9630584716797, 169.94740295410156, 163.58958435058594], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000595.npy"} +{"epoch": 0.8994708994708994, "step": 596, "batch_size": 64, "mean": 34.332279205322266, "std": 85.6504135131836, "min": -170.12046813964844, "p10": -54.37115707397461, "median": 20.612533569335938, "p90": 175.1317886352539, "max": 233.6710968017578, "pos_frac": 0.59375, "sample": [-78.9764404296875, 29.67815399169922, 200.6404571533203, 33.459022521972656, 47.75141143798828, -57.68846893310547, -13.025394439697266, 15.867149353027344, -39.39167022705078, 183.78436279296875, -88.99168395996094, 44.23491287231445, -87.92892456054688, -24.845733642578125, 233.6710968017578, 174.3127899169922, 147.97906494140625, 52.66814041137695, -102.5416259765625, 37.00574493408203, -31.08319091796875, 175.4827880859375, 45.13360595703125, 99.1265869140625, 189.0868682861328, 162.23216247558594, 75.32262420654297, -27.450963973999023, 54.13286590576172, -56.098480224609375, -33.54581069946289, 64.83132934570312, 28.252761840820312, 7.903802871704102, 70.59293365478516, -0.6516532897949219, 41.98950958251953, 225.46607971191406, 9.26772689819336, -28.741905212402344, 22.644561767578125, -0.47988128662109375, 5.776561737060547, -170.12046813964844, -18.335006713867188, -3.292400360107422, 6.31268310546875, -16.500301361083984, 195.09017944335938, 87.47369384765625, 110.56642150878906, -9.431121826171875, -26.095703125, -8.537132263183594, -50.340736389160156, 162.0747528076172, 18.58050537109375, 88.38817596435547, -27.615327835083008, 44.91426086425781, 25.152843475341797, 33.83436584472656, -7.7418365478515625, -43.96540069580078], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000596.npy"} +{"epoch": 0.9009826152683296, "step": 597, "batch_size": 64, "mean": 56.015464782714844, "std": 84.86450958251953, "min": -113.19489288330078, "p10": -46.161081314086914, "median": 37.060434341430664, "p90": 183.11654205322267, "max": 230.1363067626953, "pos_frac": 0.71875, "sample": [-5.628437042236328, -48.488258361816406, -46.42618942260742, -13.316940307617188, 198.27145385742188, -15.3955078125, 34.653629302978516, -84.1038589477539, -38.566001892089844, 190.26205444335938, 0.4821586608886719, 101.74054718017578, 4.318849563598633, 140.31202697753906, -45.54249572753906, 12.034215927124023, 184.00186157226562, 181.05079650878906, 165.43267822265625, -28.547494888305664, 80.85408782958984, 16.394866943359375, -74.453857421875, 29.088302612304688, 136.53924560546875, 135.01300048828125, 11.416837692260742, -49.13786315917969, 140.36370849609375, 8.152856826782227, 120.23420715332031, 39.46723937988281, 191.43817138671875, 49.83570098876953, 73.4519271850586, 52.967342376708984, -18.274581909179688, 93.71200561523438, 43.47019958496094, 145.9130859375, 3.3196678161621094, -79.84487915039062, 10.611137390136719, -8.663434982299805, -3.9112186431884766, -5.853239059448242, 4.614992141723633, 33.09809875488281, 118.30236053466797, 71.78839874267578, 190.52987670898438, 6.820728302001953, 125.88855743408203, -11.434951782226562, -113.19489288330078, 118.71890258789062, 6.074214935302734, 93.98056030273438, 230.1363067626953, 217.97872924804688, 46.25584411621094, 157.47621154785156, 116.06583404541016, 143.240478515625], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000597.npy"} +{"epoch": 0.9024943310657596, "step": 598, "batch_size": 64, "mean": 37.18084716796875, "std": 89.4239501953125, "min": -174.1839141845703, "p10": -64.3572006225586, "median": 28.287996292114258, "p90": 162.37207031250003, "max": 273.8683166503906, "pos_frac": 0.65625, "sample": [-6.616472244262695, -82.99446105957031, 23.03166961669922, 32.14366912841797, 73.9437484741211, 3.806377410888672, 12.433128356933594, 183.5967559814453, 149.56666564941406, -174.1839141845703, 45.709129333496094, 53.08543395996094, 26.864429473876953, -49.479766845703125, 146.5118408203125, -34.22290802001953, 220.95867919921875, -66.540771484375, 142.4738311767578, 47.83101272583008, -19.35466957092285, -165.32421875, -49.12870788574219, 99.16290283203125, 29.711563110351562, 36.12348175048828, 45.26359939575195, 70.03741455078125, -2.8541336059570312, -28.312610626220703, -55.542564392089844, -65.67462158203125, 36.04235076904297, 107.9312744140625, 164.27536010742188, -1.1622657775878906, 11.991592407226562, 7.421688079833984, 74.87611389160156, 64.3475341796875, 152.28469848632812, 25.725830078125, -3.251558303833008, 184.21041870117188, 0.674072265625, 114.36915588378906, 44.70027160644531, -2.1491470336914062, 124.04236602783203, 37.72130584716797, -59.110260009765625, -88.56964874267578, 10.202812194824219, 19.9952392578125, 40.11079406738281, -61.28321838378906, 157.93106079101562, 99.59736633300781, -21.92034912109375, -27.19536590576172, 273.8683166503906, 175.41683959960938, -94.0134048461914, 168.46759033203125], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000598.npy"} +{"epoch": 0.9040060468631897, "step": 599, "batch_size": 64, "mean": 45.02214050292969, "std": 91.29261016845703, "min": -161.39700317382812, "p10": -69.45747680664061, "median": 45.4052619934082, "p90": 172.92162322998047, "max": 270.83258056640625, "pos_frac": 0.625, "sample": [-59.47908020019531, -43.65887451171875, 49.32245635986328, 65.25395965576172, -34.95441436767578, 80.46503448486328, 25.957019805908203, 215.51434326171875, -87.47854614257812, -103.71661376953125, -11.638862609863281, -35.414268493652344, 7.9500579833984375, 76.13005065917969, 129.75711059570312, -19.67053985595703, -119.68589782714844, -3.0420188903808594, 2.327648162841797, -45.4969482421875, 172.9045867919922, 105.14804077148438, 53.936676025390625, -161.39700317382812, 3.0655899047851562, -2.116302490234375, -5.4564056396484375, 177.68231201171875, -73.73393249511719, 43.37165832519531, 210.58204650878906, 161.175537109375, -86.10443878173828, -35.29125213623047, 47.67231369018555, 30.50146484375, 68.80577087402344, -20.21954345703125, 78.67245483398438, 107.24920654296875, 130.9324188232422, -26.030471801757812, 31.984594345092773, -53.615753173828125, 164.96475219726562, 84.96673583984375, 173.35952758789062, -5.2143402099609375, -80.19552612304688, 27.134166717529297, 172.92892456054688, 191.38015747070312, 73.9580078125, 127.92918395996094, 142.4852752685547, 47.438865661621094, 270.83258056640625, 113.90567779541016, 69.05622863769531, -3.803071975708008, -18.085739135742188, 98.97557830810547, 113.49708557128906, 67.74173736572266], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000599.npy"} +{"epoch": 0.9055177626606198, "step": 600, "batch_size": 64, "mean": 53.64229965209961, "std": 92.67742919921875, "min": -150.92849731445312, "p10": -66.19792938232422, "median": 41.089576721191406, "p90": 193.2425918579102, "max": 271.7278137207031, "pos_frac": 0.75, "sample": [125.24447631835938, 54.885032653808594, 3.902467727661133, 14.276779174804688, 199.23297119140625, 24.511199951171875, 40.23220443725586, -97.92882537841797, 164.36473083496094, 207.74012756347656, -12.662910461425781, 11.569324493408203, 100.0833969116211, 126.93214416503906, 7.812530517578125, 8.875795364379883, -36.705108642578125, -72.11466217041016, -74.09603881835938, 167.3065948486328, 20.433490753173828, 63.61918640136719, 139.1930694580078, 109.59373474121094, -36.41960906982422, 221.0832061767578, 96.59139251708984, 177.11032104492188, -18.56475067138672, 161.42446899414062, 199.91079711914062, 24.97608184814453, -150.92849731445312, -17.18647003173828, 76.01852416992188, -95.81935119628906, -60.79833984375, 105.0394515991211, 1.1312217712402344, 271.7278137207031, -5.2577667236328125, 114.69168090820312, 31.274192810058594, 179.65493774414062, -9.174962997436523, 23.003353118896484, -68.51203918457031, -26.91092872619629, -124.0752944946289, 65.89773559570312, 2.05615234375, 90.82746887207031, 47.56446838378906, 33.48590087890625, 88.5751953125, 12.15301513671875, 53.49580383300781, 41.94694900512695, 86.55162048339844, 199.0658721923828, 5.973213195800781, 42.805747985839844, 56.126007080078125, 240.29092407226562], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000600.npy"} +{"epoch": 0.9070294784580499, "step": 601, "batch_size": 64, "mean": 71.37797546386719, "std": 101.33892822265625, "min": -156.41090393066406, "p10": -56.87186279296874, "median": 78.63334655761719, "p90": 188.707958984375, "max": 308.283203125, "pos_frac": 0.734375, "sample": [145.76614379882812, 37.98711395263672, 168.84912109375, -70.53857421875, 187.2366943359375, 116.756103515625, 308.283203125, -77.00082397460938, 69.42024230957031, -9.337535858154297, 208.16212463378906, -155.3133087158203, 177.33627319335938, 48.612815856933594, -22.814294815063477, 94.10254669189453, 153.54127502441406, 220.37521362304688, -59.626304626464844, 134.2042236328125, 189.3385009765625, 5.399543762207031, 1.2717742919921875, 168.28076171875, 192.54367065429688, 94.06520080566406, -4.288251876831055, -5.120830535888672, 132.55810546875, 14.700057983398438, 29.34412384033203, 124.45048522949219, 135.26663208007812, -17.36621856689453, -3.6252880096435547, 125.76164245605469, -3.2602310180664062, 99.5211181640625, 55.05134582519531, 21.605886459350586, -85.25923156738281, 87.84645080566406, 12.391033172607422, 167.56268310546875, 90.13140869140625, 102.7230224609375, 47.50887680053711, -50.44483184814453, -22.06296730041504, 36.85554504394531, 0.04965972900390625, 246.80252075195312, -4.182474136352539, 4.050861358642578, 149.64657592773438, 169.83932495117188, 276.71405029296875, 113.32177734375, 169.92340087890625, 0.9631576538085938, -107.00279235839844, 156.05831909179688, 129.6644744873047, -156.41090393066406], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000601.npy"} +{"epoch": 0.90854119425548, "step": 602, "batch_size": 64, "mean": 67.2848892211914, "std": 85.53854370117188, "min": -152.57958984375, "p10": -7.2495109558105435, "median": 53.56044960021973, "p90": 179.8467269897461, "max": 285.0884704589844, "pos_frac": 0.84375, "sample": [-15.41998291015625, 131.95361328125, 183.7576904296875, 285.0884704589844, 65.98204040527344, 34.7269287109375, 72.7919921875, 3.9355907440185547, 38.972808837890625, 5.854145050048828, 212.67935180664062, -2.3113670349121094, 179.70484924316406, 162.56979370117188, -88.3228759765625, 179.90753173828125, -134.33709716796875, 208.31881713867188, 134.1066436767578, -4.014659881591797, 6.5112762451171875, -2.5247955322265625, 12.588859558105469, -8.635875701904297, 28.66448974609375, 147.00546264648438, 65.26669311523438, 120.62572479248047, 35.72694778442383, 76.32990264892578, 14.631046295166016, 140.07704162597656, 97.58931732177734, 53.41640853881836, 51.05879592895508, 22.386783599853516, 14.751712799072266, 53.704490661621094, 172.010009765625, 58.979881286621094, 13.78548812866211, 134.55413818359375, 157.73104858398438, 159.33424377441406, 5.800994873046875, -152.57958984375, 90.62230682373047, 60.493072509765625, 12.260963439941406, 13.7353515625, -11.520626068115234, 7.3021697998046875, 133.296875, 15.767341613769531, 16.36267852783203, 179.53695678710938, 57.50841522216797, 61.251216888427734, 205.50888061523438, 198.7472686767578, -64.1720199584961, 141.6753692626953, 22.61304473876953, 30.508926391601562], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000602.npy"} +{"epoch": 0.91005291005291, "step": 603, "batch_size": 64, "mean": 65.18978881835938, "std": 91.08055877685547, "min": -158.646240234375, "p10": -51.36760311126707, "median": 61.03635597229004, "p90": 171.15, "max": 302.0792541503906, "pos_frac": 0.78125, "sample": [161.50857543945312, 136.0839385986328, 112.9197998046875, -27.349159240722656, -61.13237762451172, 67.77033996582031, 58.797401428222656, 78.47750854492188, -4.797370910644531, 62.83299255371094, 173.39549255371094, 71.19309997558594, 15.778007507324219, -71.70247650146484, 22.072486877441406, 197.50555419921875, -88.19447326660156, 45.58287811279297, 17.549537658691406, 302.0792541503906, 72.63953399658203, 19.537933349609375, 163.98028564453125, 55.010040283203125, -8.564884185791016, 58.200164794921875, 145.77601623535156, -59.72222900390625, 133.22793579101562, -139.64784240722656, 6.3661956787109375, 23.122344970703125, 122.75727844238281, 111.81446838378906, -73.32268524169922, 145.07025146484375, 76.4100341796875, 32.46004867553711, -3.133939743041992, 180.96279907226562, 98.73796081542969, 138.03744506835938, 71.82673645019531, 71.6704330444336, 123.6383285522461, 163.02947998046875, 40.18116760253906, -31.873476028442383, 59.23971939086914, 14.877779006958008, 10.671646118164062, 48.65702819824219, 142.25086975097656, 167.1822509765625, 95.12679290771484, -13.789535522460938, 19.553203582763672, -158.646240234375, 172.8504638671875, 165.76451110839844, 182.77171325683594, 3.306978225708008, 285.58819580078125, -31.8221435546875], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000603.npy"} +{"epoch": 0.9115646258503401, "step": 604, "batch_size": 64, "mean": 56.56141662597656, "std": 99.43761444091797, "min": -218.3047637939453, "p10": -62.77535018920897, "median": 51.58176231384277, "p90": 182.0372283935547, "max": 341.66705322265625, "pos_frac": 0.71875, "sample": [103.00277709960938, 150.82662963867188, -7.288234710693359, -79.57127380371094, 23.490276336669922, 124.94229125976562, -6.581371307373047, 9.560144424438477, 182.22850036621094, -29.61859130859375, 14.54833984375, -15.087013244628906, 2.1170101165771484, 145.60427856445312, -50.971923828125, -21.255722045898438, 159.79750061035156, 54.13970947265625, 55.49785614013672, 163.1419677734375, -147.49725341796875, -47.44110107421875, 21.164474487304688, -73.14273071289062, 79.7474136352539, 5.889375686645508, 12.846376419067383, 53.22051239013672, 65.71739196777344, -218.3047637939453, 49.94301223754883, -67.8339614868164, 59.63957977294922, -72.05990600585938, 175.48834228515625, -9.984565734863281, 67.11215209960938, -14.82049560546875, 192.10488891601562, 137.32962036132812, 92.58811950683594, 191.10110473632812, 341.66705322265625, 30.40868377685547, 155.2012939453125, 113.39974975585938, 31.56493377685547, 176.3460693359375, 203.7714385986328, -48.85980224609375, 203.63894653320312, 4.1847381591796875, 75.16950225830078, 37.972938537597656, 115.14030456542969, 63.13421630859375, 137.91827392578125, 26.099557876586914, 3.7099132537841797, 216.58853149414062, 133.56341552734375, -37.20799255371094, -76.40249633789062, 181.59092712402344], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000604.npy"} +{"epoch": 0.9130763416477702, "step": 605, "batch_size": 64, "mean": 57.59455490112305, "std": 95.11749267578125, "min": -153.78756713867188, "p10": -62.85916595458984, "median": 55.01337432861328, "p90": 173.3579010009766, "max": 275.00579833984375, "pos_frac": 0.75, "sample": [82.21553039550781, 74.01849365234375, -122.55622863769531, 275.00579833984375, 5.356163024902344, 184.11029052734375, 48.66697692871094, 160.09445190429688, 111.92790985107422, -60.46766662597656, 137.04638671875, -23.802413940429688, 30.56829071044922, -15.347633361816406, 13.149951934814453, -102.93418884277344, 80.87083435058594, 145.47262573242188, 132.8148956298828, 81.7293701171875, -27.228439331054688, 0.391876220703125, 111.95757293701172, -150.3321075439453, 5.276390075683594, 106.15672302246094, 175.76991271972656, 146.72003173828125, 50.35917663574219, 45.435394287109375, 142.88766479492188, 39.924072265625, -149.79676818847656, 153.90582275390625, 0.770538330078125, 181.14846801757812, 167.72987365722656, 119.58746337890625, 33.96241760253906, 106.22332763671875, -73.11732482910156, -7.539005279541016, 145.91790771484375, 59.667572021484375, 189.81939697265625, 32.66584014892578, 180.99868774414062, 164.34237670898438, 145.35922241210938, -43.676025390625, 220.95712280273438, 62.16184997558594, 91.25949096679688, -9.544532775878906, -63.88409423828125, 10.224588394165039, 31.32890510559082, -153.78756713867188, 37.41667175292969, -44.88911819458008, 9.187189102172852, 114.91697692871094, -12.78668212890625, 100.26246643066406], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000605.npy"} +{"epoch": 0.9145880574452003, "step": 606, "batch_size": 64, "mean": 68.04817199707031, "std": 94.27259063720703, "min": -111.92444610595703, "p10": -47.70610084533691, "median": 65.4781608581543, "p90": 187.52032928466798, "max": 305.2881774902344, "pos_frac": 0.703125, "sample": [-42.645973205566406, 204.7880859375, 33.03895568847656, 216.28485107421875, -59.22632598876953, 20.70331573486328, 168.79925537109375, 32.75764465332031, -0.4159526824951172, 144.4591827392578, 177.40518188476562, -20.956405639648438, 107.4637451171875, 157.101806640625, 146.94064331054688, -111.92444610595703, 105.90299987792969, 59.30078125, -3.430513381958008, 99.52777099609375, 305.2881774902344, 31.893463134765625, 44.800106048583984, 134.30718994140625, -70.90198516845703, -48.526771545410156, 187.61087036132812, -34.50157928466797, 83.64926147460938, 143.20111083984375, 99.45672607421875, -3.6792755126953125, -103.69771575927734, 171.07582092285156, 73.01417541503906, 6.437036514282227, 61.82237243652344, -5.03178596496582, 139.41900634765625, 9.200004577636719, 187.30906677246094, 223.5885009765625, 69.13394927978516, 121.2581787109375, 14.686065673828125, 248.9403839111328, -17.305130004882812, 60.79222106933594, -71.87088775634766, -45.791202545166016, 172.5499267578125, 31.00751495361328, -102.28446197509766, 69.15591430664062, -16.352615356445312, 113.23872375488281, 70.44640350341797, -11.68404769897461, 80.06105041503906, 225.51145935058594, 107.71218872070312, 123.21976470947266, 42.489715576171875, -1.440603256225586], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000606.npy"} +{"epoch": 0.9160997732426304, "step": 607, "batch_size": 64, "mean": 61.957489013671875, "std": 93.12088775634766, "min": -155.2122802734375, "p10": -43.568932342529294, "median": 40.81106376647949, "p90": 184.9141342163086, "max": 274.8736572265625, "pos_frac": 0.734375, "sample": [6.629020690917969, 29.823486328125, -81.50525665283203, 60.077728271484375, 102.91494750976562, 26.57007598876953, 127.4000473022461, 87.5611343383789, -155.2122802734375, -40.248573303222656, -1.7119026184082031, -39.45716094970703, 128.43869018554688, 179.97291564941406, 36.052093505859375, -44.991943359375, -25.488563537597656, 7.426717758178711, 40.377723693847656, 196.87522888183594, 31.350860595703125, 199.5829315185547, 136.0479278564453, 125.19038391113281, 101.52333068847656, 35.112648010253906, -26.245277404785156, 129.04629516601562, -17.153907775878906, -17.636009216308594, 199.68719482421875, 90.42343139648438, 108.16366577148438, 113.90840911865234, -57.323028564453125, 194.77499389648438, 274.8736572265625, -7.684490203857422, 150.96104431152344, 11.654281616210938, -65.65430450439453, 12.767707824707031, 5.520242691040039, 140.5693817138672, 102.51091003417969, -19.708480834960938, -28.41434669494629, 133.86585998535156, 269.70050048828125, 163.0191650390625, 6.273693084716797, 2.773406982421875, 99.00472259521484, 187.03179931640625, 41.24440383911133, 175.9540557861328, 0.5573921203613281, 61.5498046875, 99.14128112792969, 176.86495971679688, 40.30702209472656, -126.64713287353516, -67.99303436279297, 137.27780151367188], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000607.npy"} +{"epoch": 0.9176114890400605, "step": 608, "batch_size": 64, "mean": 61.9776725769043, "std": 86.64298248291016, "min": -135.2193603515625, "p10": -40.62619857788086, "median": 34.95741271972656, "p90": 178.39167327880864, "max": 293.01361083984375, "pos_frac": 0.71875, "sample": [125.31742858886719, -42.064361572265625, -0.44890594482421875, 169.2418670654297, -0.0074329376220703125, -43.040374755859375, 139.00424194335938, -1.469635009765625, 29.488544464111328, -69.57911682128906, 100.7298583984375, 83.10559844970703, 139.68934631347656, 147.9245147705078, 55.952423095703125, 105.66156005859375, 231.49452209472656, -135.2193603515625, -5.017488479614258, 13.871997833251953, 26.604354858398438, -26.80234146118164, -0.7240009307861328, 207.28646850585938, 163.03866577148438, 19.69277572631836, -4.868949890136719, 75.8309326171875, 12.481689453125, 186.75567626953125, 203.83892822265625, -47.931861877441406, 58.912017822265625, 98.93855285644531, 33.466583251953125, 86.60740661621094, 137.89346313476562, -18.685096740722656, -47.07220458984375, 8.92022705078125, -6.363624572753906, 21.47821044921875, 49.73365783691406, 24.18347930908203, 19.864639282226562, 128.2341766357422, -11.649871826171875, 167.2228546142578, 293.01361083984375, 150.0214080810547, 66.13504028320312, 29.134201049804688, 42.29883575439453, 135.50958251953125, 3.376178741455078, 138.22760009765625, -86.65940856933594, 182.31301879882812, 36.4482421875, -37.270484924316406, 16.87804412841797, 160.20941162109375, 32.98097229003906, 192.432861328125], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000608.npy"} +{"epoch": 0.9191232048374905, "step": 609, "batch_size": 64, "mean": 71.04292297363281, "std": 85.47116088867188, "min": -204.66079711914062, "p10": -45.498244476318355, "median": 82.69647216796875, "p90": 174.2399871826172, "max": 308.03546142578125, "pos_frac": 0.796875, "sample": [188.8091278076172, 119.61784362792969, 126.11199188232422, 11.733467102050781, 60.457000732421875, 25.669342041015625, 163.2808837890625, 106.53558349609375, -15.899856567382812, -5.405693054199219, -52.05224609375, 100.37266540527344, -18.782821655273438, 24.53207778930664, 308.03546142578125, 152.90219116210938, 188.4905242919922, 103.30856323242188, 73.94955444335938, 197.58010864257812, -48.62183380126953, 88.12432861328125, 96.28883361816406, 88.44313049316406, -69.09286499023438, 185.26907348632812, 147.12896728515625, 86.19304656982422, -72.70205688476562, 119.69007110595703, 67.2809829711914, -3.047914505004883, 175.90914916992188, 99.15115356445312, -1.132537841796875, 111.32645416259766, 73.24751281738281, 0.009790420532226562, 157.65948486328125, 82.91133117675781, 44.022621154785156, -72.07536315917969, 50.207550048828125, 183.94625854492188, 170.34527587890625, -204.66079711914062, 18.78103256225586, 82.48161315917969, 105.9825439453125, 16.929792404174805, 38.36153030395508, 106.53134155273438, 91.9873046875, 73.83982849121094, 6.745260238647461, 10.78366470336914, 143.3123321533203, 110.50041961669922, 151.308837890625, -50.678321838378906, 148.97384643554688, 80.40447998046875, 33.64378356933594, -38.209869384765625], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000609.npy"} +{"epoch": 0.9206349206349206, "step": 610, "batch_size": 64, "mean": 67.1641616821289, "std": 97.79708099365234, "min": -157.6158447265625, "p10": -51.21981811523437, "median": 51.80974578857422, "p90": 205.96836547851564, "max": 298.1676330566406, "pos_frac": 0.734375, "sample": [53.42212677001953, 240.8368682861328, 192.47802734375, 141.22190856933594, 56.168617248535156, 162.46218872070312, 29.317672729492188, 7.888948440551758, -104.39036560058594, 18.198440551757812, 48.80718231201172, -89.8851089477539, 74.33634948730469, 45.36933898925781, -12.624465942382812, 59.81640625, 175.1226348876953, -32.40092468261719, -83.25747680664062, -20.18732452392578, 44.61638641357422, -64.82698059082031, 15.220558166503906, 105.54905700683594, -46.02354431152344, -53.44679260253906, 8.496414184570312, 184.30653381347656, 77.50725555419922, 210.656982421875, 50.197364807128906, 298.1676330566406, 200.99197387695312, 180.25399780273438, 5.2891998291015625, 148.73068237304688, 173.7307891845703, -0.19928932189941406, 147.30307006835938, 17.493988037109375, 19.09759521484375, 121.90118408203125, 63.99054718017578, -157.6158447265625, 208.10110473632812, -1.7952003479003906, 13.438209533691406, -20.313953399658203, 172.4797821044922, 211.1900634765625, 75.34556579589844, 72.42943572998047, 42.23301696777344, -5.070695877075195, -1.460092544555664, -17.430809020996094, -79.20271301269531, 135.04739379882812, 221.3730010986328, 97.026611328125, 107.87214660644531, 14.014816284179688, 229.12289428710938, 110.01609802246094], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000610.npy"} +{"epoch": 0.9221466364323507, "step": 611, "batch_size": 64, "mean": 51.49308776855469, "std": 78.34378814697266, "min": -150.2391357421875, "p10": -53.00970001220703, "median": 53.79818344116211, "p90": 158.9636245727539, "max": 226.40133666992188, "pos_frac": 0.734375, "sample": [95.824462890625, 86.0633773803711, 33.245330810546875, 69.65817260742188, 145.42843627929688, -3.0576248168945312, -1.498992919921875, 50.46380615234375, -6.692935943603516, 66.58406066894531, -4.102008819580078, 146.78347778320312, 69.33746337890625, 106.14065551757812, -4.595062255859375, 2.8097305297851562, -76.69403076171875, 168.3637237548828, -55.76375961303711, 226.40133666992188, 124.783447265625, 96.16971588134766, 97.35319519042969, -66.00738525390625, -46.583560943603516, -5.732002258300781, 157.10816955566406, 63.281455993652344, 72.27654266357422, 169.0489501953125, 1.1284103393554688, -66.40225982666016, 22.021392822265625, 187.0482177734375, -24.62872314453125, 12.94891357421875, -150.2391357421875, 180.7404327392578, 57.13256072998047, 46.0667724609375, 118.71647644042969, 78.049072265625, -119.75261688232422, 65.36627197265625, 32.577720642089844, 42.939613342285156, 66.52951049804688, 40.221221923828125, 115.89620971679688, 129.18704223632812, 80.63713073730469, 159.75881958007812, 14.786481857299805, 59.937217712402344, 6.97564697265625, 37.99070739746094, 176.4087371826172, -76.3936538696289, 147.12530517578125, 34.192604064941406, -29.30072593688965, 6.013092041015625, -5.251575469970703, 70.73257446289062], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000611.npy"} +{"epoch": 0.9236583522297808, "step": 612, "batch_size": 64, "mean": 74.64623260498047, "std": 92.07027435302734, "min": -203.64393615722656, "p10": -22.72258510589599, "median": 67.61286163330078, "p90": 198.75167236328127, "max": 254.5653076171875, "pos_frac": 0.78125, "sample": [-2.8474273681640625, -37.655670166015625, 118.90493774414062, 17.97180938720703, -14.675674438476562, 6.851982116699219, 155.99681091308594, 131.138916015625, -9.0694580078125, 29.42926788330078, 127.25519561767578, 76.53950500488281, 62.866127014160156, 76.11155700683594, 92.3574447631836, 50.42127990722656, 47.16514587402344, 2.6650619506835938, 67.4239501953125, 127.41968536376953, 145.51998901367188, -62.68981170654297, 141.76519775390625, 32.59385681152344, 67.80177307128906, 31.55953598022461, 227.7115020751953, -24.854236602783203, -29.259639739990234, 19.79613494873047, 63.011634826660156, 185.52247619628906, 3.030231475830078, -3.462564468383789, -16.62061309814453, 194.21893310546875, 44.89441680908203, 140.56793212890625, 254.5653076171875, -134.98207092285156, 225.5837860107422, 55.93478012084961, 169.7606658935547, -74.22508239746094, 232.04193115234375, 131.57984924316406, 117.27789306640625, -17.74873161315918, 166.44520568847656, 223.8772430419922, 57.41260528564453, -5.123039245605469, 252.91232299804688, 84.64649963378906, 40.285919189453125, 200.69427490234375, 102.6352310180664, 55.967552185058594, 87.13104248046875, -203.64393615722656, 76.9029769897461, 112.2383804321289, 127.49854278564453, 150.31224060058594], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000612.npy"} +{"epoch": 0.9251700680272109, "step": 613, "batch_size": 64, "mean": 71.52304077148438, "std": 90.58146667480469, "min": -191.77133178710938, "p10": -27.762617301940907, "median": 63.56983184814453, "p90": 186.7332992553711, "max": 228.74887084960938, "pos_frac": 0.765625, "sample": [-11.744316101074219, 51.183685302734375, -10.763565063476562, 46.63615417480469, 117.45183563232422, 137.05282592773438, 129.55911254882812, 77.56257629394531, -51.769065856933594, -4.275331497192383, 59.84081268310547, 61.3325080871582, -152.47393798828125, 125.78216552734375, 139.33645629882812, 66.47029113769531, -15.303903579711914, 18.637113571166992, 228.74887084960938, 129.21725463867188, 7.8572540283203125, -35.06843566894531, -191.77133178710938, 14.343095779418945, 172.88577270507812, 80.90277099609375, 141.3593292236328, 32.63984680175781, 18.582618713378906, 28.342514038085938, 227.78158569335938, 56.55531692504883, 102.04718017578125, -3.443492889404297, -6.825736999511719, 61.15968704223633, -59.174278259277344, 123.03251647949219, 101.8191909790039, 212.10137939453125, 166.28115844726562, 186.81324768066406, 63.036277770996094, 157.4810791015625, 212.4331817626953, 17.004608154296875, 224.89950561523438, 5.679143905639648, -4.6502838134765625, 179.87710571289062, -13.238998413085938, -33.10206604003906, 148.33058166503906, 225.9139862060547, 77.01225280761719, 115.36846923828125, 16.436466217041016, 186.5467529296875, 107.08279418945312, 183.34609985351562, 39.186058044433594, 82.65325927734375, 64.10338592529297, -58.62744140625], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000613.npy"} +{"epoch": 0.926681783824641, "step": 614, "batch_size": 64, "mean": 63.72178649902344, "std": 84.00623321533203, "min": -153.648193359375, "p10": -37.404155731201165, "median": 71.69585418701172, "p90": 157.29050750732424, "max": 293.789306640625, "pos_frac": 0.78125, "sample": [153.62855529785156, 116.08448028564453, 30.17337417602539, 125.38065338134766, 76.63495635986328, 126.55571746826172, 14.656444549560547, 0.33228302001953125, 74.87699890136719, 58.66713333129883, 164.9708251953125, 104.61612701416016, 168.0921173095703, 155.82237243652344, 127.69058227539062, 128.9432830810547, 109.10612487792969, 84.17469024658203, 121.5287094116211, 121.40834045410156, -90.57599639892578, 4.6238250732421875, -26.57128143310547, -153.648193359375, 293.789306640625, -16.65552520751953, -20.182592391967773, -19.967041015625, 144.558349609375, -40.57438659667969, -54.797508239746094, 12.058818817138672, 3.395336151123047, 154.98590087890625, 39.68392562866211, 27.567293167114258, 128.28675842285156, 119.738037109375, -143.56805419921875, 121.70348358154297, -16.06549835205078, 170.87881469726562, 120.88690948486328, 125.30388641357422, 83.57831573486328, 115.44326782226562, 27.25548553466797, 59.243377685546875, 123.54324340820312, 33.58949279785156, 31.178192138671875, 52.782928466796875, -56.39067077636719, -24.363937377929688, 13.28372573852539, 177.215087890625, 86.90638732910156, -30.00695037841797, 157.91970825195312, 40.326019287109375, 68.51470947265625, 54.55156326293945, -58.75917053222656, 174.18539428710938], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000614.npy"} +{"epoch": 0.9281934996220711, "step": 615, "batch_size": 64, "mean": 71.7379150390625, "std": 107.89363098144531, "min": -207.72262573242188, "p10": -37.560049438476554, "median": 55.259403228759766, "p90": 206.70268554687505, "max": 301.400390625, "pos_frac": 0.78125, "sample": [66.66881561279297, 98.85844421386719, 163.8079376220703, 53.921722412109375, 68.00201416015625, 166.28634643554688, 90.58475494384766, -153.9378204345703, 179.18141174316406, 55.51110076904297, -83.2730941772461, 75.43628692626953, -106.60049438476562, 133.49171447753906, 61.19844055175781, -86.51638793945312, 115.7644271850586, 226.4576416015625, 131.44906616210938, 2.3380279541015625, 172.8935546875, -28.639183044433594, 216.37521362304688, -5.054206848144531, 152.20025634765625, 44.603607177734375, -41.383277893066406, 54.99568176269531, 18.774261474609375, 195.61740112304688, 174.8375701904297, 55.00770568847656, -7.776390075683594, 28.272663116455078, 27.323707580566406, 178.003173828125, 232.86941528320312, -26.284454345703125, 12.370651245117188, 177.98818969726562, 211.45352172851562, 219.11984252929688, 173.9212188720703, 15.388961791992188, 145.64027404785156, 17.024280548095703, 37.11945343017578, -26.9130859375, 53.56425476074219, 192.89837646484375, -25.70452880859375, 293.50579833984375, 4.4918975830078125, 84.15794372558594, -16.240890502929688, 301.400390625, 49.74629211425781, 108.9339599609375, 181.26995849609375, 11.410308837890625, 28.477699279785156, 26.77093505859375, -180.11349487304688, -207.72262573242188], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000615.npy"} +{"epoch": 0.9297052154195011, "step": 616, "batch_size": 64, "mean": 56.88996124267578, "std": 88.16746520996094, "min": -141.19644165039062, "p10": -29.232291603088377, "median": 50.211734771728516, "p90": 187.4200164794922, "max": 238.60488891601562, "pos_frac": 0.71875, "sample": [206.56451416015625, 16.589385986328125, 5.39251708984375, -10.39630126953125, 160.7779083251953, -8.831037521362305, 238.60488891601562, 100.92646789550781, 3.3623390197753906, 79.69857025146484, 54.36219024658203, 8.385276794433594, 63.31316375732422, -141.19644165039062, 22.86440658569336, -60.83757019042969, 53.837799072265625, -30.386783599853516, -9.383621215820312, 210.96194458007812, 53.790000915527344, 188.61773681640625, -15.751787185668945, -20.67247200012207, 190.32598876953125, -2.669252395629883, -12.794126510620117, 1.2699050903320312, -26.538476943969727, 177.78529357910156, 137.16754150390625, 11.989837646484375, 79.7332763671875, 153.1219024658203, 224.65235900878906, 129.53334045410156, -16.613033294677734, 76.99729919433594, 3.92279052734375, 168.48973083496094, 154.56735229492188, 75.8349609375, 29.095678329467773, 77.10926818847656, 147.63345336914062, 189.87734985351562, -39.008872985839844, 13.924198150634766, -139.2957763671875, 12.837226867675781, -14.94705581665039, -84.82913208007812, 62.70380401611328, 46.63346862792969, 32.96131134033203, 184.62533569335938, 59.03278350830078, 1.6111183166503906, 99.07733154296875, -19.149658203125, 157.8360595703125, 122.5478286743164, 57.30517578125, -53.993080139160156], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000616.npy"} +{"epoch": 0.9312169312169312, "step": 617, "batch_size": 64, "mean": 54.271026611328125, "std": 87.56635284423828, "min": -147.90130615234375, "p10": -39.506790924072256, "median": 43.76641082763672, "p90": 176.21254272460942, "max": 296.7300109863281, "pos_frac": 0.765625, "sample": [38.40532684326172, 21.87588119506836, -12.022476196289062, 52.912818908691406, 212.96302795410156, 103.66401672363281, 180.53628540039062, 160.24705505371094, 14.577342987060547, -71.36833953857422, 46.81745910644531, 32.055381774902344, -19.917434692382812, 9.984014511108398, 3.568462371826172, 142.6305694580078, -27.387718200683594, 182.08450317382812, 24.933135986328125, 8.490814208984375, 296.7300109863281, -10.406864166259766, 4.527645111083984, 163.14932250976562, 81.70729064941406, -1.2775077819824219, -1.6922035217285156, 106.53663635253906, 50.69029235839844, 31.225276947021484, 52.816097259521484, 7.693805694580078, 39.06913757324219, 180.88418579101562, 98.11610412597656, 216.7237548828125, 47.889808654785156, -96.57611846923828, -59.47447967529297, 144.0258026123047, 145.27786254882812, 41.20137023925781, -43.58112335205078, -3.275165557861328, 186.84475708007812, 161.5801544189453, -127.95690155029297, -147.90130615234375, -127.15823364257812, 44.98088073730469, 85.53860473632812, 122.0731201171875, 72.76799011230469, 11.713659286499023, 166.12380981445312, 95.31666564941406, 39.839996337890625, 11.565223693847656, 71.65166473388672, 42.55194091796875, 45.237953186035156, 60.998756408691406, 90.54598999023438, -30.000015258789062], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000617.npy"} +{"epoch": 0.9327286470143613, "step": 618, "batch_size": 64, "mean": 63.29845428466797, "std": 88.1844482421875, "min": -99.32154846191406, "p10": -33.25025787353514, "median": 44.719993591308594, "p90": 190.05862731933595, "max": 306.3784484863281, "pos_frac": 0.8125, "sample": [246.5646514892578, 183.12908935546875, 30.776020050048828, 139.80831909179688, -2.7494125366210938, -1.7411365509033203, -44.9556770324707, 12.892967224121094, 232.2044677734375, 0.681060791015625, 7.2724151611328125, 231.77764892578125, 151.7239532470703, 51.91160583496094, 187.18511962890625, 6.4297027587890625, 40.89354705810547, 2.6774215698242188, 306.3784484863281, 104.97698974609375, 49.35413360595703, 232.9175567626953, 3.4509449005126953, 42.872802734375, 9.151283264160156, 191.383544921875, 64.75090026855469, 59.54875946044922, 98.34395599365234, 62.798484802246094, 20.985702514648438, 26.07769012451172, 191.29013061523438, 7.620304107666016, 55.27439880371094, -16.237884521484375, 67.07113647460938, -60.272789001464844, 119.13375854492188, 43.84235382080078, -85.06597900390625, 0.09801864624023438, 0.4053001403808594, -91.67333984375, 99.30915069580078, -40.54127502441406, 29.789907455444336, -99.32154846191406, 112.45586395263672, 175.20852661132812, 62.255043029785156, 120.14013671875, 12.19256591796875, 2.808624267578125, 58.16705322265625, 44.53358459472656, -12.437301635742188, 90.34899139404297, 118.3056640625, 162.66549682617188, -12.004959106445312, 148.05322265625, -46.6925048828125, 44.906402587890625], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000618.npy"} +{"epoch": 0.9342403628117913, "step": 619, "batch_size": 64, "mean": 65.36746215820312, "std": 90.3155746459961, "min": -203.3489990234375, "p10": -31.935312461853027, "median": 62.24262237548828, "p90": 190.5901794433594, "max": 251.94384765625, "pos_frac": 0.765625, "sample": [102.29620361328125, 7.5632171630859375, 3.6866512298583984, 19.510467529296875, 176.91659545898438, 193.03944396972656, 197.675048828125, -49.45728302001953, -116.2034912109375, 242.94004821777344, 175.22366333007812, 68.36412048339844, 126.59733581542969, 7.154485702514648, 85.02655029296875, -10.554443359375, 77.75780487060547, 91.44287109375, -3.999551773071289, 0.148193359375, -86.55640411376953, 227.69464111328125, 10.591278076171875, -44.109344482421875, -29.809412002563477, 140.99008178710938, 130.18154907226562, 128.0567169189453, 6.000417709350586, -25.637908935546875, 12.159080505371094, -203.3489990234375, -32.846412658691406, 166.47879028320312, 133.213623046875, 128.68948364257812, 19.358638763427734, 184.87522888183594, 203.04852294921875, -57.54795837402344, 99.12161254882812, 195.34133911132812, 67.57145690917969, -1.298238754272461, 146.4854278564453, 112.18701171875, 103.11814880371094, 128.45501708984375, 124.88877868652344, 39.7272834777832, 30.16710662841797, 87.62362670898438, 54.99988555908203, 36.18540954589844, 251.94384765625, 17.682777404785156, 56.913787841796875, 90.16936492919922, -7.889837265014648, 41.05768585205078, -7.669342041015625, 85.9955062866211, 26.052169799804688, -1.9218711853027344], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000619.npy"} +{"epoch": 0.9357520786092215, "step": 620, "batch_size": 64, "mean": 53.78406524658203, "std": 87.40689086914062, "min": -111.04483032226562, "p10": -45.171803283691396, "median": 39.419708251953125, "p90": 174.12273559570312, "max": 236.5060272216797, "pos_frac": 0.703125, "sample": [29.81494903564453, -111.04483032226562, -22.830886840820312, 150.5875244140625, -100.28356170654297, 1.619659423828125, 54.88557434082031, 186.97984313964844, 2.1759872436523438, 82.3257064819336, 158.36936950683594, 141.3672637939453, 92.40066528320312, 89.69912719726562, -2.7712173461914062, 214.0986328125, 100.60443115234375, 51.65185546875, -37.03822326660156, 2.8302459716796875, -90.16342163085938, 25.732891082763672, -73.622314453125, 225.16848754882812, -48.657623291015625, 153.7033233642578, -8.425804138183594, -18.5584716796875, 196.52279663085938, -23.10192108154297, 151.90924072265625, 173.65481567382812, -24.456165313720703, -16.699918746948242, -25.324337005615234, 25.326904296875, 8.59726333618164, 39.51243591308594, 160.68760681152344, 3.4616928100585938, 126.47431182861328, 39.32698059082031, 86.31774139404297, 56.63380432128906, 47.545536041259766, -77.0262451171875, 236.5060272216797, 194.8607177734375, -28.152799606323242, 119.25995635986328, 1.8070735931396484, 174.32327270507812, -29.332733154296875, -1.9024181365966797, -88.949462890625, 22.6877498626709, 142.91091918945312, 31.613815307617188, 62.923343658447266, 35.86505126953125, 118.77590942382812, 92.8977279663086, 103.2591323852539, 52.845298767089844], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000620.npy"} +{"epoch": 0.9372637944066515, "step": 621, "batch_size": 64, "mean": 58.7945556640625, "std": 94.47795867919922, "min": -145.63436889648438, "p10": -53.99521255493163, "median": 58.36963081359863, "p90": 176.43409423828126, "max": 341.402587890625, "pos_frac": 0.71875, "sample": [-2.2429275512695312, 23.981903076171875, 24.30413055419922, -29.939952850341797, -56.4207763671875, -145.63436889648438, 67.72438049316406, 103.17985534667969, -48.33556365966797, 17.11252784729004, 77.66058349609375, 111.25048828125, 169.0834503173828, -2.1524829864501953, 177.88819885253906, 47.93778991699219, 54.20996856689453, 110.90774536132812, 69.6920166015625, 165.87982177734375, 80.58305358886719, 50.910980224609375, 225.91917419433594, -127.14388275146484, 205.59747314453125, 137.87725830078125, 75.60479736328125, -138.98849487304688, 130.03839111328125, -58.15324783325195, 255.41799926757812, 81.73963165283203, 97.18685913085938, 179.137451171875, 152.71734619140625, -5.6618804931640625, 62.529293060302734, 10.273080825805664, 75.49563598632812, -28.66058349609375, -60.24717712402344, 21.646772384643555, 181.5521697998047, 63.715972900390625, 26.372732162475586, -9.882587432861328, 32.57512664794922, -6.8667755126953125, -6.5130462646484375, 27.764873504638672, 4.479337692260742, 122.28551483154297, 77.89097595214844, 22.027124404907227, 114.56045532226562, -10.059818267822266, -17.733360290527344, 341.402587890625, -126.4903793334961, 89.31396484375, 121.35238647460938, 25.157913208007812, 173.0411834716797, 156.9986572265625], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000621.npy"} +{"epoch": 0.9387755102040817, "step": 622, "batch_size": 64, "mean": 60.921173095703125, "std": 86.27738189697266, "min": -117.19181823730469, "p10": -42.21318359374999, "median": 44.36030578613281, "p90": 178.30812988281252, "max": 229.09872436523438, "pos_frac": 0.765625, "sample": [136.98623657226562, 28.081600189208984, 8.062217712402344, -117.19181823730469, 19.06316375732422, 43.01349639892578, -22.518280029296875, 45.707115173339844, -61.32847595214844, -4.1459808349609375, 214.24533081054688, 101.8748779296875, -0.3163776397705078, -46.08768081665039, 169.51995849609375, 64.0948715209961, 162.91285705566406, 149.8607635498047, 108.12290954589844, 176.14126586914062, 131.82846069335938, 161.93601989746094, -9.184545516967773, -13.349699020385742, 229.09872436523438, 54.78882598876953, 52.95829772949219, 123.17046356201172, 2.312976837158203, 82.15837097167969, 179.23678588867188, -104.42727661132812, 56.888343811035156, 18.407756805419922, 5.662727355957031, 2.663644790649414, 180.35653686523438, 120.2143783569336, 95.212890625, 15.647743225097656, 157.08309936523438, 32.96070098876953, 152.2630157470703, -34.709716796875, 100.32366943359375, 147.89060974121094, 210.98419189453125, -87.48302459716797, 5.671939849853516, 16.24395751953125, 179.249755859375, 23.582618713378906, 0.5007400512695312, -45.428955078125, -4.72691535949707, -32.84577941894531, 208.636962890625, 33.221107482910156, -72.69268798828125, 14.688316345214844, 96.57960510253906, 10.292570114135742, 170.49624633789062, 54.493927001953125], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000622.npy"} +{"epoch": 0.9402872260015117, "step": 623, "batch_size": 64, "mean": 64.34942626953125, "std": 90.96340942382812, "min": -150.51190185546875, "p10": -34.17392578125, "median": 70.79263687133789, "p90": 174.69265441894532, "max": 297.4390869140625, "pos_frac": 0.734375, "sample": [142.97869873046875, 38.511863708496094, -20.415210723876953, -118.57589721679688, 70.1060791015625, 221.491455078125, 113.46411895751953, 141.998291015625, 145.68270874023438, 78.61327362060547, -81.44750213623047, 54.45281219482422, 193.407958984375, 75.90750885009766, -34.68278503417969, 225.48104858398438, -28.085651397705078, 141.37371826171875, 71.47919464111328, 83.2125473022461, 43.331268310546875, 25.684526443481445, 155.15744018554688, -13.862052917480469, -21.084434509277344, 104.46554565429688, 131.6743927001953, 176.82635498046875, -150.51190185546875, 23.03955078125, 112.40341186523438, 112.65390014648438, 79.04324340820312, 155.48324584960938, -30.79754638671875, -99.34728240966797, 158.47750854492188, -9.029052734375, 137.37765502929688, 169.71401977539062, 196.95950317382812, 194.30062866210938, 73.27256774902344, 6.087835311889648, -23.41326904296875, -11.224760055541992, -51.44422149658203, 30.50684928894043, 10.091625213623047, 129.05499267578125, 111.8673095703125, 297.4390869140625, 88.31819152832031, 107.28495788574219, 5.65948486328125, 23.54035186767578, -32.98658752441406, 5.8057098388671875, 68.1513671875, 3.788602828979492, 139.2405548095703, -4.883491516113281, 48.495025634765625, -73.20291900634766], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000623.npy"} +{"epoch": 0.9417989417989417, "step": 624, "batch_size": 64, "mean": 67.76050567626953, "std": 96.67943572998047, "min": -174.25546264648438, "p10": -30.416848754882807, "median": 36.63667678833008, "p90": 189.26238403320315, "max": 272.9964904785156, "pos_frac": 0.71875, "sample": [-64.07504272460938, -22.294601440429688, 159.73092651367188, 108.10215759277344, 185.07528686523438, 170.57518005371094, -4.592002868652344, 26.512863159179688, -24.053680419921875, -33.1439208984375, 71.75997161865234, 33.75456237792969, 89.96713256835938, 106.96379852294922, 158.5593719482422, 122.2969970703125, 35.86626434326172, 182.37158203125, 224.8751220703125, 19.165077209472656, -13.332965850830078, -58.37297439575195, -19.26201057434082, 185.04034423828125, 7.878818511962891, 133.9991912841797, 29.499900817871094, -23.67809295654297, 28.90472412109375, 37.40708923339844, 254.78872680664062, 200.27279663085938, 105.47634887695312, 272.9964904785156, 16.321430206298828, -46.65579605102539, 191.05685424804688, 155.4578857421875, 259.70172119140625, 133.76162719726562, 70.37560272216797, 162.56982421875, 94.85779571533203, 33.170501708984375, -50.94013977050781, -7.8887176513671875, 226.40928649902344, -1.8018722534179688, -16.33226203918457, 145.60406494140625, 99.06379699707031, 3.5927906036376953, 3.4374313354492188, 10.048818588256836, -174.25546264648438, 110.40833282470703, 25.344345092773438, -21.12419891357422, 162.99343872070312, -16.947460174560547, -114.38099670410156, 0.15044784545898438, 47.03954315185547, 146.59817504882812], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000624.npy"} +{"epoch": 0.9433106575963719, "step": 625, "batch_size": 64, "mean": 51.40007781982422, "std": 97.94137573242188, "min": -158.6927947998047, "p10": -57.895315551757804, "median": 35.48957824707031, "p90": 204.68834686279297, "max": 276.0272216796875, "pos_frac": 0.6875, "sample": [50.22395324707031, 119.5161361694336, 55.71623229980469, 14.298126220703125, -1.323648452758789, 118.180908203125, 69.87899780273438, 72.21688079833984, 6.407842636108398, 258.7120666503906, 91.37420654296875, -49.816097259521484, 168.46640014648438, -13.042713165283203, 236.92022705078125, 36.46376037597656, 224.45643615722656, 34.51539611816406, -61.35783767700195, -15.461250305175781, 103.03507995605469, 144.5450439453125, 21.45409393310547, -89.38818359375, -8.148788452148438, 48.026123046875, 29.839157104492188, 59.163597106933594, 20.786701202392578, 32.416534423828125, -2.957263946533203, 204.0458221435547, 257.04095458984375, -16.71881103515625, 121.70025634765625, -5.015342712402344, -6.42735481262207, 276.0272216796875, -3.1824569702148438, 15.821548461914062, 103.22528076171875, 155.29058837890625, 208.0706787109375, 99.6153335571289, 60.061683654785156, -23.619308471679688, -155.27981567382812, -96.17205810546875, -110.2799072265625, 119.53532409667969, 17.944320678710938, -116.68826293945312, -158.6927947998047, 204.96371459960938, 109.573486328125, 1.6284523010253906, 127.75161743164062, 21.953689575195312, 63.16913604736328, -38.319725036621094, 46.632598876953125, 42.063350677490234, 10.693525314331055, -21.925621032714844], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000625.npy"} +{"epoch": 0.9448223733938019, "step": 626, "batch_size": 64, "mean": 70.99238586425781, "std": 107.41842651367188, "min": -119.14131927490234, "p10": -57.644606018066405, "median": 67.87577819824219, "p90": 191.0095443725586, "max": 387.7861022949219, "pos_frac": 0.765625, "sample": [183.13473510742188, 26.094131469726562, 166.83074951171875, -48.954864501953125, 341.67535400390625, 181.5498504638672, 193.75262451171875, -36.044090270996094, 88.70645904541016, 179.45706176757812, -49.50135803222656, 19.561302185058594, 66.38326263427734, 3.3655128479003906, -57.279502868652344, 174.16236877441406, 115.76688385009766, -93.15644836425781, 228.02780151367188, 30.718286514282227, -119.14131927490234, 17.262664794921875, 82.01268768310547, 173.25425720214844, 14.411582946777344, 12.99473762512207, 109.16297149658203, 89.33816528320312, -45.49879455566406, 387.7861022949219, 69.36829376220703, -43.539154052734375, 205.77420043945312, 151.33250427246094, 52.72727966308594, -110.01126098632812, -4.575531005859375, 91.67431640625, 0.06755256652832031, 104.94953155517578, 19.88684844970703, 34.19572448730469, 191.2757568359375, 31.03213119506836, -46.027069091796875, 9.82042121887207, 61.14268493652344, 168.4134063720703, 74.59512329101562, 144.96922302246094, 143.23883056640625, 17.880840301513672, -110.68415832519531, 139.1746826171875, -98.66941833496094, 118.11529541015625, 25.668743133544922, 190.3883819580078, 152.76576232910156, 110.18275451660156, 238.20399475097656, -63.65568542480469, 95.79828643798828, -57.80107879638672], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000626.npy"} +{"epoch": 0.9463340891912321, "step": 627, "batch_size": 64, "mean": 75.57084655761719, "std": 95.22844696044922, "min": -170.98678588867188, "p10": -14.593892288208004, "median": 78.9903564453125, "p90": 195.2136184692383, "max": 266.67938232421875, "pos_frac": 0.78125, "sample": [78.76823425292969, 10.564861297607422, 79.21247863769531, 141.47393798828125, 89.93157958984375, 100.8060302734375, 161.1002197265625, 248.16615295410156, 260.14617919921875, 101.55471801757812, -5.087554931640625, 204.64898681640625, 181.64764404296875, 139.89207458496094, 40.905975341796875, 54.7452392578125, 2.7523193359375, 33.53636932373047, 204.02410888671875, 97.53166198730469, 154.5493621826172, 116.74028778076172, 36.521888732910156, 23.64666748046875, 15.608688354492188, -99.83224487304688, 188.20233154296875, -53.68302917480469, 140.70753479003906, -16.31650161743164, 5.218767166137695, 192.49034118652344, 147.63491821289062, -6.166419982910156, 82.65078735351562, -5.5836181640625, -10.574470520019531, 88.52220153808594, -50.54957580566406, 200.58558654785156, 266.67938232421875, 68.65699005126953, -105.15878295898438, -7.826927185058594, 28.13690948486328, -5.0438995361328125, -0.74871826171875, 122.27059173583984, 42.396881103515625, 192.22962951660156, 67.41885375976562, -170.98678588867188, 19.50826644897461, 98.03175354003906, 181.93548583984375, 110.51864624023438, 15.297996520996094, -164.51071166992188, 69.85600280761719, 56.32929229736328, 110.7720718383789, 156.3573455810547, 111.33802032470703, 196.3807373046875], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000627.npy"} +{"epoch": 0.9478458049886621, "step": 628, "batch_size": 64, "mean": 74.21304321289062, "std": 105.95182800292969, "min": -242.4909210205078, "p10": -71.9027145385742, "median": 77.42618560791016, "p90": 192.0174591064453, "max": 261.89013671875, "pos_frac": 0.796875, "sample": [199.8806915283203, 80.94271850585938, 78.107666015625, 117.37151336669922, -30.48967742919922, -129.83392333984375, 191.8170166015625, 13.9703369140625, 159.77285766601562, 137.14892578125, 202.0025634765625, 222.44525146484375, 108.69548034667969, 41.49673080444336, 36.694801330566406, 123.25550079345703, -242.4909210205078, -154.2095489501953, 189.8396453857422, 63.7066764831543, 187.01821899414062, 71.99476623535156, 25.123781204223633, -82.40023803710938, 172.5125274658203, 151.01141357421875, 59.329833984375, 105.76251220703125, 70.27693176269531, 184.10296630859375, 162.2257537841797, 205.04220581054688, 31.704864501953125, 192.10336303710938, 18.15401840209961, 223.33987426757812, -21.539199829101562, 4.760993957519531, 170.74533081054688, -93.19224548339844, 118.96482849121094, 100.7330093383789, 48.79054260253906, 148.8935089111328, 70.00267791748047, 71.70271301269531, 170.67347717285156, 73.1317138671875, 159.31130981445312, 174.86831665039062, 10.823354721069336, -51.14176940917969, 11.983497619628906, -176.68128967285156, 76.74470520019531, 261.89013671875, 9.588836669921875, 158.11557006835938, -26.291793823242188, 79.29547119140625, -33.472991943359375, 127.6091079711914, -3.3020668029785156, -80.80026245117188], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000628.npy"} +{"epoch": 0.9493575207860923, "step": 629, "batch_size": 64, "mean": 58.17967224121094, "std": 81.78675842285156, "min": -117.2402572631836, "p10": -23.047154235839844, "median": 41.93867492675781, "p90": 182.86548004150396, "max": 236.61314392089844, "pos_frac": 0.765625, "sample": [-40.65093231201172, 83.95706939697266, -117.2402572631836, 85.8772201538086, 80.30030822753906, 44.572845458984375, 3.7358551025390625, 70.24337768554688, -95.391845703125, 50.29689025878906, -1.385986328125, 30.024757385253906, 9.48747444152832, 199.18788146972656, 6.388849258422852, -36.3677864074707, 8.468412399291992, 0.94219970703125, 6.928619384765625, 67.52243041992188, 19.829620361328125, -5.700370788574219, -6.037714004516602, 54.89936447143555, -39.32221603393555, 42.434669494628906, 236.61314392089844, 171.5662841796875, -1.832723617553711, 171.33621215820312, 133.7413330078125, -22.555564880371094, 79.10945129394531, 80.57801055908203, 4.275775909423828, 109.11062622070312, 111.23014831542969, 21.15032958984375, 5.693561553955078, -1.2575931549072266, 2.627899169921875, 52.7051887512207, 219.0819091796875, 2.1336936950683594, -13.826438903808594, 5.705230712890625, 41.44268035888672, 130.41444396972656, 117.36461639404297, 148.81166076660156, -7.7722625732421875, 52.758914947509766, 216.83245849609375, 18.749345779418945, 121.69467163085938, 232.00437927246094, -23.257835388183594, 224.42987060546875, 162.4751739501953, 187.70799255371094, 32.96142578125, 148.68214416503906, -36.14418029785156, 64.15616607666016], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000629.npy"} +{"epoch": 0.9508692365835223, "step": 630, "batch_size": 64, "mean": 71.28953552246094, "std": 92.35899353027344, "min": -129.77093505859375, "p10": -41.01967391967772, "median": 59.210222244262695, "p90": 193.06827239990238, "max": 296.11810302734375, "pos_frac": 0.75, "sample": [-70.36285400390625, 129.6300048828125, -3.6572837829589844, 12.038642883300781, 147.46224975585938, 199.61915588378906, 119.29813385009766, -1.0554389953613281, 227.63919067382812, 155.954833984375, -2.5254440307617188, 151.9229736328125, -13.274711608886719, 175.42092895507812, 15.859489440917969, 140.07675170898438, -84.19232940673828, 60.436912536621094, 143.44241333007812, -127.6051025390625, 39.2332763671875, -4.413719177246094, 64.36263275146484, 174.90859985351562, 210.50634765625, 26.99718475341797, -46.30583953857422, 57.9835319519043, -129.77093505859375, 127.27709197998047, -0.8428421020507812, 46.58366394042969, 4.667140960693359, 220.78431701660156, 128.56991577148438, 35.403228759765625, 196.84010314941406, 24.72100830078125, 51.11749267578125, 108.07035064697266, 296.11810302734375, 34.781593322753906, 171.34335327148438, -72.37503051757812, 184.267333984375, 119.95536041259766, 106.90505981445312, 53.74139404296875, 88.64518737792969, -46.85279846191406, 54.19440460205078, -28.685287475585938, -16.495098114013672, 204.02740478515625, 135.40695190429688, 4.092390060424805, 82.1166000366211, 12.08359146118164, 160.16629028320312, 172.4522705078125, -19.94647216796875, 74.66018676757812, 70.77325439453125, 8.332775115966797], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000630.npy"} +{"epoch": 0.9523809523809523, "step": 631, "batch_size": 64, "mean": 83.69660949707031, "std": 105.84396362304688, "min": -146.87594604492188, "p10": -31.01373443603515, "median": 67.0564079284668, "p90": 209.27559051513674, "max": 327.7633056640625, "pos_frac": 0.71875, "sample": [165.47018432617188, 66.17300415039062, -14.201019287109375, 200.80859375, 123.02606201171875, 176.97015380859375, 190.19345092773438, 140.062744140625, 23.77480697631836, -14.138900756835938, 37.635711669921875, -23.269824981689453, 123.48452758789062, -10.011215209960938, -2.499797821044922, 45.974952697753906, -27.25196075439453, 33.21213150024414, 67.93981170654297, 256.0794982910156, 260.341552734375, -51.62799072265625, 203.50204467773438, 207.08506774902344, 158.57168579101562, 71.01988220214844, 20.822906494140625, 265.1206359863281, -12.978483200073242, 112.53072357177734, 38.5970573425293, 36.17604064941406, -130.68638610839844, 97.4559326171875, 85.76579284667969, 258.46484375, 171.10951232910156, 3.8387451171875, 327.7633056640625, 183.7769317626953, 53.59778594970703, -63.125579833984375, -89.13182067871094, 135.9285888671875, -17.358612060546875, -146.87594604492188, -4.331441879272461, 23.92142677307129, -58.02686309814453, 151.52691650390625, -32.62592315673828, 132.02865600585938, -10.0689697265625, 201.17840576171875, -12.582042694091797, 165.43331909179688, 28.623310089111328, 210.21438598632812, 64.34246826171875, 241.97955322265625, 114.0487060546875, 180.97918701171875, 41.388179779052734, 179.4368896484375], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000631.npy"} +{"epoch": 0.9538926681783825, "step": 632, "batch_size": 64, "mean": 78.01876831054688, "std": 86.14340209960938, "min": -112.94473266601562, "p10": -27.132029342651364, "median": 72.01583862304688, "p90": 182.65112915039063, "max": 248.49053955078125, "pos_frac": 0.828125, "sample": [99.04402160644531, 171.73126220703125, 83.90412902832031, 4.765331268310547, 65.05760192871094, 181.84841918945312, 4.461742401123047, 107.20995330810547, -24.457653045654297, 182.99514770507812, 72.9696044921875, -58.7169189453125, 74.8876953125, -13.35525894165039, -60.27894592285156, 174.9753875732422, 196.04129028320312, 8.053703308105469, 173.0835723876953, -73.04821014404297, 57.472015380859375, 30.879535675048828, -100.69522094726562, 25.766006469726562, 54.66161346435547, 138.00143432617188, 67.0279541015625, 139.67889404296875, 55.180721282958984, 28.201770782470703, 152.47970581054688, 248.49053955078125, 75.68170166015625, -28.27819061279297, 168.69180297851562, 25.104875564575195, 176.96450805664062, 52.277183532714844, 101.03083038330078, 107.12889862060547, 178.45428466796875, 171.52801513671875, 14.176055908203125, -11.529167175292969, 10.100261688232422, 192.65115356445312, 143.17355346679688, 95.95701599121094, 190.36563110351562, 168.07394409179688, 186.55908203125, -112.94473266601562, 71.06207275390625, 115.23492431640625, -7.0566558837890625, 0.8071060180664062, 199.04661560058594, 170.39169311523438, 165.84107971191406, 27.490800857543945, 58.507667541503906, 45.338199615478516, -82.88438415527344, 55.93851852416992], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000632.npy"} +{"epoch": 0.9554043839758125, "step": 633, "batch_size": 64, "mean": 59.944671630859375, "std": 90.98613739013672, "min": -117.03594207763672, "p10": -47.536891937255845, "median": 47.36437225341797, "p90": 185.00756225585937, "max": 263.4246826171875, "pos_frac": 0.71875, "sample": [-3.132863998413086, 45.47142791748047, 32.00751495361328, 87.867431640625, 156.4042205810547, -4.978363037109375, 84.2333984375, 116.06430053710938, 39.91168212890625, 72.59210968017578, -3.1199493408203125, 11.271440505981445, 252.0298309326172, 48.70481491088867, -61.22562026977539, 119.67613983154297, 9.058670043945312, 72.40614318847656, 62.75153350830078, -25.06218719482422, 9.388992309570312, -22.10430145263672, 86.1229476928711, 51.049964904785156, 137.6221160888672, 75.64456939697266, -20.542484283447266, -20.82024383544922, 122.73011016845703, 95.35485076904297, 118.9173583984375, -2.8707351684570312, 184.78829956054688, 18.327285766601562, -20.003543853759766, 21.406726837158203, -52.94883728027344, -24.912582397460938, -75.09335327148438, -34.909019470214844, -94.4956283569336, 30.810001373291016, 2.966358184814453, 244.78622436523438, 56.181556701660156, 47.59644317626953, 47.132301330566406, -81.24834442138672, 61.10694885253906, 185.4114990234375, 185.10153198242188, 163.07769775390625, 170.5692138671875, 176.75164794921875, 10.599746704101562, -69.49260711669922, 5.054904937744141, 26.211421966552734, 174.665771484375, 208.1275177001953, 263.4246826171875, -117.03594207763672, 240.77427673339844, 138.30209350585938], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000633.npy"} +{"epoch": 0.9569160997732427, "step": 634, "batch_size": 64, "mean": 25.048431396484375, "std": 92.54147338867188, "min": -160.02662658691406, "p10": -95.36680908203125, "median": 3.164113998413086, "p90": 166.77040710449222, "max": 253.8483123779297, "pos_frac": 0.53125, "sample": [-5.601558685302734, -96.10214233398438, -2.6111068725585938, 180.39004516601562, 29.525543212890625, -10.205587387084961, -15.99685287475586, -13.327634811401367, 36.284141540527344, 18.809494018554688, 21.1326847076416, 5.403892517089844, -1.9075279235839844, -34.414146423339844, -20.442901611328125, 42.25282287597656, 91.70018005371094, 66.33261108398438, -67.00811004638672, -45.381858825683594, -35.98954772949219, -1.3808174133300781, 139.8213348388672, -141.9139404296875, 189.97596740722656, 2.5592803955078125, 178.58123779296875, 141.20193481445312, 253.8483123779297, -111.12959289550781, -0.341522216796875, 19.439355850219727, -3.2879066467285156, -30.479320526123047, 170.6630096435547, -15.988748550415039, -76.66346740722656, -128.91368103027344, 206.74879455566406, 157.6876678466797, 112.13185119628906, -93.65103149414062, -104.0098876953125, 51.070194244384766, -116.79681396484375, -160.02662658691406, 0.6318092346191406, 3.7689476013183594, 177.95108032226562, 56.95157241821289, -40.80169677734375, -37.77732849121094, 94.6865463256836, 40.62946319580078, 8.297525405883789, -3.866230010986328, 155.2831268310547, 118.16818237304688, 50.207054138183594, 74.9222640991211, -6.966606140136719, 6.755598068237305, -31.336036682128906, 153.6063232421875], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000634.npy"} +{"epoch": 0.9584278155706727, "step": 635, "batch_size": 64, "mean": 48.86872100830078, "std": 99.0593032836914, "min": -166.50241088867188, "p10": -75.80367584228516, "median": 25.937240600585938, "p90": 174.8298538208008, "max": 238.0272979736328, "pos_frac": 0.6875, "sample": [-72.67144775390625, 157.156005859375, -107.99352264404297, 6.744159698486328, 76.37667846679688, 17.63634490966797, -77.06033325195312, -137.36734008789062, -94.50387573242188, 176.34408569335938, 1.7545242309570312, 149.83816528320312, 0.9311065673828125, -10.151954650878906, 156.4358673095703, 199.945068359375, 137.16275024414062, 13.353225708007812, 186.08065795898438, 142.6732635498047, -72.87147521972656, 21.83990478515625, -49.603858947753906, 221.03997802734375, 30.034576416015625, -68.05442810058594, 136.7782440185547, -1.7604808807373047, -20.31869125366211, 85.12228393554688, 81.93792724609375, -58.21552276611328, 169.0525360107422, 12.981834411621094, 47.540199279785156, 15.224918365478516, 161.68577575683594, 5.491016387939453, 171.29664611816406, -139.48318481445312, 103.29060363769531, 224.44110107421875, -29.628772735595703, 198.65269470214844, -19.521820068359375, -39.34834289550781, 86.29769897460938, 101.64801788330078, 108.98472595214844, 17.179672241210938, 88.71688079833984, 238.0272979736328, -5.658843994140625, 69.24954986572266, -166.50241088867188, 101.77007293701172, 145.81712341308594, 19.469528198242188, 6.490570068359375, 119.85911560058594, -93.35115051269531, 102.20164489746094, 77.2933120727539, -0.18204498291015625], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000635.npy"} +{"epoch": 0.9599395313681028, "step": 636, "batch_size": 64, "mean": 67.705322265625, "std": 88.60031127929688, "min": -161.98947143554688, "p10": -19.68649673461914, "median": 58.75937080383301, "p90": 167.42059173583985, "max": 285.61639404296875, "pos_frac": 0.828125, "sample": [163.7978057861328, 7.729606628417969, 13.794408798217773, 39.71227264404297, 94.34607696533203, 23.19361114501953, 79.46649169921875, 9.025917053222656, -24.73230743408203, 166.6595916748047, 111.15158081054688, -9.883012771606445, 144.96827697753906, 129.9292755126953, 51.169342041015625, 26.354721069335938, -37.38264465332031, 152.92832946777344, 56.43376922607422, 132.67523193359375, 119.7812271118164, 21.229454040527344, 3.0432872772216797, 149.36480712890625, 6.83880615234375, 82.63086700439453, 247.36166381835938, 4.060819625854492, -6.774557113647461, 94.09142303466797, 60.80727767944336, 56.711463928222656, 228.78904724121094, 81.261962890625, -18.518325805664062, 150.95773315429688, 69.53874206542969, 67.84284210205078, -20.18714141845703, 167.74673461914062, 99.03923034667969, 194.7684326171875, -9.592864990234375, 285.61639404296875, 6.463222503662109, -161.98947143554688, 208.8121795654297, 46.078857421875, 14.351749420166016, 165.7474365234375, 98.00465393066406, 54.975440979003906, 130.15249633789062, 207.98416137695312, 101.25413513183594, -124.99502563476562, -151.53225708007812, 14.659555435180664, 49.09315490722656, 124.09413146972656, 53.571746826171875, -73.64447784423828, 62.944297790527344, 39.367279052734375], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000636.npy"} +{"epoch": 0.9614512471655329, "step": 637, "batch_size": 64, "mean": 50.50914001464844, "std": 101.32233428955078, "min": -243.71743774414062, "p10": -68.23832092285154, "median": 31.335208892822266, "p90": 189.52871704101562, "max": 311.29583740234375, "pos_frac": 0.703125, "sample": [7.43084716796875, 188.72171020507812, 28.93115997314453, 311.29583740234375, -22.633811950683594, 11.90911865234375, -29.40058135986328, 109.59957122802734, 211.78237915039062, 43.98060989379883, -30.66356658935547, 20.71855926513672, 100.7211685180664, -110.25678253173828, 104.7492446899414, 42.06662368774414, -1.8737106323242188, 108.46797180175781, 164.7084197998047, -20.05693244934082, 85.79444885253906, 52.26936340332031, 8.99298095703125, -23.92395782470703, 6.999937057495117, 38.368316650390625, -77.35543060302734, 163.73277282714844, 232.0285186767578, 189.78598022460938, 186.32176208496094, 30.203590393066406, -121.19386291503906, 130.4378662109375, -36.08970642089844, 126.50433349609375, -93.57049560546875, 13.6201171875, 11.999763488769531, 58.883689880371094, 80.28834533691406, 211.653564453125, -1.863729476928711, 19.630878448486328, 178.48004150390625, 20.96050262451172, -35.63140869140625, 77.92437744140625, -92.6409912109375, -2.4076919555664062, 26.48358154296875, 225.45375061035156, 69.03530883789062, 73.35822296142578, 54.75093078613281, -98.77448272705078, 193.30044555664062, 32.466827392578125, -18.37761688232422, -243.71743774414062, 91.66368865966797, 188.92843627929688, -46.965065002441406, 4.5766448974609375], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000637.npy"} +{"epoch": 0.9629629629629629, "step": 638, "batch_size": 64, "mean": 61.109458923339844, "std": 90.29197692871094, "min": -140.8404541015625, "p10": -32.65884284973144, "median": 34.16047286987305, "p90": 184.97481231689454, "max": 241.6077117919922, "pos_frac": 0.671875, "sample": [-140.8404541015625, 148.14073181152344, 126.83769226074219, -2.7548179626464844, -125.29946899414062, -0.8757781982421875, 199.73817443847656, 88.94650268554688, 37.42304611206055, -20.929645538330078, 10.455894470214844, -59.25363540649414, -9.887283325195312, -6.5357666015625, -39.34918212890625, 206.208251953125, -42.37298583984375, -32.6812744140625, 189.03680419921875, -1.0438385009765625, 105.57832336425781, 32.990577697753906, 149.24832153320312, 180.43658447265625, -72.98369598388672, 184.7281951904297, 104.58821868896484, 173.6065673828125, 2.6745147705078125, 60.637298583984375, 28.956777572631836, 190.11598205566406, 107.25517272949219, 163.95526123046875, 27.91302490234375, -12.191545486450195, 9.470695495605469, 126.67242431640625, 0.2966766357421875, 180.04310607910156, 84.73625946044922, 185.08050537109375, 184.40834045410156, -2.217975616455078, 169.51522827148438, -14.554000854492188, -1.7017555236816406, 172.47357177734375, 33.441680908203125, 36.77838897705078, -0.5912456512451172, 28.404369354248047, 241.6077117919922, 58.18194580078125, -32.606502532958984, 43.557762145996094, 1.80804443359375, 190.19540405273438, 179.83297729492188, 8.32943344116211, -13.027694702148438, -0.0790557861328125, 34.87926483154297, 53.59718322753906], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000638.npy"} +{"epoch": 0.9644746787603931, "step": 639, "batch_size": 64, "mean": 69.29682159423828, "std": 94.20096588134766, "min": -102.85208129882812, "p10": -40.43501434326171, "median": 50.980438232421875, "p90": 212.07079315185547, "max": 284.9987487792969, "pos_frac": 0.75, "sample": [144.03692626953125, 112.99249267578125, 82.08488464355469, -45.700584411621094, 73.90985107421875, 120.7083969116211, 10.474327087402344, -29.998035430908203, -46.26012420654297, 114.99978637695312, 20.283370971679688, 59.29602813720703, 261.99822998046875, 44.563751220703125, 144.8280487060547, 5.305419921875, 39.733184814453125, 2.1750869750976562, -82.07317352294922, 80.1344223022461, 115.59593200683594, 160.28700256347656, 1.577810287475586, 211.17330932617188, 5.8456878662109375, 128.65093994140625, 76.48330688476562, 156.4526824951172, -41.787811279296875, 212.45542907714844, 213.8047637939453, -24.2264347076416, 0.8883800506591797, 115.40265655517578, -5.498897552490234, 7.966522216796875, 118.30501556396484, -8.749588012695312, 284.9987487792969, 163.74127197265625, 119.40418243408203, 57.397125244140625, 262.3736877441406, 67.90314483642578, -52.61175537109375, 10.968936920166016, -34.262779235839844, -25.308307647705078, 43.24369812011719, 32.82217025756836, 212.57952880859375, 151.00526428222656, 30.68956756591797, 28.672195434570312, -23.0760498046875, -102.85208129882812, 27.67144012451172, -37.27848815917969, -48.368812561035156, 235.2466278076172, -33.17523956298828, 145.4054412841797, 161.77584838867188, 197.91217041015625], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000639.npy"} +{"epoch": 0.9659863945578231, "step": 640, "batch_size": 64, "mean": 61.44679260253906, "std": 92.2700424194336, "min": -188.05694580078125, "p10": -45.278989410400385, "median": 56.69157791137695, "p90": 172.5312942504883, "max": 245.67710876464844, "pos_frac": 0.78125, "sample": [158.59091186523438, 35.265872955322266, 245.67710876464844, -66.91669464111328, 17.322418212890625, 99.87593078613281, 117.08847045898438, 6.4960784912109375, 152.77169799804688, 183.10684204101562, 70.99502563476562, 14.141075134277344, 106.8236312866211, 112.722412109375, -129.65452575683594, 89.13284301757812, 56.514610290527344, 77.56741333007812, -42.20425033569336, 201.47000122070312, -180.8179473876953, 119.19129180908203, 215.3222198486328, 39.27888488769531, -52.07786560058594, -19.266460418701172, 122.34021759033203, 25.36237335205078, -46.43628692626953, 2.156330108642578, 158.20468139648438, -5.7618255615234375, 23.698028564453125, 168.82611083984375, 73.51513671875, -2.0807876586914062, -0.38594818115234375, 41.641754150390625, -57.85783386230469, 70.89273834228516, 26.867477416992188, 168.71954345703125, 5.929145812988281, 58.3675537109375, 174.0947723388672, 118.02152252197266, 96.55408477783203, -188.05694580078125, 41.88506317138672, 159.90390014648438, 119.72627258300781, 238.43814086914062, 56.86854553222656, 211.92034912109375, 7.3536224365234375, -30.068456649780273, 168.8831787109375, -42.57862854003906, 98.14212036132812, 53.939666748046875, 23.84769058227539, 37.37123107910156, 32.71227264404297, 91.22089385986328], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000640.npy"} +{"epoch": 0.9674981103552532, "step": 641, "batch_size": 64, "mean": 58.35173797607422, "std": 75.60674285888672, "min": -192.5146942138672, "p10": -6.644132995605468, "median": 53.7611083984375, "p90": 160.27029876708988, "max": 294.0142822265625, "pos_frac": 0.84375, "sample": [-47.143062591552734, -69.76065826416016, 87.34518432617188, 92.43280029296875, 58.139312744140625, -5.877204895019531, 119.34751892089844, 13.141197204589844, 5.805961608886719, 13.928024291992188, 72.05513000488281, 23.54802131652832, 107.36328887939453, 164.5728302001953, 67.33001708984375, 8.700803756713867, 3.329254150390625, 183.37548828125, 182.02850341796875, 87.77903747558594, 112.20020294189453, 2.6692962646484375, 45.86133575439453, 44.97837829589844, 73.58069610595703, 163.6846160888672, 16.621627807617188, 65.25141906738281, 25.322982788085938, 107.52655029296875, 10.0357666015625, 99.400146484375, -6.972816467285156, 77.9675521850586, 12.967689514160156, -66.72872161865234, 105.11544799804688, 39.01460266113281, -32.281150817871094, 44.71852111816406, -192.5146942138672, 119.03480529785156, 76.21875, 13.218917846679688, 85.19039916992188, 210.77798461914062, 12.235458374023438, -2.621328353881836, 139.74172973632812, 56.15800476074219, 294.0142822265625, 88.27311706542969, 183.4596710205078, 152.30355834960938, -20.967193603515625, 51.36421203613281, 88.42529296875, 27.428817749023438, 29.51620864868164, 4.893280029296875, -0.28461456298828125, 18.042572021484375, 58.591575622558594, 133.6348419189453], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000641.npy"} +{"epoch": 0.9690098261526833, "step": 642, "batch_size": 64, "mean": 45.5564079284668, "std": 93.78766632080078, "min": -154.5404510498047, "p10": -73.41884078979491, "median": 39.61834144592285, "p90": 157.54635009765624, "max": 308.6103210449219, "pos_frac": 0.6875, "sample": [72.10700225830078, 41.86907196044922, 0.7662734985351562, -100.80227661132812, 39.315589904785156, -11.937108993530273, 93.30390930175781, 187.18759155273438, -27.442779541015625, -154.5404510498047, 308.6103210449219, 21.283775329589844, 88.98187255859375, -53.93560791015625, 86.20135498046875, 35.04972839355469, 127.35163879394531, 216.57760620117188, -35.250274658203125, -19.915653228759766, 99.6741714477539, 105.88339233398438, 151.25228881835938, -30.00570297241211, 120.67105102539062, 129.92616271972656, 182.67388916015625, 48.381622314453125, 155.70718383789062, 60.719093322753906, 83.14936065673828, 83.19281005859375, 82.88394165039062, 27.18478775024414, -13.423194885253906, 151.37315368652344, -78.24537658691406, 51.663841247558594, 19.012779235839844, -74.11582946777344, -7.943424224853516, 17.7027587890625, 6.810495376586914, -23.728363037109375, 122.84062194824219, 32.13053894042969, -45.94110107421875, 134.2262725830078, 141.93087768554688, 195.61398315429688, 19.7391357421875, 22.778175354003906, 158.33456420898438, 95.58258819580078, 182.62539672851562, 39.92109298706055, -71.79253387451172, 52.01557159423828, -146.35751342773438, -144.58193969726562, -7.1765899658203125, -42.21479797363281, -106.88914489746094, 17.642372131347656], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000642.npy"} +{"epoch": 0.9705215419501134, "step": 643, "batch_size": 64, "mean": 64.62714385986328, "std": 95.9227523803711, "min": -165.958984375, "p10": -53.63643074035644, "median": 64.53503799438477, "p90": 192.64208984375, "max": 264.828369140625, "pos_frac": 0.75, "sample": [54.03155517578125, 69.95101928710938, 64.41159057617188, 31.378875732421875, 3.1083593368530273, 223.35997009277344, 7.416971206665039, 156.8197784423828, 87.3049545288086, 26.74376678466797, 164.14013671875, 37.17261505126953, 103.45217895507812, 4.4512481689453125, 139.11917114257812, 139.48199462890625, -27.46649169921875, 15.660257339477539, 189.79730224609375, 201.64898681640625, 113.74361419677734, 28.88665008544922, 168.77947998046875, 56.846405029296875, -45.81922149658203, 193.61428833007812, 73.99589538574219, -47.52728271484375, 190.37362670898438, 220.384765625, 85.48080444335938, 134.0099334716797, -26.34039306640625, 122.16407775878906, 42.25022888183594, -55.4075813293457, 18.965639114379883, -4.539459228515625, 217.69290161132812, 167.57501220703125, 141.51976013183594, -49.503746032714844, 135.8099822998047, -12.136573791503906, 136.05865478515625, -100.55433654785156, -108.6414566040039, -165.958984375, 4.102649688720703, 45.67092514038086, -81.97747039794922, 113.85034942626953, 158.52273559570312, 64.89617156982422, 26.063385009765625, -84.61434173583984, -12.37921142578125, 198.38436889648438, 65.97441101074219, 64.65848541259766, -36.87839126586914, 264.828369140625, 105.08666229248047, -83.7587890625], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000643.npy"} +{"epoch": 0.9720332577475435, "step": 644, "batch_size": 64, "mean": 46.66228485107422, "std": 95.69481658935547, "min": -213.08941650390625, "p10": -56.536017227172835, "median": 22.3531494140625, "p90": 174.7918258666992, "max": 207.81698608398438, "pos_frac": 0.703125, "sample": [165.4658203125, -76.96453857421875, -213.08941650390625, 155.09365844726562, -38.39570236206055, -62.596248626708984, 12.846435546875, 8.528806686401367, 152.56690979003906, 206.46615600585938, 69.17973327636719, 17.896167755126953, 174.94244384765625, 140.6954345703125, 69.11502075195312, 44.121612548828125, 56.10285568237305, 36.22053527832031, -0.7847976684570312, 177.9354248046875, 8.144412994384766, 165.25949096679688, -142.60931396484375, -23.223098754882812, -13.26165771484375, 109.53250885009766, -1.7046127319335938, 84.71440124511719, -1.7530517578125, -41.82316589355469, 182.08644104003906, -21.52471923828125, 11.354347229003906, 112.89958190917969, 147.520263671875, -5.050628662109375, -42.395477294921875, 207.81698608398438, 174.4403839111328, 19.75921630859375, 86.56958770751953, 184.81427001953125, 98.65103149414062, 10.449743270874023, 17.24847412109375, -193.09356689453125, -14.894271850585938, 112.74351501464844, 23.745559692382812, 154.60272216796875, -20.927413940429688, 17.85552978515625, 3.9038829803466797, -81.97408294677734, 32.766265869140625, 20.960739135742188, -120.76071166992188, 101.116943359375, 101.119873046875, 3.2589950561523438, 17.011703491210938, 164.25161743164062, 41.97693634033203, 199.46051025390625], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000644.npy"} +{"epoch": 0.9735449735449735, "step": 645, "batch_size": 64, "mean": 56.69789123535156, "std": 82.6423110961914, "min": -180.48861694335938, "p10": -38.78116722106933, "median": 55.31107521057129, "p90": 165.28256988525393, "max": 268.288330078125, "pos_frac": 0.78125, "sample": [33.977542877197266, 192.746337890625, 116.35689544677734, -86.43738555908203, 82.73823547363281, 236.63363647460938, 129.09664916992188, 6.089399337768555, -14.551994323730469, 21.642738342285156, 5.635982513427734, -96.68736267089844, 51.87236785888672, -0.10197067260742188, 156.302978515625, 41.23219299316406, 103.77978515625, 4.444042205810547, -6.371826171875, 11.48780632019043, 178.8154296875, -40.706459045410156, 44.60106658935547, 79.19795989990234, 81.3248062133789, -17.239524841308594, 63.238487243652344, 77.05621337890625, 177.1528778076172, 108.05054473876953, 70.9863510131836, 0.7867374420166016, 68.17456817626953, -1.587158203125, 12.618301391601562, 109.26846313476562, -95.63008117675781, 1.1367034912109375, -60.64874267578125, 169.13096618652344, 104.33103942871094, 109.0827407836914, 268.288330078125, -2.2565231323242188, 38.08335494995117, 89.6456069946289, 127.07897186279297, 63.69196319580078, 75.75518798828125, 108.5054931640625, 16.334884643554688, 134.62008666992188, 55.94815444946289, 149.1290283203125, 54.67399597167969, 0.4775238037109375, 138.04937744140625, -34.98952102661133, -40.406158447265625, -180.48861694335938, 18.710044860839844, 171.3446502685547, 125.33924865722656, 22.10228729248047], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000645.npy"} +{"epoch": 0.9750566893424036, "step": 646, "batch_size": 64, "mean": 53.204830169677734, "std": 95.7218017578125, "min": -178.31944274902344, "p10": -42.48242340087889, "median": 28.72286605834961, "p90": 178.37750701904298, "max": 297.3627014160156, "pos_frac": 0.71875, "sample": [-47.243499755859375, 1.7817440032958984, -5.475746154785156, 129.3332061767578, 179.13519287109375, 143.1757354736328, -109.02671813964844, 198.95687866210938, 97.83497619628906, 176.6095733642578, -7.5217437744140625, 22.161285400390625, 165.30770874023438, 162.89749145507812, 113.88504028320312, -7.2563629150390625, 93.8091812133789, 66.02243041992188, 183.75955200195312, 112.3730239868164, 198.22064208984375, 106.13308715820312, -177.37962341308594, -28.74347686767578, -76.54263305664062, 112.6556167602539, 4.937129974365234, -11.429672241210938, 26.565872192382812, 23.437652587890625, 65.15524291992188, 0.4434967041015625, 24.97943878173828, 185.72068786621094, 100.04705810546875, 9.249839782714844, 30.879859924316406, -3.1979827880859375, 56.770263671875, 117.8922119140625, -0.6039218902587891, -31.373245239257812, 88.68116760253906, -73.27732849121094, 128.8231201171875, 297.3627014160156, 170.3624267578125, 128.28372192382812, 25.11886978149414, 241.04141235351562, 34.43113708496094, 4.850677490234375, 9.876434326171875, -17.610702514648438, -178.31944274902344, 18.983230590820312, 89.54458618164062, -126.6097640991211, -29.404403686523438, 148.8104248046875, 10.283496856689453, -14.617538452148438, 1.4251441955566406, 42.733158111572266], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000646.npy"} +{"epoch": 0.9765684051398337, "step": 647, "batch_size": 64, "mean": 82.75460815429688, "std": 92.1798095703125, "min": -135.86695861816406, "p10": -31.277162170410154, "median": 70.49905395507812, "p90": 198.52490081787116, "max": 307.4119567871094, "pos_frac": 0.796875, "sample": [-4.871562957763672, 81.71887969970703, 174.09278869628906, 19.875808715820312, 69.50787353515625, 113.55400085449219, 21.38067626953125, 208.7020263671875, 103.97906494140625, 254.494873046875, 61.67326354980469, 83.91522216796875, 120.58091735839844, -2.506816864013672, -32.26887512207031, 51.5057373046875, 307.4119567871094, -36.49323272705078, -82.901611328125, 179.71646118164062, 169.4414520263672, 66.69859313964844, 119.34783172607422, 71.490234375, 207.16754150390625, 145.66122436523438, 159.4147186279297, -5.150091171264648, 184.71420288085938, 27.389556884765625, 149.90109252929688, -17.6094970703125, 157.91513061523438, 13.396720886230469, 138.51710510253906, -30.336868286132812, 46.48701858520508, 184.63229370117188, 31.61858367919922, -61.00969696044922, 103.8288803100586, 46.332054138183594, 62.66586685180664, 132.01953125, -135.86695861816406, 33.88642120361328, 90.9753189086914, 39.47720718383789, 30.9957275390625, 60.222686767578125, -31.680145263671875, 229.22073364257812, 158.15773010253906, 4.6285400390625, -86.518310546875, 165.0086669921875, 30.532636642456055, 263.5953674316406, -20.34363555908203, 178.52639770507812, 204.4437713623047, 39.85462188720703, 122.20598602294922, 121.37103271484375], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000647.npy"} +{"epoch": 0.9780801209372638, "step": 648, "batch_size": 64, "mean": 59.092376708984375, "std": 101.54547882080078, "min": -184.78768920898438, "p10": -49.882979965209955, "median": 66.0661506652832, "p90": 180.50133361816407, "max": 297.793701171875, "pos_frac": 0.6875, "sample": [153.9293212890625, 38.59178924560547, 53.758522033691406, -181.60565185546875, 150.28387451171875, -61.10585021972656, -184.78768920898438, 10.880455017089844, 180.07598876953125, 68.7790298461914, -50.95732498168945, 89.70479583740234, 62.05438995361328, -6.784782409667969, -47.37617492675781, -113.17134857177734, 48.140445709228516, -16.537742614746094, 297.793701171875, 165.03781127929688, 188.2627716064453, 117.45014190673828, 115.96279907226562, 129.200927734375, 152.84375, -16.062530517578125, 81.21150207519531, 194.05023193359375, 58.64911651611328, 90.66780090332031, -13.731063842773438, -3.6186447143554688, 264.3614501953125, 268.6156005859375, 3.8331375122070312, -64.01061248779297, 56.17921447753906, 72.6507797241211, 103.5713119506836, 11.293174743652344, 115.13735961914062, 148.28265380859375, 180.68362426757812, -31.368152618408203, -34.69110870361328, 16.661521911621094, 63.353271484375, 91.01459503173828, 93.34706115722656, 188.9071807861328, 115.37663269042969, 148.71286010742188, 119.36822509765625, -168.27674865722656, -46.555084228515625, 80.65385437011719, 117.61955261230469, -41.132911682128906, 42.91838455200195, -46.388492584228516, -0.9113235473632812, -23.61130714416504, 68.82266235351562, 115.90335845947266], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000648.npy"} +{"epoch": 0.9795918367346939, "step": 649, "batch_size": 64, "mean": 60.921424865722656, "std": 97.08753204345703, "min": -174.96189880371094, "p10": -74.90256500244139, "median": 69.61957931518555, "p90": 176.18030548095706, "max": 283.75299072265625, "pos_frac": 0.703125, "sample": [148.2956085205078, 101.91592407226562, -44.56063461303711, 120.79554748535156, 154.1457977294922, 161.8372802734375, 26.698745727539062, 17.738805770874023, -10.56011962890625, 168.10391235351562, -1.0939884185791016, 283.75299072265625, 120.91551208496094, -13.23312759399414, 130.6363983154297, 130.1782989501953, 118.8255615234375, 75.99828338623047, 118.66706085205078, 165.84873962402344, 182.82736206054688, -12.561685562133789, -131.17898559570312, -40.64653778076172, -174.96189880371094, 113.39846801757812, 14.712333679199219, 50.92677307128906, -79.4637451171875, -104.91461181640625, 70.38313293457031, 41.269737243652344, 146.61190795898438, -0.5995464324951172, 96.06561279296875, 135.84115600585938, 68.85602569580078, 130.4545135498047, 128.34771728515625, 150.1311492919922, 9.019416809082031, 198.74819946289062, 83.5391616821289, -13.03030776977539, 6.610748291015625, 179.64161682128906, 2.9266433715820312, 17.12751007080078, -6.6419830322265625, 47.322479248046875, 13.712425231933594, 235.4205322265625, -64.25981140136719, -113.35879516601562, 217.70689392089844, -28.56644058227539, -86.50830078125, -86.03836059570312, 95.8743896484375, 179.7120361328125, 155.03265380859375, 76.0695571899414, -1.4073982238769531, 19.91290283203125], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000649.npy"} +{"epoch": 0.981103552532124, "step": 650, "batch_size": 64, "mean": 62.88866424560547, "std": 98.08202362060547, "min": -162.01885986328125, "p10": -50.61519355773925, "median": 38.3546142578125, "p90": 185.80362854003909, "max": 241.5028533935547, "pos_frac": 0.78125, "sample": [-48.71867752075195, 225.5271453857422, 186.91848754882812, 150.2530975341797, 17.01335906982422, 167.27374267578125, 147.06185913085938, 39.266815185546875, 11.370933532714844, 21.66342544555664, 164.343505859375, 150.87681579589844, -82.34376525878906, 5.186134338378906, 2.5219669342041016, 140.71096801757812, 144.1750030517578, 58.30320739746094, 204.1492462158203, 0.05974769592285156, 149.46994018554688, 85.26445770263672, -51.42798614501953, 4.850231170654297, 175.2253875732422, 187.88192749023438, 186.86366271972656, 160.34207153320312, 96.9944839477539, -90.8832015991211, 4.052333831787109, -140.92945861816406, 7.534687042236328, 123.85171508789062, -162.01885986328125, 26.665939331054688, 175.5258331298828, 90.71437072753906, 18.77123260498047, -28.708229064941406, -32.43023681640625, 73.78240966796875, -132.77374267578125, 166.868408203125, -34.5390625, -2.9081497192382812, 241.5028533935547, 183.33021545410156, 62.82537841796875, -52.11506652832031, 126.96192932128906, 8.152816772460938, 172.8130645751953, 3.0241432189941406, 25.77726936340332, 31.667436599731445, -30.490249633789062, 37.442413330078125, 164.51919555664062, 228.48861694335938, 6.23284912109375, -15.73831558227539, 57.08539962768555, 9.741462707519531], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000650.npy"} +{"epoch": 0.982615268329554, "step": 651, "batch_size": 64, "mean": 54.385494232177734, "std": 88.85526275634766, "min": -147.02447509765625, "p10": -44.16695404052734, "median": 22.317787170410156, "p90": 185.11818237304692, "max": 273.41497802734375, "pos_frac": 0.71875, "sample": [-1.6015701293945312, 14.40625, 87.47271728515625, -17.3345947265625, 40.59398651123047, -60.654701232910156, -46.807701110839844, 73.95220184326172, 17.740509033203125, 169.52366638183594, 12.28118896484375, -17.214019775390625, -11.807975769042969, 14.267234802246094, 100.0621337890625, -147.02447509765625, 4.384742736816406, 245.85687255859375, 54.81786346435547, 173.0559844970703, 175.28793334960938, -4.53045654296875, -37.20491027832031, 90.51097106933594, 11.521835327148438, 12.21829605102539, 72.812744140625, 117.4139404296875, -24.479385375976562, 189.33114624023438, 31.62015151977539, 204.66360473632812, 7.403270721435547, -7.374794006347656, 49.69844055175781, -0.39618873596191406, 160.1158905029297, 39.38844299316406, -47.05500030517578, 47.69672775268555, 190.20352172851562, 23.519760131835938, 124.364501953125, 2.578350067138672, -15.87802505493164, 190.8802490234375, 213.7351531982422, 154.556640625, -54.235313415527344, 168.61245727539062, 20.59819221496582, 8.368988037109375, 4.8306884765625, 114.19141387939453, 108.2381591796875, 104.41016387939453, 158.25772094726562, 2.0545005798339844, 21.115814208984375, -82.12234497070312, 69.65907287597656, -77.29087829589844, 273.41497802734375, -38.005210876464844], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000651.npy"} +{"epoch": 0.9841269841269841, "step": 652, "batch_size": 64, "mean": 51.03858947753906, "std": 100.43689727783203, "min": -182.96173095703125, "p10": -62.85539245605469, "median": 23.335201263427734, "p90": 177.59119110107423, "max": 338.057861328125, "pos_frac": 0.6875, "sample": [8.278438568115234, 162.4043426513672, 169.51968383789062, 26.64568328857422, -46.845787048339844, 182.4237060546875, 10.788400650024414, 63.8774528503418, 169.2306671142578, 7.821693420410156, 172.0826416015625, -110.4718246459961, 3.520404815673828, 31.860902786254883, 97.17776489257812, 172.53570556640625, 9.803955078125, 118.20357513427734, 75.22553253173828, 4.4362335205078125, -64.25857543945312, 162.473388671875, 131.0396270751953, 0.308929443359375, 16.167957305908203, -36.582786560058594, -182.96173095703125, -49.497711181640625, 212.3994903564453, 81.59444427490234, 20.02471923828125, -33.54967498779297, 82.01020812988281, -0.11148834228515625, 128.08404541015625, -71.46607208251953, 170.84890747070312, 115.12985229492188, -12.451408386230469, -100.35806274414062, -33.08110046386719, 189.30860900878906, -4.198707580566406, 125.45076751708984, -22.920654296875, -15.561267852783203, 182.32131958007812, 139.68606567382812, 0.2941570281982422, 182.91366577148438, 338.057861328125, 70.48798370361328, 96.46998596191406, -13.636848449707031, -12.39937973022461, 30.309585571289062, -95.94999694824219, 9.950021743774414, -59.581298828125, 179.75782775878906, 46.162933349609375, 11.140838623046875, -145.46591186523438, 169.58993530273438], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000652.npy"} +{"epoch": 0.9856386999244142, "step": 653, "batch_size": 64, "mean": 63.47991180419922, "std": 93.8610610961914, "min": -155.35557556152344, "p10": -51.24913406372069, "median": 60.50150108337402, "p90": 189.18298645019533, "max": 268.6130065917969, "pos_frac": 0.78125, "sample": [20.628999710083008, 153.89894104003906, 14.131721496582031, -2.16998291015625, 73.36770629882812, 35.31427001953125, 67.84564971923828, -63.603065490722656, 191.23541259765625, 11.299346923828125, -16.166439056396484, 2.1392669677734375, 117.61810302734375, -40.19844055175781, 268.6130065917969, 147.44570922851562, 99.56173706054688, 200.65371704101562, 23.20528793334961, 190.905029296875, 118.09741973876953, 209.03712463378906, 91.61066436767578, -0.7820968627929688, 70.24142456054688, 34.663429260253906, 185.16488647460938, 29.472274780273438, -4.595859527587891, -16.249618530273438, 224.31643676757812, -84.21858215332031, -55.985145568847656, 30.47891616821289, 25.920000076293945, -79.67909240722656, 60.36427688598633, 72.83307647705078, 108.34971618652344, 100.20111083984375, 21.076263427734375, -131.3238067626953, 248.80996704101562, 67.82373046875, 133.4532470703125, -155.35557556152344, 167.99266052246094, -12.1043701171875, 142.82728576660156, 85.64445495605469, 3.2626571655273438, 183.303955078125, -144.00991821289062, 5.6255340576171875, 3.8502864837646484, 31.445764541625977, 154.19094848632812, 168.16087341308594, 13.871074676513672, 118.8719482421875, 60.63872528076172, 113.92585754394531, 21.891075134277344, 143.87533569335938], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000653.npy"} +{"epoch": 0.9871504157218443, "step": 654, "batch_size": 64, "mean": 54.44564437866211, "std": 91.82136535644531, "min": -120.96903228759766, "p10": -55.39079513549804, "median": 42.241037368774414, "p90": 182.6667251586914, "max": 319.60125732421875, "pos_frac": 0.71875, "sample": [11.296272277832031, 211.3228302001953, -120.96903228759766, 109.99276733398438, 44.4364013671875, -89.15825653076172, 183.79307556152344, 82.03053283691406, 4.577579498291016, -57.7469482421875, -13.946426391601562, -44.99681091308594, 92.47920989990234, 3.7799148559570312, -20.765716552734375, 22.579397201538086, 166.59738159179688, -90.74795532226562, 184.8235321044922, 23.529190063476562, 34.40586853027344, 16.825366973876953, 172.21185302734375, 218.31448364257812, -4.633367538452148, -15.112419128417969, 8.013042449951172, -18.22290802001953, -49.893104553222656, 30.811748504638672, -5.56243896484375, 141.51071166992188, 319.60125732421875, 94.23075866699219, 60.504066467285156, 180.03857421875, 152.38284301757812, -23.641265869140625, 21.597976684570312, 79.32135009765625, 127.1292495727539, 67.33488464355469, 98.96510314941406, -95.2400894165039, 25.63684844970703, 13.710861206054688, 193.8241729736328, 178.49664306640625, 51.057220458984375, 77.72386169433594, 96.34230041503906, 186.66012573242188, 2.8081817626953125, 69.0909194946289, 168.145751953125, -68.509765625, -2.0523223876953125, 77.81275939941406, 73.74165344238281, 101.38221740722656, 40.42595291137695, 44.056121826171875, -43.98991394042969, -115.64279174804688], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000654.npy"} +{"epoch": 0.9886621315192744, "step": 655, "batch_size": 64, "mean": 79.42540740966797, "std": 80.28729248046875, "min": -90.65547180175781, "p10": -12.516321563720702, "median": 80.53816223144531, "p90": 174.38591613769535, "max": 236.62327575683594, "pos_frac": 0.796875, "sample": [139.87051391601562, 113.47868347167969, -12.864173889160156, 12.46786880493164, 43.975311279296875, 131.54360961914062, 236.62327575683594, 111.8211669921875, 95.71485137939453, 15.839599609375, -6.910552978515625, 142.13876342773438, 1.049072265625, -7.396461486816406, -5.3976287841796875, -23.860107421875, 56.444549560546875, 193.48089599609375, 164.46209716796875, 24.732067108154297, 188.49819946289062, -11.704666137695312, 137.5808563232422, 219.8675079345703, 53.203208923339844, -15.705093383789062, 79.84002685546875, -76.86962890625, 230.36483764648438, -45.76837158203125, 161.19479370117188, 105.09768676757812, 166.13308715820312, 38.15364074707031, 81.23629760742188, 20.401233673095703, 55.7191162109375, 148.4934539794922, 118.94189453125, 233.42694091796875, 10.070205688476562, 23.160675048828125, -6.939788818359375, 177.56536865234375, 136.2786865234375, -68.52108764648438, 56.16310119628906, 126.34675598144531, 166.96719360351562, 155.0221710205078, -8.35806655883789, 29.785598754882812, 166.04278564453125, 66.96919250488281, 38.21150207519531, 110.56370544433594, 105.02780151367188, 77.6535415649414, 155.9542236328125, 29.256057739257812, -90.65547180175781, 83.03268432617188, 103.71115112304688, 124.59962463378906], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000655.npy"} +{"epoch": 0.9901738473167044, "step": 656, "batch_size": 64, "mean": 63.30681610107422, "std": 90.24092864990234, "min": -163.1591033935547, "p10": -27.635218429565423, "median": 48.93470001220703, "p90": 194.4081924438477, "max": 228.775390625, "pos_frac": 0.796875, "sample": [161.3347625732422, 37.01732635498047, 165.32830810546875, 155.495849609375, 13.156726837158203, 15.426803588867188, 10.295963287353516, -4.361045837402344, 25.24652099609375, -22.144569396972656, 3.677623748779297, 228.775390625, -11.135604858398438, 13.966156005859375, 1.7058258056640625, 127.45903015136719, -163.1591033935547, -19.35051727294922, 105.26139068603516, 150.09310913085938, 215.54287719726562, 17.682777404785156, -142.58848571777344, 40.49782180786133, 197.5815887451172, -34.41921615600586, 71.78382110595703, 183.04502868652344, -16.116683959960938, 114.45977783203125, 147.15460205078125, 7.276496887207031, 45.03435516357422, 54.08038330078125, 65.82146453857422, 129.37501525878906, 48.482940673828125, 55.84429931640625, 198.78150939941406, 72.57476806640625, 49.38645935058594, -92.73466491699219, 50.17888641357422, 213.91697692871094, 3.3277435302734375, 187.00360107421875, 61.95753479003906, 75.29425811767578, 37.680965423583984, 119.28173828125, 183.2428741455078, -29.988353729248047, -20.178466796875, 208.187255859375, 144.07318115234375, 19.858383178710938, 18.3939208984375, -101.26521301269531, -31.46923065185547, 20.44932746887207, 32.02464294433594, 55.44123840332031, 169.89886474609375, 211.68917846679688], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000656.npy"} +{"epoch": 0.9916855631141346, "step": 657, "batch_size": 64, "mean": 74.89022827148438, "std": 98.91642761230469, "min": -178.84963989257812, "p10": -12.538628959655757, "median": 78.54146194458008, "p90": 198.06196899414064, "max": 272.2905578613281, "pos_frac": 0.796875, "sample": [216.3503875732422, 62.311187744140625, 5.021198272705078, 249.6644287109375, 107.50989532470703, 18.513731002807617, 272.2905578613281, 187.30136108398438, 54.75226593017578, -153.8007354736328, 12.647998809814453, -14.87077522277832, 127.66014099121094, 40.95470428466797, 253.8157958984375, 88.6427001953125, 77.74906158447266, 173.923095703125, -120.89285278320312, 175.79489135742188, -1.497406005859375, 117.93389129638672, -128.63235473632812, 31.11747932434082, 80.46138763427734, 168.90139770507812, 59.8948974609375, -7.096954345703125, -4.057149887084961, 59.97089385986328, 137.2073974609375, 161.35018920898438, 7.5778961181640625, 156.15090942382812, 100.29621887207031, 42.86328125, 124.82811737060547, 132.9302215576172, 199.2431640625, 5.380884170532227, 241.70217895507812, 25.676742553710938, -3.86444091796875, 195.30584716796875, 8.102386474609375, 101.71942138671875, 211.83282470703125, 1.1226482391357422, -58.43413543701172, 79.3338623046875, 4.021888732910156, -178.84963989257812, 148.82247924804688, -2.075162887573242, 18.496931076049805, 107.6499252319336, -48.98560333251953, 112.44498443603516, 96.65472412109375, 188.4562225341797, 8.873210906982422, 104.44586944580078, -7.014396667480469, 157.37237548828125], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000657.npy"} +{"epoch": 0.9931972789115646, "step": 658, "batch_size": 64, "mean": 59.35535430908203, "std": 111.37400817871094, "min": -205.49313354492188, "p10": -76.88539428710938, "median": 49.850101470947266, "p90": 186.32528533935547, "max": 353.22802734375, "pos_frac": 0.734375, "sample": [79.50688171386719, 19.82223892211914, 186.73533630371094, -205.49313354492188, 162.59005737304688, 0.32762718200683594, -164.90196228027344, 48.04515075683594, 173.3159942626953, 177.46316528320312, -18.455581665039062, 104.42037963867188, -76.07762145996094, 63.45017623901367, 177.19468688964844, 69.59352111816406, -20.170516967773438, 131.87464904785156, 353.22802734375, 17.6334228515625, -17.80254554748535, 37.506134033203125, 47.111656188964844, 127.2940902709961, 178.64935302734375, 190.4126739501953, -127.17172241210938, 113.7928466796875, 84.63156127929688, 37.06510925292969, 6.973073959350586, -3.191852569580078, 78.31636810302734, 114.77449035644531, 0.43288421630859375, 57.871986389160156, 228.2880859375, -157.93313598632812, 80.92916107177734, 52.216766357421875, 184.92550659179688, 3.7488365173339844, 126.56370544433594, 185.36849975585938, -2.610239028930664, 49.72809600830078, -77.23158264160156, 204.58749389648438, 21.75420379638672, 80.71575927734375, 23.301742553710938, -0.31623268127441406, -33.336585998535156, -122.11640930175781, 41.69316864013672, 135.46881103515625, -7.239559173583984, -175.6314697265625, 252.95306396484375, -11.504539489746094, 271.57012939453125, 49.97210693359375, 181.76422119140625, 4.344518661499023], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000658.npy"} +{"epoch": 0.9947089947089947, "step": 659, "batch_size": 64, "mean": 49.65174865722656, "std": 93.83220672607422, "min": -169.9583740234375, "p10": -79.89029388427734, "median": 41.46404266357422, "p90": 179.04762725830082, "max": 237.01791381835938, "pos_frac": 0.71875, "sample": [43.75128173828125, 101.07817077636719, 183.77389526367188, 132.4046173095703, -5.9492034912109375, 237.01791381835938, 101.94918060302734, 106.92288970947266, 34.367027282714844, 192.47125244140625, 211.86074829101562, -6.7321929931640625, 27.711761474609375, 31.40536117553711, -0.7225570678710938, 6.333702087402344, 123.42271423339844, -122.12696075439453, 14.992986679077148, -82.75293731689453, 152.58547973632812, -73.2107925415039, 49.09332275390625, 60.54791259765625, 12.584859848022461, -12.9656982421875, 20.643625259399414, 36.46027374267578, -11.65605354309082, 74.24351501464844, 39.17680358886719, 52.86870574951172, 132.7257537841797, 113.59242248535156, 79.45818328857422, 16.001014709472656, 187.91458129882812, 106.3504638671875, 182.47952270507812, 15.391414642333984, 100.0009765625, -94.3480224609375, -93.78636169433594, 171.0398712158203, -31.9002628326416, 6.3482208251953125, -1.23663330078125, 141.61856079101562, 122.9629898071289, -68.57071685791016, 17.98480224609375, 162.30072021484375, -169.9583740234375, -95.3074951171875, 165.75425720214844, 47.85984802246094, 12.577430725097656, -163.67123413085938, 212.57937622070312, 75.28317260742188, -25.553375244140625, 121.22818756103516, 63.363616943359375, -64.32269287109375], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000659.npy"} +{"epoch": 0.9962207105064248, "step": 660, "batch_size": 64, "mean": 74.60331726074219, "std": 89.3137435913086, "min": -146.51443481445312, "p10": -34.785624694824214, "median": 67.4435806274414, "p90": 176.39584045410157, "max": 387.7391357421875, "pos_frac": 0.84375, "sample": [188.05679321289062, 43.82738494873047, 47.88252639770508, -65.48353576660156, 55.84130859375, -67.64803314208984, 8.494964599609375, 180.3087615966797, -146.51443481445312, -46.500213623046875, 56.959957122802734, 198.26116943359375, 42.5861701965332, 121.42582702636719, 19.649993896484375, 272.4181823730469, 143.83773803710938, 109.81724548339844, 30.654264450073242, -65.97114562988281, 89.46427917480469, 76.76715087890625, 55.299964904785156, 33.933921813964844, 85.67228698730469, 177.2855224609375, -28.178680419921875, 174.31991577148438, 85.10687255859375, -37.61717224121094, 71.74394989013672, 162.51373291015625, 387.7391357421875, 75.97724914550781, -4.584819793701172, -59.362579345703125, 17.104507446289062, 0.27573394775390625, 133.841796875, 70.32914733886719, 46.238685607910156, 15.107587814331055, 164.09033203125, 139.57473754882812, 163.8155975341797, 154.76412963867188, -7.14312744140625, 46.339317321777344, 148.9975128173828, 123.63484954833984, 24.919078826904297, 200.94467163085938, 21.65038299560547, 7.227182388305664, 161.2391357421875, 65.8104248046875, 78.4947509765625, 124.41047668457031, 12.672286987304688, 3.8344268798828125, 51.33433532714844, 103.9146728515625, 69.07673645019531, 158.12738037109375], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000660.npy"} +{"epoch": 0.9977324263038548, "step": 661, "batch_size": 64, "mean": 50.56440734863281, "std": 99.54283142089844, "min": -224.34364318847656, "p10": -69.9677619934082, "median": 42.60058403015137, "p90": 178.72654266357424, "max": 282.13873291015625, "pos_frac": 0.734375, "sample": [24.474380493164062, -14.121681213378906, -71.9478759765625, -118.80941772460938, 100.91644287109375, 118.2039794921875, 139.8451690673828, 0.735595703125, -224.34364318847656, 142.06825256347656, -126.00022888183594, 5.2498931884765625, -35.73884582519531, 179.57395935058594, 183.91009521484375, 123.46753692626953, 194.54515075683594, 70.41728210449219, 282.13873291015625, 57.885345458984375, -176.8700714111328, 84.47453308105469, 125.42727661132812, -72.52610778808594, -5.116397857666016, 22.616348266601562, 24.526107788085938, -44.379825592041016, 5.392662048339844, 12.736152648925781, 42.62968826293945, 69.21910858154297, -133.0693817138672, 42.57147979736328, 112.48373413085938, 9.584453582763672, 62.96897888183594, 174.90765380859375, 16.929576873779297, 162.59115600585938, 75.439453125, 40.73432922363281, -16.76678466796875, 154.09619140625, 176.74923706054688, 88.32107543945312, 213.45831298828125, 34.964332580566406, 6.41459846496582, 96.13724517822266, -65.34749603271484, -5.397651672363281, 22.584854125976562, -34.82958984375, 46.661434173583984, 139.99566650390625, 95.41129302978516, 116.91714477539062, 72.13816833496094, 183.82696533203125, 18.551513671875, -7.09759521484375, -29.39586639404297, 242.9879913330078], "npy": "outputs/llama3-8b-base-new-method-s_star0.6/margin_logs/step_0000661.npy"} diff --git a/model-00001-of-00007.safetensors b/model-00001-of-00007.safetensors new file mode 100644 index 0000000..de5f87b --- /dev/null +++ b/model-00001-of-00007.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8bddaa62c4db7b2bfd624620dd206f331ab63730313d9a28b6cc8f2d5f37443f +size 4886466168 diff --git a/model-00002-of-00007.safetensors b/model-00002-of-00007.safetensors new file mode 100644 index 0000000..762d7aa --- /dev/null +++ b/model-00002-of-00007.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:edde0c2f6223fe51cb4be482a6fb0951132b4d772546cbb1c404dc4e06021f1f +size 4832007448 diff --git a/model-00003-of-00007.safetensors b/model-00003-of-00007.safetensors new file mode 100644 index 0000000..2918549 --- /dev/null +++ b/model-00003-of-00007.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9572a4aa48bf6cb2f3c911918fcfce1f051c0fb31e1763731a5deb324c9b1fa0 +size 4999813112 diff --git a/model-00004-of-00007.safetensors b/model-00004-of-00007.safetensors new file mode 100644 index 0000000..99b4c6b --- /dev/null +++ b/model-00004-of-00007.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a4ce41ab23e1891be0e26579a06947d31f434d35d083c8e504d7cde4fe7b5efc +size 4999813128 diff --git a/model-00005-of-00007.safetensors b/model-00005-of-00007.safetensors new file mode 100644 index 0000000..82fc2b3 --- /dev/null +++ b/model-00005-of-00007.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fdab0e9bee793145e8afb9b39f6060ab4595df4d9a3b91ad4c5faa398e690092 +size 4832007496 diff --git a/model-00006-of-00007.safetensors b/model-00006-of-00007.safetensors new file mode 100644 index 0000000..a126fda --- /dev/null +++ b/model-00006-of-00007.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:915ef5a26e1f6660946b0dffb51646c3d60c060b8758d691c47b99d376d5e232 +size 4999813120 diff --git a/model-00007-of-00007.safetensors b/model-00007-of-00007.safetensors new file mode 100644 index 0000000..b0e6b97 --- /dev/null +++ b/model-00007-of-00007.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1709dbc87a596447dec90f3d01f295ad26e4d5b0813ec8f79f4f96a40190c873 +size 2571158184 diff --git a/model.safetensors.index.json b/model.safetensors.index.json new file mode 100644 index 0000000..0985084 --- /dev/null +++ b/model.safetensors.index.json @@ -0,0 +1,298 @@ +{ + "metadata": { + "total_size": 32121044992 + }, + "weight_map": { + "lm_head.weight": "model-00007-of-00007.safetensors", + "model.embed_tokens.weight": "model-00001-of-00007.safetensors", + "model.layers.0.input_layernorm.weight": "model-00001-of-00007.safetensors", + "model.layers.0.mlp.down_proj.weight": "model-00001-of-00007.safetensors", + "model.layers.0.mlp.gate_proj.weight": "model-00001-of-00007.safetensors", + "model.layers.0.mlp.up_proj.weight": "model-00001-of-00007.safetensors", + "model.layers.0.post_attention_layernorm.weight": "model-00001-of-00007.safetensors", + "model.layers.0.self_attn.k_proj.weight": "model-00001-of-00007.safetensors", + "model.layers.0.self_attn.o_proj.weight": "model-00001-of-00007.safetensors", + "model.layers.0.self_attn.q_proj.weight": "model-00001-of-00007.safetensors", + "model.layers.0.self_attn.v_proj.weight": "model-00001-of-00007.safetensors", + "model.layers.1.input_layernorm.weight": "model-00001-of-00007.safetensors", + "model.layers.1.mlp.down_proj.weight": "model-00001-of-00007.safetensors", + "model.layers.1.mlp.gate_proj.weight": "model-00001-of-00007.safetensors", + "model.layers.1.mlp.up_proj.weight": "model-00001-of-00007.safetensors", + "model.layers.1.post_attention_layernorm.weight": "model-00001-of-00007.safetensors", + "model.layers.1.self_attn.k_proj.weight": "model-00001-of-00007.safetensors", + "model.layers.1.self_attn.o_proj.weight": "model-00001-of-00007.safetensors", + "model.layers.1.self_attn.q_proj.weight": "model-00001-of-00007.safetensors", + "model.layers.1.self_attn.v_proj.weight": "model-00001-of-00007.safetensors", + "model.layers.10.input_layernorm.weight": "model-00003-of-00007.safetensors", + "model.layers.10.mlp.down_proj.weight": "model-00003-of-00007.safetensors", + "model.layers.10.mlp.gate_proj.weight": "model-00003-of-00007.safetensors", + "model.layers.10.mlp.up_proj.weight": "model-00003-of-00007.safetensors", + "model.layers.10.post_attention_layernorm.weight": "model-00003-of-00007.safetensors", + "model.layers.10.self_attn.k_proj.weight": "model-00003-of-00007.safetensors", + "model.layers.10.self_attn.o_proj.weight": "model-00003-of-00007.safetensors", + "model.layers.10.self_attn.q_proj.weight": "model-00003-of-00007.safetensors", + "model.layers.10.self_attn.v_proj.weight": "model-00003-of-00007.safetensors", + "model.layers.11.input_layernorm.weight": "model-00003-of-00007.safetensors", + "model.layers.11.mlp.down_proj.weight": "model-00003-of-00007.safetensors", + "model.layers.11.mlp.gate_proj.weight": "model-00003-of-00007.safetensors", + "model.layers.11.mlp.up_proj.weight": "model-00003-of-00007.safetensors", + "model.layers.11.post_attention_layernorm.weight": "model-00003-of-00007.safetensors", + "model.layers.11.self_attn.k_proj.weight": "model-00003-of-00007.safetensors", + "model.layers.11.self_attn.o_proj.weight": "model-00003-of-00007.safetensors", + "model.layers.11.self_attn.q_proj.weight": "model-00003-of-00007.safetensors", + "model.layers.11.self_attn.v_proj.weight": "model-00003-of-00007.safetensors", + "model.layers.12.input_layernorm.weight": "model-00003-of-00007.safetensors", + "model.layers.12.mlp.down_proj.weight": "model-00003-of-00007.safetensors", + "model.layers.12.mlp.gate_proj.weight": "model-00003-of-00007.safetensors", + "model.layers.12.mlp.up_proj.weight": "model-00003-of-00007.safetensors", + "model.layers.12.post_attention_layernorm.weight": "model-00003-of-00007.safetensors", + "model.layers.12.self_attn.k_proj.weight": "model-00003-of-00007.safetensors", + "model.layers.12.self_attn.o_proj.weight": "model-00003-of-00007.safetensors", + "model.layers.12.self_attn.q_proj.weight": "model-00003-of-00007.safetensors", + "model.layers.12.self_attn.v_proj.weight": "model-00003-of-00007.safetensors", + "model.layers.13.input_layernorm.weight": "model-00003-of-00007.safetensors", + "model.layers.13.mlp.down_proj.weight": "model-00003-of-00007.safetensors", + "model.layers.13.mlp.gate_proj.weight": "model-00003-of-00007.safetensors", + "model.layers.13.mlp.up_proj.weight": "model-00003-of-00007.safetensors", + "model.layers.13.post_attention_layernorm.weight": "model-00003-of-00007.safetensors", + "model.layers.13.self_attn.k_proj.weight": "model-00003-of-00007.safetensors", + "model.layers.13.self_attn.o_proj.weight": "model-00003-of-00007.safetensors", + "model.layers.13.self_attn.q_proj.weight": "model-00003-of-00007.safetensors", + "model.layers.13.self_attn.v_proj.weight": "model-00003-of-00007.safetensors", + "model.layers.14.input_layernorm.weight": "model-00004-of-00007.safetensors", + "model.layers.14.mlp.down_proj.weight": "model-00004-of-00007.safetensors", + "model.layers.14.mlp.gate_proj.weight": "model-00003-of-00007.safetensors", + "model.layers.14.mlp.up_proj.weight": "model-00004-of-00007.safetensors", + "model.layers.14.post_attention_layernorm.weight": "model-00004-of-00007.safetensors", + "model.layers.14.self_attn.k_proj.weight": "model-00003-of-00007.safetensors", + "model.layers.14.self_attn.o_proj.weight": "model-00003-of-00007.safetensors", + "model.layers.14.self_attn.q_proj.weight": "model-00003-of-00007.safetensors", + "model.layers.14.self_attn.v_proj.weight": "model-00003-of-00007.safetensors", + "model.layers.15.input_layernorm.weight": "model-00004-of-00007.safetensors", + "model.layers.15.mlp.down_proj.weight": "model-00004-of-00007.safetensors", + "model.layers.15.mlp.gate_proj.weight": "model-00004-of-00007.safetensors", + "model.layers.15.mlp.up_proj.weight": "model-00004-of-00007.safetensors", + "model.layers.15.post_attention_layernorm.weight": "model-00004-of-00007.safetensors", + "model.layers.15.self_attn.k_proj.weight": "model-00004-of-00007.safetensors", + "model.layers.15.self_attn.o_proj.weight": "model-00004-of-00007.safetensors", + "model.layers.15.self_attn.q_proj.weight": "model-00004-of-00007.safetensors", + "model.layers.15.self_attn.v_proj.weight": "model-00004-of-00007.safetensors", + "model.layers.16.input_layernorm.weight": "model-00004-of-00007.safetensors", + "model.layers.16.mlp.down_proj.weight": "model-00004-of-00007.safetensors", + "model.layers.16.mlp.gate_proj.weight": "model-00004-of-00007.safetensors", + "model.layers.16.mlp.up_proj.weight": "model-00004-of-00007.safetensors", + "model.layers.16.post_attention_layernorm.weight": "model-00004-of-00007.safetensors", + "model.layers.16.self_attn.k_proj.weight": "model-00004-of-00007.safetensors", + "model.layers.16.self_attn.o_proj.weight": "model-00004-of-00007.safetensors", + "model.layers.16.self_attn.q_proj.weight": "model-00004-of-00007.safetensors", + "model.layers.16.self_attn.v_proj.weight": "model-00004-of-00007.safetensors", + "model.layers.17.input_layernorm.weight": "model-00004-of-00007.safetensors", + "model.layers.17.mlp.down_proj.weight": "model-00004-of-00007.safetensors", + "model.layers.17.mlp.gate_proj.weight": "model-00004-of-00007.safetensors", + "model.layers.17.mlp.up_proj.weight": "model-00004-of-00007.safetensors", + "model.layers.17.post_attention_layernorm.weight": "model-00004-of-00007.safetensors", + "model.layers.17.self_attn.k_proj.weight": "model-00004-of-00007.safetensors", + "model.layers.17.self_attn.o_proj.weight": "model-00004-of-00007.safetensors", + "model.layers.17.self_attn.q_proj.weight": "model-00004-of-00007.safetensors", + "model.layers.17.self_attn.v_proj.weight": "model-00004-of-00007.safetensors", + "model.layers.18.input_layernorm.weight": "model-00004-of-00007.safetensors", + "model.layers.18.mlp.down_proj.weight": "model-00004-of-00007.safetensors", + "model.layers.18.mlp.gate_proj.weight": "model-00004-of-00007.safetensors", + "model.layers.18.mlp.up_proj.weight": "model-00004-of-00007.safetensors", + "model.layers.18.post_attention_layernorm.weight": "model-00004-of-00007.safetensors", + "model.layers.18.self_attn.k_proj.weight": "model-00004-of-00007.safetensors", + "model.layers.18.self_attn.o_proj.weight": "model-00004-of-00007.safetensors", + "model.layers.18.self_attn.q_proj.weight": "model-00004-of-00007.safetensors", + "model.layers.18.self_attn.v_proj.weight": "model-00004-of-00007.safetensors", + "model.layers.19.input_layernorm.weight": "model-00004-of-00007.safetensors", + "model.layers.19.mlp.down_proj.weight": "model-00004-of-00007.safetensors", + "model.layers.19.mlp.gate_proj.weight": "model-00004-of-00007.safetensors", + "model.layers.19.mlp.up_proj.weight": "model-00004-of-00007.safetensors", + "model.layers.19.post_attention_layernorm.weight": "model-00004-of-00007.safetensors", + "model.layers.19.self_attn.k_proj.weight": "model-00004-of-00007.safetensors", + "model.layers.19.self_attn.o_proj.weight": "model-00004-of-00007.safetensors", + "model.layers.19.self_attn.q_proj.weight": "model-00004-of-00007.safetensors", + "model.layers.19.self_attn.v_proj.weight": "model-00004-of-00007.safetensors", + "model.layers.2.input_layernorm.weight": "model-00001-of-00007.safetensors", + "model.layers.2.mlp.down_proj.weight": "model-00001-of-00007.safetensors", + "model.layers.2.mlp.gate_proj.weight": "model-00001-of-00007.safetensors", + "model.layers.2.mlp.up_proj.weight": "model-00001-of-00007.safetensors", + "model.layers.2.post_attention_layernorm.weight": "model-00001-of-00007.safetensors", + "model.layers.2.self_attn.k_proj.weight": "model-00001-of-00007.safetensors", + "model.layers.2.self_attn.o_proj.weight": "model-00001-of-00007.safetensors", + "model.layers.2.self_attn.q_proj.weight": "model-00001-of-00007.safetensors", + "model.layers.2.self_attn.v_proj.weight": "model-00001-of-00007.safetensors", + "model.layers.20.input_layernorm.weight": "model-00005-of-00007.safetensors", + "model.layers.20.mlp.down_proj.weight": "model-00005-of-00007.safetensors", + "model.layers.20.mlp.gate_proj.weight": "model-00005-of-00007.safetensors", + "model.layers.20.mlp.up_proj.weight": "model-00005-of-00007.safetensors", + "model.layers.20.post_attention_layernorm.weight": "model-00005-of-00007.safetensors", + "model.layers.20.self_attn.k_proj.weight": "model-00004-of-00007.safetensors", + "model.layers.20.self_attn.o_proj.weight": "model-00004-of-00007.safetensors", + "model.layers.20.self_attn.q_proj.weight": "model-00004-of-00007.safetensors", + "model.layers.20.self_attn.v_proj.weight": "model-00004-of-00007.safetensors", + "model.layers.21.input_layernorm.weight": "model-00005-of-00007.safetensors", + "model.layers.21.mlp.down_proj.weight": "model-00005-of-00007.safetensors", + "model.layers.21.mlp.gate_proj.weight": "model-00005-of-00007.safetensors", + "model.layers.21.mlp.up_proj.weight": "model-00005-of-00007.safetensors", + "model.layers.21.post_attention_layernorm.weight": "model-00005-of-00007.safetensors", + "model.layers.21.self_attn.k_proj.weight": "model-00005-of-00007.safetensors", + "model.layers.21.self_attn.o_proj.weight": "model-00005-of-00007.safetensors", + "model.layers.21.self_attn.q_proj.weight": "model-00005-of-00007.safetensors", + "model.layers.21.self_attn.v_proj.weight": "model-00005-of-00007.safetensors", + "model.layers.22.input_layernorm.weight": "model-00005-of-00007.safetensors", + "model.layers.22.mlp.down_proj.weight": "model-00005-of-00007.safetensors", + "model.layers.22.mlp.gate_proj.weight": "model-00005-of-00007.safetensors", + "model.layers.22.mlp.up_proj.weight": "model-00005-of-00007.safetensors", + "model.layers.22.post_attention_layernorm.weight": "model-00005-of-00007.safetensors", + "model.layers.22.self_attn.k_proj.weight": "model-00005-of-00007.safetensors", + "model.layers.22.self_attn.o_proj.weight": "model-00005-of-00007.safetensors", + "model.layers.22.self_attn.q_proj.weight": "model-00005-of-00007.safetensors", + "model.layers.22.self_attn.v_proj.weight": "model-00005-of-00007.safetensors", + "model.layers.23.input_layernorm.weight": "model-00005-of-00007.safetensors", + "model.layers.23.mlp.down_proj.weight": "model-00005-of-00007.safetensors", + "model.layers.23.mlp.gate_proj.weight": "model-00005-of-00007.safetensors", + "model.layers.23.mlp.up_proj.weight": "model-00005-of-00007.safetensors", + "model.layers.23.post_attention_layernorm.weight": "model-00005-of-00007.safetensors", + "model.layers.23.self_attn.k_proj.weight": "model-00005-of-00007.safetensors", + "model.layers.23.self_attn.o_proj.weight": "model-00005-of-00007.safetensors", + "model.layers.23.self_attn.q_proj.weight": "model-00005-of-00007.safetensors", + "model.layers.23.self_attn.v_proj.weight": "model-00005-of-00007.safetensors", + "model.layers.24.input_layernorm.weight": "model-00005-of-00007.safetensors", + "model.layers.24.mlp.down_proj.weight": "model-00005-of-00007.safetensors", + "model.layers.24.mlp.gate_proj.weight": "model-00005-of-00007.safetensors", + "model.layers.24.mlp.up_proj.weight": "model-00005-of-00007.safetensors", + "model.layers.24.post_attention_layernorm.weight": "model-00005-of-00007.safetensors", + "model.layers.24.self_attn.k_proj.weight": "model-00005-of-00007.safetensors", + "model.layers.24.self_attn.o_proj.weight": "model-00005-of-00007.safetensors", + "model.layers.24.self_attn.q_proj.weight": "model-00005-of-00007.safetensors", + "model.layers.24.self_attn.v_proj.weight": "model-00005-of-00007.safetensors", + "model.layers.25.input_layernorm.weight": "model-00006-of-00007.safetensors", + "model.layers.25.mlp.down_proj.weight": "model-00006-of-00007.safetensors", + "model.layers.25.mlp.gate_proj.weight": "model-00005-of-00007.safetensors", + "model.layers.25.mlp.up_proj.weight": "model-00005-of-00007.safetensors", + "model.layers.25.post_attention_layernorm.weight": "model-00006-of-00007.safetensors", + "model.layers.25.self_attn.k_proj.weight": "model-00005-of-00007.safetensors", + "model.layers.25.self_attn.o_proj.weight": "model-00005-of-00007.safetensors", + "model.layers.25.self_attn.q_proj.weight": "model-00005-of-00007.safetensors", + "model.layers.25.self_attn.v_proj.weight": "model-00005-of-00007.safetensors", + "model.layers.26.input_layernorm.weight": "model-00006-of-00007.safetensors", + "model.layers.26.mlp.down_proj.weight": "model-00006-of-00007.safetensors", + "model.layers.26.mlp.gate_proj.weight": "model-00006-of-00007.safetensors", + "model.layers.26.mlp.up_proj.weight": "model-00006-of-00007.safetensors", + "model.layers.26.post_attention_layernorm.weight": "model-00006-of-00007.safetensors", + "model.layers.26.self_attn.k_proj.weight": "model-00006-of-00007.safetensors", + "model.layers.26.self_attn.o_proj.weight": "model-00006-of-00007.safetensors", + "model.layers.26.self_attn.q_proj.weight": "model-00006-of-00007.safetensors", + "model.layers.26.self_attn.v_proj.weight": "model-00006-of-00007.safetensors", + "model.layers.27.input_layernorm.weight": "model-00006-of-00007.safetensors", + "model.layers.27.mlp.down_proj.weight": "model-00006-of-00007.safetensors", + "model.layers.27.mlp.gate_proj.weight": "model-00006-of-00007.safetensors", + "model.layers.27.mlp.up_proj.weight": "model-00006-of-00007.safetensors", + "model.layers.27.post_attention_layernorm.weight": "model-00006-of-00007.safetensors", + "model.layers.27.self_attn.k_proj.weight": "model-00006-of-00007.safetensors", + "model.layers.27.self_attn.o_proj.weight": "model-00006-of-00007.safetensors", + "model.layers.27.self_attn.q_proj.weight": "model-00006-of-00007.safetensors", + "model.layers.27.self_attn.v_proj.weight": "model-00006-of-00007.safetensors", + "model.layers.28.input_layernorm.weight": "model-00006-of-00007.safetensors", + "model.layers.28.mlp.down_proj.weight": "model-00006-of-00007.safetensors", + "model.layers.28.mlp.gate_proj.weight": "model-00006-of-00007.safetensors", + "model.layers.28.mlp.up_proj.weight": "model-00006-of-00007.safetensors", + "model.layers.28.post_attention_layernorm.weight": "model-00006-of-00007.safetensors", + "model.layers.28.self_attn.k_proj.weight": "model-00006-of-00007.safetensors", + "model.layers.28.self_attn.o_proj.weight": "model-00006-of-00007.safetensors", + "model.layers.28.self_attn.q_proj.weight": "model-00006-of-00007.safetensors", + "model.layers.28.self_attn.v_proj.weight": "model-00006-of-00007.safetensors", + "model.layers.29.input_layernorm.weight": "model-00006-of-00007.safetensors", + "model.layers.29.mlp.down_proj.weight": "model-00006-of-00007.safetensors", + "model.layers.29.mlp.gate_proj.weight": "model-00006-of-00007.safetensors", + "model.layers.29.mlp.up_proj.weight": "model-00006-of-00007.safetensors", + "model.layers.29.post_attention_layernorm.weight": "model-00006-of-00007.safetensors", + "model.layers.29.self_attn.k_proj.weight": "model-00006-of-00007.safetensors", + "model.layers.29.self_attn.o_proj.weight": "model-00006-of-00007.safetensors", + "model.layers.29.self_attn.q_proj.weight": "model-00006-of-00007.safetensors", + "model.layers.29.self_attn.v_proj.weight": "model-00006-of-00007.safetensors", + "model.layers.3.input_layernorm.weight": "model-00002-of-00007.safetensors", + "model.layers.3.mlp.down_proj.weight": "model-00002-of-00007.safetensors", + "model.layers.3.mlp.gate_proj.weight": "model-00002-of-00007.safetensors", + "model.layers.3.mlp.up_proj.weight": "model-00002-of-00007.safetensors", + "model.layers.3.post_attention_layernorm.weight": "model-00002-of-00007.safetensors", + "model.layers.3.self_attn.k_proj.weight": "model-00001-of-00007.safetensors", + "model.layers.3.self_attn.o_proj.weight": "model-00001-of-00007.safetensors", + "model.layers.3.self_attn.q_proj.weight": "model-00001-of-00007.safetensors", + "model.layers.3.self_attn.v_proj.weight": "model-00001-of-00007.safetensors", + "model.layers.30.input_layernorm.weight": "model-00006-of-00007.safetensors", + "model.layers.30.mlp.down_proj.weight": "model-00006-of-00007.safetensors", + "model.layers.30.mlp.gate_proj.weight": "model-00006-of-00007.safetensors", + "model.layers.30.mlp.up_proj.weight": "model-00006-of-00007.safetensors", + "model.layers.30.post_attention_layernorm.weight": "model-00006-of-00007.safetensors", + "model.layers.30.self_attn.k_proj.weight": "model-00006-of-00007.safetensors", + "model.layers.30.self_attn.o_proj.weight": "model-00006-of-00007.safetensors", + "model.layers.30.self_attn.q_proj.weight": "model-00006-of-00007.safetensors", + "model.layers.30.self_attn.v_proj.weight": "model-00006-of-00007.safetensors", + "model.layers.31.input_layernorm.weight": "model-00007-of-00007.safetensors", + "model.layers.31.mlp.down_proj.weight": "model-00007-of-00007.safetensors", + "model.layers.31.mlp.gate_proj.weight": "model-00006-of-00007.safetensors", + "model.layers.31.mlp.up_proj.weight": "model-00007-of-00007.safetensors", + "model.layers.31.post_attention_layernorm.weight": "model-00007-of-00007.safetensors", + "model.layers.31.self_attn.k_proj.weight": "model-00006-of-00007.safetensors", + "model.layers.31.self_attn.o_proj.weight": "model-00006-of-00007.safetensors", + "model.layers.31.self_attn.q_proj.weight": "model-00006-of-00007.safetensors", + "model.layers.31.self_attn.v_proj.weight": "model-00006-of-00007.safetensors", + "model.layers.4.input_layernorm.weight": "model-00002-of-00007.safetensors", + "model.layers.4.mlp.down_proj.weight": "model-00002-of-00007.safetensors", + "model.layers.4.mlp.gate_proj.weight": "model-00002-of-00007.safetensors", + "model.layers.4.mlp.up_proj.weight": "model-00002-of-00007.safetensors", + "model.layers.4.post_attention_layernorm.weight": "model-00002-of-00007.safetensors", + "model.layers.4.self_attn.k_proj.weight": "model-00002-of-00007.safetensors", + "model.layers.4.self_attn.o_proj.weight": "model-00002-of-00007.safetensors", + "model.layers.4.self_attn.q_proj.weight": "model-00002-of-00007.safetensors", + "model.layers.4.self_attn.v_proj.weight": "model-00002-of-00007.safetensors", + "model.layers.5.input_layernorm.weight": "model-00002-of-00007.safetensors", + "model.layers.5.mlp.down_proj.weight": "model-00002-of-00007.safetensors", + "model.layers.5.mlp.gate_proj.weight": "model-00002-of-00007.safetensors", + "model.layers.5.mlp.up_proj.weight": "model-00002-of-00007.safetensors", + "model.layers.5.post_attention_layernorm.weight": "model-00002-of-00007.safetensors", + "model.layers.5.self_attn.k_proj.weight": "model-00002-of-00007.safetensors", + "model.layers.5.self_attn.o_proj.weight": "model-00002-of-00007.safetensors", + "model.layers.5.self_attn.q_proj.weight": "model-00002-of-00007.safetensors", + "model.layers.5.self_attn.v_proj.weight": "model-00002-of-00007.safetensors", + "model.layers.6.input_layernorm.weight": "model-00002-of-00007.safetensors", + "model.layers.6.mlp.down_proj.weight": "model-00002-of-00007.safetensors", + "model.layers.6.mlp.gate_proj.weight": "model-00002-of-00007.safetensors", + "model.layers.6.mlp.up_proj.weight": "model-00002-of-00007.safetensors", + "model.layers.6.post_attention_layernorm.weight": "model-00002-of-00007.safetensors", + "model.layers.6.self_attn.k_proj.weight": "model-00002-of-00007.safetensors", + "model.layers.6.self_attn.o_proj.weight": "model-00002-of-00007.safetensors", + "model.layers.6.self_attn.q_proj.weight": "model-00002-of-00007.safetensors", + "model.layers.6.self_attn.v_proj.weight": "model-00002-of-00007.safetensors", + "model.layers.7.input_layernorm.weight": "model-00002-of-00007.safetensors", + "model.layers.7.mlp.down_proj.weight": "model-00002-of-00007.safetensors", + "model.layers.7.mlp.gate_proj.weight": "model-00002-of-00007.safetensors", + "model.layers.7.mlp.up_proj.weight": "model-00002-of-00007.safetensors", + "model.layers.7.post_attention_layernorm.weight": "model-00002-of-00007.safetensors", + "model.layers.7.self_attn.k_proj.weight": "model-00002-of-00007.safetensors", + "model.layers.7.self_attn.o_proj.weight": "model-00002-of-00007.safetensors", + "model.layers.7.self_attn.q_proj.weight": "model-00002-of-00007.safetensors", + "model.layers.7.self_attn.v_proj.weight": "model-00002-of-00007.safetensors", + "model.layers.8.input_layernorm.weight": "model-00003-of-00007.safetensors", + "model.layers.8.mlp.down_proj.weight": "model-00003-of-00007.safetensors", + "model.layers.8.mlp.gate_proj.weight": "model-00002-of-00007.safetensors", + "model.layers.8.mlp.up_proj.weight": "model-00002-of-00007.safetensors", + "model.layers.8.post_attention_layernorm.weight": "model-00003-of-00007.safetensors", + "model.layers.8.self_attn.k_proj.weight": "model-00002-of-00007.safetensors", + "model.layers.8.self_attn.o_proj.weight": "model-00002-of-00007.safetensors", + "model.layers.8.self_attn.q_proj.weight": "model-00002-of-00007.safetensors", + "model.layers.8.self_attn.v_proj.weight": "model-00002-of-00007.safetensors", + "model.layers.9.input_layernorm.weight": "model-00003-of-00007.safetensors", + "model.layers.9.mlp.down_proj.weight": "model-00003-of-00007.safetensors", + "model.layers.9.mlp.gate_proj.weight": "model-00003-of-00007.safetensors", + "model.layers.9.mlp.up_proj.weight": "model-00003-of-00007.safetensors", + "model.layers.9.post_attention_layernorm.weight": "model-00003-of-00007.safetensors", + "model.layers.9.self_attn.k_proj.weight": "model-00003-of-00007.safetensors", + "model.layers.9.self_attn.o_proj.weight": "model-00003-of-00007.safetensors", + "model.layers.9.self_attn.q_proj.weight": "model-00003-of-00007.safetensors", + "model.layers.9.self_attn.v_proj.weight": "model-00003-of-00007.safetensors", + "model.norm.weight": "model-00007-of-00007.safetensors" + } +} diff --git a/special_tokens_map.json b/special_tokens_map.json new file mode 100644 index 0000000..e5b39b6 --- /dev/null +++ b/special_tokens_map.json @@ -0,0 +1,23 @@ +{ + "bos_token": { + "content": "<|begin_of_text|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false + }, + "eos_token": { + "content": "<|end_of_text|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false + }, + "pad_token": { + "content": "<|end_of_text|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false + } +} diff --git a/tokenizer.json b/tokenizer.json new file mode 100644 index 0000000..86a3394 --- /dev/null +++ b/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c5cf44023714fb39b05e71e425f8d7b92805ff73f7988b083b8c87f0bf87393 +size 17209961 diff --git a/tokenizer_config.json b/tokenizer_config.json new file mode 100644 index 0000000..8c6916a --- /dev/null +++ b/tokenizer_config.json @@ -0,0 +1,2064 @@ +{ + "added_tokens_decoder": { + "128000": { + "content": "<|begin_of_text|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128001": { + "content": "<|end_of_text|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128002": { + "content": "<|reserved_special_token_0|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128003": { + "content": "<|reserved_special_token_1|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128004": { + "content": "<|reserved_special_token_2|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128005": { + "content": "<|reserved_special_token_3|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128006": { + "content": "<|start_header_id|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128007": { + "content": "<|end_header_id|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128008": { + "content": "<|reserved_special_token_4|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128009": { + "content": "<|eot_id|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128010": { + "content": "<|reserved_special_token_5|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128011": { + "content": "<|reserved_special_token_6|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128012": { + "content": "<|reserved_special_token_7|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128013": { + "content": "<|reserved_special_token_8|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128014": { + "content": "<|reserved_special_token_9|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128015": { + "content": "<|reserved_special_token_10|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128016": { + "content": "<|reserved_special_token_11|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128017": { + "content": "<|reserved_special_token_12|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128018": { + "content": "<|reserved_special_token_13|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128019": { + "content": "<|reserved_special_token_14|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128020": { + "content": "<|reserved_special_token_15|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128021": { + "content": "<|reserved_special_token_16|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128022": { + "content": "<|reserved_special_token_17|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128023": { + "content": "<|reserved_special_token_18|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128024": { + "content": "<|reserved_special_token_19|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128025": { + "content": "<|reserved_special_token_20|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128026": { + "content": "<|reserved_special_token_21|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128027": { + "content": "<|reserved_special_token_22|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128028": { + "content": "<|reserved_special_token_23|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128029": { + "content": "<|reserved_special_token_24|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128030": { + "content": "<|reserved_special_token_25|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128031": { + "content": "<|reserved_special_token_26|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128032": { + "content": "<|reserved_special_token_27|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128033": { + "content": "<|reserved_special_token_28|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128034": { + "content": "<|reserved_special_token_29|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128035": { + "content": "<|reserved_special_token_30|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128036": { + "content": "<|reserved_special_token_31|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128037": { + "content": "<|reserved_special_token_32|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128038": { + "content": "<|reserved_special_token_33|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128039": { + "content": "<|reserved_special_token_34|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128040": { + "content": "<|reserved_special_token_35|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128041": { + "content": "<|reserved_special_token_36|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128042": { + "content": "<|reserved_special_token_37|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128043": { + "content": "<|reserved_special_token_38|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128044": { + "content": "<|reserved_special_token_39|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128045": { + "content": "<|reserved_special_token_40|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128046": { + "content": "<|reserved_special_token_41|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128047": { + "content": "<|reserved_special_token_42|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128048": { + "content": "<|reserved_special_token_43|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128049": { + "content": "<|reserved_special_token_44|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128050": { + "content": "<|reserved_special_token_45|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128051": { + "content": "<|reserved_special_token_46|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128052": { + "content": "<|reserved_special_token_47|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128053": { + "content": "<|reserved_special_token_48|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128054": { + "content": "<|reserved_special_token_49|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128055": { + "content": "<|reserved_special_token_50|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128056": { + "content": "<|reserved_special_token_51|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128057": { + "content": "<|reserved_special_token_52|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128058": { + "content": "<|reserved_special_token_53|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128059": { + "content": "<|reserved_special_token_54|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128060": { + "content": "<|reserved_special_token_55|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128061": { + "content": "<|reserved_special_token_56|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128062": { + "content": "<|reserved_special_token_57|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128063": { + "content": "<|reserved_special_token_58|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128064": { + "content": "<|reserved_special_token_59|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128065": { + "content": "<|reserved_special_token_60|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128066": { + "content": "<|reserved_special_token_61|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128067": { + "content": "<|reserved_special_token_62|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128068": { + "content": "<|reserved_special_token_63|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128069": { + "content": "<|reserved_special_token_64|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128070": { + "content": "<|reserved_special_token_65|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128071": { + "content": "<|reserved_special_token_66|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128072": { + "content": "<|reserved_special_token_67|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128073": { + "content": "<|reserved_special_token_68|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128074": { + "content": "<|reserved_special_token_69|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128075": { + "content": "<|reserved_special_token_70|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128076": { + "content": "<|reserved_special_token_71|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128077": { + "content": "<|reserved_special_token_72|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128078": { + "content": "<|reserved_special_token_73|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128079": { + "content": "<|reserved_special_token_74|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128080": { + "content": "<|reserved_special_token_75|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128081": { + "content": "<|reserved_special_token_76|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128082": { + "content": "<|reserved_special_token_77|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128083": { + "content": "<|reserved_special_token_78|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128084": { + "content": "<|reserved_special_token_79|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128085": { + "content": "<|reserved_special_token_80|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128086": { + "content": "<|reserved_special_token_81|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128087": { + "content": "<|reserved_special_token_82|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128088": { + "content": "<|reserved_special_token_83|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128089": { + "content": "<|reserved_special_token_84|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128090": { + "content": "<|reserved_special_token_85|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128091": { + "content": "<|reserved_special_token_86|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128092": { + "content": "<|reserved_special_token_87|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128093": { + "content": "<|reserved_special_token_88|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128094": { + "content": "<|reserved_special_token_89|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128095": { + "content": "<|reserved_special_token_90|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128096": { + "content": "<|reserved_special_token_91|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128097": { + "content": "<|reserved_special_token_92|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128098": { + "content": "<|reserved_special_token_93|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128099": { + "content": "<|reserved_special_token_94|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128100": { + "content": "<|reserved_special_token_95|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128101": { + "content": "<|reserved_special_token_96|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128102": { + "content": "<|reserved_special_token_97|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128103": { + "content": "<|reserved_special_token_98|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128104": { + "content": "<|reserved_special_token_99|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128105": { + "content": "<|reserved_special_token_100|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128106": { + "content": "<|reserved_special_token_101|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128107": { + "content": "<|reserved_special_token_102|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128108": { + "content": "<|reserved_special_token_103|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128109": { + "content": "<|reserved_special_token_104|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128110": { + "content": "<|reserved_special_token_105|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128111": { + "content": "<|reserved_special_token_106|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128112": { + "content": "<|reserved_special_token_107|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128113": { + "content": "<|reserved_special_token_108|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128114": { + "content": "<|reserved_special_token_109|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128115": { + "content": "<|reserved_special_token_110|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128116": { + "content": "<|reserved_special_token_111|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128117": { + "content": "<|reserved_special_token_112|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128118": { + "content": "<|reserved_special_token_113|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128119": { + "content": "<|reserved_special_token_114|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128120": { + "content": "<|reserved_special_token_115|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128121": { + "content": "<|reserved_special_token_116|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128122": { + "content": "<|reserved_special_token_117|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128123": { + "content": "<|reserved_special_token_118|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128124": { + "content": "<|reserved_special_token_119|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128125": { + "content": "<|reserved_special_token_120|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128126": { + "content": "<|reserved_special_token_121|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128127": { + "content": "<|reserved_special_token_122|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128128": { + "content": "<|reserved_special_token_123|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128129": { + "content": "<|reserved_special_token_124|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128130": { + "content": "<|reserved_special_token_125|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128131": { + "content": "<|reserved_special_token_126|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128132": { + "content": "<|reserved_special_token_127|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128133": { + "content": "<|reserved_special_token_128|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128134": { + "content": "<|reserved_special_token_129|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128135": { + "content": "<|reserved_special_token_130|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128136": { + "content": "<|reserved_special_token_131|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128137": { + "content": "<|reserved_special_token_132|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128138": { + "content": "<|reserved_special_token_133|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128139": { + "content": "<|reserved_special_token_134|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128140": { + "content": "<|reserved_special_token_135|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128141": { + "content": "<|reserved_special_token_136|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128142": { + "content": "<|reserved_special_token_137|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128143": { + "content": "<|reserved_special_token_138|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128144": { + "content": "<|reserved_special_token_139|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128145": { + "content": "<|reserved_special_token_140|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128146": { + "content": "<|reserved_special_token_141|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128147": { + "content": "<|reserved_special_token_142|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128148": { + "content": "<|reserved_special_token_143|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128149": { + "content": "<|reserved_special_token_144|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128150": { + "content": "<|reserved_special_token_145|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128151": { + "content": "<|reserved_special_token_146|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128152": { + "content": "<|reserved_special_token_147|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128153": { + "content": "<|reserved_special_token_148|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128154": { + "content": "<|reserved_special_token_149|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128155": { + "content": "<|reserved_special_token_150|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128156": { + "content": "<|reserved_special_token_151|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128157": { + "content": "<|reserved_special_token_152|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128158": { + "content": "<|reserved_special_token_153|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128159": { + "content": "<|reserved_special_token_154|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128160": { + "content": "<|reserved_special_token_155|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128161": { + "content": "<|reserved_special_token_156|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128162": { + "content": "<|reserved_special_token_157|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128163": { + "content": "<|reserved_special_token_158|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128164": { + "content": "<|reserved_special_token_159|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128165": { + "content": "<|reserved_special_token_160|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128166": { + "content": "<|reserved_special_token_161|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128167": { + "content": "<|reserved_special_token_162|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128168": { + "content": "<|reserved_special_token_163|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128169": { + "content": "<|reserved_special_token_164|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128170": { + "content": "<|reserved_special_token_165|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128171": { + "content": "<|reserved_special_token_166|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128172": { + "content": "<|reserved_special_token_167|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128173": { + "content": "<|reserved_special_token_168|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128174": { + "content": "<|reserved_special_token_169|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128175": { + "content": "<|reserved_special_token_170|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128176": { + "content": "<|reserved_special_token_171|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128177": { + "content": "<|reserved_special_token_172|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128178": { + "content": "<|reserved_special_token_173|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128179": { + "content": "<|reserved_special_token_174|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128180": { + "content": "<|reserved_special_token_175|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128181": { + "content": "<|reserved_special_token_176|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128182": { + "content": "<|reserved_special_token_177|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128183": { + "content": "<|reserved_special_token_178|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128184": { + "content": "<|reserved_special_token_179|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128185": { + "content": "<|reserved_special_token_180|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128186": { + "content": "<|reserved_special_token_181|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128187": { + "content": "<|reserved_special_token_182|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128188": { + "content": "<|reserved_special_token_183|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128189": { + "content": "<|reserved_special_token_184|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128190": { + "content": "<|reserved_special_token_185|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128191": { + "content": "<|reserved_special_token_186|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128192": { + "content": "<|reserved_special_token_187|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128193": { + "content": "<|reserved_special_token_188|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128194": { + "content": "<|reserved_special_token_189|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128195": { + "content": "<|reserved_special_token_190|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128196": { + "content": "<|reserved_special_token_191|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128197": { + "content": "<|reserved_special_token_192|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128198": { + "content": "<|reserved_special_token_193|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128199": { + "content": "<|reserved_special_token_194|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128200": { + "content": "<|reserved_special_token_195|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128201": { + "content": "<|reserved_special_token_196|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128202": { + "content": "<|reserved_special_token_197|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128203": { + "content": "<|reserved_special_token_198|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128204": { + "content": "<|reserved_special_token_199|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128205": { + "content": "<|reserved_special_token_200|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128206": { + "content": "<|reserved_special_token_201|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128207": { + "content": "<|reserved_special_token_202|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128208": { + "content": "<|reserved_special_token_203|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128209": { + "content": "<|reserved_special_token_204|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128210": { + "content": "<|reserved_special_token_205|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128211": { + "content": "<|reserved_special_token_206|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128212": { + "content": "<|reserved_special_token_207|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128213": { + "content": "<|reserved_special_token_208|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128214": { + "content": "<|reserved_special_token_209|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128215": { + "content": "<|reserved_special_token_210|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128216": { + "content": "<|reserved_special_token_211|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128217": { + "content": "<|reserved_special_token_212|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128218": { + "content": "<|reserved_special_token_213|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128219": { + "content": "<|reserved_special_token_214|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128220": { + "content": "<|reserved_special_token_215|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128221": { + "content": "<|reserved_special_token_216|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128222": { + "content": "<|reserved_special_token_217|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128223": { + "content": "<|reserved_special_token_218|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128224": { + "content": "<|reserved_special_token_219|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128225": { + "content": "<|reserved_special_token_220|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128226": { + "content": "<|reserved_special_token_221|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128227": { + "content": "<|reserved_special_token_222|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128228": { + "content": "<|reserved_special_token_223|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128229": { + "content": "<|reserved_special_token_224|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128230": { + "content": "<|reserved_special_token_225|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128231": { + "content": "<|reserved_special_token_226|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128232": { + "content": "<|reserved_special_token_227|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128233": { + "content": "<|reserved_special_token_228|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128234": { + "content": "<|reserved_special_token_229|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128235": { + "content": "<|reserved_special_token_230|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128236": { + "content": "<|reserved_special_token_231|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128237": { + "content": "<|reserved_special_token_232|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128238": { + "content": "<|reserved_special_token_233|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128239": { + "content": "<|reserved_special_token_234|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128240": { + "content": "<|reserved_special_token_235|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128241": { + "content": "<|reserved_special_token_236|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128242": { + "content": "<|reserved_special_token_237|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128243": { + "content": "<|reserved_special_token_238|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128244": { + "content": "<|reserved_special_token_239|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128245": { + "content": "<|reserved_special_token_240|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128246": { + "content": "<|reserved_special_token_241|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128247": { + "content": "<|reserved_special_token_242|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128248": { + "content": "<|reserved_special_token_243|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128249": { + "content": "<|reserved_special_token_244|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128250": { + "content": "<|reserved_special_token_245|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128251": { + "content": "<|reserved_special_token_246|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128252": { + "content": "<|reserved_special_token_247|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128253": { + "content": "<|reserved_special_token_248|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128254": { + "content": "<|reserved_special_token_249|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + }, + "128255": { + "content": "<|reserved_special_token_250|>", + "lstrip": false, + "normalized": false, + "rstrip": false, + "single_word": false, + "special": true + } + }, + "bos_token": "<|begin_of_text|>", + "chat_template": "{% set loop_messages = messages %}{% for message in loop_messages %}{% set content = '<|start_header_id|>' + message['role'] + '<|end_header_id|>\n\n'+ message['content'] | trim + '<|eot_id|>' %}{% if loop.index0 == 0 %}{% set content = bos_token + content %}{% endif %}{{ content }}{% endfor %}{% if add_generation_prompt %}{{ '<|start_header_id|>assistant<|end_header_id|>\n\n' }}{% endif %}", + "clean_up_tokenization_spaces": true, + "eos_token": "<|end_of_text|>", + "extra_special_tokens": {}, + "model_input_names": [ + "input_ids", + "attention_mask" + ], + "model_max_length": 2048, + "pad_token": "<|end_of_text|>", + "tokenizer_class": "PreTrainedTokenizer" +} diff --git a/train_results.json b/train_results.json new file mode 100644 index 0000000..d8bb97e --- /dev/null +++ b/train_results.json @@ -0,0 +1,9 @@ +{ + "epoch": 0.999244142101285, + "total_flos": 0.0, + "train_loss": 1.120150500454809, + "train_runtime": 1811.4729, + "train_samples": 42336, + "train_samples_per_second": 23.371, + "train_steps_per_second": 0.365 +} \ No newline at end of file diff --git a/trainer_state.json b/trainer_state.json new file mode 100644 index 0000000..57043ec --- /dev/null +++ b/trainer_state.json @@ -0,0 +1,2621 @@ +{ + "best_global_step": null, + "best_metric": null, + "best_model_checkpoint": null, + "epoch": 0.999244142101285, + "eval_steps": 200, + "global_step": 661, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 0.0015117157974300832, + "fcm_dpo/beta": 0.10000000149011612, + "fcm_dpo/delta": 0.0, + "fcm_dpo/margin": -0.0013532638549804688, + "fcm_dpo/q_t": 0.5000336766242981, + "grad_norm": 28.21888542175293, + "learning_rate": 0.0, + "logits/chosen": 0.13337239623069763, + "logits/rejected": 0.12492948770523071, + "logps/chosen": -64.5841293334961, + "logps/ref_chosen": -64.61280822753906, + "logps/ref_rejected": -64.17195129394531, + "logps/rejected": -64.14192199707031, + "loss": 1.3866, + "margin_dpo/margin_mean": -0.0013527870178222656, + "margin_dpo/margin_std": 0.2561596930027008, + "step": 1 + }, + { + "epoch": 0.007558578987150416, + "fcm_dpo/beta": 0.10000000894069672, + "fcm_dpo/delta": 0.0, + "fcm_dpo/margin": -0.006315112113952637, + "fcm_dpo/q_t": 0.5001578330993652, + "grad_norm": 29.724584579467773, + "learning_rate": 2.9850746268656714e-08, + "logits/chosen": 0.09723952412605286, + "logits/rejected": 0.06879077106714249, + "logps/chosen": -65.34913635253906, + "logps/ref_chosen": -65.34695434570312, + "logps/ref_rejected": -79.315673828125, + "logps/rejected": -79.31153869628906, + "loss": 1.3872, + "margin_dpo/margin_mean": -0.006315216422080994, + "margin_dpo/margin_std": 0.2993292212486267, + "step": 5 + }, + { + "epoch": 0.015117157974300832, + "fcm_dpo/beta": 0.10000000894069672, + "fcm_dpo/delta": 0.0, + "fcm_dpo/margin": -0.013524067588150501, + "fcm_dpo/q_t": 0.500338077545166, + "grad_norm": 29.753292083740234, + "learning_rate": 6.71641791044776e-08, + "logits/chosen": 0.10936982929706573, + "logits/rejected": 0.07020524889230728, + "logps/chosen": -56.681053161621094, + "logps/ref_chosen": -56.65692901611328, + "logps/ref_rejected": -80.12786865234375, + "logps/rejected": -80.13846588134766, + "loss": 1.3879, + "margin_dpo/margin_mean": -0.013524264097213745, + "margin_dpo/margin_std": 0.3152056336402893, + "step": 10 + }, + { + "epoch": 0.022675736961451247, + "fcm_dpo/beta": 0.10000000894069672, + "fcm_dpo/delta": 0.0, + "fcm_dpo/margin": 0.01606299914419651, + "fcm_dpo/q_t": 0.49959880113601685, + "grad_norm": 33.080528259277344, + "learning_rate": 1.044776119402985e-07, + "logits/chosen": 0.07683371752500534, + "logits/rejected": 0.04736438766121864, + "logps/chosen": -60.102806091308594, + "logps/ref_chosen": -60.09392166137695, + "logps/ref_rejected": -78.99056243896484, + "logps/rejected": -79.01551818847656, + "loss": 1.385, + "margin_dpo/margin_mean": 0.01606297492980957, + "margin_dpo/margin_std": 0.31872445344924927, + "step": 15 + }, + { + "epoch": 0.030234315948601664, + "fcm_dpo/beta": 0.10000000894069672, + "fcm_dpo/delta": 0.0, + "fcm_dpo/margin": 0.045558154582977295, + "fcm_dpo/q_t": 0.498861163854599, + "grad_norm": 29.158737182617188, + "learning_rate": 1.4179104477611938e-07, + "logits/chosen": 0.0912957563996315, + "logits/rejected": 0.06395339965820312, + "logps/chosen": -55.449317932128906, + "logps/ref_chosen": -55.464561462402344, + "logps/ref_rejected": -77.40013122558594, + "logps/rejected": -77.43043518066406, + "loss": 1.382, + "margin_dpo/margin_mean": 0.04555808752775192, + "margin_dpo/margin_std": 0.29819026589393616, + "step": 20 + }, + { + "epoch": 0.03779289493575208, + "fcm_dpo/beta": 0.10000000894069672, + "fcm_dpo/delta": 0.0, + "fcm_dpo/margin": -0.004711696412414312, + "fcm_dpo/q_t": 0.5001178979873657, + "grad_norm": 29.72311782836914, + "learning_rate": 1.7910447761194027e-07, + "logits/chosen": 0.10293181240558624, + "logits/rejected": 0.07127834111452103, + "logps/chosen": -60.726539611816406, + "logps/ref_chosen": -60.711814880371094, + "logps/ref_rejected": -82.71756744384766, + "logps/rejected": -82.72756958007812, + "loss": 1.387, + "margin_dpo/margin_mean": -0.004711783025413752, + "margin_dpo/margin_std": 0.29338979721069336, + "step": 25 + }, + { + "epoch": 0.045351473922902494, + "fcm_dpo/beta": 0.10000000894069672, + "fcm_dpo/delta": 0.0, + "fcm_dpo/margin": 0.011212587356567383, + "fcm_dpo/q_t": 0.4997197091579437, + "grad_norm": 30.495267868041992, + "learning_rate": 2.1641791044776117e-07, + "logits/chosen": 0.11331719160079956, + "logits/rejected": 0.088210329413414, + "logps/chosen": -60.893218994140625, + "logps/ref_chosen": -60.880210876464844, + "logps/ref_rejected": -78.44148254394531, + "logps/rejected": -78.4656982421875, + "loss": 1.3854, + "margin_dpo/margin_mean": 0.011212664656341076, + "margin_dpo/margin_std": 0.283229798078537, + "step": 30 + }, + { + "epoch": 0.05291005291005291, + "fcm_dpo/beta": 0.10000000894069672, + "fcm_dpo/delta": 0.0, + "fcm_dpo/margin": 0.033431313931941986, + "fcm_dpo/q_t": 0.4991644322872162, + "grad_norm": 27.916645050048828, + "learning_rate": 2.537313432835821e-07, + "logits/chosen": 0.06567516177892685, + "logits/rejected": 0.03955943509936333, + "logps/chosen": -62.278358459472656, + "logps/ref_chosen": -62.248138427734375, + "logps/ref_rejected": -79.56475830078125, + "logps/rejected": -79.62838745117188, + "loss": 1.3832, + "margin_dpo/margin_mean": 0.03343154489994049, + "margin_dpo/margin_std": 0.3196953535079956, + "step": 35 + }, + { + "epoch": 0.06046863189720333, + "fcm_dpo/beta": 0.10000000894069672, + "fcm_dpo/delta": 0.0, + "fcm_dpo/margin": 0.026270773261785507, + "fcm_dpo/q_t": 0.49934354424476624, + "grad_norm": 31.407669067382812, + "learning_rate": 2.9104477611940296e-07, + "logits/chosen": 0.1118750348687172, + "logits/rejected": 0.06694410741329193, + "logps/chosen": -58.9628791809082, + "logps/ref_chosen": -58.87812423706055, + "logps/ref_rejected": -84.22982025146484, + "logps/rejected": -84.34083557128906, + "loss": 1.384, + "margin_dpo/margin_mean": 0.026270756497979164, + "margin_dpo/margin_std": 0.32897505164146423, + "step": 40 + }, + { + "epoch": 0.06802721088435375, + "fcm_dpo/beta": 0.10000000894069672, + "fcm_dpo/delta": 0.0, + "fcm_dpo/margin": 0.06596313416957855, + "fcm_dpo/q_t": 0.49835172295570374, + "grad_norm": 31.758451461791992, + "learning_rate": 3.2835820895522385e-07, + "logits/chosen": 0.07056122273206711, + "logits/rejected": 0.043311070650815964, + "logps/chosen": -66.0146713256836, + "logps/ref_chosen": -65.88298034667969, + "logps/ref_rejected": -83.87881469726562, + "logps/rejected": -84.07647705078125, + "loss": 1.3801, + "margin_dpo/margin_mean": 0.0659632533788681, + "margin_dpo/margin_std": 0.4093398153781891, + "step": 45 + }, + { + "epoch": 0.07558578987150416, + "fcm_dpo/beta": 0.10000000894069672, + "fcm_dpo/delta": 0.0, + "fcm_dpo/margin": 0.11442438513040543, + "fcm_dpo/q_t": 0.4971412718296051, + "grad_norm": 27.961788177490234, + "learning_rate": 3.6567164179104475e-07, + "logits/chosen": 0.0864916443824768, + "logits/rejected": 0.052734147757291794, + "logps/chosen": -55.3635139465332, + "logps/ref_chosen": -55.172386169433594, + "logps/ref_rejected": -69.63300323486328, + "logps/rejected": -69.93855285644531, + "loss": 1.3753, + "margin_dpo/margin_mean": 0.11442458629608154, + "margin_dpo/margin_std": 0.4219285845756531, + "step": 50 + }, + { + "epoch": 0.08314436885865457, + "fcm_dpo/beta": 0.10000000894069672, + "fcm_dpo/delta": 0.0, + "fcm_dpo/margin": 0.20081201195716858, + "fcm_dpo/q_t": 0.4949868321418762, + "grad_norm": 31.33340835571289, + "learning_rate": 4.0298507462686564e-07, + "logits/chosen": 0.07780580222606659, + "logits/rejected": 0.04163379222154617, + "logps/chosen": -57.531211853027344, + "logps/ref_chosen": -57.193580627441406, + "logps/ref_rejected": -79.69940948486328, + "logps/rejected": -80.23786926269531, + "loss": 1.3672, + "margin_dpo/margin_mean": 0.20081210136413574, + "margin_dpo/margin_std": 0.5645917057991028, + "step": 55 + }, + { + "epoch": 0.09070294784580499, + "fcm_dpo/beta": 0.10000000894069672, + "fcm_dpo/delta": 0.0, + "fcm_dpo/margin": 0.21879427134990692, + "fcm_dpo/q_t": 0.4945460259914398, + "grad_norm": 29.641948699951172, + "learning_rate": 4.4029850746268654e-07, + "logits/chosen": 0.1170019656419754, + "logits/rejected": 0.0827331617474556, + "logps/chosen": -60.59779739379883, + "logps/ref_chosen": -60.068870544433594, + "logps/ref_rejected": -74.41178894042969, + "logps/rejected": -75.15950012207031, + "loss": 1.3662, + "margin_dpo/margin_mean": 0.2187943458557129, + "margin_dpo/margin_std": 0.7729828357696533, + "step": 60 + }, + { + "epoch": 0.0982615268329554, + "fcm_dpo/beta": 0.10000000894069672, + "fcm_dpo/delta": 0.0, + "fcm_dpo/margin": 0.30554288625717163, + "fcm_dpo/q_t": 0.492379754781723, + "grad_norm": 30.804401397705078, + "learning_rate": 4.776119402985074e-07, + "logits/chosen": 0.14683708548545837, + "logits/rejected": 0.11651895940303802, + "logps/chosen": -58.885589599609375, + "logps/ref_chosen": -58.1558952331543, + "logps/ref_rejected": -76.06512451171875, + "logps/rejected": -77.1003646850586, + "loss": 1.3584, + "margin_dpo/margin_mean": 0.30554264783859253, + "margin_dpo/margin_std": 0.9574313163757324, + "step": 65 + }, + { + "epoch": 0.10582010582010581, + "fcm_dpo/beta": 0.10000000894069672, + "fcm_dpo/delta": 0.0, + "fcm_dpo/margin": 0.4061034321784973, + "fcm_dpo/q_t": 0.4898872971534729, + "grad_norm": 28.625547409057617, + "learning_rate": 4.999860140229787e-07, + "logits/chosen": 0.10340998321771622, + "logits/rejected": 0.0681125819683075, + "logps/chosen": -68.41093444824219, + "logps/ref_chosen": -67.35506439208984, + "logps/ref_rejected": -82.24962615966797, + "logps/rejected": -83.71160125732422, + "loss": 1.3494, + "margin_dpo/margin_mean": 0.40610337257385254, + "margin_dpo/margin_std": 1.122269868850708, + "step": 70 + }, + { + "epoch": 0.11337868480725624, + "fcm_dpo/beta": 0.10000000894069672, + "fcm_dpo/delta": 0.0, + "fcm_dpo/margin": 0.519697368144989, + "fcm_dpo/q_t": 0.48709648847579956, + "grad_norm": 26.1798095703125, + "learning_rate": 4.998286897523808e-07, + "logits/chosen": 0.11257852613925934, + "logits/rejected": 0.07697894424200058, + "logps/chosen": -58.29564666748047, + "logps/ref_chosen": -56.86763381958008, + "logps/ref_rejected": -72.56938934326172, + "logps/rejected": -74.51709747314453, + "loss": 1.3404, + "margin_dpo/margin_mean": 0.5196975469589233, + "margin_dpo/margin_std": 1.4106642007827759, + "step": 75 + }, + { + "epoch": 0.12093726379440665, + "fcm_dpo/beta": 0.10000000894069672, + "fcm_dpo/delta": 0.0, + "fcm_dpo/margin": 0.6465596556663513, + "fcm_dpo/q_t": 0.48402470350265503, + "grad_norm": 28.485530853271484, + "learning_rate": 4.994966691179711e-07, + "logits/chosen": 0.14081288874149323, + "logits/rejected": 0.09565093368291855, + "logps/chosen": -59.448753356933594, + "logps/ref_chosen": -57.687095642089844, + "logps/ref_rejected": -78.06813049316406, + "logps/rejected": -80.4763412475586, + "loss": 1.3302, + "margin_dpo/margin_mean": 0.6465598344802856, + "margin_dpo/margin_std": 1.6814677715301514, + "step": 80 + }, + { + "epoch": 0.12849584278155707, + "fcm_dpo/beta": 0.10000000894069672, + "fcm_dpo/delta": 0.0, + "fcm_dpo/margin": 1.0534989833831787, + "fcm_dpo/q_t": 0.4739624559879303, + "grad_norm": 26.71432876586914, + "learning_rate": 4.989901842900325e-07, + "logits/chosen": 0.16136503219604492, + "logits/rejected": 0.11435899883508682, + "logps/chosen": -59.10918426513672, + "logps/ref_chosen": -56.96040725708008, + "logps/ref_rejected": -75.22166442871094, + "logps/rejected": -78.42394256591797, + "loss": 1.2921, + "margin_dpo/margin_mean": 1.0534991025924683, + "margin_dpo/margin_std": 1.7913897037506104, + "step": 85 + }, + { + "epoch": 0.1360544217687075, + "fcm_dpo/beta": 0.10000000894069672, + "fcm_dpo/delta": 0.0, + "fcm_dpo/margin": 1.108295202255249, + "fcm_dpo/q_t": 0.47283005714416504, + "grad_norm": 29.2835693359375, + "learning_rate": 4.983095894354857e-07, + "logits/chosen": 0.21447758376598358, + "logits/rejected": 0.1654311865568161, + "logps/chosen": -60.33354949951172, + "logps/ref_chosen": -57.41730499267578, + "logps/ref_rejected": -80.87986755371094, + "logps/rejected": -84.9044189453125, + "loss": 1.2951, + "margin_dpo/margin_mean": 1.1082954406738281, + "margin_dpo/margin_std": 2.5071663856506348, + "step": 90 + }, + { + "epoch": 0.1436130007558579, + "fcm_dpo/beta": 0.10000000894069672, + "fcm_dpo/delta": 0.0, + "fcm_dpo/margin": 1.4385011196136475, + "fcm_dpo/q_t": 0.4653662145137787, + "grad_norm": 29.20956039428711, + "learning_rate": 4.974553604702332e-07, + "logits/chosen": 0.2017609179019928, + "logits/rejected": 0.15785647928714752, + "logps/chosen": -57.5848274230957, + "logps/ref_chosen": -54.08087158203125, + "logps/ref_rejected": -76.15860748291016, + "logps/rejected": -81.1010513305664, + "loss": 1.2755, + "margin_dpo/margin_mean": 1.4385008811950684, + "margin_dpo/margin_std": 3.3299403190612793, + "step": 95 + }, + { + "epoch": 0.15117157974300832, + "fcm_dpo/beta": 0.10000000894069672, + "fcm_dpo/delta": 0.0, + "fcm_dpo/margin": 1.2202621698379517, + "fcm_dpo/q_t": 0.47157055139541626, + "grad_norm": 33.23603057861328, + "learning_rate": 4.964280947263676e-07, + "logits/chosen": 0.21698299050331116, + "logits/rejected": 0.184483140707016, + "logps/chosen": -68.64390563964844, + "logps/ref_chosen": -63.875038146972656, + "logps/ref_rejected": -82.077880859375, + "logps/rejected": -88.06700134277344, + "loss": 1.3233, + "margin_dpo/margin_mean": 1.220262050628662, + "margin_dpo/margin_std": 4.634930610656738, + "step": 100 + }, + { + "epoch": 0.15873015873015872, + "fcm_dpo/beta": 0.10000000894069672, + "fcm_dpo/delta": 0.0, + "fcm_dpo/margin": 1.7332004308700562, + "fcm_dpo/q_t": 0.46054258942604065, + "grad_norm": 30.745962142944336, + "learning_rate": 4.952285105344791e-07, + "logits/chosen": 0.2272680103778839, + "logits/rejected": 0.17643623054027557, + "logps/chosen": -67.46278381347656, + "logps/ref_chosen": -62.572479248046875, + "logps/ref_rejected": -80.93415069580078, + "logps/rejected": -87.5576400756836, + "loss": 1.2811, + "margin_dpo/margin_mean": 1.7332004308700562, + "margin_dpo/margin_std": 4.913107872009277, + "step": 105 + }, + { + "epoch": 0.16628873771730915, + "fcm_dpo/beta": 0.10000000894069672, + "fcm_dpo/delta": 0.0, + "fcm_dpo/margin": 1.5242812633514404, + "fcm_dpo/q_t": 0.46426910161972046, + "grad_norm": 44.22966003417969, + "learning_rate": 4.938574467213517e-07, + "logits/chosen": 0.19085553288459778, + "logits/rejected": 0.16806969046592712, + "logps/chosen": -74.31179809570312, + "logps/ref_chosen": -68.67534637451172, + "logps/ref_rejected": -78.82028198242188, + "logps/rejected": -85.98100280761719, + "loss": 1.3145, + "margin_dpo/margin_mean": 1.5242810249328613, + "margin_dpo/margin_std": 5.536143779754639, + "step": 110 + }, + { + "epoch": 0.17384731670445955, + "fcm_dpo/beta": 0.10000000894069672, + "fcm_dpo/delta": 0.0, + "fcm_dpo/margin": 2.013551712036133, + "fcm_dpo/q_t": 0.452955424785614, + "grad_norm": 28.415409088134766, + "learning_rate": 4.923158620234019e-07, + "logits/chosen": 0.23339705169200897, + "logits/rejected": 0.18038101494312286, + "logps/chosen": -64.06039428710938, + "logps/ref_chosen": -58.65370559692383, + "logps/ref_rejected": -81.89688873291016, + "logps/rejected": -89.31713104248047, + "loss": 1.2498, + "margin_dpo/margin_mean": 2.013551712036133, + "margin_dpo/margin_std": 4.735473155975342, + "step": 115 + }, + { + "epoch": 0.18140589569160998, + "fcm_dpo/beta": 0.10000000894069672, + "fcm_dpo/delta": 0.0, + "fcm_dpo/margin": 2.4133291244506836, + "fcm_dpo/q_t": 0.44279351830482483, + "grad_norm": 28.7838191986084, + "learning_rate": 4.906048344162676e-07, + "logits/chosen": 0.24171380698680878, + "logits/rejected": 0.19227424263954163, + "logps/chosen": -61.56781768798828, + "logps/ref_chosen": -56.16423797607422, + "logps/ref_rejected": -75.87689971923828, + "logps/rejected": -83.69380187988281, + "loss": 1.2069, + "margin_dpo/margin_mean": 2.4133291244506836, + "margin_dpo/margin_std": 4.3148322105407715, + "step": 120 + }, + { + "epoch": 0.1889644746787604, + "fcm_dpo/beta": 0.10000000894069672, + "fcm_dpo/delta": 0.0, + "fcm_dpo/margin": 3.0360968112945557, + "fcm_dpo/q_t": 0.4307987093925476, + "grad_norm": 29.158105850219727, + "learning_rate": 4.887255603610184e-07, + "logits/chosen": 0.2693176865577698, + "logits/rejected": 0.21195952594280243, + "logps/chosen": -66.05271911621094, + "logps/ref_chosen": -59.744285583496094, + "logps/ref_rejected": -86.77314758300781, + "logps/rejected": -96.11767578125, + "loss": 1.1645, + "margin_dpo/margin_mean": 3.0360968112945557, + "margin_dpo/margin_std": 5.009610652923584, + "step": 125 + }, + { + "epoch": 0.1965230536659108, + "fcm_dpo/beta": 0.10000000894069672, + "fcm_dpo/delta": 0.0, + "fcm_dpo/margin": 2.8338823318481445, + "fcm_dpo/q_t": 0.43448346853256226, + "grad_norm": 30.431678771972656, + "learning_rate": 4.866793539675126e-07, + "logits/chosen": 0.20911665260791779, + "logits/rejected": 0.17860978841781616, + "logps/chosen": -71.53947448730469, + "logps/ref_chosen": -64.15296936035156, + "logps/ref_rejected": -75.17271423339844, + "logps/rejected": -85.3930892944336, + "loss": 1.1921, + "margin_dpo/margin_mean": 2.8338828086853027, + "margin_dpo/margin_std": 5.266488075256348, + "step": 130 + }, + { + "epoch": 0.20408163265306123, + "fcm_dpo/beta": 0.10191638767719269, + "fcm_dpo/delta": 0.031610384583473206, + "fcm_dpo/margin": 3.762406826019287, + "fcm_dpo/q_t": 0.4133889079093933, + "grad_norm": 26.239471435546875, + "learning_rate": 4.844676460754862e-07, + "logits/chosen": 0.25873705744743347, + "logits/rejected": 0.21873533725738525, + "logps/chosen": -65.23578643798828, + "logps/ref_chosen": -57.006690979003906, + "logps/ref_rejected": -73.71768188476562, + "logps/rejected": -85.70919036865234, + "loss": 1.1276, + "margin_dpo/margin_mean": 3.76240611076355, + "margin_dpo/margin_std": 5.971688270568848, + "step": 135 + }, + { + "epoch": 0.21164021164021163, + "fcm_dpo/beta": 0.10494687408208847, + "fcm_dpo/delta": 0.025396008044481277, + "fcm_dpo/margin": 4.405590534210205, + "fcm_dpo/q_t": 0.3999941945075989, + "grad_norm": 33.757999420166016, + "learning_rate": 4.820919832540181e-07, + "logits/chosen": 0.24625614285469055, + "logits/rejected": 0.2025199830532074, + "logps/chosen": -74.15595245361328, + "logps/ref_chosen": -63.36246871948242, + "logps/ref_rejected": -79.62621307373047, + "logps/rejected": -94.8252944946289, + "loss": 1.1183, + "margin_dpo/margin_mean": 4.405590534210205, + "margin_dpo/margin_std": 7.449770927429199, + "step": 140 + }, + { + "epoch": 0.21919879062736206, + "fcm_dpo/beta": 0.10641102492809296, + "fcm_dpo/delta": 0.022974295541644096, + "fcm_dpo/margin": 4.693943977355957, + "fcm_dpo/q_t": 0.395569384098053, + "grad_norm": 38.00341033935547, + "learning_rate": 4.795540267200686e-07, + "logits/chosen": 0.2727429270744324, + "logits/rejected": 0.2512747049331665, + "logps/chosen": -77.23705291748047, + "logps/ref_chosen": -65.01470184326172, + "logps/ref_rejected": -80.49073791503906, + "logps/rejected": -97.40702819824219, + "loss": 1.1399, + "margin_dpo/margin_mean": 4.693943977355957, + "margin_dpo/margin_std": 8.747485160827637, + "step": 145 + }, + { + "epoch": 0.22675736961451248, + "fcm_dpo/beta": 0.10816685855388641, + "fcm_dpo/delta": -0.04916912317276001, + "fcm_dpo/margin": 5.7198591232299805, + "fcm_dpo/q_t": 0.3732493221759796, + "grad_norm": 28.534120559692383, + "learning_rate": 4.768555511768486e-07, + "logits/chosen": 0.28103944659233093, + "logits/rejected": 0.2354610413312912, + "logps/chosen": -71.84245300292969, + "logps/ref_chosen": -59.19135284423828, + "logps/ref_rejected": -74.0339126586914, + "logps/rejected": -92.40486145019531, + "loss": 1.0549, + "margin_dpo/margin_mean": 5.7198591232299805, + "margin_dpo/margin_std": 8.658864974975586, + "step": 150 + }, + { + "epoch": 0.23431594860166288, + "fcm_dpo/beta": 0.09626957774162292, + "fcm_dpo/delta": -0.08038349449634552, + "fcm_dpo/margin": 6.609867095947266, + "fcm_dpo/q_t": 0.36982256174087524, + "grad_norm": 29.370683670043945, + "learning_rate": 4.7399844357283393e-07, + "logits/chosen": 0.29301148653030396, + "logits/rejected": 0.25923386216163635, + "logps/chosen": -73.53243255615234, + "logps/ref_chosen": -60.93949508666992, + "logps/ref_rejected": -74.51151275634766, + "logps/rejected": -93.71430969238281, + "loss": 1.0523, + "margin_dpo/margin_mean": 6.609866142272949, + "margin_dpo/margin_std": 10.054447174072266, + "step": 155 + }, + { + "epoch": 0.2418745275888133, + "fcm_dpo/beta": 0.08975216001272202, + "fcm_dpo/delta": -0.07737629860639572, + "fcm_dpo/margin": 7.146323204040527, + "fcm_dpo/q_t": 0.36957624554634094, + "grad_norm": 26.117460250854492, + "learning_rate": 4.7098470178228755e-07, + "logits/chosen": 0.2661024034023285, + "logits/rejected": 0.22873857617378235, + "logps/chosen": -72.47210693359375, + "logps/ref_chosen": -58.763816833496094, + "logps/ref_rejected": -74.94743347167969, + "logps/rejected": -95.80204010009766, + "loss": 1.0421, + "margin_dpo/margin_mean": 7.146323204040527, + "margin_dpo/margin_std": 10.654400825500488, + "step": 160 + }, + { + "epoch": 0.2494331065759637, + "fcm_dpo/beta": 0.08210185170173645, + "fcm_dpo/delta": -0.13484172523021698, + "fcm_dpo/margin": 8.718481063842773, + "fcm_dpo/q_t": 0.3526487350463867, + "grad_norm": 23.741703033447266, + "learning_rate": 4.678164332082175e-07, + "logits/chosen": 0.3242879807949066, + "logits/rejected": 0.2718299329280853, + "logps/chosen": -70.94097900390625, + "logps/ref_chosen": -55.70417022705078, + "logps/ref_rejected": -76.59439849853516, + "logps/rejected": -100.54969024658203, + "loss": 0.9977, + "margin_dpo/margin_mean": 8.718481063842773, + "margin_dpo/margin_std": 11.619240760803223, + "step": 165 + }, + { + "epoch": 0.25699168556311414, + "fcm_dpo/beta": 0.07538954168558121, + "fcm_dpo/delta": -0.042643819004297256, + "fcm_dpo/margin": 8.284780502319336, + "fcm_dpo/q_t": 0.3727918565273285, + "grad_norm": 21.66844367980957, + "learning_rate": 4.6449585330874425e-07, + "logits/chosen": 0.2913161516189575, + "logits/rejected": 0.2505802512168884, + "logps/chosen": -75.16352081298828, + "logps/ref_chosen": -61.169105529785156, + "logps/ref_rejected": -77.21674346923828, + "logps/rejected": -99.49595642089844, + "loss": 1.0435, + "margin_dpo/margin_mean": 8.284780502319336, + "margin_dpo/margin_std": 12.27697467803955, + "step": 170 + }, + { + "epoch": 0.26455026455026454, + "fcm_dpo/beta": 0.06802255660295486, + "fcm_dpo/delta": -0.13938404619693756, + "fcm_dpo/margin": 9.97547721862793, + "fcm_dpo/q_t": 0.3644518256187439, + "grad_norm": 21.26988983154297, + "learning_rate": 4.6102528404790965e-07, + "logits/chosen": 0.34859341382980347, + "logits/rejected": 0.2882172167301178, + "logps/chosen": -73.75447082519531, + "logps/ref_chosen": -59.24176788330078, + "logps/ref_rejected": -81.80384826660156, + "logps/rejected": -106.2920150756836, + "loss": 1.0468, + "margin_dpo/margin_mean": 9.97547721862793, + "margin_dpo/margin_std": 15.061019897460938, + "step": 175 + }, + { + "epoch": 0.272108843537415, + "fcm_dpo/beta": 0.060754068195819855, + "fcm_dpo/delta": -0.07431790977716446, + "fcm_dpo/margin": 9.864774703979492, + "fcm_dpo/q_t": 0.37669187784194946, + "grad_norm": 20.148046493530273, + "learning_rate": 4.5740715227200897e-07, + "logits/chosen": 0.3143027424812317, + "logits/rejected": 0.27188676595687866, + "logps/chosen": -77.92072296142578, + "logps/ref_chosen": -63.24883270263672, + "logps/ref_rejected": -79.00736236572266, + "logps/rejected": -103.54402923583984, + "loss": 1.0681, + "margin_dpo/margin_mean": 9.864773750305176, + "margin_dpo/margin_std": 15.329916000366211, + "step": 180 + }, + { + "epoch": 0.2796674225245654, + "fcm_dpo/beta": 0.05635453015565872, + "fcm_dpo/delta": -0.08090370148420334, + "fcm_dpo/margin": 10.306377410888672, + "fcm_dpo/q_t": 0.37912043929100037, + "grad_norm": 18.77512550354004, + "learning_rate": 4.5364398801258394e-07, + "logits/chosen": 0.36532798409461975, + "logits/rejected": 0.31204718351364136, + "logps/chosen": -70.10028076171875, + "logps/ref_chosen": -56.390625, + "logps/ref_rejected": -76.81001281738281, + "logps/rejected": -100.82603454589844, + "loss": 1.0654, + "margin_dpo/margin_mean": 10.306377410888672, + "margin_dpo/margin_std": 15.676936149597168, + "step": 185 + }, + { + "epoch": 0.2872260015117158, + "fcm_dpo/beta": 0.053449880331754684, + "fcm_dpo/delta": -0.07286106050014496, + "fcm_dpo/margin": 12.053500175476074, + "fcm_dpo/q_t": 0.36934491991996765, + "grad_norm": 25.36161231994629, + "learning_rate": 4.4973842271726024e-07, + "logits/chosen": 0.35614460706710815, + "logits/rejected": 0.30015695095062256, + "logps/chosen": -81.80848693847656, + "logps/ref_chosen": -68.25389099121094, + "logps/ref_rejected": -86.461181640625, + "logps/rejected": -112.06925964355469, + "loss": 1.0366, + "margin_dpo/margin_mean": 12.05350112915039, + "margin_dpo/margin_std": 17.739303588867188, + "step": 190 + }, + { + "epoch": 0.2947845804988662, + "fcm_dpo/beta": 0.05007879063487053, + "fcm_dpo/delta": -0.04965587332844734, + "fcm_dpo/margin": 11.500941276550293, + "fcm_dpo/q_t": 0.3801359236240387, + "grad_norm": 21.779829025268555, + "learning_rate": 4.4569318740967043e-07, + "logits/chosen": 0.38067522644996643, + "logits/rejected": 0.35913893580436707, + "logps/chosen": -79.82146453857422, + "logps/ref_chosen": -62.1484260559082, + "logps/ref_rejected": -71.33458709716797, + "logps/rejected": -100.50856018066406, + "loss": 1.0743, + "margin_dpo/margin_mean": 11.50094223022461, + "margin_dpo/margin_std": 17.975563049316406, + "step": 195 + }, + { + "epoch": 0.30234315948601664, + "fcm_dpo/beta": 0.04691356047987938, + "fcm_dpo/delta": -0.08742973953485489, + "fcm_dpo/margin": 13.574827194213867, + "fcm_dpo/q_t": 0.36781007051467896, + "grad_norm": 18.177783966064453, + "learning_rate": 4.415111107797445e-07, + "logits/chosen": 0.4625890851020813, + "logits/rejected": 0.39986932277679443, + "logps/chosen": -75.27424621582031, + "logps/ref_chosen": -56.950096130371094, + "logps/ref_rejected": -78.66989135742188, + "logps/rejected": -110.5688705444336, + "loss": 1.0505, + "margin_dpo/margin_mean": 13.574827194213867, + "margin_dpo/margin_std": 20.146961212158203, + "step": 200 + }, + { + "epoch": 0.30234315948601664, + "eval_fcm_dpo/beta": 0.0445309579372406, + "eval_logits/chosen": 0.43528974056243896, + "eval_logits/rejected": 0.3850432336330414, + "eval_logps/chosen": -94.9354248046875, + "eval_logps/ref_chosen": -74.85946655273438, + "eval_logps/ref_rejected": -79.54898834228516, + "eval_logps/rejected": -112.46160888671875, + "eval_loss": 0.5490387678146362, + "eval_margin_dpo/margin_mean": 12.836673736572266, + "eval_margin_dpo/margin_std": 21.53274154663086, + "eval_runtime": 39.0577, + "eval_samples_per_second": 58.964, + "eval_steps_per_second": 1.843, + "step": 200 + }, + { + "epoch": 0.30990173847316704, + "fcm_dpo/beta": 0.043045125901699066, + "fcm_dpo/delta": -0.05937931686639786, + "fcm_dpo/margin": 14.329627990722656, + "fcm_dpo/q_t": 0.3726270794868469, + "grad_norm": 24.482276916503906, + "learning_rate": 4.3719511720570814e-07, + "logits/chosen": 0.4526013731956482, + "logits/rejected": 0.3818688988685608, + "logps/chosen": -80.59419250488281, + "logps/ref_chosen": -57.99428176879883, + "logps/ref_rejected": -83.5367431640625, + "logps/rejected": -120.4662857055664, + "loss": 1.0519, + "margin_dpo/margin_mean": 14.329629898071289, + "margin_dpo/margin_std": 21.601360321044922, + "step": 205 + }, + { + "epoch": 0.31746031746031744, + "fcm_dpo/beta": 0.04131709039211273, + "fcm_dpo/delta": -0.05793388932943344, + "fcm_dpo/margin": 13.949444770812988, + "fcm_dpo/q_t": 0.3844899535179138, + "grad_norm": 19.35005760192871, + "learning_rate": 4.327482247091679e-07, + "logits/chosen": 0.4452959895133972, + "logits/rejected": 0.39058345556259155, + "logps/chosen": -90.13018798828125, + "logps/ref_chosen": -63.77195358276367, + "logps/ref_rejected": -82.56491088867188, + "logps/rejected": -122.87260437011719, + "loss": 1.1108, + "margin_dpo/margin_mean": 13.949444770812988, + "margin_dpo/margin_std": 24.073421478271484, + "step": 210 + }, + { + "epoch": 0.3250188964474679, + "fcm_dpo/beta": 0.03761471435427666, + "fcm_dpo/delta": -0.12060566991567612, + "fcm_dpo/margin": 18.96577262878418, + "fcm_dpo/q_t": 0.35724228620529175, + "grad_norm": 18.37898826599121, + "learning_rate": 4.281735428447157e-07, + "logits/chosen": 0.4427056908607483, + "logits/rejected": 0.37563619017601013, + "logps/chosen": -84.36368560791016, + "logps/ref_chosen": -60.27800750732422, + "logps/ref_rejected": -83.91607666015625, + "logps/rejected": -126.96754455566406, + "loss": 1.002, + "margin_dpo/margin_mean": 18.965770721435547, + "margin_dpo/margin_std": 26.138744354248047, + "step": 215 + }, + { + "epoch": 0.3325774754346183, + "fcm_dpo/beta": 0.033143509179353714, + "fcm_dpo/delta": -0.07818768918514252, + "fcm_dpo/margin": 18.13027000427246, + "fcm_dpo/q_t": 0.37564554810523987, + "grad_norm": 17.499849319458008, + "learning_rate": 4.234742705255272e-07, + "logits/chosen": 0.4456612169742584, + "logits/rejected": 0.38407641649246216, + "logps/chosen": -88.01606750488281, + "logps/ref_chosen": -60.88572311401367, + "logps/ref_rejected": -80.1805191040039, + "logps/rejected": -125.44112396240234, + "loss": 1.0594, + "margin_dpo/margin_mean": 18.13027000427246, + "margin_dpo/margin_std": 27.581802368164062, + "step": 220 + }, + { + "epoch": 0.3401360544217687, + "fcm_dpo/beta": 0.030816316604614258, + "fcm_dpo/delta": -0.08487220108509064, + "fcm_dpo/margin": 20.55803871154785, + "fcm_dpo/q_t": 0.37105461955070496, + "grad_norm": 17.931140899658203, + "learning_rate": 4.186536937864752e-07, + "logits/chosen": 0.511905312538147, + "logits/rejected": 0.43826180696487427, + "logps/chosen": -89.73455047607422, + "logps/ref_chosen": -61.02507781982422, + "logps/ref_rejected": -91.92439270019531, + "logps/rejected": -141.19189453125, + "loss": 1.0315, + "margin_dpo/margin_mean": 20.55803680419922, + "margin_dpo/margin_std": 29.531564712524414, + "step": 225 + }, + { + "epoch": 0.3476946334089191, + "fcm_dpo/beta": 0.030043313279747963, + "fcm_dpo/delta": -0.015888774767518044, + "fcm_dpo/margin": 19.927255630493164, + "fcm_dpo/q_t": 0.3782123029232025, + "grad_norm": 17.704288482666016, + "learning_rate": 4.137151834863213e-07, + "logits/chosen": 0.567510724067688, + "logits/rejected": 0.5179559588432312, + "logps/chosen": -85.0999984741211, + "logps/ref_chosen": -54.49797821044922, + "logps/ref_rejected": -71.96363830566406, + "logps/rejected": -122.492919921875, + "loss": 1.0889, + "margin_dpo/margin_mean": 19.927255630493164, + "margin_dpo/margin_std": 33.03584671020508, + "step": 230 + }, + { + "epoch": 0.35525321239606955, + "fcm_dpo/beta": 0.02700546756386757, + "fcm_dpo/delta": -0.13411830365657806, + "fcm_dpo/margin": 23.45638656616211, + "fcm_dpo/q_t": 0.36994558572769165, + "grad_norm": 16.464786529541016, + "learning_rate": 4.08662192950594e-07, + "logits/chosen": 0.5007590055465698, + "logits/rejected": 0.4768039286136627, + "logps/chosen": -99.23008728027344, + "logps/ref_chosen": -63.250282287597656, + "logps/ref_rejected": -73.09049987792969, + "logps/rejected": -132.5266876220703, + "loss": 1.0474, + "margin_dpo/margin_mean": 23.456384658813477, + "margin_dpo/margin_std": 33.97542190551758, + "step": 235 + }, + { + "epoch": 0.36281179138321995, + "fcm_dpo/beta": 0.024938663467764854, + "fcm_dpo/delta": -0.08994299918413162, + "fcm_dpo/margin": 27.00982666015625, + "fcm_dpo/q_t": 0.3612818121910095, + "grad_norm": 14.642565727233887, + "learning_rate": 4.0349825555680045e-07, + "logits/chosen": 0.561758279800415, + "logits/rejected": 0.5071486234664917, + "logps/chosen": -108.31246185302734, + "logps/ref_chosen": -65.26150512695312, + "logps/ref_rejected": -87.60311126708984, + "logps/rejected": -157.66390991210938, + "loss": 1.0195, + "margin_dpo/margin_mean": 27.00982666015625, + "margin_dpo/margin_std": 37.65082550048828, + "step": 240 + }, + { + "epoch": 0.37037037037037035, + "fcm_dpo/beta": 0.02278234250843525, + "fcm_dpo/delta": -0.10555760562419891, + "fcm_dpo/margin": 30.133275985717773, + "fcm_dpo/q_t": 0.3576427102088928, + "grad_norm": 15.980971336364746, + "learning_rate": 3.982269822636601e-07, + "logits/chosen": 0.5394655466079712, + "logits/rejected": 0.5064207911491394, + "logps/chosen": -108.2628173828125, + "logps/ref_chosen": -65.73170471191406, + "logps/ref_rejected": -75.19642639160156, + "logps/rejected": -147.86080932617188, + "loss": 0.9861, + "margin_dpo/margin_mean": 30.133275985717773, + "margin_dpo/margin_std": 38.397438049316406, + "step": 245 + }, + { + "epoch": 0.3779289493575208, + "fcm_dpo/beta": 0.0209406279027462, + "fcm_dpo/delta": -0.029252177104353905, + "fcm_dpo/margin": 25.17742347717285, + "fcm_dpo/q_t": 0.39082691073417664, + "grad_norm": 18.229862213134766, + "learning_rate": 3.9285205908608934e-07, + "logits/chosen": 0.599532961845398, + "logits/rejected": 0.5946930050849915, + "logps/chosen": -126.43806457519531, + "logps/ref_chosen": -70.71224212646484, + "logps/ref_rejected": -76.12723541259766, + "logps/rejected": -157.03048706054688, + "loss": 1.1321, + "margin_dpo/margin_mean": 25.17742347717285, + "margin_dpo/margin_std": 44.761314392089844, + "step": 250 + }, + { + "epoch": 0.3854875283446712, + "fcm_dpo/beta": 0.02031904086470604, + "fcm_dpo/delta": -0.02309424616396427, + "fcm_dpo/margin": 24.082748413085938, + "fcm_dpo/q_t": 0.3976757824420929, + "grad_norm": 18.887149810791016, + "learning_rate": 3.873772445177015e-07, + "logits/chosen": 0.609887957572937, + "logits/rejected": 0.5647954940795898, + "logps/chosen": -117.80338287353516, + "logps/ref_chosen": -61.767662048339844, + "logps/ref_rejected": -77.38813018798828, + "logps/rejected": -157.50662231445312, + "loss": 1.1377, + "margin_dpo/margin_mean": 24.082748413085938, + "margin_dpo/margin_std": 43.56954574584961, + "step": 255 + }, + { + "epoch": 0.3930461073318216, + "fcm_dpo/beta": 0.019356101751327515, + "fcm_dpo/delta": -0.06188065558671951, + "fcm_dpo/margin": 33.2767448425293, + "fcm_dpo/q_t": 0.3668089807033539, + "grad_norm": 19.52748680114746, + "learning_rate": 3.818063669026256e-07, + "logits/chosen": 0.585278332233429, + "logits/rejected": 0.5075653195381165, + "logps/chosen": -119.7823486328125, + "logps/ref_chosen": -61.57584762573242, + "logps/ref_rejected": -91.87513732910156, + "logps/rejected": -183.35836791992188, + "loss": 1.0274, + "margin_dpo/margin_mean": 33.2767448425293, + "margin_dpo/margin_std": 47.10149002075195, + "step": 260 + }, + { + "epoch": 0.40060468631897206, + "fcm_dpo/beta": 0.019167505204677582, + "fcm_dpo/delta": 0.02147207036614418, + "fcm_dpo/margin": 28.888378143310547, + "fcm_dpo/q_t": 0.38470879197120667, + "grad_norm": 16.250465393066406, + "learning_rate": 3.7614332175848027e-07, + "logits/chosen": 0.5632354021072388, + "logits/rejected": 0.5125952959060669, + "logps/chosen": -119.10379791259766, + "logps/ref_chosen": -65.75422668457031, + "logps/ref_rejected": -77.9569320678711, + "logps/rejected": -160.19488525390625, + "loss": 1.082, + "margin_dpo/margin_mean": 28.888378143310547, + "margin_dpo/margin_std": 46.08098602294922, + "step": 265 + }, + { + "epoch": 0.40816326530612246, + "fcm_dpo/beta": 0.018922636285424232, + "fcm_dpo/delta": -0.03335314989089966, + "fcm_dpo/margin": 29.144763946533203, + "fcm_dpo/q_t": 0.3839413523674011, + "grad_norm": 16.50005531311035, + "learning_rate": 3.7039206905237656e-07, + "logits/chosen": 0.6007962226867676, + "logits/rejected": 0.5515360236167908, + "logps/chosen": -110.72042083740234, + "logps/ref_chosen": -62.27649688720703, + "logps/ref_rejected": -76.56950378417969, + "logps/rejected": -154.158203125, + "loss": 1.0747, + "margin_dpo/margin_mean": 29.144763946533203, + "margin_dpo/margin_std": 44.99258804321289, + "step": 270 + }, + { + "epoch": 0.41572184429327286, + "fcm_dpo/beta": 0.018402384594082832, + "fcm_dpo/delta": -0.021868888288736343, + "fcm_dpo/margin": 32.19723129272461, + "fcm_dpo/q_t": 0.37771254777908325, + "grad_norm": 16.371837615966797, + "learning_rate": 3.645566304318526e-07, + "logits/chosen": 0.5913391709327698, + "logits/rejected": 0.5466698408126831, + "logps/chosen": -113.94535827636719, + "logps/ref_chosen": -61.854393005371094, + "logps/ref_rejected": -77.22246551513672, + "logps/rejected": -161.51065063476562, + "loss": 1.0643, + "margin_dpo/margin_mean": 32.197235107421875, + "margin_dpo/margin_std": 49.30824279785156, + "step": 275 + }, + { + "epoch": 0.42328042328042326, + "fcm_dpo/beta": 0.01777859404683113, + "fcm_dpo/delta": -0.08700723201036453, + "fcm_dpo/margin": 34.64583206176758, + "fcm_dpo/q_t": 0.3692876696586609, + "grad_norm": 15.50888729095459, + "learning_rate": 3.586410864126781e-07, + "logits/chosen": 0.593945324420929, + "logits/rejected": 0.5639765858650208, + "logps/chosen": -114.51588439941406, + "logps/ref_chosen": -61.29896926879883, + "logps/ref_rejected": -73.35762023925781, + "logps/rejected": -161.22035217285156, + "loss": 1.0139, + "margin_dpo/margin_mean": 34.64583206176758, + "margin_dpo/margin_std": 45.06488800048828, + "step": 280 + }, + { + "epoch": 0.4308390022675737, + "fcm_dpo/beta": 0.016293346881866455, + "fcm_dpo/delta": -0.030563678592443466, + "fcm_dpo/margin": 35.089866638183594, + "fcm_dpo/q_t": 0.37944841384887695, + "grad_norm": 18.91819190979004, + "learning_rate": 3.5264957352549375e-07, + "logits/chosen": 0.6056411862373352, + "logits/rejected": 0.5613064765930176, + "logps/chosen": -125.51373291015625, + "logps/ref_chosen": -63.435462951660156, + "logps/ref_rejected": -79.73661804199219, + "logps/rejected": -176.90478515625, + "loss": 1.0488, + "margin_dpo/margin_mean": 35.089866638183594, + "margin_dpo/margin_std": 50.59145736694336, + "step": 285 + }, + { + "epoch": 0.4383975812547241, + "fcm_dpo/beta": 0.015350925736129284, + "fcm_dpo/delta": -0.06803837418556213, + "fcm_dpo/margin": 40.154258728027344, + "fcm_dpo/q_t": 0.36974334716796875, + "grad_norm": 18.484561920166016, + "learning_rate": 3.465862814232821e-07, + "logits/chosen": 0.6393694877624512, + "logits/rejected": 0.5767431855201721, + "logps/chosen": -128.746337890625, + "logps/ref_chosen": -57.696876525878906, + "logps/ref_rejected": -79.78132629394531, + "logps/rejected": -190.9850616455078, + "loss": 1.0121, + "margin_dpo/margin_mean": 40.154258728027344, + "margin_dpo/margin_std": 53.58546829223633, + "step": 290 + }, + { + "epoch": 0.4459561602418745, + "fcm_dpo/beta": 0.014825056307017803, + "fcm_dpo/delta": -0.02245759218931198, + "fcm_dpo/margin": 38.19078063964844, + "fcm_dpo/q_t": 0.3817628026008606, + "grad_norm": 19.01740074157715, + "learning_rate": 3.4045544995169125e-07, + "logits/chosen": 0.7111937999725342, + "logits/rejected": 0.6355310678482056, + "logps/chosen": -135.02879333496094, + "logps/ref_chosen": -55.430633544921875, + "logps/ref_rejected": -78.1390151977539, + "logps/rejected": -195.927978515625, + "loss": 1.0571, + "margin_dpo/margin_mean": 38.19078826904297, + "margin_dpo/margin_std": 56.477027893066406, + "step": 295 + }, + { + "epoch": 0.45351473922902497, + "fcm_dpo/beta": 0.015004401095211506, + "fcm_dpo/delta": 0.03381625562906265, + "fcm_dpo/margin": 34.913299560546875, + "fcm_dpo/q_t": 0.39039894938468933, + "grad_norm": 16.89678955078125, + "learning_rate": 3.3426136618426043e-07, + "logits/chosen": 0.6468077898025513, + "logits/rejected": 0.5938016176223755, + "logps/chosen": -149.64816284179688, + "logps/ref_chosen": -61.207069396972656, + "logps/ref_rejected": -75.23294067382812, + "logps/rejected": -198.58737182617188, + "loss": 1.0995, + "margin_dpo/margin_mean": 34.913299560546875, + "margin_dpo/margin_std": 57.363426208496094, + "step": 300 + }, + { + "epoch": 0.46107331821617537, + "fcm_dpo/beta": 0.015164652839303017, + "fcm_dpo/delta": -0.027595514431595802, + "fcm_dpo/margin": 34.962440490722656, + "fcm_dpo/q_t": 0.38818344473838806, + "grad_norm": 17.029956817626953, + "learning_rate": 3.280083614246217e-07, + "logits/chosen": 0.6154987812042236, + "logits/rejected": 0.578453540802002, + "logps/chosen": -147.16146850585938, + "logps/ref_chosen": -63.06663131713867, + "logps/ref_rejected": -78.45845031738281, + "logps/rejected": -197.51571655273438, + "loss": 1.0998, + "margin_dpo/margin_mean": 34.96243667602539, + "margin_dpo/margin_std": 57.51310348510742, + "step": 305 + }, + { + "epoch": 0.46863189720332576, + "fcm_dpo/beta": 0.014774846844375134, + "fcm_dpo/delta": -0.008402171544730663, + "fcm_dpo/margin": 27.70456886291504, + "fcm_dpo/q_t": 0.41280922293663025, + "grad_norm": 15.905935287475586, + "learning_rate": 3.2170080817777257e-07, + "logits/chosen": 0.6693840622901917, + "logits/rejected": 0.619363009929657, + "logps/chosen": -142.225341796875, + "logps/ref_chosen": -63.60908889770508, + "logps/ref_rejected": -74.06394958496094, + "logps/rejected": -180.38479614257812, + "loss": 1.1676, + "margin_dpo/margin_mean": 27.70456886291504, + "margin_dpo/margin_std": 53.79878616333008, + "step": 310 + }, + { + "epoch": 0.47619047619047616, + "fcm_dpo/beta": 0.014566788449883461, + "fcm_dpo/delta": -0.02135154977440834, + "fcm_dpo/margin": 35.78001403808594, + "fcm_dpo/q_t": 0.38799604773521423, + "grad_norm": 13.580395698547363, + "learning_rate": 3.1534311709253723e-07, + "logits/chosen": 0.6421744227409363, + "logits/rejected": 0.5867301225662231, + "logps/chosen": -130.10659790039062, + "logps/ref_chosen": -62.31493377685547, + "logps/ref_rejected": -75.07472229003906, + "logps/rejected": -178.64637756347656, + "loss": 1.0606, + "margin_dpo/margin_mean": 35.78001403808594, + "margin_dpo/margin_std": 51.48203659057617, + "step": 315 + }, + { + "epoch": 0.4837490551776266, + "fcm_dpo/beta": 0.013901944272220135, + "fcm_dpo/delta": -0.061062753200531006, + "fcm_dpo/margin": 40.63452911376953, + "fcm_dpo/q_t": 0.3800038993358612, + "grad_norm": 15.753009796142578, + "learning_rate": 3.0893973387735683e-07, + "logits/chosen": 0.587223470211029, + "logits/rejected": 0.524192214012146, + "logps/chosen": -118.84355163574219, + "logps/ref_chosen": -55.336036682128906, + "logps/ref_rejected": -80.05536651611328, + "logps/rejected": -184.19741821289062, + "loss": 1.0452, + "margin_dpo/margin_mean": 40.63452911376953, + "margin_dpo/margin_std": 56.74776077270508, + "step": 320 + }, + { + "epoch": 0.491307634164777, + "fcm_dpo/beta": 0.013363140635192394, + "fcm_dpo/delta": -0.023248041048645973, + "fcm_dpo/margin": 41.32105255126953, + "fcm_dpo/q_t": 0.3810966908931732, + "grad_norm": 14.63464069366455, + "learning_rate": 3.0249513619156206e-07, + "logits/chosen": 0.6304353475570679, + "logits/rejected": 0.5674418210983276, + "logps/chosen": -130.5197296142578, + "logps/ref_chosen": -57.90629959106445, + "logps/ref_rejected": -74.2243881225586, + "logps/rejected": -188.1588592529297, + "loss": 1.0513, + "margin_dpo/margin_mean": 41.32105255126953, + "margin_dpo/margin_std": 59.10980987548828, + "step": 325 + }, + { + "epoch": 0.4988662131519274, + "fcm_dpo/beta": 0.013443930074572563, + "fcm_dpo/delta": 0.021733686327934265, + "fcm_dpo/margin": 36.37574005126953, + "fcm_dpo/q_t": 0.39693742990493774, + "grad_norm": 15.07494831085205, + "learning_rate": 2.9601383051430505e-07, + "logits/chosen": 0.5850898623466492, + "logits/rejected": 0.5469895005226135, + "logps/chosen": -149.595458984375, + "logps/ref_chosen": -65.17555236816406, + "logps/ref_rejected": -78.53681182861328, + "logps/rejected": -199.3324432373047, + "loss": 1.1175, + "margin_dpo/margin_mean": 36.37574005126953, + "margin_dpo/margin_std": 62.23854446411133, + "step": 330 + }, + { + "epoch": 0.5064247921390779, + "fcm_dpo/beta": 0.01288739126175642, + "fcm_dpo/delta": -0.0680394172668457, + "fcm_dpo/margin": 46.44968795776367, + "fcm_dpo/q_t": 0.37343794107437134, + "grad_norm": 19.42026710510254, + "learning_rate": 2.895003489933375e-07, + "logits/chosen": 0.6479321122169495, + "logits/rejected": 0.600612998008728, + "logps/chosen": -147.13876342773438, + "logps/ref_chosen": -62.62797927856445, + "logps/ref_rejected": -79.9095458984375, + "logps/rejected": -210.8699951171875, + "loss": 1.0295, + "margin_dpo/margin_mean": 46.44968795776367, + "margin_dpo/margin_std": 64.50286865234375, + "step": 335 + }, + { + "epoch": 0.5139833711262283, + "fcm_dpo/beta": 0.012590940110385418, + "fcm_dpo/delta": 0.003505054162815213, + "fcm_dpo/margin": 38.454471588134766, + "fcm_dpo/q_t": 0.39839255809783936, + "grad_norm": 15.376999855041504, + "learning_rate": 2.8295924627584004e-07, + "logits/chosen": 0.6036761999130249, + "logits/rejected": 0.5653026103973389, + "logps/chosen": -155.42881774902344, + "logps/ref_chosen": -61.1064567565918, + "logps/ref_rejected": -76.71846008300781, + "logps/rejected": -209.4952850341797, + "loss": 1.1186, + "margin_dpo/margin_mean": 38.454471588134766, + "margin_dpo/margin_std": 66.48394012451172, + "step": 340 + }, + { + "epoch": 0.5215419501133787, + "fcm_dpo/beta": 0.012363018468022346, + "fcm_dpo/delta": -0.01725325547158718, + "fcm_dpo/margin": 44.01114273071289, + "fcm_dpo/q_t": 0.3849506974220276, + "grad_norm": 15.500265121459961, + "learning_rate": 2.7639509632351927e-07, + "logits/chosen": 0.6400725841522217, + "logits/rejected": 0.5962103009223938, + "logps/chosen": -147.3646240234375, + "logps/ref_chosen": -60.12370681762695, + "logps/ref_rejected": -78.58574676513672, + "logps/rejected": -209.83779907226562, + "loss": 1.0666, + "margin_dpo/margin_mean": 44.01114273071289, + "margin_dpo/margin_std": 65.67613220214844, + "step": 345 + }, + { + "epoch": 0.5291005291005291, + "fcm_dpo/beta": 0.012403665110468864, + "fcm_dpo/delta": -0.03641422092914581, + "fcm_dpo/margin": 49.11076354980469, + "fcm_dpo/q_t": 0.3730853796005249, + "grad_norm": 18.272642135620117, + "learning_rate": 2.698124892141971e-07, + "logits/chosen": 0.6958315372467041, + "logits/rejected": 0.6265360116958618, + "logps/chosen": -138.1358642578125, + "logps/ref_chosen": -55.104461669921875, + "logps/ref_rejected": -80.63292694091797, + "logps/rejected": -212.77511596679688, + "loss": 1.0253, + "margin_dpo/margin_mean": 49.11076354980469, + "margin_dpo/margin_std": 67.76351165771484, + "step": 350 + }, + { + "epoch": 0.5366591080876795, + "fcm_dpo/beta": 0.012127144262194633, + "fcm_dpo/delta": -0.010115819983184338, + "fcm_dpo/margin": 50.23556137084961, + "fcm_dpo/q_t": 0.37128472328186035, + "grad_norm": 17.643238067626953, + "learning_rate": 2.632160279321328e-07, + "logits/chosen": 0.6702345609664917, + "logits/rejected": 0.5912803411483765, + "logps/chosen": -134.65940856933594, + "logps/ref_chosen": -54.87224197387695, + "logps/ref_rejected": -77.01316833496094, + "logps/rejected": -207.03591918945312, + "loss": 1.0338, + "margin_dpo/margin_mean": 50.23556137084961, + "margin_dpo/margin_std": 71.0433578491211, + "step": 355 + }, + { + "epoch": 0.54421768707483, + "fcm_dpo/beta": 0.01166975311934948, + "fcm_dpo/delta": -0.01579994522035122, + "fcm_dpo/margin": 41.836509704589844, + "fcm_dpo/q_t": 0.3966527581214905, + "grad_norm": 15.070870399475098, + "learning_rate": 2.5661032514931834e-07, + "logits/chosen": 0.6302360892295837, + "logits/rejected": 0.5863192677497864, + "logps/chosen": -152.76345825195312, + "logps/ref_chosen": -60.75285720825195, + "logps/ref_rejected": -75.21507263183594, + "logps/rejected": -209.0622100830078, + "loss": 1.1188, + "margin_dpo/margin_mean": 41.83650588989258, + "margin_dpo/margin_std": 70.53252410888672, + "step": 360 + }, + { + "epoch": 0.5517762660619804, + "fcm_dpo/beta": 0.01143195666372776, + "fcm_dpo/delta": -0.052489638328552246, + "fcm_dpo/margin": 56.774986267089844, + "fcm_dpo/q_t": 0.3644375205039978, + "grad_norm": 12.386019706726074, + "learning_rate": 2.5e-07, + "logits/chosen": 0.6857043504714966, + "logits/rejected": 0.6063531637191772, + "logps/chosen": -149.87673950195312, + "logps/ref_chosen": -58.56513595581055, + "logps/ref_rejected": -84.06403350830078, + "logps/rejected": -232.150634765625, + "loss": 0.9963, + "margin_dpo/margin_mean": 56.774986267089844, + "margin_dpo/margin_std": 74.50080871582031, + "step": 365 + }, + { + "epoch": 0.5593348450491308, + "fcm_dpo/beta": 0.011315222829580307, + "fcm_dpo/delta": 0.02159869484603405, + "fcm_dpo/margin": 45.84794616699219, + "fcm_dpo/q_t": 0.3889442980289459, + "grad_norm": 15.18197250366211, + "learning_rate": 2.4338967485068164e-07, + "logits/chosen": 0.6318791508674622, + "logits/rejected": 0.5831542611122131, + "logps/chosen": -152.20651245117188, + "logps/ref_chosen": -59.443138122558594, + "logps/ref_rejected": -75.80937194824219, + "logps/rejected": -214.42068481445312, + "loss": 1.0915, + "margin_dpo/margin_mean": 45.84794616699219, + "margin_dpo/margin_std": 73.65330505371094, + "step": 370 + }, + { + "epoch": 0.5668934240362812, + "fcm_dpo/beta": 0.011248277500271797, + "fcm_dpo/delta": -0.027419675141572952, + "fcm_dpo/margin": 46.06201171875, + "fcm_dpo/q_t": 0.3906846046447754, + "grad_norm": 16.094900131225586, + "learning_rate": 2.3678397206786715e-07, + "logits/chosen": 0.6881932616233826, + "logits/rejected": 0.6348354816436768, + "logps/chosen": -155.08950805664062, + "logps/ref_chosen": -58.59185028076172, + "logps/ref_rejected": -73.7529525756836, + "logps/rejected": -216.31265258789062, + "loss": 1.1143, + "margin_dpo/margin_mean": 46.062007904052734, + "margin_dpo/margin_std": 78.36566162109375, + "step": 375 + }, + { + "epoch": 0.5744520030234316, + "fcm_dpo/beta": 0.010973427444696426, + "fcm_dpo/delta": -0.023532114923000336, + "fcm_dpo/margin": 51.64561080932617, + "fcm_dpo/q_t": 0.3803391456604004, + "grad_norm": 13.79555892944336, + "learning_rate": 2.3018751078580283e-07, + "logits/chosen": 0.7098981142044067, + "logits/rejected": 0.6563004851341248, + "logps/chosen": -153.05264282226562, + "logps/ref_chosen": -58.93424606323242, + "logps/ref_rejected": -76.27055358886719, + "logps/rejected": -222.03457641601562, + "loss": 1.0563, + "margin_dpo/margin_mean": 51.64561080932617, + "margin_dpo/margin_std": 76.09913635253906, + "step": 380 + }, + { + "epoch": 0.582010582010582, + "fcm_dpo/beta": 0.010893596336245537, + "fcm_dpo/delta": 0.006062631495296955, + "fcm_dpo/margin": 44.309181213378906, + "fcm_dpo/q_t": 0.39645999670028687, + "grad_norm": 13.824441909790039, + "learning_rate": 2.2360490367648084e-07, + "logits/chosen": 0.6328981518745422, + "logits/rejected": 0.606531023979187, + "logps/chosen": -165.55270385742188, + "logps/ref_chosen": -66.42684173583984, + "logps/ref_rejected": -76.96304321289062, + "logps/rejected": -220.3980712890625, + "loss": 1.1059, + "margin_dpo/margin_mean": 44.30918502807617, + "margin_dpo/margin_std": 72.50572204589844, + "step": 385 + }, + { + "epoch": 0.5895691609977324, + "fcm_dpo/beta": 0.011033998802304268, + "fcm_dpo/delta": 0.017967429012060165, + "fcm_dpo/margin": 46.52573013305664, + "fcm_dpo/q_t": 0.39048102498054504, + "grad_norm": 13.157139778137207, + "learning_rate": 2.170407537241599e-07, + "logits/chosen": 0.6664471626281738, + "logits/rejected": 0.6082719564437866, + "logps/chosen": -158.45370483398438, + "logps/ref_chosen": -60.984214782714844, + "logps/ref_rejected": -79.54056549072266, + "logps/rejected": -223.53579711914062, + "loss": 1.0801, + "margin_dpo/margin_mean": 46.52573013305664, + "margin_dpo/margin_std": 71.85535430908203, + "step": 390 + }, + { + "epoch": 0.5971277399848829, + "fcm_dpo/beta": 0.010882696136832237, + "fcm_dpo/delta": -0.01834883727133274, + "fcm_dpo/margin": 53.6688117980957, + "fcm_dpo/q_t": 0.37560978531837463, + "grad_norm": 17.336837768554688, + "learning_rate": 2.104996510066625e-07, + "logits/chosen": 0.6918023824691772, + "logits/rejected": 0.6310297846794128, + "logps/chosen": -150.5190887451172, + "logps/ref_chosen": -58.30937957763672, + "logps/ref_rejected": -80.09587097167969, + "logps/rejected": -225.9744110107422, + "loss": 1.0295, + "margin_dpo/margin_mean": 53.6688117980957, + "margin_dpo/margin_std": 73.11488342285156, + "step": 395 + }, + { + "epoch": 0.6046863189720333, + "fcm_dpo/beta": 0.010488608852028847, + "fcm_dpo/delta": -0.05746689438819885, + "fcm_dpo/margin": 49.87424850463867, + "fcm_dpo/q_t": 0.38892143964767456, + "grad_norm": 19.94718360900879, + "learning_rate": 2.0398616948569493e-07, + "logits/chosen": 0.6400595307350159, + "logits/rejected": 0.5548309087753296, + "logps/chosen": -163.4067840576172, + "logps/ref_chosen": -61.39867401123047, + "logps/ref_rejected": -89.0177993774414, + "logps/rejected": -240.90017700195312, + "loss": 1.0738, + "margin_dpo/margin_mean": 49.87424850463867, + "margin_dpo/margin_std": 74.35093688964844, + "step": 400 + }, + { + "epoch": 0.6046863189720333, + "eval_fcm_dpo/beta": 0.010275867767632008, + "eval_logits/chosen": 0.6246050596237183, + "eval_logits/rejected": 0.5774987936019897, + "eval_logps/chosen": -176.5742950439453, + "eval_logps/ref_chosen": -74.85946655273438, + "eval_logps/ref_rejected": -79.54898834228516, + "eval_logps/rejected": -226.17611694335938, + "eval_loss": 0.5613793134689331, + "eval_margin_dpo/margin_mean": 44.91230392456055, + "eval_margin_dpo/margin_std": 77.27910614013672, + "eval_runtime": 39.1906, + "eval_samples_per_second": 58.764, + "eval_steps_per_second": 1.837, + "step": 400 + }, + { + "epoch": 0.6122448979591837, + "fcm_dpo/beta": 0.010087807662785053, + "fcm_dpo/delta": -0.038665831089019775, + "fcm_dpo/margin": 55.62682342529297, + "fcm_dpo/q_t": 0.3804628252983093, + "grad_norm": 13.084096908569336, + "learning_rate": 1.975048638084379e-07, + "logits/chosen": 0.6958111524581909, + "logits/rejected": 0.6256667971611023, + "logps/chosen": -153.22628784179688, + "logps/ref_chosen": -55.953521728515625, + "logps/ref_rejected": -77.67539978027344, + "logps/rejected": -230.57498168945312, + "loss": 1.0364, + "margin_dpo/margin_mean": 55.62682342529297, + "margin_dpo/margin_std": 75.48118591308594, + "step": 405 + }, + { + "epoch": 0.6198034769463341, + "fcm_dpo/beta": 0.009773796424269676, + "fcm_dpo/delta": -0.03128813952207565, + "fcm_dpo/margin": 55.161216735839844, + "fcm_dpo/q_t": 0.38234299421310425, + "grad_norm": 12.041950225830078, + "learning_rate": 1.9106026612264315e-07, + "logits/chosen": 0.6618553996086121, + "logits/rejected": 0.5954070687294006, + "logps/chosen": -169.55258178710938, + "logps/ref_chosen": -63.40419387817383, + "logps/ref_rejected": -80.85710144042969, + "logps/rejected": -242.1666717529297, + "loss": 1.0439, + "margin_dpo/margin_mean": 55.161216735839844, + "margin_dpo/margin_std": 74.25384521484375, + "step": 410 + }, + { + "epoch": 0.6273620559334845, + "fcm_dpo/beta": 0.009798675775527954, + "fcm_dpo/delta": 0.039564795792102814, + "fcm_dpo/margin": 52.46839141845703, + "fcm_dpo/q_t": 0.38860344886779785, + "grad_norm": 13.28818416595459, + "learning_rate": 1.846568829074628e-07, + "logits/chosen": 0.6661458015441895, + "logits/rejected": 0.6173139214515686, + "logps/chosen": -174.634765625, + "logps/ref_chosen": -57.6942024230957, + "logps/ref_rejected": -71.74036407470703, + "logps/rejected": -241.14932250976562, + "loss": 1.0677, + "margin_dpo/margin_mean": 52.46839141845703, + "margin_dpo/margin_std": 77.23680114746094, + "step": 415 + }, + { + "epoch": 0.6349206349206349, + "fcm_dpo/beta": 0.009716962464153767, + "fcm_dpo/delta": -0.0343676395714283, + "fcm_dpo/margin": 47.64646911621094, + "fcm_dpo/q_t": 0.4010258615016937, + "grad_norm": 15.641878128051758, + "learning_rate": 1.782991918222275e-07, + "logits/chosen": 0.6854730248451233, + "logits/rejected": 0.6435775756835938, + "logps/chosen": -182.29537963867188, + "logps/ref_chosen": -59.169517517089844, + "logps/ref_rejected": -69.47721099853516, + "logps/rejected": -240.24954223632812, + "loss": 1.1303, + "margin_dpo/margin_mean": 47.64646911621094, + "margin_dpo/margin_std": 82.67323303222656, + "step": 420 + }, + { + "epoch": 0.6424792139077853, + "fcm_dpo/beta": 0.009624272584915161, + "fcm_dpo/delta": 0.003170407610014081, + "fcm_dpo/margin": 58.16600799560547, + "fcm_dpo/q_t": 0.3807678818702698, + "grad_norm": 14.270646095275879, + "learning_rate": 1.7199163857537824e-07, + "logits/chosen": 0.6730635166168213, + "logits/rejected": 0.6302940845489502, + "logps/chosen": -172.57290649414062, + "logps/ref_chosen": -58.09320831298828, + "logps/ref_rejected": -73.98226165771484, + "logps/rejected": -246.6279754638672, + "loss": 1.0478, + "margin_dpo/margin_mean": 58.16600799560547, + "margin_dpo/margin_std": 82.8730239868164, + "step": 425 + }, + { + "epoch": 0.6500377928949358, + "fcm_dpo/beta": 0.009675036184489727, + "fcm_dpo/delta": -0.009549234993755817, + "fcm_dpo/margin": 51.29081344604492, + "fcm_dpo/q_t": 0.39365965127944946, + "grad_norm": 14.406279563903809, + "learning_rate": 1.6573863381573954e-07, + "logits/chosen": 0.6383100748062134, + "logits/rejected": 0.6207207441329956, + "logps/chosen": -191.18653869628906, + "logps/ref_chosen": -62.7039909362793, + "logps/ref_rejected": -74.52284240722656, + "logps/rejected": -254.29623413085938, + "loss": 1.112, + "margin_dpo/margin_mean": 51.29081344604492, + "margin_dpo/margin_std": 86.48429870605469, + "step": 430 + }, + { + "epoch": 0.6575963718820862, + "fcm_dpo/beta": 0.009738308377563953, + "fcm_dpo/delta": 0.005447807256132364, + "fcm_dpo/margin": 59.08086013793945, + "fcm_dpo/q_t": 0.3763192296028137, + "grad_norm": 16.807050704956055, + "learning_rate": 1.5954455004830878e-07, + "logits/chosen": 0.7440453171730042, + "logits/rejected": 0.7008776664733887, + "logps/chosen": -169.50389099121094, + "logps/ref_chosen": -56.12516403198242, + "logps/ref_rejected": -74.36073303222656, + "logps/rejected": -246.8203125, + "loss": 1.0417, + "margin_dpo/margin_mean": 59.08086013793945, + "margin_dpo/margin_std": 83.0219955444336, + "step": 435 + }, + { + "epoch": 0.6651549508692366, + "fcm_dpo/beta": 0.009510443545877934, + "fcm_dpo/delta": -0.04184270650148392, + "fcm_dpo/margin": 58.687843322753906, + "fcm_dpo/q_t": 0.3826465308666229, + "grad_norm": 22.634798049926758, + "learning_rate": 1.534137185767178e-07, + "logits/chosen": 0.6856757998466492, + "logits/rejected": 0.6076371073722839, + "logps/chosen": -172.70729064941406, + "logps/ref_chosen": -55.67548751831055, + "logps/ref_rejected": -76.62055206298828, + "logps/rejected": -252.34017944335938, + "loss": 1.0688, + "margin_dpo/margin_mean": 58.687843322753906, + "margin_dpo/margin_std": 89.2109146118164, + "step": 440 + }, + { + "epoch": 0.672713529856387, + "fcm_dpo/beta": 0.008997871540486813, + "fcm_dpo/delta": -0.03983866050839424, + "fcm_dpo/margin": 64.14662170410156, + "fcm_dpo/q_t": 0.3751087486743927, + "grad_norm": 14.766826629638672, + "learning_rate": 1.473504264745062e-07, + "logits/chosen": 0.6673511266708374, + "logits/rejected": 0.6046266555786133, + "logps/chosen": -180.44454956054688, + "logps/ref_chosen": -59.903411865234375, + "logps/ref_rejected": -82.02873229980469, + "logps/rejected": -266.71649169921875, + "loss": 1.023, + "margin_dpo/margin_mean": 64.14662170410156, + "margin_dpo/margin_std": 84.01716613769531, + "step": 445 + }, + { + "epoch": 0.6802721088435374, + "fcm_dpo/beta": 0.008571968413889408, + "fcm_dpo/delta": -0.029057633131742477, + "fcm_dpo/margin": 60.95649337768555, + "fcm_dpo/q_t": 0.3861503601074219, + "grad_norm": 15.082186698913574, + "learning_rate": 1.4135891358732205e-07, + "logits/chosen": 0.670871376991272, + "logits/rejected": 0.6003819704055786, + "logps/chosen": -176.04681396484375, + "logps/ref_chosen": -55.83526611328125, + "logps/ref_rejected": -79.63658142089844, + "logps/rejected": -260.80462646484375, + "loss": 1.0575, + "margin_dpo/margin_mean": 60.95649337768555, + "margin_dpo/margin_std": 84.30404663085938, + "step": 450 + }, + { + "epoch": 0.6878306878306878, + "fcm_dpo/beta": 0.008977680467069149, + "fcm_dpo/delta": 0.06819285452365875, + "fcm_dpo/margin": 57.031578063964844, + "fcm_dpo/q_t": 0.39055323600769043, + "grad_norm": 14.447818756103516, + "learning_rate": 1.354433695681474e-07, + "logits/chosen": 0.6231824159622192, + "logits/rejected": 0.5777461528778076, + "logps/chosen": -178.04124450683594, + "logps/ref_chosen": -60.59226608276367, + "logps/ref_rejected": -73.37936401367188, + "logps/rejected": -247.8599395751953, + "loss": 1.0795, + "margin_dpo/margin_mean": 57.031578063964844, + "margin_dpo/margin_std": 88.28900146484375, + "step": 455 + }, + { + "epoch": 0.6953892668178382, + "fcm_dpo/beta": 0.009271183051168919, + "fcm_dpo/delta": -0.02087727189064026, + "fcm_dpo/margin": 65.31262969970703, + "fcm_dpo/q_t": 0.3707457184791565, + "grad_norm": 13.688095092773438, + "learning_rate": 1.2960793094762345e-07, + "logits/chosen": 0.6910965442657471, + "logits/rejected": 0.6071202158927917, + "logps/chosen": -175.61166381835938, + "logps/ref_chosen": -56.21283721923828, + "logps/ref_rejected": -83.02075958251953, + "logps/rejected": -267.73223876953125, + "loss": 1.0119, + "margin_dpo/margin_mean": 65.31262969970703, + "margin_dpo/margin_std": 85.2598648071289, + "step": 460 + }, + { + "epoch": 0.7029478458049887, + "fcm_dpo/beta": 0.008703077211976051, + "fcm_dpo/delta": -0.03589098900556564, + "fcm_dpo/margin": 65.30760192871094, + "fcm_dpo/q_t": 0.37661120295524597, + "grad_norm": 15.768505096435547, + "learning_rate": 1.238566782415197e-07, + "logits/chosen": 0.7279990315437317, + "logits/rejected": 0.6809935569763184, + "logps/chosen": -180.1580352783203, + "logps/ref_chosen": -59.0674934387207, + "logps/ref_rejected": -74.53498840332031, + "logps/rejected": -260.93310546875, + "loss": 1.0318, + "margin_dpo/margin_mean": 65.30760192871094, + "margin_dpo/margin_std": 86.46934509277344, + "step": 465 + }, + { + "epoch": 0.7105064247921391, + "fcm_dpo/beta": 0.008754456415772438, + "fcm_dpo/delta": 0.00041560232057236135, + "fcm_dpo/margin": 60.178565979003906, + "fcm_dpo/q_t": 0.3857038617134094, + "grad_norm": 13.696944236755371, + "learning_rate": 1.1819363309737438e-07, + "logits/chosen": 0.7032414674758911, + "logits/rejected": 0.6553713083267212, + "logps/chosen": -180.98046875, + "logps/ref_chosen": -58.3397331237793, + "logps/ref_rejected": -74.33660125732422, + "logps/rejected": -257.1558837890625, + "loss": 1.0557, + "margin_dpo/margin_mean": 60.178558349609375, + "margin_dpo/margin_std": 85.16178131103516, + "step": 470 + }, + { + "epoch": 0.7180650037792895, + "fcm_dpo/beta": 0.008638769388198853, + "fcm_dpo/delta": -0.022516410797834396, + "fcm_dpo/margin": 68.27113342285156, + "fcm_dpo/q_t": 0.3759641647338867, + "grad_norm": 10.956338882446289, + "learning_rate": 1.126227554822985e-07, + "logits/chosen": 0.7186409831047058, + "logits/rejected": 0.6497506499290466, + "logps/chosen": -168.41812133789062, + "logps/ref_chosen": -54.60407638549805, + "logps/ref_rejected": -79.94635009765625, + "logps/rejected": -262.03155517578125, + "loss": 1.0416, + "margin_dpo/margin_mean": 68.27113342285156, + "margin_dpo/margin_std": 97.92758178710938, + "step": 475 + }, + { + "epoch": 0.7256235827664399, + "fcm_dpo/beta": 0.00875013880431652, + "fcm_dpo/delta": 0.02565288171172142, + "fcm_dpo/margin": 54.354835510253906, + "fcm_dpo/q_t": 0.39852726459503174, + "grad_norm": 17.79652976989746, + "learning_rate": 1.0714794091391072e-07, + "logits/chosen": 0.6550045013427734, + "logits/rejected": 0.6366511583328247, + "logps/chosen": -192.35037231445312, + "logps/ref_chosen": -63.0672492980957, + "logps/ref_rejected": -68.59602355957031, + "logps/rejected": -252.2339324951172, + "loss": 1.1297, + "margin_dpo/margin_mean": 54.354835510253906, + "margin_dpo/margin_std": 96.1163101196289, + "step": 480 + }, + { + "epoch": 0.7331821617535903, + "fcm_dpo/beta": 0.008799830451607704, + "fcm_dpo/delta": 0.002256347332149744, + "fcm_dpo/margin": 59.921966552734375, + "fcm_dpo/q_t": 0.3874397277832031, + "grad_norm": 14.530784606933594, + "learning_rate": 1.0177301773633992e-07, + "logits/chosen": 0.7001765370368958, + "logits/rejected": 0.6357440948486328, + "logps/chosen": -185.18301391601562, + "logps/ref_chosen": -58.75799560546875, + "logps/ref_rejected": -79.72233581542969, + "logps/rejected": -266.0693054199219, + "loss": 1.0675, + "margin_dpo/margin_mean": 59.921974182128906, + "margin_dpo/margin_std": 89.0008316040039, + "step": 485 + }, + { + "epoch": 0.7407407407407407, + "fcm_dpo/beta": 0.00887683592736721, + "fcm_dpo/delta": 0.020326469093561172, + "fcm_dpo/margin": 53.544097900390625, + "fcm_dpo/q_t": 0.4002537131309509, + "grad_norm": 14.441047668457031, + "learning_rate": 9.650174444319956e-08, + "logits/chosen": 0.7496536374092102, + "logits/rejected": 0.6850180625915527, + "logps/chosen": -195.7850799560547, + "logps/ref_chosen": -61.394195556640625, + "logps/ref_rejected": -81.1914291381836, + "logps/rejected": -269.12640380859375, + "loss": 1.1317, + "margin_dpo/margin_mean": 53.544097900390625, + "margin_dpo/margin_std": 96.80680847167969, + "step": 490 + }, + { + "epoch": 0.7482993197278912, + "fcm_dpo/beta": 0.008899571374058723, + "fcm_dpo/delta": -0.002458928618580103, + "fcm_dpo/margin": 53.95166778564453, + "fcm_dpo/q_t": 0.39891940355300903, + "grad_norm": 18.731355667114258, + "learning_rate": 9.133780704940594e-08, + "logits/chosen": 0.6664924621582031, + "logits/rejected": 0.600567102432251, + "logps/chosen": -189.1266632080078, + "logps/ref_chosen": -59.85382843017578, + "logps/ref_rejected": -80.63748931884766, + "logps/rejected": -263.86199951171875, + "loss": 1.1266, + "margin_dpo/margin_mean": 53.95166778564453, + "margin_dpo/margin_std": 95.11207580566406, + "step": 495 + }, + { + "epoch": 0.7558578987150416, + "fcm_dpo/beta": 0.008871853351593018, + "fcm_dpo/delta": 0.011157815344631672, + "fcm_dpo/margin": 64.1400375366211, + "fcm_dpo/q_t": 0.3798808455467224, + "grad_norm": 18.928569793701172, + "learning_rate": 8.628481651367875e-08, + "logits/chosen": 0.6870494484901428, + "logits/rejected": 0.6374934911727905, + "logps/chosen": -194.50869750976562, + "logps/ref_chosen": -66.17753601074219, + "logps/ref_rejected": -83.75955200195312, + "logps/rejected": -276.23077392578125, + "loss": 1.0621, + "margin_dpo/margin_mean": 64.1400375366211, + "margin_dpo/margin_std": 97.7823257446289, + "step": 500 + }, + { + "epoch": 0.763416477702192, + "fcm_dpo/beta": 0.009083734825253487, + "fcm_dpo/delta": -0.0031442195177078247, + "fcm_dpo/margin": 59.1200065612793, + "fcm_dpo/q_t": 0.3837282359600067, + "grad_norm": 16.126550674438477, + "learning_rate": 8.134630621352483e-08, + "logits/chosen": 0.6756311655044556, + "logits/rejected": 0.655124843120575, + "logps/chosen": -185.13583374023438, + "logps/ref_chosen": -62.11005401611328, + "logps/ref_rejected": -74.64705657958984, + "logps/rejected": -256.7928466796875, + "loss": 1.0546, + "margin_dpo/margin_mean": 59.1200065612793, + "margin_dpo/margin_std": 83.1792984008789, + "step": 505 + }, + { + "epoch": 0.7709750566893424, + "fcm_dpo/beta": 0.008973537012934685, + "fcm_dpo/delta": -0.01379710715264082, + "fcm_dpo/margin": 61.247772216796875, + "fcm_dpo/q_t": 0.38576018810272217, + "grad_norm": 15.6004056930542, + "learning_rate": 7.652572947447272e-08, + "logits/chosen": 0.6822357177734375, + "logits/rejected": 0.6185404658317566, + "logps/chosen": -192.7943572998047, + "logps/ref_chosen": -64.42265319824219, + "logps/ref_rejected": -87.00096130371094, + "logps/rejected": -276.62042236328125, + "loss": 1.0879, + "margin_dpo/margin_mean": 61.247772216796875, + "margin_dpo/margin_std": 99.09281158447266, + "step": 510 + }, + { + "epoch": 0.7785336356764928, + "fcm_dpo/beta": 0.008877582848072052, + "fcm_dpo/delta": 0.016705047339200974, + "fcm_dpo/margin": 63.62353515625, + "fcm_dpo/q_t": 0.37913957238197327, + "grad_norm": 17.3339900970459, + "learning_rate": 7.182645715528435e-08, + "logits/chosen": 0.7022300958633423, + "logits/rejected": 0.6536498665809631, + "logps/chosen": -183.25079345703125, + "logps/ref_chosen": -58.284393310546875, + "logps/ref_rejected": -79.09356689453125, + "logps/rejected": -267.6835021972656, + "loss": 1.0458, + "margin_dpo/margin_mean": 63.62353515625, + "margin_dpo/margin_std": 90.51985168457031, + "step": 515 + }, + { + "epoch": 0.7860922146636432, + "fcm_dpo/beta": 0.009218396618962288, + "fcm_dpo/delta": 0.03311960771679878, + "fcm_dpo/margin": 47.081138610839844, + "fcm_dpo/q_t": 0.40798163414001465, + "grad_norm": 17.232772827148438, + "learning_rate": 6.725177529083209e-08, + "logits/chosen": 0.7172441482543945, + "logits/rejected": 0.6776331067085266, + "logps/chosen": -190.6273956298828, + "logps/ref_chosen": -61.03638458251953, + "logps/ref_rejected": -72.15824890136719, + "logps/rejected": -248.83041381835938, + "loss": 1.1669, + "margin_dpo/margin_mean": 47.081138610839844, + "margin_dpo/margin_std": 92.7890396118164, + "step": 520 + }, + { + "epoch": 0.7936507936507936, + "fcm_dpo/beta": 0.009218786843121052, + "fcm_dpo/delta": -0.009822583757340908, + "fcm_dpo/margin": 54.7793083190918, + "fcm_dpo/q_t": 0.39144212007522583, + "grad_norm": 19.94845199584961, + "learning_rate": 6.280488279429185e-08, + "logits/chosen": 0.6219805479049683, + "logits/rejected": 0.5724949240684509, + "logps/chosen": -194.5631103515625, + "logps/ref_chosen": -68.02732849121094, + "logps/ref_rejected": -85.41429901123047, + "logps/rejected": -266.7294006347656, + "loss": 1.1074, + "margin_dpo/margin_mean": 54.77930450439453, + "margin_dpo/margin_std": 92.09957122802734, + "step": 525 + }, + { + "epoch": 0.8012093726379441, + "fcm_dpo/beta": 0.009130226448178291, + "fcm_dpo/delta": -0.02196129783987999, + "fcm_dpo/margin": 50.85799026489258, + "fcm_dpo/q_t": 0.40008097887039185, + "grad_norm": 18.58346939086914, + "learning_rate": 5.848888922025552e-08, + "logits/chosen": 0.6770039796829224, + "logits/rejected": 0.6091686487197876, + "logps/chosen": -189.2750701904297, + "logps/ref_chosen": -58.67436599731445, + "logps/ref_rejected": -79.38807678222656, + "logps/rejected": -260.8467712402344, + "loss": 1.1307, + "margin_dpo/margin_mean": 50.857994079589844, + "margin_dpo/margin_std": 87.7162857055664, + "step": 530 + }, + { + "epoch": 0.8087679516250945, + "fcm_dpo/beta": 0.0091576362028718, + "fcm_dpo/delta": 0.029367243871092796, + "fcm_dpo/margin": 56.45143508911133, + "fcm_dpo/q_t": 0.39041271805763245, + "grad_norm": 18.556217193603516, + "learning_rate": 5.430681259032957e-08, + "logits/chosen": 0.6739664077758789, + "logits/rejected": 0.6132084727287292, + "logps/chosen": -183.68429565429688, + "logps/ref_chosen": -57.640098571777344, + "logps/ref_rejected": -77.25399780273438, + "logps/rejected": -259.7496643066406, + "loss": 1.0926, + "margin_dpo/margin_mean": 56.451438903808594, + "margin_dpo/margin_std": 91.31838989257812, + "step": 535 + }, + { + "epoch": 0.8163265306122449, + "fcm_dpo/beta": 0.009130528196692467, + "fcm_dpo/delta": -0.028515305370092392, + "fcm_dpo/margin": 64.78633117675781, + "fcm_dpo/q_t": 0.3742666244506836, + "grad_norm": 15.093501091003418, + "learning_rate": 5.026157728273966e-08, + "logits/chosen": 0.7153981924057007, + "logits/rejected": 0.6350281238555908, + "logps/chosen": -190.83726501464844, + "logps/ref_chosen": -60.17341995239258, + "logps/ref_rejected": -85.50316619873047, + "logps/rejected": -280.9533386230469, + "loss": 1.0162, + "margin_dpo/margin_mean": 64.78633117675781, + "margin_dpo/margin_std": 85.54998779296875, + "step": 540 + }, + { + "epoch": 0.8238851095993953, + "fcm_dpo/beta": 0.008908280171453953, + "fcm_dpo/delta": -0.029253508895635605, + "fcm_dpo/margin": 66.00330352783203, + "fcm_dpo/q_t": 0.37347084283828735, + "grad_norm": 16.25635528564453, + "learning_rate": 4.635601198741607e-08, + "logits/chosen": 0.7022188305854797, + "logits/rejected": 0.6508811116218567, + "logps/chosen": -179.33633422851562, + "logps/ref_chosen": -56.985809326171875, + "logps/ref_rejected": -73.21353912353516, + "logps/rejected": -261.56732177734375, + "loss": 1.029, + "margin_dpo/margin_mean": 66.00330352783203, + "margin_dpo/margin_std": 89.81163787841797, + "step": 545 + }, + { + "epoch": 0.8314436885865457, + "fcm_dpo/beta": 0.008911579847335815, + "fcm_dpo/delta": 0.03279992565512657, + "fcm_dpo/margin": 52.2221794128418, + "fcm_dpo/q_t": 0.3997356593608856, + "grad_norm": 16.76923179626465, + "learning_rate": 4.259284772799099e-08, + "logits/chosen": 0.6925860643386841, + "logits/rejected": 0.6450766324996948, + "logps/chosen": -189.15829467773438, + "logps/ref_chosen": -59.600929260253906, + "logps/ref_rejected": -75.24870300292969, + "logps/rejected": -257.02825927734375, + "loss": 1.1275, + "margin_dpo/margin_mean": 52.2221794128418, + "margin_dpo/margin_std": 90.92387390136719, + "step": 550 + }, + { + "epoch": 0.8390022675736961, + "fcm_dpo/beta": 0.009163258597254753, + "fcm_dpo/delta": 0.0038489706348627806, + "fcm_dpo/margin": 56.18461990356445, + "fcm_dpo/q_t": 0.38901767134666443, + "grad_norm": 16.93880271911621, + "learning_rate": 3.89747159520904e-08, + "logits/chosen": 0.6867181062698364, + "logits/rejected": 0.637639045715332, + "logps/chosen": -197.40147399902344, + "logps/ref_chosen": -63.578895568847656, + "logps/ref_rejected": -78.87867736816406, + "logps/rejected": -268.8858947753906, + "loss": 1.0913, + "margin_dpo/margin_mean": 56.18461990356445, + "margin_dpo/margin_std": 90.01570129394531, + "step": 555 + }, + { + "epoch": 0.8465608465608465, + "fcm_dpo/beta": 0.008957808837294579, + "fcm_dpo/delta": -0.0419851616024971, + "fcm_dpo/margin": 64.90444946289062, + "fcm_dpo/q_t": 0.3777204155921936, + "grad_norm": 16.868953704833984, + "learning_rate": 3.550414669125573e-08, + "logits/chosen": 0.7213538289070129, + "logits/rejected": 0.6617583632469177, + "logps/chosen": -192.423828125, + "logps/ref_chosen": -58.651512145996094, + "logps/ref_rejected": -78.67181396484375, + "logps/rejected": -277.34857177734375, + "loss": 1.0363, + "margin_dpo/margin_mean": 64.90444946289062, + "margin_dpo/margin_std": 90.19843292236328, + "step": 560 + }, + { + "epoch": 0.854119425547997, + "fcm_dpo/beta": 0.008735055103898048, + "fcm_dpo/delta": -0.009981656447052956, + "fcm_dpo/margin": 67.18910217285156, + "fcm_dpo/q_t": 0.3747270703315735, + "grad_norm": 14.736648559570312, + "learning_rate": 3.218356679178252e-08, + "logits/chosen": 0.7032049298286438, + "logits/rejected": 0.6600871682167053, + "logps/chosen": -187.43948364257812, + "logps/ref_chosen": -60.3114128112793, + "logps/ref_rejected": -78.25270080566406, + "logps/rejected": -272.56982421875, + "loss": 1.028, + "margin_dpo/margin_mean": 67.18910217285156, + "margin_dpo/margin_std": 91.42976379394531, + "step": 565 + }, + { + "epoch": 0.8616780045351474, + "fcm_dpo/beta": 0.008505801670253277, + "fcm_dpo/delta": -0.04424377158284187, + "fcm_dpo/margin": 65.48918914794922, + "fcm_dpo/q_t": 0.3805517554283142, + "grad_norm": 12.924057006835938, + "learning_rate": 2.9015298217712453e-08, + "logits/chosen": 0.6734435558319092, + "logits/rejected": 0.6112924814224243, + "logps/chosen": -184.1428680419922, + "logps/ref_chosen": -57.752410888671875, + "logps/ref_rejected": -76.99858093261719, + "logps/rejected": -268.8782043457031, + "loss": 1.049, + "margin_dpo/margin_mean": 65.48918914794922, + "margin_dpo/margin_std": 91.4268798828125, + "step": 570 + }, + { + "epoch": 0.8692365835222978, + "fcm_dpo/beta": 0.008431388065218925, + "fcm_dpo/delta": 0.01765955612063408, + "fcm_dpo/margin": 56.814170837402344, + "fcm_dpo/q_t": 0.39621537923812866, + "grad_norm": 14.525823593139648, + "learning_rate": 2.600155642716606e-08, + "logits/chosen": 0.701653242111206, + "logits/rejected": 0.66460120677948, + "logps/chosen": -196.06419372558594, + "logps/ref_chosen": -63.61958694458008, + "logps/ref_rejected": -79.51353454589844, + "logps/rejected": -268.7723388671875, + "loss": 1.101, + "margin_dpo/margin_mean": 56.814170837402344, + "margin_dpo/margin_std": 90.25949096679688, + "step": 575 + }, + { + "epoch": 0.8767951625094482, + "fcm_dpo/beta": 0.008416803553700447, + "fcm_dpo/delta": 0.0003098793386016041, + "fcm_dpo/margin": 62.08296585083008, + "fcm_dpo/q_t": 0.38741156458854675, + "grad_norm": 15.001502990722656, + "learning_rate": 2.3144448823151392e-08, + "logits/chosen": 0.6825278997421265, + "logits/rejected": 0.6386707425117493, + "logps/chosen": -182.51686096191406, + "logps/ref_chosen": -57.3541145324707, + "logps/ref_rejected": -73.14434051513672, + "logps/rejected": -260.3900451660156, + "loss": 1.0717, + "margin_dpo/margin_mean": 62.08296585083008, + "margin_dpo/margin_std": 92.49629211425781, + "step": 580 + }, + { + "epoch": 0.8843537414965986, + "fcm_dpo/beta": 0.008522504940629005, + "fcm_dpo/delta": 0.025987576693296432, + "fcm_dpo/margin": 57.36644744873047, + "fcm_dpo/q_t": 0.39568692445755005, + "grad_norm": 14.261137962341309, + "learning_rate": 2.044597327993153e-08, + "logits/chosen": 0.7333514094352722, + "logits/rejected": 0.6711838245391846, + "logps/chosen": -186.538330078125, + "logps/ref_chosen": -56.0127067565918, + "logps/ref_rejected": -77.16522216796875, + "logps/rejected": -265.05731201171875, + "loss": 1.1076, + "margin_dpo/margin_mean": 57.36644744873047, + "margin_dpo/margin_std": 95.25784301757812, + "step": 585 + }, + { + "epoch": 0.891912320483749, + "fcm_dpo/beta": 0.008789935149252415, + "fcm_dpo/delta": 0.02721945382654667, + "fcm_dpo/margin": 63.61796188354492, + "fcm_dpo/q_t": 0.3782525360584259, + "grad_norm": 15.488899230957031, + "learning_rate": 1.7908016745981856e-08, + "logits/chosen": 0.717170774936676, + "logits/rejected": 0.6842165589332581, + "logps/chosen": -190.9798126220703, + "logps/ref_chosen": -60.5894660949707, + "logps/ref_rejected": -74.34771728515625, + "logps/rejected": -268.35601806640625, + "loss": 1.0465, + "margin_dpo/margin_mean": 63.61796188354492, + "margin_dpo/margin_std": 90.69212341308594, + "step": 590 + }, + { + "epoch": 0.8994708994708994, + "fcm_dpo/beta": 0.008735476061701775, + "fcm_dpo/delta": -0.010337557643651962, + "fcm_dpo/margin": 67.07391357421875, + "fcm_dpo/q_t": 0.3761887550354004, + "grad_norm": 14.772221565246582, + "learning_rate": 1.553235392451377e-08, + "logits/chosen": 0.7367411255836487, + "logits/rejected": 0.6589676141738892, + "logps/chosen": -176.36756896972656, + "logps/ref_chosen": -54.77838897705078, + "logps/ref_rejected": -78.102783203125, + "logps/rejected": -266.765869140625, + "loss": 1.0433, + "margin_dpo/margin_mean": 67.07390594482422, + "margin_dpo/margin_std": 95.8719482421875, + "step": 595 + }, + { + "epoch": 0.9070294784580499, + "fcm_dpo/beta": 0.008924348279833794, + "fcm_dpo/delta": 0.013378431089222431, + "fcm_dpo/margin": 45.238609313964844, + "fcm_dpo/q_t": 0.41461238265037537, + "grad_norm": 18.25551986694336, + "learning_rate": 1.3320646032487393e-08, + "logits/chosen": 0.7176660299301147, + "logits/rejected": 0.6818990111351013, + "logps/chosen": -193.6077880859375, + "logps/ref_chosen": -58.45500564575195, + "logps/ref_rejected": -70.7367172241211, + "logps/rejected": -251.1281280517578, + "loss": 1.1653, + "margin_dpo/margin_mean": 45.238609313964844, + "margin_dpo/margin_std": 87.94874572753906, + "step": 600 + }, + { + "epoch": 0.9070294784580499, + "eval_fcm_dpo/beta": 0.008908301591873169, + "eval_logits/chosen": 0.7206099629402161, + "eval_logits/rejected": 0.6751406192779541, + "eval_logps/chosen": -205.21878051757812, + "eval_logps/ref_chosen": -74.85946655273438, + "eval_logps/ref_rejected": -79.54898834228516, + "eval_logps/rejected": -265.1909484863281, + "eval_loss": 0.5591413378715515, + "eval_margin_dpo/margin_mean": 55.28264236450195, + "eval_margin_dpo/margin_std": 95.356689453125, + "eval_runtime": 39.0896, + "eval_samples_per_second": 58.916, + "eval_steps_per_second": 1.842, + "step": 600 + }, + { + "epoch": 0.9145880574452003, + "fcm_dpo/beta": 0.00893603079020977, + "fcm_dpo/delta": 0.01746518909931183, + "fcm_dpo/margin": 63.60172653198242, + "fcm_dpo/q_t": 0.37951910495758057, + "grad_norm": 16.666015625, + "learning_rate": 1.1274439638981532e-08, + "logits/chosen": 0.7014644742012024, + "logits/rejected": 0.6582333445549011, + "logps/chosen": -179.68258666992188, + "logps/ref_chosen": -59.87483596801758, + "logps/ref_rejected": -75.75318908691406, + "logps/rejected": -259.16265869140625, + "loss": 1.0544, + "margin_dpo/margin_mean": 63.60172653198242, + "margin_dpo/margin_std": 93.95574951171875, + "step": 605 + }, + { + "epoch": 0.9221466364323507, + "fcm_dpo/beta": 0.008915998041629791, + "fcm_dpo/delta": -0.01860709860920906, + "fcm_dpo/margin": 66.0380859375, + "fcm_dpo/q_t": 0.37500935792922974, + "grad_norm": 14.762502670288086, + "learning_rate": 9.395165583732379e-09, + "logits/chosen": 0.706168532371521, + "logits/rejected": 0.6614619493484497, + "logps/chosen": -186.66229248046875, + "logps/ref_chosen": -60.35883712768555, + "logps/ref_rejected": -81.3543930053711, + "logps/rejected": -273.6959228515625, + "loss": 1.0278, + "margin_dpo/margin_mean": 66.03807830810547, + "margin_dpo/margin_std": 89.66718292236328, + "step": 610 + }, + { + "epoch": 0.9297052154195011, + "fcm_dpo/beta": 0.008840186521410942, + "fcm_dpo/delta": -0.026694372296333313, + "fcm_dpo/margin": 66.6244125366211, + "fcm_dpo/q_t": 0.3726271688938141, + "grad_norm": 15.342317581176758, + "learning_rate": 7.684137976598088e-09, + "logits/chosen": 0.6743055582046509, + "logits/rejected": 0.6356549859046936, + "logps/chosen": -185.5474395751953, + "logps/ref_chosen": -59.17219161987305, + "logps/ref_rejected": -79.92167663574219, + "logps/rejected": -272.9213562011719, + "loss": 1.0255, + "margin_dpo/margin_mean": 66.62440490722656, + "margin_dpo/margin_std": 89.74223327636719, + "step": 615 + }, + { + "epoch": 0.9372637944066515, + "fcm_dpo/beta": 0.00864451751112938, + "fcm_dpo/delta": -0.011452676728367805, + "fcm_dpo/margin": 58.722190856933594, + "fcm_dpo/q_t": 0.39084118604660034, + "grad_norm": 17.209096908569336, + "learning_rate": 6.142553278648238e-09, + "logits/chosen": 0.7176477313041687, + "logits/rejected": 0.6551352739334106, + "logps/chosen": -185.00552368164062, + "logps/ref_chosen": -58.052696228027344, + "logps/ref_rejected": -78.37252807617188, + "logps/rejected": -264.04754638671875, + "loss": 1.0716, + "margin_dpo/margin_mean": 58.722190856933594, + "margin_dpo/margin_std": 86.17276763916016, + "step": 620 + }, + { + "epoch": 0.9448223733938019, + "fcm_dpo/beta": 0.008548585698008537, + "fcm_dpo/delta": -0.0001246035099029541, + "fcm_dpo/margin": 60.6451530456543, + "fcm_dpo/q_t": 0.3894796669483185, + "grad_norm": 14.61771011352539, + "learning_rate": 4.7714894655209174e-09, + "logits/chosen": 0.708177924156189, + "logits/rejected": 0.6277607679367065, + "logps/chosen": -186.0558624267578, + "logps/ref_chosen": -56.957862854003906, + "logps/ref_rejected": -82.68255615234375, + "logps/rejected": -272.4256896972656, + "loss": 1.0748, + "margin_dpo/margin_mean": 60.6451530456543, + "margin_dpo/margin_std": 92.42916870117188, + "step": 625 + }, + { + "epoch": 0.9523809523809523, + "fcm_dpo/beta": 0.008414940908551216, + "fcm_dpo/delta": -0.02683025598526001, + "fcm_dpo/margin": 70.0490951538086, + "fcm_dpo/q_t": 0.3737347424030304, + "grad_norm": 11.857268333435059, + "learning_rate": 3.5719052736323806e-09, + "logits/chosen": 0.7122366428375244, + "logits/rejected": 0.6418401598930359, + "logps/chosen": -179.7769012451172, + "logps/ref_chosen": -56.71510696411133, + "logps/ref_rejected": -82.94544219970703, + "logps/rejected": -276.05633544921875, + "loss": 1.0285, + "margin_dpo/margin_mean": 70.0490951538086, + "margin_dpo/margin_std": 94.82304382324219, + "step": 630 + }, + { + "epoch": 0.9599395313681028, + "fcm_dpo/beta": 0.008062823675572872, + "fcm_dpo/delta": -0.03275930508971214, + "fcm_dpo/margin": 59.115440368652344, + "fcm_dpo/q_t": 0.3975747227668762, + "grad_norm": 13.964070320129395, + "learning_rate": 2.5446395297668287e-09, + "logits/chosen": 0.6974132061004639, + "logits/rejected": 0.6502237319946289, + "logps/chosen": -186.69309997558594, + "logps/ref_chosen": -59.33793258666992, + "logps/ref_rejected": -75.01703643798828, + "logps/rejected": -261.4876403808594, + "loss": 1.1043, + "margin_dpo/margin_mean": 59.115440368652344, + "margin_dpo/margin_std": 93.75061798095703, + "step": 635 + }, + { + "epoch": 0.9674981103552532, + "fcm_dpo/beta": 0.008327251300215721, + "fcm_dpo/delta": 0.06021968647837639, + "fcm_dpo/margin": 62.01350784301758, + "fcm_dpo/q_t": 0.38918977975845337, + "grad_norm": 14.674144744873047, + "learning_rate": 1.690410564514244e-09, + "logits/chosen": 0.6967864036560059, + "logits/rejected": 0.6229372024536133, + "logps/chosen": -191.25723266601562, + "logps/ref_chosen": -58.1605339050293, + "logps/ref_rejected": -79.85365295410156, + "logps/rejected": -274.9638671875, + "loss": 1.0702, + "margin_dpo/margin_mean": 62.01350784301758, + "margin_dpo/margin_std": 92.87417602539062, + "step": 640 + }, + { + "epoch": 0.9750566893424036, + "fcm_dpo/beta": 0.008840223774313927, + "fcm_dpo/delta": 0.05628042295575142, + "fcm_dpo/margin": 54.37908935546875, + "fcm_dpo/q_t": 0.3959693908691406, + "grad_norm": 16.510818481445312, + "learning_rate": 1.0098157099674987e-09, + "logits/chosen": 0.6872873306274414, + "logits/rejected": 0.6607547998428345, + "logps/chosen": -193.90921020507812, + "logps/ref_chosen": -63.45180130004883, + "logps/ref_rejected": -74.18285369873047, + "logps/rejected": -259.01934814453125, + "loss": 1.1021, + "margin_dpo/margin_mean": 54.37909698486328, + "margin_dpo/margin_std": 87.93758392333984, + "step": 645 + }, + { + "epoch": 0.982615268329554, + "fcm_dpo/beta": 0.009017017669975758, + "fcm_dpo/delta": -0.01029270887374878, + "fcm_dpo/margin": 63.77238845825195, + "fcm_dpo/q_t": 0.3787182569503784, + "grad_norm": 15.225814819335938, + "learning_rate": 5.033308820289184e-10, + "logits/chosen": 0.7203370332717896, + "logits/rejected": 0.6512852311134338, + "logps/chosen": -195.11532592773438, + "logps/ref_chosen": -59.75496292114258, + "logps/ref_rejected": -84.31481170654297, + "logps/rejected": -283.4475402832031, + "loss": 1.0611, + "margin_dpo/margin_mean": 63.77238082885742, + "margin_dpo/margin_std": 96.05448913574219, + "step": 650 + }, + { + "epoch": 0.9901738473167044, + "fcm_dpo/beta": 0.008963796310126781, + "fcm_dpo/delta": -0.022582078352570534, + "fcm_dpo/margin": 60.55501174926758, + "fcm_dpo/q_t": 0.3851621747016907, + "grad_norm": 13.021146774291992, + "learning_rate": 1.7131024761923852e-10, + "logits/chosen": 0.7035177946090698, + "logits/rejected": 0.6318515539169312, + "logps/chosen": -185.91603088378906, + "logps/ref_chosen": -57.817848205566406, + "logps/ref_rejected": -79.81755065917969, + "logps/rejected": -268.4707336425781, + "loss": 1.0654, + "margin_dpo/margin_mean": 60.55500411987305, + "margin_dpo/margin_std": 88.59367370605469, + "step": 655 + }, + { + "epoch": 0.9977324263038548, + "fcm_dpo/beta": 0.008747505024075508, + "fcm_dpo/delta": -0.01453787088394165, + "fcm_dpo/margin": 64.36149597167969, + "fcm_dpo/q_t": 0.3801228702068329, + "grad_norm": 15.389237403869629, + "learning_rate": 1.3985977021235829e-11, + "logits/chosen": 0.7586897611618042, + "logits/rejected": 0.6943166255950928, + "logps/chosen": -190.80844116210938, + "logps/ref_chosen": -59.12651443481445, + "logps/ref_rejected": -79.42085266113281, + "logps/rejected": -275.46429443359375, + "loss": 1.0594, + "margin_dpo/margin_mean": 64.36149597167969, + "margin_dpo/margin_std": 96.14913940429688, + "step": 660 + }, + { + "epoch": 0.999244142101285, + "step": 661, + "total_flos": 0.0, + "train_loss": 1.120150500454809, + "train_runtime": 1811.4729, + "train_samples_per_second": 23.371, + "train_steps_per_second": 0.365 + } + ], + "logging_steps": 5, + "max_steps": 661, + "num_input_tokens_seen": 0, + "num_train_epochs": 1, + "save_steps": 50, + "stateful_callbacks": { + "TrainerControl": { + "args": { + "should_epoch_stop": false, + "should_evaluate": false, + "should_log": false, + "should_save": false, + "should_training_stop": false + }, + "attributes": {} + } + }, + "total_flos": 0.0, + "train_batch_size": 8, + "trial_name": null, + "trial_params": null +}