83 lines
3.2 KiB
YAML
83 lines
3.2 KiB
YAML
|
|
model_name: Tucano2-qwen-0.5B-Base
|
||
|
|
results:
|
||
|
|
niah_pt_multikey_1_1024: 0.376
|
||
|
|
niah_pt_multikey_1_1024_stderr: 0.02168382753928621
|
||
|
|
niah_pt_multikey_1_2048: 0.386
|
||
|
|
niah_pt_multikey_1_2048_stderr: 0.021793529219281196
|
||
|
|
niah_pt_multikey_1_4096: 0.356
|
||
|
|
niah_pt_multikey_1_4096_stderr: N/A
|
||
|
|
niah_pt_multikey_1_alias: " - niah_pt_multikey_1"
|
||
|
|
niah_pt_multikey_2_1024: 0.2
|
||
|
|
niah_pt_multikey_2_1024_stderr: 0.01790645924143381
|
||
|
|
niah_pt_multikey_2_2048: 0.086
|
||
|
|
niah_pt_multikey_2_2048_stderr: 0.012550818542716023
|
||
|
|
niah_pt_multikey_2_4096: 0.024
|
||
|
|
niah_pt_multikey_2_4096_stderr: N/A
|
||
|
|
niah_pt_multikey_2_alias: " - niah_pt_multikey_2"
|
||
|
|
niah_pt_multikey_3_1024: 0.236
|
||
|
|
niah_pt_multikey_3_1024_stderr: 0.01900869962208476
|
||
|
|
niah_pt_multikey_3_2048: 0.09
|
||
|
|
niah_pt_multikey_3_2048_stderr: 0.012811255071733842
|
||
|
|
niah_pt_multikey_3_4096: 0.044
|
||
|
|
niah_pt_multikey_3_4096_stderr: N/A
|
||
|
|
niah_pt_multikey_3_alias: " - niah_pt_multikey_3"
|
||
|
|
niah_pt_multiquery_1024: 0.1405
|
||
|
|
niah_pt_multiquery_1024_stderr: 0.010839949677836887
|
||
|
|
niah_pt_multiquery_2048: 0.121
|
||
|
|
niah_pt_multiquery_2048_stderr: 0.009920424872923468
|
||
|
|
niah_pt_multiquery_4096: 0.042
|
||
|
|
niah_pt_multiquery_4096_stderr: N/A
|
||
|
|
niah_pt_multiquery_alias: " - niah_pt_multiquery"
|
||
|
|
niah_pt_multivalue_1024: 0.2165
|
||
|
|
niah_pt_multivalue_1024_stderr: 0.012341398633885907
|
||
|
|
niah_pt_multivalue_2048: 0.1295
|
||
|
|
niah_pt_multivalue_2048_stderr: 0.010243014140249671
|
||
|
|
niah_pt_multivalue_4096: 0.0525
|
||
|
|
niah_pt_multivalue_4096_stderr: N/A
|
||
|
|
niah_pt_multivalue_alias: " - niah_pt_multivalue"
|
||
|
|
niah_pt_single_1_1024: 0.236
|
||
|
|
niah_pt_single_1_1024_stderr: 0.01900869962208476
|
||
|
|
niah_pt_single_1_2048: 0.228
|
||
|
|
niah_pt_single_1_2048_stderr: 0.018781306529363172
|
||
|
|
niah_pt_single_1_4096: 0.172
|
||
|
|
niah_pt_single_1_4096_stderr: N/A
|
||
|
|
niah_pt_single_1_alias: " - niah_pt_single_1"
|
||
|
|
niah_pt_single_2_1024: 0.32
|
||
|
|
niah_pt_single_2_1024_stderr: 0.02088234048876172
|
||
|
|
niah_pt_single_2_2048: 0.374
|
||
|
|
niah_pt_single_2_2048_stderr: 0.021660710347204473
|
||
|
|
niah_pt_single_2_4096: 0.37
|
||
|
|
niah_pt_single_2_4096_stderr: N/A
|
||
|
|
niah_pt_single_2_alias: " - niah_pt_single_2"
|
||
|
|
niah_pt_single_3_1024: 0.604
|
||
|
|
niah_pt_single_3_1024_stderr: 0.021893529941665716
|
||
|
|
niah_pt_single_3_2048: 0.6
|
||
|
|
niah_pt_single_3_2048_stderr: 0.02193084412072858
|
||
|
|
niah_pt_single_3_4096: 0.502
|
||
|
|
niah_pt_single_3_4096_stderr: N/A
|
||
|
|
niah_pt_single_3_alias: " - niah_pt_single_3"
|
||
|
|
ruler_pt_4096: 0.25705757575757576
|
||
|
|
ruler_pt_4096_stderr: N/A
|
||
|
|
ruler_pt_alias: ruler_pt
|
||
|
|
ruler_pt_cwe_1024: 0.5392
|
||
|
|
ruler_pt_cwe_1024_stderr: 0.01332673717935847
|
||
|
|
ruler_pt_cwe_2048: 0.321
|
||
|
|
ruler_pt_cwe_2048_stderr: 0.009951686899430094
|
||
|
|
ruler_pt_cwe_4096: 0.21059999999999998
|
||
|
|
ruler_pt_cwe_4096_stderr: N/A
|
||
|
|
ruler_pt_cwe_alias: " - ruler_pt_cwe"
|
||
|
|
ruler_pt_fwe_1024: 0.5753333333333333
|
||
|
|
ruler_pt_fwe_1024_stderr: 0.013569419559555793
|
||
|
|
ruler_pt_fwe_2048: 0.48533333333333334
|
||
|
|
ruler_pt_fwe_2048_stderr: 0.012767415662313082
|
||
|
|
ruler_pt_fwe_4096: 0.47333333333333333
|
||
|
|
ruler_pt_fwe_4096_stderr: N/A
|
||
|
|
ruler_pt_fwe_alias: " - ruler_pt_fwe"
|
||
|
|
ruler_pt_vt_1024: 0.9272
|
||
|
|
ruler_pt_vt_1024_stderr: 0.008164167272570364
|
||
|
|
ruler_pt_vt_2048: 0.842
|
||
|
|
ruler_pt_vt_2048_stderr: 0.00944936935262479
|
||
|
|
ruler_pt_vt_4096: 0.5812
|
||
|
|
ruler_pt_vt_4096_stderr: N/A
|
||
|
|
ruler_pt_vt_alias: " - ruler_pt_vt"
|