初始化项目,由ModelHub XC社区提供模型
Model: bigscience/bloomz-7b1-p3 Source: Original Platform
This commit is contained in:
@@ -0,0 +1,9 @@
|
||||
{
|
||||
"dataset_name": "super_glue",
|
||||
"dataset_config_name": "cb",
|
||||
"template_name": "GPT-3 style",
|
||||
"evaluation": {
|
||||
"accuracy": 0.625
|
||||
},
|
||||
"arguments": "Namespace(config_name=None, dataset_config_name='cb', dataset_name='super_glue', debug=False, dtype='float16', max_length=2048, model_name_or_path='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/p31lossseqglobal_step1000', output_dir='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/p31lossseqglobal_step1000/evaluation', pad_to_max_length=False, per_device_eval_batch_size=8, prefixlm=False, split='validation', target_max_length=256, template_config_name=None, template_name='GPT-3 style', tokenizer_name=None, use_slow_tokenizer=False)"
|
||||
}
|
||||
@@ -0,0 +1,9 @@
|
||||
{
|
||||
"dataset_name": "super_glue",
|
||||
"dataset_config_name": "cb",
|
||||
"template_name": "MNLI crowdsource",
|
||||
"evaluation": {
|
||||
"accuracy": 0.08928571428571429
|
||||
},
|
||||
"arguments": "Namespace(config_name=None, dataset_config_name='cb', dataset_name='super_glue', debug=False, dtype='float16', max_length=2048, model_name_or_path='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/p31lossseqglobal_step1000', output_dir='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/p31lossseqglobal_step1000/evaluation', pad_to_max_length=False, per_device_eval_batch_size=8, prefixlm=False, split='validation', target_max_length=256, template_config_name=None, template_name='MNLI crowdsource', tokenizer_name=None, use_slow_tokenizer=False)"
|
||||
}
|
||||
@@ -0,0 +1,9 @@
|
||||
{
|
||||
"dataset_name": "super_glue",
|
||||
"dataset_config_name": "cb",
|
||||
"template_name": "can we infer",
|
||||
"evaluation": {
|
||||
"accuracy": 0.5892857142857143
|
||||
},
|
||||
"arguments": "Namespace(config_name=None, dataset_config_name='cb', dataset_name='super_glue', debug=False, dtype='float16', max_length=2048, model_name_or_path='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/p31lossseqglobal_step1000', output_dir='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/p31lossseqglobal_step1000/evaluation', pad_to_max_length=False, per_device_eval_batch_size=8, prefixlm=False, split='validation', target_max_length=256, template_config_name=None, template_name='can we infer', tokenizer_name=None, use_slow_tokenizer=False)"
|
||||
}
|
||||
@@ -0,0 +1,9 @@
|
||||
{
|
||||
"dataset_name": "super_glue",
|
||||
"dataset_config_name": "cb",
|
||||
"template_name": "guaranteed/possible/impossible",
|
||||
"evaluation": {
|
||||
"accuracy": 0.5
|
||||
},
|
||||
"arguments": "Namespace(config_name=None, dataset_config_name='cb', dataset_name='super_glue', debug=False, dtype='float16', max_length=2048, model_name_or_path='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/p31lossseqglobal_step1000', output_dir='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/p31lossseqglobal_step1000/evaluation', pad_to_max_length=False, per_device_eval_batch_size=8, prefixlm=False, split='validation', target_max_length=256, template_config_name=None, template_name='guaranteed/possible/impossible', tokenizer_name=None, use_slow_tokenizer=False)"
|
||||
}
|
||||
@@ -0,0 +1,9 @@
|
||||
{
|
||||
"dataset_name": "super_glue",
|
||||
"dataset_config_name": "cb",
|
||||
"template_name": "justified in saying",
|
||||
"evaluation": {
|
||||
"accuracy": 0.5357142857142857
|
||||
},
|
||||
"arguments": "Namespace(config_name=None, dataset_config_name='cb', dataset_name='super_glue', debug=False, dtype='float16', max_length=2048, model_name_or_path='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/p31lossseqglobal_step1000', output_dir='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/p31lossseqglobal_step1000/evaluation', pad_to_max_length=False, per_device_eval_batch_size=8, prefixlm=False, split='validation', target_max_length=256, template_config_name=None, template_name='justified in saying', tokenizer_name=None, use_slow_tokenizer=False)"
|
||||
}
|
||||
@@ -0,0 +1,9 @@
|
||||
{
|
||||
"dataset_name": "super_glue",
|
||||
"dataset_config_name": "copa",
|
||||
"template_name": "C1 or C2? premise, so/because\u2026",
|
||||
"evaluation": {
|
||||
"accuracy": 0.66
|
||||
},
|
||||
"arguments": "Namespace(config_name=None, dataset_config_name='copa', dataset_name='super_glue', debug=False, dtype='float16', max_length=2048, model_name_or_path='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/p31lossseqglobal_step1000', output_dir='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/p31lossseqglobal_step1000/evaluation', pad_to_max_length=False, per_device_eval_batch_size=8, prefixlm=False, split='validation', target_max_length=256, template_config_name=None, template_name='C1 or C2? premise, so/because\u2026', tokenizer_name=None, use_slow_tokenizer=False)"
|
||||
}
|
||||
@@ -0,0 +1,9 @@
|
||||
{
|
||||
"dataset_name": "super_glue",
|
||||
"dataset_config_name": "copa",
|
||||
"template_name": "C1 or C2? premise, so/because\u2026",
|
||||
"evaluation": {
|
||||
"accuracy": 0.66
|
||||
},
|
||||
"arguments": "Namespace(config_name=None, dataset_config_name='copa', dataset_name='super_glue', debug=False, dtype='float16', max_length=2048, model_name_or_path='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/p31lossseqglobal_step1000', output_dir='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/p31lossseqglobal_step1000/evaluation', pad_to_max_length=False, per_device_eval_batch_size=8, prefixlm=False, split='so/because\u2026,validation', target_max_length=256, template_config_name=None, template_name='C1 or C2? premise', tokenizer_name=None, use_slow_tokenizer=False)"
|
||||
}
|
||||
@@ -0,0 +1,9 @@
|
||||
{
|
||||
"dataset_name": "super_glue",
|
||||
"dataset_config_name": "copa",
|
||||
"template_name": "best_option",
|
||||
"evaluation": {
|
||||
"accuracy": 0.67
|
||||
},
|
||||
"arguments": "Namespace(config_name=None, dataset_config_name='copa', dataset_name='super_glue', debug=False, dtype='float16', max_length=2048, model_name_or_path='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/p31lossseqglobal_step1000', output_dir='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/p31lossseqglobal_step1000/evaluation', pad_to_max_length=False, per_device_eval_batch_size=8, prefixlm=False, split='validation', target_max_length=256, template_config_name=None, template_name='best_option', tokenizer_name=None, use_slow_tokenizer=False)"
|
||||
}
|
||||
@@ -0,0 +1,9 @@
|
||||
{
|
||||
"dataset_name": "super_glue",
|
||||
"dataset_config_name": "copa",
|
||||
"template_name": "cause_effect",
|
||||
"evaluation": {
|
||||
"accuracy": 0.78
|
||||
},
|
||||
"arguments": "Namespace(config_name=None, dataset_config_name='copa', dataset_name='super_glue', debug=False, dtype='float16', max_length=2048, model_name_or_path='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/p31lossseqglobal_step1000', output_dir='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/p31lossseqglobal_step1000/evaluation', pad_to_max_length=False, per_device_eval_batch_size=8, prefixlm=False, split='validation', target_max_length=256, template_config_name=None, template_name='cause_effect', tokenizer_name=None, use_slow_tokenizer=False)"
|
||||
}
|
||||
@@ -0,0 +1,9 @@
|
||||
{
|
||||
"dataset_name": "super_glue",
|
||||
"dataset_config_name": "copa",
|
||||
"template_name": "i_am_hesitating",
|
||||
"evaluation": {
|
||||
"accuracy": 0.8
|
||||
},
|
||||
"arguments": "Namespace(config_name=None, dataset_config_name='copa', dataset_name='super_glue', debug=False, dtype='float16', max_length=2048, model_name_or_path='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/p31lossseqglobal_step1000', output_dir='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/p31lossseqglobal_step1000/evaluation', pad_to_max_length=False, per_device_eval_batch_size=8, prefixlm=False, split='validation', target_max_length=256, template_config_name=None, template_name='i_am_hesitating', tokenizer_name=None, use_slow_tokenizer=False)"
|
||||
}
|
||||
@@ -0,0 +1,9 @@
|
||||
{
|
||||
"dataset_name": "super_glue",
|
||||
"dataset_config_name": "copa",
|
||||
"template_name": "plausible_alternatives",
|
||||
"evaluation": {
|
||||
"accuracy": 0.81
|
||||
},
|
||||
"arguments": "Namespace(config_name=None, dataset_config_name='copa', dataset_name='super_glue', debug=False, dtype='float16', max_length=2048, model_name_or_path='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/p31lossseqglobal_step1000', output_dir='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/p31lossseqglobal_step1000/evaluation', pad_to_max_length=False, per_device_eval_batch_size=8, prefixlm=False, split='validation', target_max_length=256, template_config_name=None, template_name='plausible_alternatives', tokenizer_name=None, use_slow_tokenizer=False)"
|
||||
}
|
||||
@@ -0,0 +1,9 @@
|
||||
{
|
||||
"dataset_name": "super_glue",
|
||||
"dataset_config_name": "rte",
|
||||
"template_name": "GPT-3 style",
|
||||
"evaluation": {
|
||||
"accuracy": 0.7870036101083032
|
||||
},
|
||||
"arguments": "Namespace(config_name=None, dataset_config_name='rte', dataset_name='super_glue', debug=False, dtype='float16', max_length=2048, model_name_or_path='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/p31lossseqglobal_step1000', output_dir='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/p31lossseqglobal_step1000/evaluation', pad_to_max_length=False, per_device_eval_batch_size=8, prefixlm=False, split='validation', target_max_length=256, template_config_name=None, template_name='GPT-3 style', tokenizer_name=None, use_slow_tokenizer=False)"
|
||||
}
|
||||
@@ -0,0 +1,9 @@
|
||||
{
|
||||
"dataset_name": "super_glue",
|
||||
"dataset_config_name": "rte",
|
||||
"template_name": "MNLI crowdsource",
|
||||
"evaluation": {
|
||||
"accuracy": 0.7220216606498195
|
||||
},
|
||||
"arguments": "Namespace(config_name=None, dataset_config_name='rte', dataset_name='super_glue', debug=False, dtype='float16', max_length=2048, model_name_or_path='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/p31lossseqglobal_step1000', output_dir='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/p31lossseqglobal_step1000/evaluation', pad_to_max_length=False, per_device_eval_batch_size=8, prefixlm=False, split='validation', target_max_length=256, template_config_name=None, template_name='MNLI crowdsource', tokenizer_name=None, use_slow_tokenizer=False)"
|
||||
}
|
||||
@@ -0,0 +1,9 @@
|
||||
{
|
||||
"dataset_name": "super_glue",
|
||||
"dataset_config_name": "rte",
|
||||
"template_name": "does it follow that",
|
||||
"evaluation": {
|
||||
"accuracy": 0.6678700361010831
|
||||
},
|
||||
"arguments": "Namespace(config_name=None, dataset_config_name='rte', dataset_name='super_glue', debug=False, dtype='float16', max_length=2048, model_name_or_path='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/p31lossseqglobal_step1000', output_dir='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/p31lossseqglobal_step1000/evaluation', pad_to_max_length=False, per_device_eval_batch_size=8, prefixlm=False, split='validation', target_max_length=256, template_config_name=None, template_name='does it follow that', tokenizer_name=None, use_slow_tokenizer=False)"
|
||||
}
|
||||
@@ -0,0 +1,9 @@
|
||||
{
|
||||
"dataset_name": "super_glue",
|
||||
"dataset_config_name": "rte",
|
||||
"template_name": "guaranteed true",
|
||||
"evaluation": {
|
||||
"accuracy": 0.6714801444043321
|
||||
},
|
||||
"arguments": "Namespace(config_name=None, dataset_config_name='rte', dataset_name='super_glue', debug=False, dtype='float16', max_length=2048, model_name_or_path='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/p31lossseqglobal_step1000', output_dir='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/p31lossseqglobal_step1000/evaluation', pad_to_max_length=False, per_device_eval_batch_size=8, prefixlm=False, split='validation', target_max_length=256, template_config_name=None, template_name='guaranteed true', tokenizer_name=None, use_slow_tokenizer=False)"
|
||||
}
|
||||
@@ -0,0 +1,9 @@
|
||||
{
|
||||
"dataset_name": "super_glue",
|
||||
"dataset_config_name": "rte",
|
||||
"template_name": "should assume",
|
||||
"evaluation": {
|
||||
"accuracy": 0.6678700361010831
|
||||
},
|
||||
"arguments": "Namespace(config_name=None, dataset_config_name='rte', dataset_name='super_glue', debug=False, dtype='float16', max_length=2048, model_name_or_path='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/p31lossseqglobal_step1000', output_dir='/gpfsscratch/rech/six/commun/experiments/muennighoff/bloomckpt/6b3t0/p31lossseqglobal_step1000/evaluation', pad_to_max_length=False, per_device_eval_batch_size=8, prefixlm=False, split='validation', target_max_length=256, template_config_name=None, template_name='should assume', tokenizer_name=None, use_slow_tokenizer=False)"
|
||||
}
|
||||
Reference in New Issue
Block a user